In [1]:
import numpy as np 
import pandas as pd
from sklearn.datasets import load_iris

### loading original dataset:

In [2]:
iris=load_iris()

In [3]:
X=iris.data
y=iris.target

In [4]:
X.shape

(150, 4)

In [5]:
y.shape

(150,)

### encrypting the data (X and y using tenseal):

#### importing tenseal (for CKKS encryption):

In [6]:
import tenseal as ts
import utils

#### generating keys:

In [7]:
context=ts.context(
    ts.SCHEME_TYPE.CKKS,
    poly_modulus_degree=8192,
    coeff_mod_bit_sizes=[60,40,40,60]
)

In [8]:
context.generate_galois_keys()
context.global_scale=2**40

#### Storing Private key:

In [9]:
secret_context=context.serialize(save_secret_key=True)
utils.write_data('keys1/secret.txt',secret_context)

#### Storing Public key:

In [10]:
context.make_context_public()
public_context=context.serialize()
utils.write_data('keys1/public.txt',public_context)

### Encrypting X and y:

In [11]:
type(X)

numpy.ndarray

In [12]:
type(y)

numpy.ndarray

#### a demo test:

##### encrypting salary variable with a secret key:

In [13]:
context=ts.context_from(utils.read_data('keys1/secret.txt'))
salary=[1000,2000,3000]
salary_encrypted=ts.ckks_vector(context,salary)
utils.write_data('demo_encrypted_objects/salary_encrypted.txt',salary_encrypted.serialize())

#### Encrypting X and y:

In [14]:
from sklearn.model_selection import train_test_split

In [15]:
X_train,X_test,y_train,y_test=train_test_split(X,y,test_size=0.3,stratify=y)
len(X_train),len(X_test),len(y_train),len(y_test)

(105, 45, 105, 45)

In [16]:
from time import time
t_start=time()
enc_x_train=[ts.ckks_vector(context,x.tolist()) for x in X_train]
enc_y_train=ts.ckks_vector(context,y_train.tolist())
t_end=time()
print(f"Encryption of the training_set took {int(t_end - t_start)} seconds")

Encryption of the training_set took 0 seconds


In [17]:
t_start=time()
enc_x_test=[ts.ckks_vector(context,x.tolist()) for x in X_test]
enc_y_test=ts.ckks_vector(context,y_test.tolist())
t_end=time()
print(f"Encryption of the testing_set took {int(t_end-t_start)} seconds")

Encryption of the testing_set took 0 seconds


In [18]:
type(enc_x_train)

list

In [19]:
enc_x_train[0]

<tenseal.tensors.ckksvector.CKKSVector at 0x1c864695db0>

#### storing the ckks encrypted variables into json files


In [20]:
import json

In [21]:
serialized_enc_x_train=[vec.serialize() for vec in enc_x_train]
serialized_enc_x_train.serialize()

AttributeError: 'list' object has no attribute 'serialize'

In [22]:
with open('encrypted_data_variables/enc_x_train.json','w') as f:
    json.dump(serialized_enc_x_train,f)

TypeError: Object of type bytes is not JSON serializable

In [23]:
with open('encrypted_data_variables/enc_x_train.txt','w') as f:
    f.write(serialized_enc_x_train)

TypeError: write() argument must be str, not list