### Imports and training Configurations

In [1]:
import torch
import syft as sy
import argparse
import numpy as np
import pandas as pd

import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch.distributions import Categorical
from torchvision import transforms
from torchvision import datasets, transforms

import time
print("torch version:", torch.__version__)
print("syft version:", sy.__version__)

torch version: 1.3.0
syft version: 0.2.0a2


In [2]:
def getSamples(filename):
    data = pd.read_csv(filename, sep='\t')
    return data.to_numpy()[:,1:].transpose()

dim = 12634
data1 = getSamples("GSE2034-Normal-train.txt")
data2 = getSamples("GSE2034-Tumor-train.txt")

data1Label = np.zeros(len(data1)).reshape((-1, 1))
data2Label = np.ones(len(data2)).reshape((-1, 1))
x = np.concatenate((data1, data2))
y = np.concatenate((data1Label, data2Label))

# shuffle the data
idx = np.random.permutation(len(x))
x,y = x[idx], y[idx]

z = np.concatenate((x, y), axis = 1)

# We follow an 80/20 partitioning for the training and testing sets
n_train_items = 181
n_test_items = 46

# partition the data into training data and test data
x_train = x[:n_train_items]
y_train = y[:n_train_items]

x_train = x_train.reshape((-1,1,dim))
y_train = y_train.reshape((-1,1))

x_test = x[n_train_items:]
y_test = y[n_train_items:]    

x_test = x_test.reshape((-1,1,dim))
y_test = y_test.reshape((-1,1))

In [3]:
# get the data into (batch, channel = 1, length=dim)
data_torch = torch.from_numpy(x).view([-1, 1, dim]).float()
label_torch = torch.from_numpy(y).view([-1,1,1]).float()

### Deep Learning Model applied to GSE2034

In [4]:
dim = 12634

class Res1d(nn.Module):
    # the conv layers
    def __init__(self, inSize, outSize, kernel=(3,), strides=1,):
        super(Res1d, self).__init__()
        
        # Left , kernel size 3
        # hard-coded to do the padding correctly
        if inSize in (16,64,128,512) and strides > 1:
            pding = 0
        else:
            pding = 1
            
        self.l = nn.Sequential(
            nn.Conv1d(inSize, outSize, kernel, stride=strides, padding=pding, bias=False),
            nn.InstanceNorm1d(outSize)
        )    
        
        # Right, kernel size 1
        if inSize != outSize or strides > 1:
            if strides > 1:
                self.r1 = nn.AvgPool1d(strides)
            else:
                self.r1 = nn.Identity()
                
        self.r = nn.Sequential(
            self.r1,
            nn.Conv1d(inSize, outSize, 1, bias=False),
            nn.InstanceNorm1d(outSize)
        )
    
        self.relu = nn.ReLU()
        
    def forward(self, x):          
        x = self.l(x) + self.r(x)
        return self.relu(x)
    


class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        
        self.l = nn.Sequential(
            nn.Linear(dim, 64),
            nn.ReLU()
        )

        self.r = nn.Sequential(
            Res1d(1, 4, 3),

            Res1d(4, 8, 3),
            Res1d(8, 8, 3, strides=2),

            Res1d(8, 16, 3),
            Res1d(16, 16, 3, strides=2),

            Res1d(16, 32, 3),
            Res1d(32, 32, 3, strides=2),

            Res1d(32, 64, 3),
            Res1d(64, 64, 3, strides=2),

            Res1d(64, 128, 3),
            Res1d(128, 128, 3, strides=2),

            Res1d(128, 256, 3),
            Res1d(256, 256, 3, strides=2),

            Res1d(256, 512, 3),
            Res1d(512, 512, 3, strides=2),

            Res1d(512, 1024, 3),
            Res1d(1024, 1024, 3, strides=2),

            nn.Flatten()
        )
        
        # size is by experiment and hardcode
        self.last = nn.Sequential(
            nn.Linear(50240,32),
            nn.ReLU(),
            nn.Linear(32,1),
            nn.Sigmoid()
        )
    
    def forward(self, x):
        # shape is (batch, channel, time)
        l = self.l(x)
        r = self.r(x)
        r.unsqueeze_(-2) # add channel dimension
        y = torch.cat((l,r),dim=-1)
        y = self.last(y)
        return y


In [5]:
device = torch.device("cuda")
net = Net().to(device)

#from torchsummary import summary
#summary(net,(1,12634))

In [6]:
import torch.optim as optim
criterion = nn.BCELoss() # Binary Cross Entropy 
optimizer = optim.SGD(net.parameters(), lr=0.001, momentum=0.9)

### Training on plain data

In [7]:
test_inputs = torch.from_numpy(x_test).view([-1, 1, dim]).float().cuda()
test_labels = torch.from_numpy(y_test).view([-1, 1]).float().cuda()
for batch in range(100):  # loop over the dataset multiple times
    # get the inputs; data is a list of [inputs, labels]
    indices = np.random.choice(len(x_train), size=(30))
    inputs = x_train[indices]
    labels = y_train[indices]
    
    inputs = torch.from_numpy(inputs).float().cuda()
    labels = torch.from_numpy(labels).float().cuda()
    
    # zero the parameter gradients
    optimizer.zero_grad()

    # forward + backward + optimize
    outputs = net(inputs).view([-1,1]).cuda()
    loss = criterion(outputs, labels).cuda()
    loss.backward()
    optimizer.step()
    
    print(batch, "% Trained", "loss = ", loss.item())

print('Finished Training')

0 % Trained loss =  0.7175427675247192
1 % Trained loss =  0.5960087180137634
2 % Trained loss =  0.8237826228141785
3 % Trained loss =  0.6514562964439392
4 % Trained loss =  0.5533632636070251
5 % Trained loss =  0.6631456017494202
6 % Trained loss =  0.644184947013855
7 % Trained loss =  0.6296128630638123
8 % Trained loss =  0.5669456720352173
9 % Trained loss =  0.5513830780982971
10 % Trained loss =  0.5824121832847595
11 % Trained loss =  0.5907394289970398
12 % Trained loss =  0.4805615544319153
13 % Trained loss =  0.47551998496055603
14 % Trained loss =  0.43236055970191956
15 % Trained loss =  0.442240834236145
16 % Trained loss =  0.4249318242073059
17 % Trained loss =  0.4000908434391022
18 % Trained loss =  0.5188621878623962
19 % Trained loss =  0.37506961822509766
20 % Trained loss =  0.2837182581424713
21 % Trained loss =  0.28202465176582336
22 % Trained loss =  0.43621012568473816
23 % Trained loss =  0.20410969853401184
24 % Trained loss =  0.17711634933948517
25 % 

In [8]:
net

Net(
  (l): Sequential(
    (0): Linear(in_features=12634, out_features=64, bias=True)
    (1): ReLU()
  )
  (r): Sequential(
    (0): Res1d(
      (l): Sequential(
        (0): Conv1d(1, 4, kernel_size=(3,), stride=(1,), padding=(1,), bias=False)
        (1): InstanceNorm1d(4, eps=1e-05, momentum=0.1, affine=False, track_running_stats=False)
      )
      (r1): Identity()
      (r): Sequential(
        (0): Identity()
        (1): Conv1d(1, 4, kernel_size=(1,), stride=(1,), bias=False)
        (2): InstanceNorm1d(4, eps=1e-05, momentum=0.1, affine=False, track_running_stats=False)
      )
      (relu): ReLU()
    )
    (1): Res1d(
      (l): Sequential(
        (0): Conv1d(4, 8, kernel_size=(3,), stride=(1,), padding=(1,), bias=False)
        (1): InstanceNorm1d(8, eps=1e-05, momentum=0.1, affine=False, track_running_stats=False)
      )
      (r1): Identity()
      (r): Sequential(
        (0): Identity()
        (1): Conv1d(4, 8, kernel_size=(1,), stride=(1,), bias=False)
        (2

In [9]:
input_data = data_torch.cuda()
net(input_data)

tensor([[[0.0041]],

        [[0.0057]],

        [[0.9967]],

        [[0.9970]],

        [[0.9970]],

        [[0.0034]],

        [[0.9967]],

        [[0.9995]],

        [[0.9969]],

        [[0.0047]],

        [[0.9980]],

        [[0.9965]],

        [[0.9975]],

        [[0.0035]],

        [[0.0029]],

        [[0.9978]],

        [[0.9969]],

        [[0.9961]],

        [[0.0083]],

        [[0.9970]],

        [[0.9966]],

        [[0.9983]],

        [[0.9961]],

        [[0.9991]],

        [[0.9986]],

        [[0.9973]],

        [[0.0016]],

        [[0.9979]],

        [[0.9971]],

        [[0.0041]],

        [[0.0053]],

        [[0.9978]],

        [[0.9987]],

        [[0.0107]],

        [[0.0046]],

        [[0.0041]],

        [[0.9974]],

        [[0.9979]],

        [[0.9960]],

        [[0.9982]],

        [[0.9965]],

        [[0.0100]],

        [[0.9897]],

        [[0.9972]],

        [[0.9982]],

        [[0.0061]],

        [[0.9977]],

        [[0.0

### Setup of the secure environment

In [10]:
hook = sy.TorchHook(torch)

def connect_to_workers(n_workers):
    return [
        sy.VirtualWorker(hook, id=f"worker{i+1}")
        for i in range(n_workers)
    ]

def connect_to_crypto_provider():
    return sy.VirtualWorker(hook, id="crypto_provider")

workers = connect_to_workers(n_workers=2)
crypto_provider = connect_to_crypto_provider()

def get_private_data_loaders(precision_fractional, workers, crypto_provider):
    
    def secret_share(tensor): #Transforms to fixed precision and secret share a tensor
        return (
            tensor
            .fix_precision(precision_fractional=precision_fractional)
            .share(*workers, crypto_provider=crypto_provider, requires_grad=True)
        )
    
    private_train_loader = [
        (secret_share(torch.Tensor(x_train[i*5:i*5+5])), secret_share(torch.Tensor(y_train[i*5:i*5+5])))
        for i in range (n_train_items)
        if i < n_train_items / 5
    ]
    
    private_test_loader = [
        (secret_share(torch.Tensor(x_test[i*5:i*5+5])), secret_share(torch.Tensor(y_test[i*5:i*5+5])))
        for i in range (n_train_items)
        if i < n_train_items / 5
    ]
    return private_train_loader, private_test_loader
    
    
private_train_loader, private_test_loader = get_private_data_loaders(
    precision_fractional=3,
    workers=workers,
    crypto_provider=crypto_provider
)

### Model for encrypted data

In [11]:
class Res1d(nn.Module):
    # the conv layers
    def __init__(self, inSize, outSize, kernel=(3,), strides=1,):
        super(Res1d, self).__init__()
        self.inSize = inSize
        self.outSize = outSize
        # hard-coded to do the padding correctly
        if inSize in (16,64,128,512) and strides is 2:
            pding = 0
        else:
            pding = 1
        self.l1 = nn.Conv1d(inSize, outSize, kernel, stride=strides, padding=pding, bias=False)
        self.l2 = nn.Identity()
        
        if strides > 1 or inSize != outSize:
            if strides > 1:
                self.r1 = nn.Identity()
                self.r2 = nn.AvgPool1d(strides)
            else:
                self.r1 = None
                self.r2 = None
            self.r3 = nn.Conv1d(inSize, outSize, 1, bias=False)
            self.r4 = nn.Identity()
            
    def forward(self, x):
        l = x
        l = self.l1(l)
        l = self.l2(l)
        
        if self.r1 is not None:
            r = self.r1(x)
            r = self.r2(r)
            r = self.r3(r)
            r = self.r4(r)
        else:
            r = self.r3(x)
            r = self.r4(r)
            
        x = l + r
        print("forwarding: ", self.inSize, self.outSize)
        return F.relu(x)
    
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.l1 = nn.Linear(dim, 64)
        self.l2 = F.relu
        
        self.r1 = Res1d(1, 4, 3)
        
        self.r2 = Res1d(4, 8, 3)
        self.r3 = Res1d(8, 8, 3, strides=2)
        
        self.r4 = Res1d(8, 16, 3)
        self.r5 = Res1d(16, 16, 3, strides=2)
        
        self.r6 = Res1d(16, 32, 3)
        self.r7 = Res1d(32, 32, 3, strides=2)
        
        self.r8 = Res1d(32, 64, 3)
        self.r9 = Res1d(64, 64, 3, strides=2)
        
        self.r10 = Res1d(64, 128, 3)
        self.r11 = Res1d(128, 128, 3, strides=2)
        
        self.r12 = Res1d(128, 256, 3)
        self.r13 = Res1d(256, 256, 3, strides=2)
        
        self.r14 = Res1d(256, 512, 3)
        self.r15 = Res1d(512, 512, 3, strides=2)
        
        self.r16 = Res1d(512, 1024, 3)
        self.r17 = Res1d(1024, 1024, 3, strides=2)
        
        # size is by experiment and hardcode
        self.lastLinear = nn.Linear(50240,32)
        self.lastRelu = F.relu
        self.lastAgg = nn.Linear(32,1)
        self.lastSigmoid = nn.Sigmoid()
    
    def forward(self, x):           
        # shape is (batch, channel, time)
        l = x
        l = x.view(x.shape[0],-1)
        l = self.l1(l)
        l = self.l2(l)

        # conv layers should operate on time
        r = x
        r = self.r1(r)
        r = self.r4(self.r3(self.r2(r)))
        r = self.r8(self.r7(self.r6(self.r5(r))))
        r = self.r12(self.r11(self.r10(self.r9(r))))
        r = self.r16(self.r15(self.r14(self.r13(r))))
        r = self.r17(r)
        
        # flatten l
        r = r.view(x.shape[0],-1)
        l = l.view(x.shape[0],-1)
        y = torch.cat((l,r),dim=1)
        y = self.lastLinear(y)
        y = self.lastRelu(y)
        y = self.lastAgg(y)
        y = self.lastSigmoid(y)
        return y

### Private Training of the model

In [12]:
def train(model, private_train_loader, optimizer, epoch):
    model.train()
    for batch_idx, (data, target) in enumerate(private_train_loader): # <-- now it is a private dataset
        print('training...')
        start_time = time.time()
        optimizer.zero_grad()
        
        output = model(data)
        
        batch_size = output.shape[0]
        loss = ((output - target)**2).sum().refresh()/batch_size
        
        loss.backward()
        
        optimizer.step()

        
#Although the aim of this project was to provide private training, we prepared code for testing as well
def test(model, private_test_loader):
    print('testing...')
    model.eval()
    test_loss = 0
    correct = 0
    with torch.no_grad():
        for data, target in private_test_loader:
            start_time = time.time()
            
            output = model(data)
            pred = output.argmax(dim=1)
            correct += pred.eq(target.view_as(pred)).sum()

    correct = correct.get().float_precision()

In [13]:
model = Net()
model = model.fix_precision().share(*workers, crypto_provider=crypto_provider, requires_grad=True)

optimizer = optim.SGD(model.parameters(), lr=0.001)
optimizer = optimizer.fix_precision() 
for epoch in range(1, 2):
    train(model, private_train_loader, optimizer, epoch)
    test(model, private_test_loader)

training...
forwarding:  1 4
forwarding:  4 8
forwarding:  8 8
forwarding:  8 16
forwarding:  16 16
forwarding:  16 32
forwarding:  32 32
forwarding:  32 64
forwarding:  64 64
forwarding:  64 128
forwarding:  128 128
forwarding:  128 256
forwarding:  256 256
forwarding:  256 512
forwarding:  512 512
forwarding:  512 1024
forwarding:  1024 1024
training...
forwarding:  1 4
forwarding:  4 8
forwarding:  8 8
forwarding:  8 16
forwarding:  16 16
forwarding:  16 32
forwarding:  32 32
forwarding:  32 64
forwarding:  64 64
forwarding:  64 128
forwarding:  128 128
forwarding:  128 256
forwarding:  256 256
forwarding:  256 512
forwarding:  512 512
forwarding:  512 1024
forwarding:  1024 1024
training...
forwarding:  1 4
forwarding:  4 8
forwarding:  8 8
forwarding:  8 16
forwarding:  16 16
forwarding:  16 32
forwarding:  32 32
forwarding:  32 64
forwarding:  64 64
forwarding:  64 128
forwarding:  128 128
forwarding:  128 256
forwarding:  256 256
forwarding:  256 512
forwarding:  512 512
forward

forwarding:  256 256
forwarding:  256 512
forwarding:  512 512
forwarding:  512 1024
forwarding:  1024 1024
training...
forwarding:  1 4
forwarding:  4 8
forwarding:  8 8
forwarding:  8 16
forwarding:  16 16
forwarding:  16 32
forwarding:  32 32
forwarding:  32 64
forwarding:  64 64
forwarding:  64 128
forwarding:  128 128
forwarding:  128 256
forwarding:  256 256
forwarding:  256 512
forwarding:  512 512
forwarding:  512 1024
forwarding:  1024 1024
training...
forwarding:  1 4
forwarding:  4 8
forwarding:  8 8
forwarding:  8 16
forwarding:  16 16
forwarding:  16 32
forwarding:  32 32
forwarding:  32 64
forwarding:  64 64
forwarding:  64 128
forwarding:  128 128
forwarding:  128 256
forwarding:  256 256
forwarding:  256 512
forwarding:  512 512
forwarding:  512 1024
forwarding:  1024 1024
training...
forwarding:  1 4
forwarding:  4 8
forwarding:  8 8
forwarding:  8 16
forwarding:  16 16
forwarding:  16 32
forwarding:  32 32
forwarding:  32 64
forwarding:  64 64
forwarding:  64 128
forw

RuntimeError: shape '[1]' is invalid for input of size 5