In [10]:
import argparse
import numpy as np
from itertools import count

import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch.distributions import Categorical

In [11]:
import syft as sy

hook = sy.TorchHook(torch)

def connect_to_workers(n_workers):
    return [
        sy.VirtualWorker(hook, id=f"worker{i+1}")
        for i in range(n_workers)
    ]
def connect_to_crypto_provider():
    return sy.VirtualWorker(hook, id="crypto_provider")

workers = connect_to_workers(n_workers=2)
crypto_provider = connect_to_crypto_provider()



In [12]:
import pandas as pd
import numpy as np

def getSamples(filename):
    data = pd.read_csv(filename, sep='\t')
    return data.values[:,1:].transpose()

data1 = getSamples("GSE2034-Normal-train.txt")
data2 = getSamples("GSE2034-Tumor-train.txt")

data1Label = np.zeros(len(data1)).reshape((-1, 1))
data2Label = np.ones(len(data2)).reshape((-1, 1))
x = np.concatenate((data1, data2))
y = np.concatenate((data1Label, data2Label))

In [13]:
# We don't use the whole dataset for efficiency purpose, but feel free to increase these numbers
n_train_items = 181
n_test_items = 46

# partition the data into training data and test data
x_train = x[:n_train_items]
y_train = y[:n_train_items]

x_test = x[n_train_items:]
y_test = x[n_train_items:]            

In [4]:

def get_private_data_loaders(precision_fractional, workers, crypto_provider):
    
    def one_hot_of(index_tensor):#Transforms to one hot tensor
     
        onehot_tensor = torch.zeros(*index_tensor.shape, 2) # 2 Output classes
        onehot_tensor = onehot_tensor.scatter(1, index_tensor.view(-1, 1), 1)
        return onehot_tensor
        
    def secret_share(tensor): #Transforms to fixed precision and secret share a tensor

        return (
            tensor
            .fix_precision(precision_fractional=precision_fractional)
            .share(*workers, crypto_provider=crypto_provider, requires_grad=True)
        )
    
    transformation = transforms.Compose([
        transforms.ToTensor(),
        transforms.Normalize((0.1307,), (0.3081,))
    ])
    
    private_train_loader = [
        (secret_share(data), secret_share(one_hot_of(target)))
        for i, (data, target) in enumerate(#Training Set)
        if i < n_train_items / args.batch_size
    ]
    
    private_test_loader = [
        (secret_share(data), secret_share(target.float()))
        for i, (data, target) in enumerate(#Testing Set)
        if i < n_test_items / args.test_batch_size
    ]
    
    return private_train_loader, private_test_loader
    
    
private_train_loader, private_test_loader = get_private_data_loaders(
    precision_fractional=args.precision_fractional,
    workers=workers,
    crypto_provider=crypto_provider
)

SyntaxError: invalid syntax (<ipython-input-4-67515ade8122>, line 29)

In [14]:
dim = 12634

class Res1d(nn.Module):
    # the conv layers
    def __init__(self, inSize, outSize, kernel=(3,), strides=1,):
        super(Res1d, self).__init__()
        # hard-coded to do the padding correctly
        if inSize in (16,64,128,512) and strides is 2:
            pding = 0
        else:
            pding = 1
        self.l1 = nn.Conv1d(inSize, outSize, kernel, stride=strides, padding=pding, bias=False)
        self.l2 = nn.InstanceNorm1d(outSize)
        
        if strides > 1 or inSize != outSize:
            if strides > 1:
                self.r1 = nn.Identity()
                self.r2 = nn.AvgPool1d(strides)
            else:
                self.r1 = None
                self.r2 = None
            self.r3 = nn.Conv1d(inSize, outSize, 1, bias=False)
            self.r4 = nn.InstanceNorm1d(outSize)
    
        self.relu = nn.ReLU()
        
    def forward(self, x):
        l = self.l1(x)
        l = self.l2(l)
        
        if self.r1 is not None:
            r = self.r1(x)
            r = self.r2(r)
            r = self.r3(r)
            r = self.r4(r)
        else:
            r = self.r3(x)
            r = self.r4(r)
            
        x = l + r
        return self.relu(x)
    
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.l1 = nn.Linear(dim, 64)
        self.l2 = nn.ReLU()
        
        self.r1 = Res1d(1, 4, 3)
        
        self.r2 = Res1d(4, 8, 3)
        self.r3 = Res1d(8, 8, 3, strides=2)
        
        self.r4 = Res1d(8, 16, 3)
        self.r5 = Res1d(16, 16, 3, strides=2)
        
        self.r6 = Res1d(16, 32, 3)
        self.r7 = Res1d(32, 32, 3, strides=2)
        
        self.r8 = Res1d(32, 64, 3)
        self.r9 = Res1d(64, 64, 3, strides=2)
        
        self.r10 = Res1d(64, 128, 3)
        self.r11 = Res1d(128, 128, 3, strides=2)
        
        self.r12 = Res1d(128, 256, 3)
        self.r13 = Res1d(256, 256, 3, strides=2)
        
        self.r14 = Res1d(256, 512, 3)
        self.r15 = Res1d(512, 512, 3, strides=2)
        
        self.r16 = Res1d(512, 1024, 3)
        self.r17 = Res1d(1024, 1024, 3, strides=2)
        
        # size is by experiment and hardcode
        self.lastLinear = nn.Linear(50240,32)
        self.lastRelu = nn.ReLU()
        self.lastAgg = nn.Linear(32,1)
        self.lastSigmoid = nn.Sigmoid()
    
    def forward(self, x):
        # shape is (batch, channel, time)
        l = x
        l = self.l2(self.l1(l))
        
        # conv layers should operate on time
        r = x
        r = self.r4(self.r3(self.r2(self.r1(r))))
        r = self.r8(self.r7(self.r6(self.r5(r))))
        r = self.r12(self.r11(self.r10(self.r9(r))))
        r = self.r16(self.r15(self.r14(self.r13(r))))
        r = self.r17(r)
        
        # flatten l
        r = r.view(x.shape[0],1, -1)
        y = torch.cat((l,r),-1)
        y = self.lastLinear(y)
        y = self.lastRelu(y)
        y = self.lastAgg(y)
        y = self.lastSigmoid(y)
        return y

In [15]:
device = torch.device("cuda")
net = Net().to(device)


RuntimeError: CUDA error: out of memory

In [16]:
input_test = torch.randn(80, 1, dim).float().cuda()
out = net(input_test).cuda()
out.shape

RuntimeError: CUDA error: out of memory

# Train the model

In [17]:
# get the data into (batch, channel = 1, length=dim)
data_torch = torch.from_numpy(x).view([-1, 1, dim]).float()
label_torch = torch.from_numpy(y).view([-1,1,1]).float()

In [18]:
import torch.optim as optim
criterion = nn.BCELoss() # Binary Cross Entropy 
optimizer = optim.SGD(net.parameters(), lr=0.001, momentum=0.9)

NameError: name 'net' is not defined

In [19]:
test_inputs = torch.from_numpy(x_test).view([-1, 1, dim]).float().cuda()
test_labels = torch.from_numpy(y_test).view([-1, 1]).float().cuda()

for batch in range(1000):  # loop over the dataset multiple times
    # get the inputs; data is a list of [inputs, labels]
    indices = np.random.choice(len(x_train), size=(30))
    inputs = x_train[indices]
    labels = x_train[indices]
    
    inputs = torch.from_numpy(inputs).view([-1, 1, dim]).float().cuda()
    labels = torch.from_numpy(labels).view([-1, 1]).float().cuda()
    
    # zero the parameter gradients
    optimizer.zero_grad()

    # forward + backward + optimize
    outputs = net(inputs).view([-1,1]).cuda()
    loss = criterion(outputs, labels).cuda()
    loss.backward()
    optimizer.step()
    
    if batch % 10 == 0:
        outputs = net(test_inputs).view([-1,1]).cuda()
        loss = criterion(outputs, labels).cuda()
        print(batch / 10 + 1, "% Trained", "loss = ", loss)

print('Finished Training')

RuntimeError: CUDA error: out of memory

In [20]:
# MPC learning
net

NameError: name 'net' is not defined

In [10]:
net(data_torch.cuda())

tensor([[[4.0814e-04]],

        [[5.1038e-04]],

        [[3.8278e-04]],

        [[5.1896e-04]],

        [[2.9317e-04]],

        [[5.0704e-04]],

        [[3.5465e-04]],

        [[4.4371e-04]],

        [[2.9039e-04]],

        [[2.7970e-04]],

        [[3.3898e-04]],

        [[3.3784e-04]],

        [[4.0894e-04]],

        [[4.3664e-04]],

        [[4.4219e-04]],

        [[2.9098e-04]],

        [[3.6885e-04]],

        [[2.3485e-04]],

        [[2.8562e-04]],

        [[2.7229e-04]],

        [[3.4142e-04]],

        [[9.8182e-05]],

        [[4.3720e-04]],

        [[3.4343e-04]],

        [[3.3708e-04]],

        [[2.5448e-04]],

        [[4.7543e-04]],

        [[3.2778e-04]],

        [[4.2785e-04]],

        [[3.9049e-04]],

        [[3.3560e-04]],

        [[4.1627e-04]],

        [[1.9340e-04]],

        [[3.6553e-04]],

        [[1.3619e-04]],

        [[3.9539e-04]],

        [[1.6606e-04]],

        [[3.8498e-04]],

        [[3.8387e-04]],

        [[3.4144e-04]],

