In [1]:
import numpy as np
import h5py
import torch
import torch.utils.data as data_utils
from torch.utils.data.dataset import random_split
import numpy as np
from torch.autograd import Variable
import torch.nn as nn
import torch.optim as optim

  from ._conv import register_converters as _register_converters


# Helper Clases / Functions

In [2]:
def Load_Data(num):
    if (num == -1): # All data
        X_all = []
        y_all = []
        for i in range(8):
            file_path = './../project_datasets/A0' + str(i+1) + 'T_slice.mat'
            data = h5py.File(file_path, 'r')
            X = np.copy(data['image'])
            y = np.copy(data['type'])
            X = X[:, 0:23, :]
            X_all.append(X)
            y = y[0,0:X.shape[0]:1]
            y_all.append(y)
        A, N, E, T = np.shape(X_all)
        X_all = np.reshape(X_all, (A*N, E, T))
        y_all = np.reshape(y_all, (-1))
        y_all = y_all - 769
        ## Remove NAN
        index_Nan = []
        for i in range(A*N):
            for j in range(E):
                if (any(np.isnan(X_all[i,j])) == True):
                    index_Nan.append(i)
        index_Nan = list(set(index_Nan))
        X_all = np.delete(X_all, index_Nan, axis=0)
        y_all = np.delete(y_all, index_Nan)
        return (X_all, y_all)
    else:
        file_path = './../project_datasets/A0' + str(num) + 'T_slice.mat'
        data = h5py.File(file_path, 'r')
        X = np.copy(data['image'])
        y = np.copy(data['type'])
        X = X[:, 0:23, :]
        y = y[0,0:X.shape[0]:1]
        y = y - 769
         ## Remove NAN
        N, E, T = np.shape(X)
        index_Nan = []
        for i in range(N):
            for j in range(E):
                if (any(np.isnan(X[i,j])) == True):
                    index_Nan.append(i)
        index_Nan = list(set(index_Nan))
        X = np.delete(X, index_Nan, axis=0)
        y = np.delete(y, index_Nan)
        return (X, y)

# Load Data

In [3]:
X, y = Load_Data(-1) # -1 to load all datas
N, E, T = np.shape(X)
print (np.shape(X))

(2280, 23, 1000)


# Make DataLoaders

In [4]:
bs_train = 200
bs_val = 100
bs_test = 100
data = data_utils.TensorDataset(torch.Tensor(X), torch.Tensor(y))
dset = {}
dataloaders = {}
dset['train'], dset['val'], dset['test'] = random_split(data, [N-bs_val-bs_test, bs_val, bs_test])
dataloaders['train'] = data_utils.DataLoader(dset['train'], batch_size=bs_train, shuffle=True, num_workers=1)
dataloaders['val'] = data_utils.DataLoader(dset['val'], batch_size=bs_val, shuffle=True, num_workers=1)
dataloaders['test'] = data_utils.DataLoader(dset['test'], batch_size=bs_test, shuffle=True, num_workers=1)

# Define Model

In [92]:
class myGRU(nn.Module):
    def __init__(self, input_dim, hidden_dim, num_layer, num_class):
        super(myGRU, self).__init__()
        self.num_layer = num_layer
        self.hidden_dim = hidden_dim
        # First Inception layer
        self.conv11 = nn.Conv1d(23, 32, 2, stride=2)
        self.conv12 = nn.Conv1d(23, 32, 4, stride=2, padding=1)
        self.conv13 = nn.Conv1d(23, 32, 8, stride=2, padding=3)
        # Second Inception layer
        self.conv21 = nn.Conv1d(96, 32, 2, stride=2)
        self.conv22 = nn.Conv1d(96, 32, 4, stride=2, padding=1)
        self.conv23 = nn.Conv1d(96, 32, 8, stride=2, padding=3)
        # Third Inception layer
        self.conv31 = nn.Conv1d(96, 32, 2, stride=2)
        self.conv32 = nn.Conv1d(96, 32, 4, stride=2, padding=1)
        self.conv33 = nn.Conv1d(96, 32, 8, stride=2, padding=3)
        #self.conv_13 = nn.Conv2d()
        self.conv_elec = nn.Conv3d(1,23,tuple([40, 23, 1]))
        self.gru1 = nn.GRU(32*3, hidden_dim, num_layer)
        self.gru2 = nn.GRU(hidden_dim, hidden_dim, num_layer)
        self.gru3 = nn.GRU(hidden_dim, hidden_dim, num_layer)
        self.gru4 = nn.GRU(hidden_dim, hidden_dim, num_layer)
        self.classifier = nn.Linear(hidden_dim, num_class)
    def forward(self, x):
        out_conv11 = self.conv11(x)
        out_conv12 = self.conv12(x)
        out_conv13 = self.conv13(x)
        out_conv1 = torch.cat((out_conv11, out_conv12, out_conv13), 1)
        out_conv21 = self.conv21(out_conv1)
        out_conv22 = self.conv22(out_conv1)
        out_conv23 = self.conv23(out_conv1)
        out_conv2 = torch.cat((out_conv21, out_conv22, out_conv23), 1)
        out_conv31 = self.conv31(out_conv2)
        out_conv32 = self.conv32(out_conv2)
        out_conv33 = self.conv33(out_conv2)
        out_conv3 = torch.cat((out_conv31, out_conv32, out_conv33), 1)
        # N, C, L --> L, N, C
        out_conv3 = out_conv3.permute(2,0,1)
        out_gru1, _ = self.gru1(out_conv3)
        out_gru2, _ = self.gru2(out_gru1)
        out_gru3, _ = self.gru3(out_gru2)
        out_gru4, _ = self.gru4(out_gru3)
        out_gru4 = out_gru4[-1, :, :] # taking the last time seq
        out = self.classifier(out_gru4)
        return out
    def check_accuracy(self, dataloader):
        total_correct = 0
        total_label = 0
        for i_batch, sample_batched in enumerate(dataloader):
            X_sample, y_sample = sample_batched
            X_sample, y_sample = Variable(X_sample), Variable(y_sample)
            out = self.forward(X_sample.cuda())
            _, pred = torch.max(out, 1)
            num_correct = np.sum(pred.data.cpu().numpy() == y_sample.data.cpu().numpy())
            total_correct += num_correct
            total_label += len(pred)
        return  total_correct / total_label

In [99]:
dtype = torch.cuda.FloatTensor
hidden_dim = 128
num_classes = 4
num_epoches = 100
model = myGRU(E, hidden_dim, 1, num_classes)
model.type(dtype)
loss_fn = nn.CrossEntropyLoss().type(dtype)
optimizer = optim.Adam(model.parameters(), lr=1e-3)

# Conv Training

In [100]:
best_acc = 0.35

In [101]:
for epoch in range(num_epoches):
    for i, data in enumerate(dataloaders['train'], 0):
        X_train, y_train = data
        # Wrap them in Variable
        X_train, y_train = Variable(X_train), Variable(y_train)
        # forward + backward + optimize
        out = model(X_train.cuda())
        # print (out)
        loss = loss_fn(out, y_train.long().cuda())
        print('(%d batch) loss: %f' % (i, loss))
        # zero the parameter gradients
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
    train_acc = model.check_accuracy(dataloaders['train'])
    val_acc = model.check_accuracy(dataloaders['val'])
    print('(Epoch %d / %d) train_acc: %f; val_acc: %f' % (epoch+1, num_epoches, train_acc, val_acc))
    if (val_acc > best_acc):
        best_acc = val_acc
        torch.save(model, 'best_CHRONET.pt')

(0 batch) loss: 1.380186


RuntimeError: cuda runtime error (2) : out of memory at /pytorch/torch/lib/THC/generic/THCStorage.cu:58

# Best Model Test

In [10]:
best_model = torch.load('best_CHRONET.pt')
print (best_model.check_accuracy(dataloaders['val']))

0.35


