# Experiment 5: Scattering Features + CNN Model




In [250]:
import sys
sys.path.append('../src')

from utils.reduce import reduce_pca
from utils.split import train_test_split, train_test_split_pytorch
from utils.UltrasoundDataset import UltrasoundDataset
from utils.Networks import  BasicBlock, Scattering2dResNet
from torch.utils.data import Dataset, DataLoader
import torch.nn.functional as F
from torch.autograd import Variable
from kymatio.torch import Scattering2D
import argparse
import torch.nn as nn
import torch.nn.functional as F
import torchvision.transforms as transforms
import torch.optim
import pickle
import pandas as pd
import numpy as np
import mlflow
import matplotlib.pyplot as plt

In [251]:
#mlflow.set_experiment('scattering_linear_experiment')

## Upload Ultrasound images

In [252]:
with open('../data/02_interim/bmodes_steatosis_assessment_IJCARS.pickle', 'rb') as handle:
    df = pickle.load(handle)

In [253]:
M, N= 434, 636 # ultrasound image dimension

In [254]:
def resize2d(img, size):
    return (F.adaptive_avg_pool2d(Variable(img,volatile=True), size)).data
# downsampling
df['img'] = df['img'].apply(lambda x: resize2d(x, (32,32)))
df['img'] = df['img'].apply(lambda x: x.expand(3,32,32))


# np.nan
# for i in range(len(df['img'])):
#     new_df['img'].iloc[i] = resize2d(df['img'].iloc[i], (32,32))


  


In [255]:
df['img'][0].shape

torch.Size([3, 32, 32])

In [256]:
# split training and test (by making sure the 10 ultrasound images of one patient is in the same set)
train_data, test_data = train_test_split(df)

In [257]:
###############################################################################
# If a GPU is available, let's use it!
use_cuda = torch.cuda.is_available()
device = torch.device("cuda" if use_cuda else "cpu")
###############################################################################

# Create dataloader

In [258]:
# create dataset
# from https://github.com/python-engineer/pytorchTutorial/blob/master/09_dataloader.py

train_dataset = UltrasoundDataset(train_data)
test_dataset  = UltrasoundDataset(test_data)

# Load whole dataset with DataLoader
# shuffle: shuffle data, good for training
# num_workers: faster loading with multiple subprocesses
# !!! IF YOU GET AN ERROR DURING LOADING, SET num_workers TO 0 !!!
train_loader = DataLoader(dataset=train_dataset,
                          batch_size=128,
                          shuffle=True,
                          num_workers=2)
test_loader = DataLoader(dataset=test_dataset,
                          batch_size=5,
                          shuffle=True,
                          num_workers=2)


In [259]:
dataiter = iter(train_loader)
data1 = dataiter.next()
data2 = dataiter.next()
data3 = dataiter.next()
features, labels = data3
print(features.shape, labels.shape)

torch.Size([128, 3, 32, 32]) torch.Size([128])


In [260]:
features[0].shape

torch.Size([3, 32, 32])

# Defining scattering transformations

In [261]:
parser = argparse.ArgumentParser(description='CIFAR scattering  + hybrid examples')
parser.add_argument('--mode', type=int, default=1,help='scattering 1st or 2nd order')
parser.add_argument('--width', type=int, default=2,help='width factor for resnet')
args = parser.parse_args(args=[])

use_cuda = torch.cuda.is_available()
device = torch.device("cuda" if use_cuda else "cpu")
number_channels = 3
if args.mode == 1:
    scattering = Scattering2D(J=2, shape=(32, 32), max_order=1)
    K = 17*number_channels
else:
    scattering = Scattering2D(J=2, shape=(32, 32))
    K = 81*number_channels
if use_cuda:
    scattering = scattering.cuda()


In [262]:
def conv3x3(in_planes, out_planes, stride=1):
    "3x3 convolution with padding"
    # in_planes = in_channels
    # out_planes = out_channels
    return nn.Conv2d(in_planes, out_planes, kernel_size=3, stride=stride,
                     padding=1, bias=False)

## Training and Testing Functions

In [263]:
def train(model, device, train_loader, optimizer, epoch, scattering):
    model.train()
    for batch_idx, (data, target) in enumerate(train_loader):
        data, target = data.to(device), target.to(device)
        optimizer.zero_grad()
        output = model(scattering(data))
        loss = F.cross_entropy(output, target)
        loss.backward()
        optimizer.step()
        if batch_idx % 50 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch, batch_idx * len(data), len(train_loader.dataset),
                100. * batch_idx / len(train_loader), loss.item()))

def test(model, device, test_loader, scattering):
    model.eval()
    test_loss = 0
    correct = 0
    with torch.no_grad():
        for data, target in test_loader:
            data, target = data.to(device), target.to(device)
            output = model(scattering(data))
            test_loss += F.cross_entropy(output, target, reduction='sum').item() # sum up batch loss
            pred = output.max(1, keepdim=True)[1] # get the index of the max log-probability
            correct += pred.eq(target.view_as(pred)).sum().item()

    test_loss /= len(test_loader.dataset)
    print('\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.2f}%)\n'.format(
        test_loss, correct, len(test_loader.dataset),
        100. * correct / len(test_loader.dataset)))

# Optimization

In [264]:
class BasicBlock(nn.Module):
    def __init__(self, inplanes, planes, stride=1, downsample=None):
        super(BasicBlock, self).__init__()
        self.conv1 = conv3x3(inplanes, planes, stride)
        self.bn1 = nn.BatchNorm2d(planes)
        self.relu = nn.ReLU(inplace=True)
        self.conv2 = conv3x3(planes, planes)
        self.bn2 = nn.BatchNorm2d(planes)
        self.downsample = downsample
        self.stride = stride

    def forward(self, x):
        print(type(x))
        residual = x
        out = self.conv1(x)
        out = self.bn1(out)
        out = self.relu(out)
        out = self.conv2(out)
        out = self.bn2(out)
        

        if self.downsample is not None:
            residual = self.downsample(x)

        out += residual
        out = self.relu(out)

In [270]:
class Scattering2dResNet(nn.Module):
    def __init__(self, in_channels,  k=2, n=4, num_classes=2):
        super(Scattering2dResNet, self).__init__()
        self.inplanes = 16 * k
        self.ichannels = 16 * k
        self.K = in_channels
        self.init_conv = nn.Sequential(
            nn.BatchNorm2d(in_channels, eps=1e-5, affine=False),
            nn.Conv2d(in_channels, self.ichannels,
                  kernel_size=3, stride=1, padding=1, bias=False),
            nn.BatchNorm2d(self.ichannels),
            nn.ReLU(True)
        )

        self.layer2 = self._make_layer(BasicBlock, 32 * k, n)
        self.layer3 = self._make_layer(BasicBlock, 64 * k, n)
        self.avgpool = nn.AdaptiveAvgPool2d(2)
        self.fc = nn.Linear(64 * k * 4, num_classes)

    def _make_layer(self, block, planes, blocks, stride=1):
        downsample = None
        print('here')
        if stride != 1 or self.inplanes != planes:
            downsample = nn.Sequential(
                nn.Conv2d(self.inplanes, planes,
                          kernel_size=1, stride=stride, bias=False),
                nn.BatchNorm2d(planes),
            )
       
        layers = []
        
        layers.append(block(self.inplanes, planes, stride, downsample))
        self.inplanes = planes
        for i in range(1, blocks):
            layers.append(block(self.inplanes, planes))
        return nn.Sequential(*layers)

    def forward(self, x):
        print(1)
        x = x.view(x.size(0), self.K, 8, 8)
        print(2)
        x = self.init_conv(x)
        print(3)
        print(x.shape)
        x = self.layer2(x)
        print(4)
        x = self.layer3(x)
        print(5)
        x = self.avgpool(x)
        print(6)
        x = x.view(x.size(0), -1)
        print(7)
        x = self.fc(x)
        print(8)
        return x

In [271]:
model = Scattering2dResNet(K, args.width).to(device)
# Optimizer
lr = 0.1
for epoch in range(0, 90):
  if epoch%20==0:
      optimizer = torch.optim.SGD(model.parameters(), lr=lr, momentum=0.9,
                                  weight_decay=0.0005)
      lr*=0.2

train(model, device, train_loader, optimizer, epoch+1, scattering)
test(model, device, test_loader, scattering)

1
2
3
torch.Size([128, 32, 8, 8])
<class 'torch.Tensor'>
<class 'NoneType'>


TypeError: conv2d(): argument 'input' (position 1) must be Tensor, not NoneType

# Run Mlflow to see results

`!mlflow ui`

Should launch something like this:



In [None]:
# !mlflow ui