In [1]:
import torch
import torchvision
import torch.nn as nn
import time
import json
import datetime
from DeepLearning.Project1.data import *

In [2]:
# File based on https://github.com/huyvnphan/PyTorch_CIFAR10/
class VGG(nn.Module):
    def __init__(self, features, num_classes=10, avgpool_size=(1,1)):
        super(VGG, self).__init__()
        self.features = features

        self.avgpool = nn.AdaptiveAvgPool2d(avgpool_size)

        self.classifier = nn.Sequential(
            nn.Linear(512 * avgpool_size[0] * avgpool_size[1], 4096),
            nn.ReLU(True),
            nn.Dropout(),
            nn.Linear(4096, 4096),
            nn.ReLU(True),
            nn.Dropout(),
            nn.Linear(4096, num_classes),
        )

    def forward(self, x):
        x = self.features(x)
        x = self.avgpool(x)
        x = torch.flatten(x, 1)
        x = self.classifier(x)
        return x

 # Create convolution part of VGG11_bn archhitecture
def make_vgg11_bn_layers(cfg = None):
    if cfg == None:
        cfg = [64, "M", 128, "M", 256, 256, "M", 512, 512, "M", 512, 512, "M"]
    layers = []
    in_channels = 3
    for v in cfg:
        if v == "M":
            layers += [nn.MaxPool2d(kernel_size=2, stride=2)]
        else:
            conv2d = nn.Conv2d(in_channels, v, kernel_size=3, padding=1)
            layers += [conv2d, nn.BatchNorm2d(v), nn.ReLU(inplace=True)]
            in_channels = v
    return nn.Sequential(*layers)

 # Create VGG11_bn model
def vgg11_bn(device="cpu", num_classes=10):
    model = VGG(make_vgg11_bn_layers(), num_classes=num_classes)
    return model

vgg_cfg = {
    '8':  [64, 'M', 128, 'M', 256, 'M', 512, 'M', 512, 'M'],
    '11': [64, 'M', 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M'],
    '13': [64, 64, 'M', 128, 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M'],
    '16': [64, 64, 'M', 128, 128, 'M', 256, 256, 256, 'M', 512, 512, 512, 'M', 512, 512, 512, 'M'],
    '19': [64, 64, 'M', 128, 128, 'M', 256, 256, 256, 256, 'M', 512, 512, 512, 512, 'M', 
          512, 512, 512, 512, 'M'],
}



def eval_accuracy(model, dataloader, training_device='cpu'):
    with torch.no_grad():
        model.to(training_device)
        correct = 0
        all_so_far = 0
        for inputs, labels in dataloader:
            inputs, labels = inputs.to(training_device), labels.to(training_device)
            pred = torch.argmax(model(inputs), dim=1)

            all_so_far += labels.size().numel()
            correct += torch.sum(pred.eq(labels)).item()
    return correct/all_so_far

In [3]:
def backup_to_ram(model):
    from copy import deepcopy
    return deepcopy(model).cpu()

class EarlyStopper:
    def __init__(self, patience = 3, backup_method=backup_to_ram):
        self.patience = patience
        self.current = 0
        
        self.backup_method = backup_method
        
        self.best_backup = None
        self.best_accuracy = 0.

    def should_continue(self, accuracy, model = None):
        if self.best_accuracy < accuracy:
            self.current = 0
            self.best_accuracy = accuracy
            if model is not None:
                self.best_backup = self.backup_method(model)
            return True
        
        self.current += 1
        
        if self.current >= self.patience:
            return False
        return True

In [4]:
def train_one_epoch(model, optimizer, criterion, dataloader_train, training_device):
    for inputs, labels in dataloader_train:
        inputs, labels = inputs.to(training_device), labels.to(training_device)
        optimizer.zero_grad()
        loss = criterion(model(inputs), labels)
        loss.backward()
        optimizer.step()

def train_one_run(model, optimizer, criterion, dataloader_train, dataloader_val, max_epochs, early_stopper, trajectory, training_device='cuda', *_args, **_kwargs):
    model.train()
    model.to(training_device)
    for epoch in range(max_epochs):
        start_time = time.time()
        
        train_one_epoch(model, optimizer, criterion, dataloader_train, training_device)
        
        end_time = time.time()
        
        training_accuracy = eval_accuracy(model, dataloader_train, training_device)
        validation_accuracy = eval_accuracy(model, dataloader_val, training_device)
        print("Epoch: {}, Accuracy on validation set: {}".format(epoch, validation_accuracy))
        
        trajectory.append({
            "epoch": epoch,
            "train": training_accuracy,
            "validation": validation_accuracy,
            "start_time": start_time,
            "duration": end_time - start_time,
            "memory_allocated_mb": torch.cuda.memory_allocated()/1024/1024,
            "memory_reserved_mb": torch.cuda.memory_reserved()/1024/1024,
        })
        
        
        if not early_stopper.should_continue(validation_accuracy, model):
            print("Early stop")
            return early_stopper.best_backup
    
    return model

In [5]:
def run_aug_experiment(arch_name, model_factory, aug_name, aug_factory, run):
    path = "experiments/aug_" + aug_name + "_arch" + arch_name + "_" + run + "_"
    
    # 
    import os
    try:
        if os.stat(path + "report.json").st_size != 0:
            print("Report exists already for " + path[:-1] + ". Skipping...")
            return
    except OSError:
        pass
    
    train, test, val = aug_factory()
    print("data loaded")
    model = model_factory()
    criterion = torch.nn.CrossEntropyLoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=1e-3)
    early_stopper = EarlyStopper(patience = 5)
    trajectory = []
    print("experiment initialized")
    model = train_one_run(model, optimizer, criterion, train, val, 200, early_stopper, trajectory)
    validation_accuracy = eval_accuracy(model, val, "cuda")
    
    with open(path + "report.json", "w") as f:
        json.dump(
            {
                "name": arch_name,
                "run": run,
                "best_accuracy_validation": validation_accuracy,
                "time_generated": datetime.datetime.now().isoformat(),
                "trajectory": trajectory
            },
            f
        )
    torch.save(model, path + "model.pt")

In [6]:
def vgg_from_cfg(cfg_key):
    return VGG(
        make_vgg11_bn_layers(cfg=vgg_cfg[cfg_key]),
        num_classes=10,
        avgpool_size=(1,1)
    ).to("cuda")

def vgg11():
    return vgg_from_cfg("11")

def vgg13():
    return vgg_from_cfg("13")

def vgg16():
    return vgg_from_cfg("16")

In [7]:
def flip():
    return augmented_cifar10_dataset_randomflip(bs=128)

def small_rotate():
    return augmented_cifar10_dataset_randomrotate(5, bs=128)

def medium_rotate():
    return augmented_cifar10_dataset_randomrotate(45, bs=128)

def full_rotate():
    return augmented_cifar10_dataset_randomrotate(180, bs=128)

def fliprotate():
    return augmented_cifar10_dataset_randomflip_rotate(5, bs=128)

def noise():
    return augmented_cifar10_dataset_gauss_noise(0.05, bs=128)

def cutout():
    return augmented_cifar10_dataset_cutout(5, bs=128)

In [8]:
experiment_list = [
    (archfactory.__name__, archfactory, augfactory.__name__, augfactory, str(run))
    for run in range(1, 11)
    for archfactory in [vgg13, vgg16]
    for augfactory in [cutout]
] 

In [10]:
for experiment in experiment_list:
    print(
        "Time:", datetime.datetime.now().isoformat(), 
        "Arch: ", experiment[0], 
        "Aug: ", experiment[2],
        "Run: ", experiment[4]
    )
    run_aug_experiment(*experiment)

Time: 2023-03-25T14:10:46.231156 Arch:  vgg13 Aug:  cutout Run:  1
Report exists already for experiments/aug_cutout_archvgg13_1. Skipping...
Time: 2023-03-25T14:10:46.232285 Arch:  vgg16 Aug:  cutout Run:  1
Report exists already for experiments/aug_cutout_archvgg16_1. Skipping...
Time: 2023-03-25T14:10:46.232458 Arch:  vgg13 Aug:  cutout Run:  2
Report exists already for experiments/aug_cutout_archvgg13_2. Skipping...
Time: 2023-03-25T14:10:46.233836 Arch:  vgg16 Aug:  cutout Run:  2
Report exists already for experiments/aug_cutout_archvgg16_2. Skipping...
Time: 2023-03-25T14:10:46.234007 Arch:  vgg13 Aug:  cutout Run:  3
Report exists already for experiments/aug_cutout_archvgg13_3. Skipping...
Time: 2023-03-25T14:10:46.234071 Arch:  vgg16 Aug:  cutout Run:  3
Report exists already for experiments/aug_cutout_archvgg16_3. Skipping...
Time: 2023-03-25T14:10:46.234176 Arch:  vgg13 Aug:  cutout Run:  4
Report exists already for experiments/aug_cutout_archvgg13_4. Skipping...
Time: 2023-03

Epoch: 39, Accuracy on validation set: 0.8522
Epoch: 40, Accuracy on validation set: 0.8462
Early stop
Time: 2023-03-25T15:12:23.182483 Arch:  vgg16 Aug:  cutout Run:  9
Files already downloaded and verified
Files already downloaded and verified
data loaded
experiment initialized
Epoch: 0, Accuracy on validation set: 0.2736
Epoch: 1, Accuracy on validation set: 0.4128
Epoch: 2, Accuracy on validation set: 0.5168
Epoch: 3, Accuracy on validation set: 0.601
Epoch: 4, Accuracy on validation set: 0.6516
Epoch: 5, Accuracy on validation set: 0.709
Epoch: 6, Accuracy on validation set: 0.7336
Epoch: 7, Accuracy on validation set: 0.7658
Epoch: 8, Accuracy on validation set: 0.7756
Epoch: 9, Accuracy on validation set: 0.7922
Epoch: 10, Accuracy on validation set: 0.799
Epoch: 11, Accuracy on validation set: 0.8074
Epoch: 12, Accuracy on validation set: 0.8202
Epoch: 13, Accuracy on validation set: 0.8226
Epoch: 14, Accuracy on validation set: 0.8326
Epoch: 15, Accuracy on validation set: 0.8

In [None]:
len(experiment_list)