In [1]:
# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load

import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

# Input data files are available in the read-only "../input/" directory
# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory

import os
for dirname, _, filenames in os.walk('/kaggle/input'):
    for filename in filenames:
        print(os.path.join(dirname, filename))

# You can write up to 20GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using "Save & Run All" 
# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session

/kaggle/input/test-cifar100/test
/kaggle/input/cifar10-test-data-sp24-npy/cifar10_test_data_sp24.npy


# Data Preprocessing

In [2]:
# Imports for pytorch
import numpy as np
import torch
import torchvision
from torch import nn
import matplotlib
from matplotlib import pyplot as plt
import tqdm
import copy
import torch.utils.data as data

SEED = 1234

torch.manual_seed(SEED)
torch.cuda.manual_seed(SEED)
torch.backends.cudnn.deterministic = True

In [3]:
transform = torchvision.transforms.ToTensor()

unprocessed_train_data = torchvision.datasets.CIFAR100(
    root="data",
    train=True,
    download=True
)

"""
    
                           torchvision.transforms.ColorJitter(brightness = 0.1,
                                                              contrast = 0.1, 
                                                              saturation = 0.1), 
                           torchvision.transforms.RandomAdjustSharpness(sharpness_factor = 2,
                                                                        p = 0.1),
                           torchvision.transforms.RandomErasing(p=0.75,
                                                                scale=(0.02, 0.1),
                                                                value=1.0, 
                                                                inplace=False),
                            """


arr_mean = np.mean(unprocessed_train_data.data, axis=(0, 1, 2)) / 255
arr_sd = np.std(unprocessed_train_data.data, axis=(0, 1, 2)) / 255

SIZE = 112


train_transforms = torchvision.transforms.Compose([
                           torchvision.transforms.Resize(SIZE),
                           torchvision.transforms.RandomRotation(20),
                           torchvision.transforms.RandomHorizontalFlip(0.5),
                           torchvision.transforms.RandomCrop(SIZE, padding=10),
                           torchvision.transforms.ColorJitter(brightness = 0.1,
                                                              contrast = 0.1, 
                                                              saturation = 0.1), 
                           torchvision.transforms.RandomAdjustSharpness(sharpness_factor = 2,
                                                                        p = 0.1),
                           
                           torchvision.transforms.ToTensor(),
                           torchvision.transforms.Normalize(mean=arr_mean,
                                                std=arr_sd)
                       ])


test_transforms = torchvision.transforms.Compose([
                           torchvision.transforms.Resize(SIZE),
                           torchvision.transforms.ToTensor(),
                           torchvision.transforms.Normalize(mean=arr_mean,
                                                std=arr_sd)
                           ])

training_data = torchvision.datasets.CIFAR10(root = 'data',
                              train=True,
                              download=True,
                              transform=train_transforms)

test_data = torchvision.datasets.CIFAR10(root = 'data',
                             train=False,
                             download=True,
                             transform=test_transforms)

Files already downloaded and verified
Files already downloaded and verified
Files already downloaded and verified


In [4]:
test_data

Dataset CIFAR10
    Number of datapoints: 10000
    Root location: data
    Split: Test
    StandardTransform
Transform: Compose(
               Resize(size=112, interpolation=bilinear, max_size=None, antialias=True)
               ToTensor()
               Normalize(mean=[0.50707516 0.48654887 0.44091784], std=[0.26733429 0.25643846 0.27615047])
           )

In [5]:
train_data, val_data = data.random_split(training_data,
                                           [int(training_data.data.shape[0] * 0.9), int(training_data.data.shape[0] * 0.1)])


In [6]:
val_data = copy.deepcopy(val_data)
val_data.dataset.transform = test_transforms #make sure the val data uses test transform

# **Build Model Architecture**


In [7]:
class NormalizedLayer(nn.Module):
    def __init__(self, size):
        super().__init__()
        self.linear1 = nn.Linear(size, size)
        self.linear2 = nn.Linear(size, size)
        self.layer = nn.RMSNorm(size)
        self.dropout = nn.Dropout(0.4)


    def forward(self, input):
        x = input
        x = self.dropout(x)
        x = self.linear1(x)
        x = nn.functional.relu(x)
        x = torch.square(x)
        x = self.layer(x)
        x = self.linear2(x)
        x = x + input
        return x

class Classifier(nn.Module):
    def __init__(self, output_dim, hidden_dim = 512, layer_count = 32):
        super().__init__()

        self.dropout = nn.Dropout(.5)
        self.reduction = nn.Linear(25088, hidden_dim)
        #self.reduction = nn.Linear(6272, hidden_dim)
        self.layer = nn.RMSNorm(hidden_dim)
        
        self.layers = []
        for i in range(layer_count):
            layer = NormalizedLayer(hidden_dim)
            self.layers.append(layer)
            self.register_module('layer' + str(i), layer)
        self.linearOutput = nn.Linear(hidden_dim, output_dim)
        

    def forward(self, x):

        x = self.dropout(x)
        x = self.reduction(x)
        x = self.layer(x)

        for layer in self.layers:
            x = layer(x)

        x = self.linearOutput(x)
        
        return x

In [8]:


class VGG(nn.Module):
    def __init__(self, features, output_dim):
        super().__init__()

        self.features = features

        self.avgpool = nn.AdaptiveAvgPool2d((7,7))

        self.classifier = Classifier(output_dim)
    

    def forward(self, x):
        x = self.features(x)
        #x = self.avgpool(x)
        h = x.view(x.shape[0], -1)
        x = self.classifier(h)
        return x, h

 
                
def design_layers(config, batch_norm):

    layers = []
    in_channels = 3

    for c in config:

        if c == 'M':
            #layers += [nn.Conv2d(in_channels, in_channels, kernel_size=2, stride = 2)]
            layers += [nn.MaxPool2d(kernel_size=2, stride = 2)]

        else:
        
            conv2d = nn.Conv2d(in_channels, c, kernel_size=3, padding=1)
            if batch_norm:
                layers += [conv2d, nn.BatchNorm2d(c), nn.ReLU(inplace=True)]
            else:
                layers += [conv2d, nn.ReLU(inplace=True)]
            in_channels = c

    return nn.Sequential(*layers)
seq = [64, 'M', 128, 'M', 256, 256, 'M', 512, 512, 'M', 512, 512, 'M']







"\n64, 64, 'M', \n       64, 64, 'M',  \n       64, 64, 'M',  \n       64, 512, 'M']\n"

In [9]:
vgg1_layers = design_layers(seq, batch_norm=True)
model = VGG(vgg1_layers, 10)
vgg1_layers

Sequential(
  (0): Conv2d(3, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (2): ReLU(inplace=True)
  (3): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (4): Conv2d(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (5): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (6): ReLU(inplace=True)
  (7): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)
  (8): Conv2d(32, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (9): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (10): ReLU(inplace=True)
  (11): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (12): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (13): ReLU(inplace=True)
  (14): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_m

In [10]:
BATCH_SIZE = 64

training_data = torchvision.datasets.CIFAR10(root = 'data',
                              train=True,
                              download=True,
                              transform=train_transforms)


train_iterator = data.DataLoader(train_data,
                                 shuffle=True,
                                 batch_size=BATCH_SIZE)

val_iterator = data.DataLoader(val_data,
                                 batch_size=BATCH_SIZE)



Files already downloaded and verified


In [11]:
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')


model = model.to(device)
CEL = nn.CrossEntropyLoss().to(device)

In [12]:
import torch.optim as optim


params = [
          {'params': model.features.parameters()}, #, 'lr': 5e-4 / 10},
          {'params': model.classifier.parameters()}
         ]

optimizer = optim.AdamW(params, lr= 5e-3, weight_decay = 1e-4)



In [13]:
from tqdm.notebook import trange, tqdm

def train(model, iterator, optimizer, CEL, device):

    epoch_loss = 0
    epoch_accuracy = 0

    model.train()

    for (x, y) in tqdm(iterator, desc="Training", leave=False):

        x = x.to(device)
        y = y.to(device)

        optimizer.zero_grad()

        y_pred,_ = model(x)

        loss = CEL(y_pred, y)

        accuracy = calculate_accuracy(y_pred, y)

        loss.backward()

        optimizer.step()

        epoch_loss += loss.item()
        epoch_accuracy += accuracy.item()

    return epoch_loss / len(iterator), epoch_accuracy / len(iterator)


def evaluate(model, iterator, CEL, device):

    epoch_loss = 0
    epoch_accuracy = 0

    model.eval()

    with torch.no_grad():

        for (x, y) in tqdm(iterator, desc="Evaluating", leave=False):

            x = x.to(device)
            y = y.to(device)

            y_pred,_ = model(x)

            loss = CEL(y_pred, y)

            accuracy = calculate_accuracy(y_pred, y)

            epoch_loss += loss.item()
            epoch_accuracy += accuracy.item()

    return epoch_loss / len(iterator), epoch_accuracy / len(iterator)

def calculate_accuracy(y_pred, y):
    first_pred = y_pred.argmax(1, keepdim=True)
    correct = first_pred.eq(y.view_as(first_pred)).sum()
    accuracy = correct.float() / y.shape[0]
    return accuracy

In [None]:
EPOCHS = 20
BATCH_SIZE = 64


best_val_loss = float('inf')

train_accuracies = []
val_accuracies = []
train_losses = []
val_losses = []

val_iterator = data.DataLoader(val_data,
                                 batch_size=BATCH_SIZE)

for epoch in trange(EPOCHS):
    
    training_data = torchvision.datasets.CIFAR10(root = 'data',
                              train=True,
                              download=False,
                              transform=train_transforms)
    train_iterator = data.DataLoader(train_data,
                                 shuffle=True,
                                 batch_size=BATCH_SIZE)

    train_loss, train_accuracy = train(model, train_iterator, optimizer, CEL, device)
    val_loss, val_accuracy = evaluate(model, val_iterator, CEL, device)

    train_accuracies.append(train_accuracy)
    val_accuracies.append(val_accuracy)
    train_losses.append(train_loss)
    val_losses.append(val_loss)

    if val_loss < best_val_loss:
        best_val_loss = val_loss
        torch.save(model.state_dict(), 'tut1-model.pt')

    print(f'\tTrain Loss: {train_loss:.3f} | Train Acc: {train_accuracy*100:.2f}%')
    print(f'\t Val. Loss: {val_loss:.3f} |  Val. Acc: {val_accuracy*100:.2f}%')


plt.plot(range(1, EPOCHS + 1), train_accuracies, label='Train Accuracy')
plt.plot(range(1, EPOCHS + 1), val_accuracies, label='Validation Accuracy')
plt.xlabel('Epoch')
plt.ylabel('Accuracy')
plt.title('Train/Validation Accuracy')
plt.legend()
plt.show()

plt.plot(range(1, EPOCHS + 1), train_losses, label='Train Loss')
plt.plot(range(1, EPOCHS + 1), val_losses, label='Validation Loss')
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.title('Train/Validation Loss')
plt.legend()
plt.show()

  0%|          | 0/20 [00:00<?, ?it/s]

Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 4.472 | Train Acc: 24.35%
	 Val. Loss: 1.806 |  Val. Acc: 35.82%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 1.413 | Train Acc: 48.20%
	 Val. Loss: 1.093 |  Val. Acc: 60.27%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 1.057 | Train Acc: 62.27%
	 Val. Loss: 0.903 |  Val. Acc: 68.43%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 0.889 | Train Acc: 68.67%
	 Val. Loss: 0.731 |  Val. Acc: 74.74%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 0.784 | Train Acc: 72.58%
	 Val. Loss: 0.628 |  Val. Acc: 78.03%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 0.714 | Train Acc: 75.36%
	 Val. Loss: 0.646 |  Val. Acc: 77.77%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 0.655 | Train Acc: 77.27%
	 Val. Loss: 0.639 |  Val. Acc: 77.97%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

Evaluating:   0%|          | 0/79 [00:00<?, ?it/s]

	Train Loss: 0.616 | Train Acc: 78.57%
	 Val. Loss: 0.597 |  Val. Acc: 78.84%


Training:   0%|          | 0/704 [00:00<?, ?it/s]

In [None]:
from PIL import Image
import os

class CIFAR10Test(torchvision.datasets.VisionDataset):

    def __init__(self, transform=None, target_transform=None):
        super(CIFAR10Test, self).__init__(None, transform=transform,
                                      target_transform=target_transform)
        assert os.path.exists("/kaggle/input/cifar10-test-data-sp24-npy/cifar10_test_data_sp24.npy"), "You must upload the test data to the file system."
        self.data = [np.load("/kaggle/input/cifar10-test-data-sp24-npy/cifar10_test_data_sp24.npy", allow_pickle=False)]

        self.data = np.vstack(self.data).reshape(-1, 3, 32, 32)
        self.data = self.data.transpose((0, 2, 3, 1))  # convert to HWC

    def __getitem__(self, index: int):
        img = self.data[index]
        img = Image.fromarray(img)
        if self.transform is not None:
            img = self.transform(img)
        return img

    def __len__(self) -> int:
        return len(self.data)

# Create the test dataset
testing_data = CIFAR10Test(
    transform=test_transforms # NOTE: Make sure transform is the same as used in the training dataset.
)

test_data = torchvision.datasets.CIFAR10(root = 'data',
                             train=False,
                             download=True,
                             transform=test_transforms)

In [None]:
test_iterator = data.DataLoader(testing_data,
                                batch_size=BATCH_SIZE,
                               shuffle = False)


In [None]:
model

In [None]:


def get_predictions(model, iterator):

    model.eval()
    model = model.to(device)
    labels = []

    with torch.no_grad():
        for x in tqdm(iterator):
            x = x.to(device)

            y_pred, _ = model(x)
            
            _, predicted_labels = torch.max(y_pred, 1)
            
            labels.extend(predicted_labels.tolist())
    

    return labels


predictions = get_predictions(model, test_iterator)
len(predictions)

In [None]:
import pandas as pd

if isinstance(predictions, np.ndarray):
    predictions = predictions.astype(int)
else:
    predictions = np.array(predictions, dtype=int)
assert predictions.shape == (len(testing_data),), "Predictions were not the correct shape"
df = pd.DataFrame({'Category': predictions})
df.index += 1  # Ensures that the index starts at 1.
df.to_csv('submission.csv', index_label='Id')

In [None]:
def unpickle(file):
    import pickle
    with open(file, 'rb') as fo:
        dict = pickle.load(fo, encoding='bytes')
    return dict
df