In [None]:
import sys
import os

current_dir = os.getcwd()  
util_dir = os.path.join(current_dir, '../util')
sys.path.append(util_dir)

  from .autonotebook import tqdm as notebook_tqdm


In [None]:
from helpers import *
from warnings import filterwarnings

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F

filterwarnings('ignore')

device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

In [2]:
print(f'Using device: {device}')

Using device: cuda


In [3]:
positive_encodings, negative_encodings = load_complete_dataset(n_files=10)

Loading checkpoint shards: 100%|██████████| 2/2 [00:02<00:00,  1.00s/it]
100%|██████████| 10/10 [00:03<00:00,  3.14it/s]
100%|██████████| 10/10 [00:01<00:00,  6.04it/s]
100%|██████████| 10/10 [00:01<00:00,  6.53it/s]
100%|██████████| 10/10 [00:02<00:00,  4.07it/s]
100%|██████████| 10/10 [00:02<00:00,  4.73it/s]
100%|██████████| 10/10 [00:01<00:00,  6.30it/s]
100%|██████████| 10/10 [00:02<00:00,  4.36it/s]
100%|██████████| 10/10 [00:02<00:00,  4.42it/s]
100%|██████████| 10/10 [00:03<00:00,  2.92it/s]
100%|██████████| 10/10 [00:02<00:00,  4.44it/s]


In [4]:
class MLPClassifier(nn.Module):
    def __init__(self, input_size, hidden_size, output_size):
        super(MLPClassifier, self).__init__()
        self.fc1 = nn.Linear(input_size, hidden_size)
        self.fc2 = nn.Linear(hidden_size, hidden_size)
        self.fc3 = nn.Linear(hidden_size, output_size)
        self.dropout = nn.Dropout(0.01)
        self.sinu = nn.SiLU()
        self.batchnorm = nn.BatchNorm1d(hidden_size)
        self.softmax = nn.Softmax(dim=1)

    def forward(self, x):
        x = self.fc1(x)
        x = self.batchnorm(x)
        x = self.sinu(x)
        x = self.dropout(x)
        x = self.fc2(x)
        x = self.batchnorm(x)
        x = self.sinu(x)
        x = self.dropout(x)
        x = self.fc3(x)
        x = self.softmax(x)
        return x

In [5]:
batch_size = 16

dataset = torch.concat([positive_encodings, negative_encodings], dim=0)
labels = torch.tensor([1] * len(positive_encodings) + [0] * len(negative_encodings))

dataset = torch.utils.data.TensorDataset(dataset, labels)

train_dataset, test_dataset = torch.utils.data.random_split(dataset, [int(0.8 * len(dataset)), len(dataset) - int(0.8 * len(dataset))])

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=False)

In [6]:
learning_rate = 1e-5
num_epochs = 15
input_size = 3072
hidden_size = 1024
n_classes = 2

model = MLPClassifier(input_size, hidden_size, n_classes)
model = model.to(device)

criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

for epoch in range(num_epochs):
    for i, (data, labels) in enumerate(train_loader):

        data = data.to(device).float()
        labels = labels.to(device).long()

        optimizer.zero_grad()
        outputs = model(data)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

    print(f'[Epoch {epoch + 1}] | Loss: {round(loss.item(), 3)}')

[Epoch 1] | Loss: 0.631
[Epoch 2] | Loss: 0.546
[Epoch 3] | Loss: 0.391
[Epoch 4] | Loss: 0.486
[Epoch 5] | Loss: 0.41
[Epoch 6] | Loss: 0.487
[Epoch 7] | Loss: 0.347
[Epoch 8] | Loss: 0.343
[Epoch 9] | Loss: 0.381
[Epoch 10] | Loss: 0.436
[Epoch 11] | Loss: 0.548
[Epoch 12] | Loss: 0.406
[Epoch 13] | Loss: 0.381
[Epoch 14] | Loss: 0.436
[Epoch 15] | Loss: 0.325


In [7]:
train_acc = 0

with torch.no_grad():
    for data, labels in test_loader:
        data = data.to(device).float()
        labels = labels.to(device).long()

        outputs = model(data)
        _, predicted = torch.max(outputs.data, 1)
        train_acc += (predicted == labels).sum().item()

print(f'Test Accuracy: {round(train_acc / len(test_dataset), 3)}')

Test Accuracy: 0.88


In [8]:
test_acc = 0
with torch.no_grad():
    for data, labels in test_loader:
        data = data.to(device).float()
        labels = labels.to(device).long()

        outputs = model(data)
        _, predicted = torch.max(outputs.data, 1)
        test_acc += (predicted == labels).sum().item()

print(f'Test Accuracy: {round(test_acc / len(test_dataset), 3)}')

Test Accuracy: 0.881
