# Training MNIST Model

The goal of this is to create a larger-than-necessary model for classifying handwritten MNIST digits. After training, the model will be serialized in a binary format to later be run using **raw** CUDA and OpenCL.

In [12]:
# required imports
import torch
import torch.nn as nn
import torch.optim as optim
from torchvision import datasets, transforms
from torch.utils.data import DataLoader 
from torchvision.datasets import MNIST
import numpy as np

## seed for reproducibility
torch.manual_seed(0)

<torch._C.Generator at 0x7f4ea4b71bd0>

In [2]:
# Define the neural network model
class SimpleNN(nn.Module):
    def __init__(self):
        super(SimpleNN, self).__init__()
        self.fc1 = nn.Linear(28 * 28, 128)
        self.fc2 = nn.Linear(128, 64)
        self.fc3 = nn.Linear(64, 10) # 0 - 9 digits
    
    def forward(self, x):
        x = x.view(-1, 28 * 28)
        x = torch.relu(self.fc1(x))
        x = torch.relu(self.fc2(x))
        x = self.fc3(x)
        return x

model = SimpleNN()

In [3]:
# Hyperparameters
batch_size = 64
learning_rate = 0.001
epochs = 5
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

In [4]:
# data loading
transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5,), (0.5,))])

# Datasets and DataLoaders
train_dataset = datasets.MNIST(root='./data', train=True, download=True, transform=transform)
test_dataset = datasets.MNIST(root='./data', train=False, download=True, transform=transform)
train_loader = DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
test_loader = DataLoader(test_dataset, batch_size=batch_size, shuffle=False)

In [5]:
# training the model
model.train()
for epoch in range(epochs):
    running_loss = 0.0
    for images, labels in train_loader:
        optimizer.zero_grad()
        outputs = model(images)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()
        running_loss += loss.item()
    print(f'Epoch {epoch+1}/{epochs}, Loss: {running_loss/len(train_loader)}')

Epoch 1/5, Loss: 0.40121362450471054
Epoch 2/5, Loss: 0.19369668023053135
Epoch 3/5, Loss: 0.14247536396425067
Epoch 4/5, Loss: 0.11517478759958545
Epoch 5/5, Loss: 0.09768994483299481


In [18]:
model.eval()
correct = 0
total = 0
with torch.no_grad():
    for images, labels in test_loader:
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()
print(f'Accuracy of the model on the test images: {100 * correct / total}%')

Accuracy of the model on the test images: 96.52%


In [19]:
# rather sloppy section to save model weights in a binary format
# somewhat difficult for some reason

import glob
import os

os.system('rm *.bin')

rm: cannot remove '*.bin': No such file or directory


256

In [20]:
# checking the distribution of weights

# this comes after seeing the bill daily talk where weights are: normally distributed **before** pruning and non-normally distributed after pruning
i = 0
for layer in model.children():
    if isinstance(layer, nn.Linear):
        state = layer.state_dict()
        state['weight'].flatten().data.cpu().numpy().tofile(f'weights{i}.bin')
        state['bias'].flatten().data.cpu().numpy().tofile(f'bias{i}.bin')
        i += 1

In [21]:
# appending all the model weights to a single binary file
with open('model', 'wb') as f:
    for file in glob.glob('*.bin'):
        with open(file, 'rb') as f2:
            f.write(f2.read())

os.system('rm *.bin')

0

## Saving MNIST Outputs

Save the MNIST and model outputs as a position-dependent pair.

In [None]:
transform = transforms.Compose([transforms.ToTensor()])
mnist_train = MNIST(root='./data', train=True, download=True, transform=transform)
mnist_test = MNIST(root='./data', train=False, download=True, transform=transform)

def flatten_and_convert_to_numpy(dataset):
    images = []
    labels = []
    for img, label in dataset:
        images.append(img.view(-1).numpy())
        labels.append(label)
    return np.array(images), np.array(labels)

train_images, train_labels = flatten_and_convert_to_numpy(mnist_train)
test_images, test_labels = flatten_and_convert_to_numpy(mnist_test)

# Step 4: Save the flattened data in a binary format
train_images.tofile('mnist_train_images.bin')
train_labels.tofile('mnist_train_labels.bin')
test_images.tofile('mnist_test_images.bin')
test_labels.tofile('mnist_test_labels.bin')

print("MNIST dataset saved as flattened binary format.")



# Generating Outputs

This section seeks to match outputs from PyTorch to real data.

In [22]:
# generating sample outputs for the model

# generate the outputs for each mnist image
model.eval()
outputs = []
with torch.no_grad():
    for images, labels in test_loader:
        outputs.append(model(images).numpy())

outputs

[array([[-3.84305739e+00, -6.96367931e+00,  4.26903677e+00,
          1.58622944e+00, -1.00826817e+01, -6.90857589e-01,
         -1.88668499e+01,  1.23242245e+01, -3.35564971e+00,
         -4.76819158e-01],
        [-3.17163157e+00,  3.17657900e+00,  1.07219229e+01,
          1.97508609e+00, -1.50801525e+01, -1.28383875e+00,
         -3.79964662e+00, -1.13140535e+01, -4.25785875e+00,
         -1.35257730e+01],
        [-4.75522995e+00,  6.85870075e+00, -7.09604621e-01,
         -1.37461233e+00, -1.60529363e+00, -2.13369441e+00,
         -4.14791012e+00, -8.77739310e-01,  2.88579941e-01,
         -1.57263720e+00],
        [ 5.80550432e+00, -5.79681349e+00,  1.79512167e+00,
         -4.56232357e+00, -8.08167648e+00, -1.95451808e+00,
         -4.52850294e+00, -1.13939202e+00, -6.62702894e+00,
         -1.74032733e-01],
        [-4.61704540e+00, -9.28204823e+00, -2.25462294e+00,
         -1.09925079e+01,  7.76164627e+00, -3.84284711e+00,
         -5.20674467e+00, -2.52163142e-01, -4.788426

In [23]:
# save the outputs to a binary file
for i, output in enumerate(outputs):
    output.tofile(f'output{i}.bin')

# appending all the model outputs to a single binary file
with open('model_outputs', 'ab') as f:
    for file in glob.glob('output*.bin'):
        with open(file, 'rb') as f2:
            f.write(f2.read())

# clean up
os.system('rm output*.bin')

0