<a href="https://colab.research.google.com/github/srishti-git1110/Simple_NN_in_PyTorch/blob/main/FFNN.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

This notebook is just to get a hands on demo of pytorch for ones who know what neural networks are & their working in theory, and want to implement their theoretical knowledge in pytorch.
You can run this nb on a gpu as well as cpu.

We construct a very short network here working on MNIST data.

In [1]:
import torch.nn as nn #ffnn, cnn, rnn etc
import torch.optim as optim #optimisers like sgd etc
import torch.nn.functional as f #activ funcs
from torch.utils.data import DataLoader #minibatch train test etc
import torchvision.datasets as datasets #std datasets
import torchvision.transforms as transforms #transformations to perform on dataset


In [10]:
import torch

In [14]:
class NN(nn.Module):
  def __init__(self, input_size, num_classes):
    super(NN, self).__init__()

    #input layer - hidden layer - output layer; This is our network structure
    self.fc1 = nn.Linear(in_features=input_size, out_features=50)
    self.fc2 = nn.Linear(in_features=50, out_features=num_classes)

  def forward(self, x): #x is the dataset (batch etc) - examples*features
    #64*768
    x = f.relu(self.fc1(x)) 
    #64*50
    x = self.fc2(x)
    return x #64*10

device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
input_size = 784
num_classes = 10
learning_rate = .001
batch_size = 64
epochs = 1

#load data
train_set = datasets.MNIST(root='dataset/', train=True, transform=transforms.ToTensor(), download=True)
train_loader = DataLoader(dataset=train_set, batch_size=batch_size, shuffle=True)
test_set = datasets.MNIST(root='dataset/', train=False, transform=transforms.ToTensor(), download=True)
test_loader = DataLoader(dataset=test_set, batch_size=batch_size, shuffle=True)

#initialize
model = NN(input_size, num_classes).to(device)

criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

#train
for epoch in range(epochs):
  for batch_num, (data, targets) in enumerate(train_loader):
    data = data.to(device=device)
    targets = targets.to(device=device)
    data = data.reshape(data.shape[0], -1) #original was (64, 1, 28, 28) we want (64, 768)
    
    #calls the forward, returns 64*10
    scores = model(data) 
    loss = criterion(scores, targets)
    
    #backward
    optimizer.zero_grad() #clears old gradients from the last step (otherwise you’d just accumulate the gradients from all loss.backward() calls).
    loss.backward() #computes the derivative of the loss w.r.t. the parameters (or anything requiring gradients) using backpropagation.
    optimizer.step() #causes the optimizer to take a step based on the gradients of the parameters

def check_accuracy(loader, model):
  if loader.dataset.train:
    print("checking accuracy on train data")
  else:
    print("checking accuracy on test data")

  num_correct = 0
  num_samples = 0
  model.eval() #some training only operations turned off like dropout etc

  with torch.no_grad():
    for x, y in loader: #loops over batches in a loader
      x = x.to(device=device)
      y = y.to(device=device)
      x = x.reshape(x.shape[0], -1)

      scores = model(x) #64*10
      _, predictions = scores.max(1) #probs, indices
      num_correct += (predictions == y).sum()
      num_samples += predictions.size(0)
    print(f'Accuracy {float(num_correct)/float(num_samples)*100:.2f}')
  model.train() #again puts it in train mode just in case 
  

check_accuracy(train_loader, model)
check_accuracy(test_loader, model)

Batch no:  0
Batch no:  1
torch.Size([64, 10])
torch.Size([64])
torch.Size([])
Batch no:  2
Batch no:  3
Batch no:  4
Batch no:  5
Batch no:  6
Batch no:  7
Batch no:  8
Batch no:  9
Batch no:  10
Batch no:  11
Batch no:  12
Batch no:  13
Batch no:  14
Batch no:  15
Batch no:  16
Batch no:  17
Batch no:  18
Batch no:  19
Batch no:  20
Batch no:  21
Batch no:  22
Batch no:  23
Batch no:  24
Batch no:  25
Batch no:  26
Batch no:  27
Batch no:  28
Batch no:  29
Batch no:  30
Batch no:  31
Batch no:  32
Batch no:  33
Batch no:  34
Batch no:  35
Batch no:  36
Batch no:  37
Batch no:  38
Batch no:  39
Batch no:  40
Batch no:  41
Batch no:  42
Batch no:  43
Batch no:  44
Batch no:  45
Batch no:  46
Batch no:  47
Batch no:  48
Batch no:  49
Batch no:  50
Batch no:  51
Batch no:  52
Batch no:  53
Batch no:  54
Batch no:  55
Batch no:  56
Batch no:  57
Batch no:  58
Batch no:  59
Batch no:  60
Batch no:  61
Batch no:  62
Batch no:  63
Batch no:  64
Batch no:  65
Batch no:  66
Batch no:  67
Batch

In [12]:
train_loader

<torch.utils.data.dataloader.DataLoader at 0x7fbca9913950>

In [13]:
print(targets.shape)

torch.Size([32])
