In [3]:
import torch, numpy as np, torch.nn as nn
from torch.autograd import variable
import torchvision.transforms as transforms, torchvision.datasets as dsets

train_dataset = dsets.MNIST(root = "./data", 
                            train = True,
                            transform = transforms.ToTensor(),
                            download = True)

test_dataset = dsets.MNIST(root = "./data", 
                            train = False,
                            transform = transforms.ToTensor())

batch_size = 100
n_iters = 3000
num_epochs = n_iters / (len(train_dataset) / batch_size)
num_epochs = int(num_epochs)

train_loader = torch.utils.data.DataLoader(dataset = train_dataset,
                                       batch_size = batch_size,
                                       shuffle = True)

test_loader = torch.utils.data.DataLoader(dataset = test_dataset,
                                          batch_size = batch_size,
                                          shuffle = False)

class FeedforwardNeuralNetModel(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(FeedforwardNeuralNetModel, self).__init__()
        self.fc1 = nn.Linear(input_dim, hidden_dim)
        self.tanh = nn.Tanh()
        self.fc2 = nn.Linear(hidden_dim, output_dim)
        
    def forward(self, x):
        out = self.fc1(x)
        out = self.tanh(out)
        out = self.fc2(out)
        return out

input_dim = 28*28
hidden_dim = 100
output_dim = 10
model = FeedforwardNeuralNetModel(input_dim, hidden_dim, output_dim)
criterion = nn.CrossEntropyLoss()
learning_rate = 0.1
optimizer = torch.optim.SGD(model.parameters(), lr = learning_rate)

print(len(list(model.parameters())))
print(list(model.parameters())[0].size())
print(list(model.parameters())[1].size())
print(list(model.parameters())[2].size())
print(list(model.parameters())[3].size())

iter = 0
for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):
        images = variable(images.view(-1, 28*28))
        labels = variable(labels)
        optimizer.zero_grad()
        outputs = model(images)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()

        iter += 1

        if iter % 500 == 0:
            correct = 0
            total = 0

            for images, labels in test_loader:
                images = variable(images.view(-1, 28*28))
                outputs = model(images)
                _, predicted = torch.max(outputs.data, -1)
                total += labels.size(0)
                correct+= (predicted == labels).sum()

            accuracy  =(100*correct)/total
            
            print("Iteration: {}. loss: {}. accuracy: {} ".format(iter, loss.data, accuracy))

4
torch.Size([100, 784])
torch.Size([100])
torch.Size([10, 100])
torch.Size([10])
Iteration: 500. loss: 0.3723928928375244. accuracy: 91 
Iteration: 1000. loss: 0.30961447954177856. accuracy: 92 
Iteration: 1500. loss: 0.34778961539268494. accuracy: 93 
Iteration: 2000. loss: 0.22718468308448792. accuracy: 94 
Iteration: 2500. loss: 0.18948039412498474. accuracy: 94 
Iteration: 3000. loss: 0.17092649638652802. accuracy: 94 
