# Feedforward Neural Network

### Problems with Logistic Regression

In [2]:
import torch
import torch.nn as nn

In [3]:
class LogisticRegressionModel(nn.Module):
    def __init__(self, input_size, num_classes):
        super(LogisticRegressionModel, self).__init__()
        self.linear = nn.Linear(input_dim, output_dim)
        
    def forward(self, x):
        out = self.linear(x)

In [4]:
input_dim = 28*28
output_dim = 10

model = LogisticRegressionModel(input_dim, output_dim)

In [5]:
print(model)

LogisticRegressionModel(
  (linear): Linear(in_features=784, out_features=10, bias=True)
)


### Building a feedforward Neural Network with Pytorch

#### Model A: 1 Hidden layer Feedforward Neural Network (Sigmoid Activation)

##### Steps

<li> Step 1: Load Dataset
<li> Step 2: Make Dataset Iterable
<li> Step 3: Create Model Class
<li> Step 4: Instantiate Model Class
<li> Step 5: Instantiate Loss Class
<li> Step 6: Instantiate Optimizer Class
<li> Step 7: Train Model


###### Step 1: Load Dataset


In [6]:
import torch
import torch.nn as nn
import torchvision.transforms as transforms
import torchvision.datasets as dsets
from torch.autograd import Variable


In [7]:
train_dataset = dsets.MNIST(root = './data',
                            train = True,
                            transform = transforms.ToTensor(),
                            download = True)

test_dataset = dsets.MNIST(root = './data',
                           train = False,
                           transform = transforms.ToTensor())

###### Step 2: Make Dataset Iterable

In [31]:
batch_size = 100
n_iters = 3000

num_epochs = n_iters / (len(train_dataset) / batch_size)
num_epochs = int(num_epochs)

train_loader = torch.utils.data.DataLoader(dataset=train_dataset,
                                           batch_size=batch_size,
                                           shuffle=True)

test_loader = torch.utils.data.DataLoader(dataset=test_dataset,
                                        batch_size=batch_size,
                                        shuffle=False)

###### Step 3: Create Model Class

In [32]:
class FeedforwardNeuralNetModel(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(FeedforwardNeuralNetModel, self).__init__()
        # Linear fnction
        self.fn1 = nn.Linear(input_dim, hidden_dim)
        # Non-linearity
        self.sigmoid = nn.Sigmoid()
        # Linear Function (Readout)
        self.fn2 = nn.Linear(hidden_dim, output_dim)
        
    def forward(self, x):
        out = self.fn1(x)
        out = self.sigmoid(out)
        out = self.fn2(out)
        return out

###### Step 4: Instantiate Model Class

In [33]:
input_dim = 28 * 28
hidden_dim = 100
output_dim = 10

model = FeedforwardNeuralNetModel(input_dim, hidden_dim, output_dim)

###### Step 5: Instantiate Loss Class

In [34]:
criterion = nn.CrossEntropyLoss()

###### Step 6: Instantiate Optimizer Class

In [35]:
learning_rate = 0.1
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

**Parameters In-Depth**



In [36]:
print(model.parameters())

print(len(list(model.parameters())))

print(list(model.parameters())[0].size())

print(list(model.parameters())[1].size())

print(list(model.parameters())[2].size())

print(list(model.parameters())[3].size())

<generator object Module.parameters at 0x000001DA33041F68>
4
torch.Size([100, 784])
torch.Size([100])
torch.Size([10, 100])
torch.Size([10])


###### Step 7: Train Model

Process
1. Convert input/labels to variables
2. Clear gradient buffers
3. Get output given inputs
4. Get loss
5. Get gradients w.r.t. parameters
6. Update parameters using gradients
    * parameters = parameters - leaarning_rate * parameter_gradients
7. Repeat

In [41]:
iter = 0

for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):
        
        images = Variable(images.view(-1, 28 * 28))
        labels = Variable(labels)
        
        optimizer.zero_grad()
        
        outputs = model(images)
        
        loss = criterion(outputs, labels)
        
        loss.backward()
        
        optimizer.step()
        
        iter += 1
        
        if iter % 500 == 0:
            correct = 0
            total = 0
            
            for images, labels in test_loader:
                
                images = Variable(images.view(-1, 28 * 28))
                outputs = model(images)
                
                _, predicted = torch.max(outputs.data, 1)
                
                total += labels.size(0)
                
                correct += (predicted == labels).sum()
                
            accuracy = 100 * correct / total
            
            print('Iterations: {}, Loss: {}, Accuracy: {}'.format(iter, loss.data, accuracy.float()))

Iterations: 500, Loss: 0.3565400242805481, Accuracy: 93.0
Iterations: 1000, Loss: 0.214106485247612, Accuracy: 93.0
Iterations: 1500, Loss: 0.25565993785858154, Accuracy: 93.0
Iterations: 2000, Loss: 0.14567551016807556, Accuracy: 93.0
Iterations: 2500, Loss: 0.3261256515979767, Accuracy: 94.0
Iterations: 3000, Loss: 0.16373074054718018, Accuracy: 94.0


#### Model B: 1 Hidden layer Feedforward Neural Network (TanH Activation)

##### Steps

<li> Step 1: Load Dataset
<li> Step 2: Make Dataset Iterable
    <b><li> Step 3: Create Model Class</b>
<li> Step 4: Instantiate Model Class
<li> Step 5: Instantiate Loss Class
<li> Step 6: Instantiate Optimizer Class
<li> Step 7: Train Model

In [None]:
import torch
import torch.nn as nn
import torchvision.transforms as transforms
import torchvision.datasets as dsets
from torch.autograd import Variable

'''
Step 1: Load Dataset
'''
train_dataset = dsets.MNIST(root = './data',
                            train = True,
                            transform = transforms.ToTensor(),
                            download = True)

test_dataset = dsets.MNIST(root = './data',
                           train = False,
                           transform = transforms.ToTensor())

'''
Step 2: Make Dataset Iterable
'''
batch_size = 100
n_iters = 3000

num_epochs = n_iters / (len(train_dataset) / batch_size)
num_epochs = int(num_epochs)

train_loader = torch.utils.data.DataLoader(dataset=train_dataset,
                                           batch_size=batch_size,
                                           shuffle=True)

test_loader = torch.utils.data.DataLoader(dataset=test_dataset,
                                        batch_size=batch_size,
                                        shuffle=False)
'''
Step 3: Create Model Class
'''
class FeedforwardNeuralNetModel(nn.Module):
    def __init__(self, input_size, hidden_size, num_classes):
        super(FeedforwardNeuralNetModel, self).__init__()
        # Linear fnction
        self.fn1 = nn.Linear(input_dim, hidden_dim)
        # Non-linearity
        self.sigmoid = nn.Tanh()
        # Linear Function (Readout)
        self.fn2 = nn.Linear(hidden_dim, output_dim)
        
    def forward(self, x):
        out = self.fn1(x)
        out = self.sigmoid(out)
        out = self.fn2(out)
        return out
'''
Step 4: Instantiate Model Class
'''
input_dim = 28 * 28
hidden_dim = 100
output_dim = 10

model = FeedforwardNeuralNetModel(input_dim, hidden_dim, output_dim)
'''
Step 5: Instantiate Loss Class
'''
criterion = nn.CrossEntropyLoss()

'''
Step 6: Instantiate Optimizer Class
'''
learning_rate = 0.1
optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

'''
Step 7: Train Model
'''
iter = 0

for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):
        
        images = Variable(images.view(-1, 28 * 28))
        labels = Variable(labels)
        
        optimizer.zero_grad()
        
        outputs = model(images)
        
        loss = criterion(outputs, labels)
        
        loss.backward()
        
        optimizer.step()
        
        iter += 1
        
        if iter % 500 == 0:
            correct = 0
            total = 0
            
            for images, labels in test_loader:
                
                images = Variable(images.view(-1, 28 * 28))
                outputs = model(images)
                
                _, predicted = torch.max(outputs.data, 1)
                
                total += labels.size(0)
                
                correct += (predicted == labels).sum()
                
            accuracy = 100 * correct / total
            
            print('Iterations: {}, Loss: {}, Accuracy: {}'.format(iter, loss.data, accuracy.float()))