# Tutorial pytorch (DNN Feedfoward)

## Importando dependências

In [4]:
import torch
import torch.nn as nn
import torchvision.transforms as transforms
import torchvision.datasets as dsets
from torch.autograd import Variable

## Carregando dataset

In [5]:
train_dataset = dsets.MNIST(root='./data', 
                            train=True, 
                            transform=transforms.ToTensor(),
                            download=True)

test_dataset = dsets.MNIST(root='./data', 
                           train=False, 
                           transform=transforms.ToTensor())

## Preparando dataset (Interativo)

In [6]:
batch_size = 100
n_iters = 3000
num_epochs = n_iters / (len(train_dataset) / batch_size)
num_epochs = int(num_epochs)

train_loader = torch.utils.data.DataLoader(dataset=train_dataset, 
                                           batch_size=batch_size, 
                                           shuffle=True)

test_loader = torch.utils.data.DataLoader(dataset=test_dataset, 
                                          batch_size=batch_size, 
                                          shuffle=False)

## Criando classe do modelo

In [7]:
class FeedforwardNeuralNetModel(nn.Module):
    def __init__(self, input_dim, hidden_dim, output_dim):
        super(FeedforwardNeuralNetModel, self).__init__()
        
        self.fc1 = nn.Linear(input_dim, hidden_dim) 
        self.relu1 = nn.ReLU()
        
        self.fc2 = nn.Linear(hidden_dim, hidden_dim)
        self.relu2 = nn.ReLU()
        
        self.fc3 = nn.Linear(hidden_dim, hidden_dim)
        self.relu3 = nn.ReLU()
        
        self.fc4 = nn.Linear(hidden_dim, output_dim)  
    
    def forward(self, x):
        out = self.fc1(x)
        out = self.relu1(out)
        
        out = self.fc2(out)
        out = self.relu2(out)
        
        out = self.fc3(out)
        out = self.relu3(out)
        
        out = self.fc4(out)
        return out

## Inicializando o modelo

- Input dims: 784
    - Tamanho da imagem: 28 x 28 = 784
- Saida dims: 10 (digitos)
- Hidden: 100 (neuronios)
    - Número de ativações

In [8]:
input_dim = 28*28
hidden_dim = 100
output_dim = 10

model = FeedforwardNeuralNetModel(input_dim, hidden_dim, output_dim)

## Inicializando medida de erro (Entropia Cruzada)

In [9]:
criterion = nn.CrossEntropyLoss()

## Inicializando o otimizado (Gradiente Descendente Estocástico)

In [10]:
learning_rate = 0.1

optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

In [19]:
print(model.parameters())
print(len(list(model.parameters())))
print(list(model.parameters())[0].size())
print(list(model.parameters())[1].size())
print(list(model.parameters())[2].size())
print(list(model.parameters())[3].size())
print(list(model.parameters())[4].size())
print(list(model.parameters())[5].size())
print(list(model.parameters())[6].size())
print(list(model.parameters())[7].size())

<generator object Module.parameters at 0x7fdda47fdf10>
8
torch.Size([100, 784])
torch.Size([100])
torch.Size([100, 100])
torch.Size([100])
torch.Size([100, 100])
torch.Size([100])
torch.Size([10, 100])
torch.Size([10])


## Treinando o modelo

In [11]:
iter = 0
for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):
        

        if torch.cuda.is_available():
            images = Variable(images.view(-1, 28*28))
            labels = Variable(labels)
        else:
            images = Variable(images.view(-1, 28*28))
            labels = Variable(labels)
        

        optimizer.zero_grad()
        outputs = model(images)
        
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()
        
        iter += 1
        
        if iter % 500 == 0: 
            correct = 0
            total = 0
            for images, labels in test_loader:
                images = Variable(images.view(-1, 28*28))
                
                
                outputs = model(images)
                _, predicted = torch.max(outputs.data, 1)
                total += labels.size(0)
                
                correct += (predicted.cpu() == labels.cpu()).sum()
            
            accuracy = 100 * correct / total
            
            print('Iteration: {}. Loss: {}. Accuracy: {}'.format(iter, loss.data[0], accuracy))



Iteration: 500. Loss: 0.2674975097179413. Accuracy: 90
Iteration: 1000. Loss: 0.131819948554039. Accuracy: 94
Iteration: 1500. Loss: 0.18804334104061127. Accuracy: 95
Iteration: 2000. Loss: 0.02799047902226448. Accuracy: 96
Iteration: 2500. Loss: 0.03164204582571983. Accuracy: 96
Iteration: 3000. Loss: 0.06487608700990677. Accuracy: 96
