# LABORATORIO 02
## Nombre : Tumiri Huanca Alex
### Desarrolle lo siguiente:
- Busque un dataset con datos suficientemente complejos como para ser procesados por una CNN, que condicione una clasificación de al menos 5 clases.
- Cree un mecanismo personalizado para la lectura del dataset y su adecuación a un modelo CNN en Pytorch.
- Construya un modelo (CNN) para procesar los datos preparados previamente, considerando varias alternativas en la configuración de la estructura de la CNN.
- Reporte cual es el mejor modelo que construyo, explicando la arquitectura y los hiperparametros asumidos.

### Se trabajo con un dataset creado por mi mismo de animales con 5 clases
![title](https://www.diegocalvo.es/wp-content/uploads/2017/07/red-neuronal-convolucional-arquitectura.png)

In [1]:
# Imports
import torch
import torchvision # torch package for vision related things
import torch.nn.functional as F  # Parameterless functions, like (some) activation functions
import torchvision.datasets as datasets  # Standard datasets
import torchvision.transforms as transforms  # Transformations we can perform on our dataset for augmentation
from torch import optim  # For optimizers like SGD, Adam, etc.
from torch import nn  # All neural network modules
from torch.utils.data import DataLoader  # Gives easier dataset managment by creating mini batches etc.
from tqdm import tqdm  # For nice progress bar!
from torch.utils.data import (Dataset,DataLoader,) 
import pandas as pd
import os
from skimage import io

In [9]:
# Simple CNN
class CNN(nn.Module):
    def __init__(self, in_channels=1, num_classes=1):
        super(CNN, self).__init__()
        
        #First CNN
        self.conv1 = nn.Conv2d(
            in_channels = in_channels,
            out_channels= 6,
            kernel_size=(3, 3),
            stride=(1, 1),
            padding=(1, 1),
        )
    
        
        self.pool = nn.MaxPool2d(kernel_size=(2, 2), stride=(2, 2))
        
        #Second CNN
        self.conv2 = nn.Conv2d(
            in_channels= 6,
            out_channels=12,
            kernel_size=(3, 3),
            stride=(1, 1),
            padding=(1, 1),
        )
        
        self.fc1 = nn.Linear(12 * 75 * 75, num_classes)

    def forward(self, x):
        x = F.relu(self.conv1(x))
        #print("conv 1")
        #print(x.shape)
        x = self.pool(x)
        #print("pool 1")
        #print(x.shape)
        x = F.relu(self.conv2(x))
        #print("conv 2")
        #print(x.shape)
        x = self.pool(x)
        #print("pool 2")
        #print(x.shape)
        # print("Shape 1")
        # print(x.shape)
        # print(x.shape[0])
        # print(x.shape[1])
        x = x.reshape(x.shape[0], -1)
        # print("Shape 2")
        # print(x.shape)
        # print(x.shape[0])
        # print(x.shape[1])
        x = self.fc1(x)
        #print("esta es la x del fc1 : ",x)
        return x

# model = CNN()
# x = torch.rand(64, 1, 28, 28)
# print(x)
# print(model(x).shape)
# # Set device
class Dataset_treatment(Dataset):
    def __init__(self,csv_file , root_dir, transform=None):
        self.annotations = pd.read_csv(csv_file)
        self.root_dir = root_dir
        self.transform = transform

    def __len__(self):
        return len(self.annotations)

    def __getitem__(self, index):
        img_path = os.path.join(self.root_dir, self.annotations.iloc[index, 0])
        image = io.imread(img_path)
        y_label = torch.tensor(int(self.annotations.iloc[index, 1]))

        if self.transform:
            image = self.transform(image)

        return (image, y_label)


device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

# Hyperparameters
in_channels = 3
num_classes = 5
learning_rate = 0.001
batch_size = 32
num_epochs = 500


# Load Data
dataset = Dataset_treatment(    
    csv_file="animals.csv",
    root_dir="dataset",
    transform = transforms.ToTensor(),
)

# Dataset is actually a lot larger ~25k images, just took out 10 pictures
# to upload to Github. It's enough to understand the structure and scale
# if you got more images.
# Load Data
train_set, test_set = torch.utils.data.random_split(dataset, [368,368])
train_loader = DataLoader(dataset=train_set, batch_size=batch_size, shuffle=True)
test_loader = DataLoader(dataset=test_set, batch_size=batch_size, shuffle=True)

# Initialize network
model = CNN(in_channels=in_channels, num_classes=num_classes).to(device)

# Loss and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

# Train Network
for epoch in range(num_epochs):
    for batch_idx, (data, targets) in enumerate(tqdm(train_loader)):
        # Get data to cuda if possible
        data = data.to(device=device)
        targets = targets.to(device=device)

        # forward
        scores = model(data)
        loss = criterion(scores, targets)

        # backward
        optimizer.zero_grad()
        loss.backward()

        # gradient descent or adam step
        optimizer.step()

# Check accuracy on training & test to see how good our model
def check_accuracy(loader, model):
    num_correct = 0
    num_samples = 0
    model.eval()

    with torch.no_grad():
        for x, y in loader:
            x = x.to(device=device)
            y = y.to(device=device)

            scores = model(x)
            _, predictions = scores.max(1)
            num_correct += (predictions == y).sum()
            num_samples += predictions.size(0)


    model.train()
    return num_correct/num_samples


print(f"Accuracy on training set: {check_accuracy(train_loader, model)*100:.2f}")
print(f"Accuracy on test set: {check_accuracy(test_loader, model)*100:.2f}")

100%|██████████| 12/12 [00:03<00:00,  3.72it/s]
100%|██████████| 12/12 [00:03<00:00,  3.82it/s]
100%|██████████| 12/12 [00:02<00:00,  4.27it/s]
100%|██████████| 12/12 [00:02<00:00,  4.19it/s]
100%|██████████| 12/12 [00:02<00:00,  4.11it/s]
100%|██████████| 12/12 [00:02<00:00,  4.29it/s]
100%|██████████| 12/12 [00:02<00:00,  4.21it/s]
100%|██████████| 12/12 [00:02<00:00,  4.23it/s]
100%|██████████| 12/12 [00:02<00:00,  4.07it/s]
100%|██████████| 12/12 [00:02<00:00,  4.05it/s]
100%|██████████| 12/12 [00:02<00:00,  4.27it/s]
100%|██████████| 12/12 [00:02<00:00,  4.24it/s]
100%|██████████| 12/12 [00:02<00:00,  4.30it/s]
100%|██████████| 12/12 [00:02<00:00,  4.24it/s]
100%|██████████| 12/12 [00:02<00:00,  4.30it/s]
100%|██████████| 12/12 [00:02<00:00,  4.01it/s]
100%|██████████| 12/12 [00:02<00:00,  4.23it/s]
100%|██████████| 12/12 [00:02<00:00,  4.21it/s]
100%|██████████| 12/12 [00:02<00:00,  4.32it/s]
100%|██████████| 12/12 [00:02<00:00,  4.19it/s]
100%|██████████| 12/12 [00:02<00:00,  4.

100%|██████████| 12/12 [00:02<00:00,  4.33it/s]
100%|██████████| 12/12 [00:02<00:00,  4.37it/s]
100%|██████████| 12/12 [00:02<00:00,  4.37it/s]
100%|██████████| 12/12 [00:02<00:00,  4.28it/s]
100%|██████████| 12/12 [00:02<00:00,  4.28it/s]
100%|██████████| 12/12 [00:02<00:00,  4.40it/s]
100%|██████████| 12/12 [00:02<00:00,  4.24it/s]
100%|██████████| 12/12 [00:02<00:00,  4.49it/s]
100%|██████████| 12/12 [00:02<00:00,  4.38it/s]
100%|██████████| 12/12 [00:02<00:00,  4.14it/s]
100%|██████████| 12/12 [00:02<00:00,  4.36it/s]
100%|██████████| 12/12 [00:02<00:00,  4.31it/s]
100%|██████████| 12/12 [00:03<00:00,  3.90it/s]
100%|██████████| 12/12 [00:02<00:00,  4.28it/s]
100%|██████████| 12/12 [00:02<00:00,  4.40it/s]
100%|██████████| 12/12 [00:02<00:00,  4.15it/s]
100%|██████████| 12/12 [00:02<00:00,  4.40it/s]
100%|██████████| 12/12 [00:02<00:00,  4.39it/s]
100%|██████████| 12/12 [00:02<00:00,  4.44it/s]
100%|██████████| 12/12 [00:02<00:00,  4.31it/s]
100%|██████████| 12/12 [00:02<00:00,  4.

100%|██████████| 12/12 [00:02<00:00,  4.35it/s]
100%|██████████| 12/12 [00:03<00:00,  3.84it/s]
100%|██████████| 12/12 [00:03<00:00,  3.93it/s]
100%|██████████| 12/12 [03:30<00:00, 17.55s/it]
100%|██████████| 12/12 [00:03<00:00,  3.31it/s]
100%|██████████| 12/12 [00:02<00:00,  4.38it/s]
100%|██████████| 12/12 [00:03<00:00,  3.61it/s]
100%|██████████| 12/12 [00:02<00:00,  4.15it/s]
100%|██████████| 12/12 [00:02<00:00,  4.67it/s]
100%|██████████| 12/12 [00:02<00:00,  4.06it/s]
100%|██████████| 12/12 [00:03<00:00,  3.72it/s]
100%|██████████| 12/12 [00:03<00:00,  3.65it/s]
100%|██████████| 12/12 [00:03<00:00,  3.52it/s]
100%|██████████| 12/12 [00:03<00:00,  3.41it/s]
100%|██████████| 12/12 [00:03<00:00,  3.49it/s]
100%|██████████| 12/12 [00:02<00:00,  4.11it/s]
100%|██████████| 12/12 [00:03<00:00,  3.78it/s]
100%|██████████| 12/12 [00:03<00:00,  3.85it/s]
100%|██████████| 12/12 [00:02<00:00,  4.13it/s]
100%|██████████| 12/12 [00:03<00:00,  3.42it/s]
100%|██████████| 12/12 [00:03<00:00,  3.

Accuracy on training set: 100.00
Accuracy on test set: 53.26
