In [2]:
from __future__ import print_function, division

import torch
import torch.nn as nn
import torch.optim as optim
from torch.optim import lr_scheduler
import numpy as np
import torchvision
from torchvision import datasets, models, transforms
import matplotlib.pyplot as plt
import time
import os
import copy
from PIL import Image

plt.ion()

In [5]:
from PIL import Image
im = Image.open('data/test/glass/glass102.jpg')
im.show()

In [4]:
!pwd

/home/ubuntu/trash-recycling-classifier


In [6]:
std_norm = transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                std=[0.229, 0.224, 0.225])

In [11]:
img_transforms = {'train': transforms.Compose([transforms.RandomResizedCrop(64),
                                     transforms.RandomHorizontalFlip(),
                                     transforms.ToTensor(),
                                     std_norm]),
                   'valid': transforms.Compose([transforms.Resize(64),
                                     transforms.CenterCrop(64),
                                     transforms.ToTensor(),
                                     std_norm]),
                   'test': transforms.Compose([transforms.Resize(size=(64,64)),
                                     transforms.ToTensor(), 
                                     std_norm])
                  }

In [8]:
train_data_path = "data/train/"
train_data = torchvision.datasets.ImageFolder(root=train_data_path,transform=img_transforms['train'])

In [16]:
valid_data_path = "data/valid/"
valid_data = torchvision.datasets.ImageFolder(root=val_data_path,transform=img_transforms['valid'])

In [17]:
test_data_path = "data/test/"
test_data = torchvision.datasets.ImageFolder(root=test_data_path,transform=img_transforms['test']) 

In [18]:
batch_size = 64
num_workers = 0

In [19]:
train_loader = torch.utils.data.DataLoader(train_data,
                                           batch_size=batch_size, 
                                           num_workers=num_workers,
                                           shuffle=True)
valid_loader = torch.utils.data.DataLoader(valid_data,
                                           batch_size=batch_size, 
                                           num_workers=num_workers,
                                           shuffle=False)
test_loader = torch.utils.data.DataLoader(test_data,
                                           batch_size=batch_size, 
                                           num_workers=num_workers,
                                           shuffle=False)

In [20]:
loaders = {
    'train': train_loader,
    'valid': valid_loader,
    'test': test_loader
}

In [23]:
print(f'Num. of Images in Training Set: {len(train_loader.dataset)}')
print(f'Num. of Images in Validation Set: {len(valid_loader.dataset)}')
print(f'Num. of Images in Testing Set: {len(test_loader.dataset)}')

Num. of Images in Training Set: 1766
Num. of Images in Validation Set: 378
Num. of Images in Testing Set: 383


In [24]:
if torch.cuda.is_available():
    device = torch.device("cuda") 
else:
    device = torch.device("cpu")

In [25]:
transfer_model = models.resnet50(pretrained=True) 

Downloading: "https://download.pytorch.org/models/resnet50-19c8e357.pth" to /home/ubuntu/.cache/torch/checkpoints/resnet50-19c8e357.pth
100%|██████████| 97.8M/97.8M [00:00<00:00, 137MB/s]


In [35]:
transfer_model

ResNet(
  (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
  (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (relu): ReLU(inplace=True)
  (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
  (layer1): Sequential(
    (0): Bottleneck(
      (conv1): Conv2d(64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (bn3): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
      (downsample): Sequential(
        (0): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 

In [36]:
for name, param in transfer_model.named_parameters():
    if("bn" not in name):
        param.requires_grad = False

In [38]:
# transfer_model.fc = nn.Sequential(nn.Linear(transfer_model.fc.in_features,500),
# nn.ReLU(),                                 
# nn.Dropout(), nn.Linear(500,6)) 

transfer_model.fc = nn.Linear(2048, 6, bias=True)

In [None]:
# criterion_transfer = nn.CrossEntropyLoss()
# optimizer_transfer = optim.SGD(model_transfer.fc.parameters(), lr=0.001)

In [42]:
def train(model, optimizer, loss_fn, train_loader, valid_loader, epochs=20, device="cpu"):
    for epoch in range(epochs):
        training_loss = 0.0
        valid_loss = 0.0
        model.train()
        for batch in train_loader:
            optimizer.zero_grad()
            inputs, targets = batch
            inputs = inputs.to(device)
            targets = targets.to(device)
            output = model(inputs)
            loss = loss_fn(output, targets)
            loss.backward()
            optimizer.step()
            training_loss += loss.data.item() * inputs.size(0)
        training_loss /= len(train_loader.dataset)
        
        model.eval()
        num_correct = 0 
        num_examples = 0
        for batch in valid_loader:
            inputs, targets = batch
            inputs = inputs.to(device)
            output = model(inputs)
            targets = targets.to(device)
            loss = loss_fn(output,targets) 
            valid_loss += loss.data.item() * inputs.size(0)
            correct = torch.eq(torch.max(torch.nn.functional.softmax(output), dim=1)[1], targets).view(-1)
            num_correct += torch.sum(correct).item()
            num_examples += correct.shape[0]
        valid_loss /= len(valid_loader.dataset)

        print('Epoch: {}, Training Loss: {:.2f}, Validation Loss: {:.2f}, accuracy = {:.2f}'.format(epoch, training_loss,
        valid_loss, num_correct / num_examples))

In [43]:
transfer_model.to(device)
optimizer = optim.Adam(transfer_model.parameters(), lr=0.001)

In [45]:
train(transfer_model, optimizer,torch.nn.CrossEntropyLoss(), train_loader, valid_loader, epochs=15, device=device)



Epoch: 0, Training Loss: 0.55, Validation Loss: 0.65, accuracy = 0.78
Epoch: 1, Training Loss: 0.49, Validation Loss: 0.59, accuracy = 0.81
Epoch: 2, Training Loss: 0.47, Validation Loss: 0.61, accuracy = 0.79
Epoch: 3, Training Loss: 0.46, Validation Loss: 0.65, accuracy = 0.79
Epoch: 4, Training Loss: 0.45, Validation Loss: 0.60, accuracy = 0.80
Epoch: 5, Training Loss: 0.41, Validation Loss: 0.57, accuracy = 0.82
Epoch: 6, Training Loss: 0.40, Validation Loss: 0.56, accuracy = 0.84
Epoch: 7, Training Loss: 0.41, Validation Loss: 0.52, accuracy = 0.85
Epoch: 8, Training Loss: 0.37, Validation Loss: 0.51, accuracy = 0.84
Epoch: 9, Training Loss: 0.34, Validation Loss: 0.53, accuracy = 0.84
Epoch: 10, Training Loss: 0.33, Validation Loss: 0.55, accuracy = 0.83
Epoch: 11, Training Loss: 0.37, Validation Loss: 0.52, accuracy = 0.85
Epoch: 12, Training Loss: 0.33, Validation Loss: 0.54, accuracy = 0.83
Epoch: 13, Training Loss: 0.34, Validation Loss: 0.54, accuracy = 0.84
Epoch: 14, Train