In [1]:
from __future__ import print_function, division

import torch
import torch.nn as nn
import torch.optim as optim
from torch.optim import lr_scheduler
import numpy as np
import torchvision
from torchvision import datasets, models, transforms
import matplotlib.pyplot as plt
import time
import os
import copy
import cv2

In [2]:
def show(image):
    cv2.imshow("title",image)
    cv2.waitKey(0)
    cv2.destroyAllWindows()

In [3]:
normalize = transforms.Normalize(
   mean=[0.485, 0.456, 0.406],
   std=[0.229, 0.224, 0.225]
)
preprocess = transforms.Compose([
   transforms.Resize((224,224)),
   transforms.ToTensor(),
   normalize
])

In [6]:
DATA_DIR = 'data/sample_dir'
img_dataset = datasets.ImageFolder(root = DATA_DIR , transform = preprocess)

In [7]:
img_dataset

Dataset ImageFolder
    Number of datapoints: 514
    Root location: data/sample_dir

In [15]:
DATA_DIR = 'data/sample_dir'
img_dataset = datasets.ImageFolder(root = DATA_DIR , transform = preprocess)
train_data, val_data = torch.utils.data.random_split(img_dataset,[360,154])

dataloaders = {'train': torch.utils.data.DataLoader(train_data, batch_size=4, shuffle=True, num_workers=4),
               'val' : torch.utils.data.DataLoader(val_data, batch_size=4, shuffle=True, num_workers=4)}

dataset_sizes = {'train' : len(train_data), 'val' : len(val_data)}
class_names = img_dataset.classes

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

In [16]:
# show first image
inp = img_dataset[0][0].numpy().transpose((1, 2, 0))
mean = np.array([0.485, 0.456, 0.406])
std = np.array([0.229, 0.224, 0.225])
inp = std * inp + mean
inp_copy = np.uint8(inp*255)
inp_copy = cv2.cvtColor(inp_copy,cv2.COLOR_BGR2RGB)

show(inp_copy)

In [17]:
def train_model(model, criterion, optimizer, scheduler, num_epochs=25):
    since = time.time()

    best_model_wts = copy.deepcopy(model.state_dict())
    best_acc = 0.0

    for epoch in range(num_epochs):
        print('Epoch {}/{}'.format(epoch, num_epochs - 1))
        print('-' * 10)

        # Each epoch has a training and validation phase
        for phase in ['train', 'val']:
            if phase == 'train':
                scheduler.step()
                model.train()  # Set model to training mode
            else:
                model.eval()   # Set model to evaluate mode

            running_loss = 0.0
            running_corrects = 0

            # Iterate over data.
            for inputs, labels in dataloaders[phase]:
                inputs = inputs.to(device)
                labels = labels.to(device)

                # zero the parameter gradients
                optimizer.zero_grad()

                # forward
                # track history if only in train
                with torch.set_grad_enabled(phase == 'train'):
                    outputs = model(inputs)
                    _, preds = torch.max(outputs, 1)
                    loss = criterion(outputs, labels)

                    # backward + optimize only if in training phase
                    if phase == 'train':
                        loss.backward()
                        optimizer.step()

                # statistics
                running_loss += loss.item() * inputs.size(0)
                running_corrects += torch.sum(preds == labels.data)

            epoch_loss = running_loss / dataset_sizes[phase]
            epoch_acc = running_corrects.double() / dataset_sizes[phase]

            print('{} Loss: {:.4f} Acc: {:.4f}'.format(
                phase, epoch_loss, epoch_acc))

            # deep copy the model
            if phase == 'val' and epoch_acc > best_acc:
                best_acc = epoch_acc
                best_model_wts = copy.deepcopy(model.state_dict())

        print()

    time_elapsed = time.time() - since
    print('Training complete in {:.0f}m {:.0f}s'.format(
        time_elapsed // 60, time_elapsed % 60))
    print('Best val Acc: {:4f}'.format(best_acc))

    # load best model weights
    model.load_state_dict(best_model_wts)
    return model

In [18]:
model_ft = models.resnet18(pretrained=True)
num_ftrs = model_ft.fc.in_features
model_ft.fc = nn.Linear(num_ftrs, 257)

model_ft = model_ft.to(device)

criterion = nn.CrossEntropyLoss()

# Observe that all parameters are being optimized
optimizer_ft = optim.SGD(model_ft.parameters(), lr=0.001, momentum=0.9)

# Decay LR by a factor of 0.1 every 7 epochs
exp_lr_scheduler = lr_scheduler.StepLR(optimizer_ft, step_size=7, gamma=0.1)

In [None]:
model_ft = train_model(model_ft, criterion, optimizer_ft, exp_lr_scheduler,
                       num_epochs=25)

Epoch 0/24
----------
train Loss: 5.9067 Acc: 0.0000
val Loss: 6.1062 Acc: 0.0000

Epoch 1/24
----------
train Loss: 5.0108 Acc: 0.0556
val Loss: 6.2048 Acc: 0.0000

Epoch 2/24
----------
train Loss: 4.2073 Acc: 0.2750
val Loss: 6.1418 Acc: 0.0065

Epoch 3/24
----------
train Loss: 3.4258 Acc: 0.5694
val Loss: 6.1064 Acc: 0.0130

Epoch 4/24
----------
train Loss: 2.8197 Acc: 0.7389
val Loss: 6.0895 Acc: 0.0195

Epoch 5/24
----------
train Loss: 2.2322 Acc: 0.8722
val Loss: 6.0049 Acc: 0.0260

Epoch 6/24
----------
train Loss: 1.4890 Acc: 0.9889
val Loss: 5.9779 Acc: 0.0390

Epoch 7/24
----------
train Loss: 1.4344 Acc: 0.9917
val Loss: 5.9729 Acc: 0.0260

Epoch 8/24
----------
train Loss: 1.3681 Acc: 0.9917
val Loss: 5.9562 Acc: 0.0390

Epoch 9/24
----------
train Loss: 1.3260 Acc: 0.9972
val Loss: 5.8993 Acc: 0.0390

Epoch 10/24
----------
train Loss: 1.3049 Acc: 0.9944
val Loss: 5.9288 Acc: 0.0455

Epoch 11/24
----------


In [None]:
savePath = "./output/test_model.pth"
torch.save(model.state_dict(), savePath)