In [1]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [3]:
!unzip -qq '/content/drive/MyDrive/Colab Notebooks/Deep Learning 프로젝트/dataset.zip' -d './dataset'

In [4]:
import os

original_dataset_dir = './dataset'
classes_list = os.listdir(original_dataset_dir)

base_dir = './splitted'
os.mkdir(base_dir)

In [5]:
import shutil

train_dir = os.path.join(base_dir,'train')
os.mkdir(train_dir)
validation_dir = os.path.join(base_dir,'val')
os.mkdir(validation_dir)
test_dir = os.path.join(base_dir,'test')
os.mkdir(test_dir)

for cls in classes_list:
    os.mkdir(os.path.join(train_dir,cls))
    os.mkdir(os.path.join(validation_dir,cls))
    os.mkdir(os.path.join(test_dir,cls))

In [6]:
import math

for cls in classes_list:
    path = os.path.join(original_dataset_dir, cls)
    fnames = os.listdir(path)
    
    train_size = math.floor(len(fnames) * 0.6)
    validation_size = math.floor(len(fnames) * 0.2)
    test_size = math.floor(len(fnames) * 0.2)
    
    train_fnames = fnames[:train_size]
    print("Train size(",cls,"): ", len(train_fnames))
    for fname in train_fnames:
        src = os.path.join(path, fname)
        dst = os.path.join(os.path.join(train_dir,cls), fname)
        shutil.copyfile(src, dst)
        
    validation_fnames = fnames[train_size:(validation_size + train_size)]
    print("Validation size(",cls,"): ", len(validation_fnames))
    for fname in validation_fnames:
        src = os.path.join(path, fname)
        dst = os.path.join(os.path.join(validation_dir,cls), fname)
        shutil.copyfile(src, dst)
        
    test_fnames = fnames[(train_size+validation_size): (validation_size+train_size+test_size)]
    print("Test size(",cls,"): ", len(test_fnames))
    for fname in test_fnames:
        src = os.path.join(path, fname)
        dst = os.path.join(os.path.join(test_dir,cls), fname)
        shutil.copyfile(src, dst)

Train size( Corn___Cercospora_leaf_spot Gray_leaf_spot ):  307
Validation size( Corn___Cercospora_leaf_spot Gray_leaf_spot ):  102
Test size( Corn___Cercospora_leaf_spot Gray_leaf_spot ):  102
Train size( Tomato___Septoria_leaf_spot ):  1062
Validation size( Tomato___Septoria_leaf_spot ):  354
Test size( Tomato___Septoria_leaf_spot ):  354
Train size( Peach___healthy ):  216
Validation size( Peach___healthy ):  72
Test size( Peach___healthy ):  72
Train size( Tomato___Leaf_Mold ):  571
Validation size( Tomato___Leaf_Mold ):  190
Test size( Tomato___Leaf_Mold ):  190
Train size( Potato___Early_blight ):  600
Validation size( Potato___Early_blight ):  200
Test size( Potato___Early_blight ):  200
Train size( Tomato___Bacterial_spot ):  1276
Validation size( Tomato___Bacterial_spot ):  425
Test size( Tomato___Bacterial_spot ):  425
Train size( Peach___Bacterial_spot ):  1378
Validation size( Peach___Bacterial_spot ):  459
Test size( Peach___Bacterial_spot ):  459
Train size( Tomato___Tomat

In [7]:
import torch
import os

USE_CUDA = torch.cuda.is_available()
DEVICE = torch.device('cuda' if USE_CUDA else 'cpu')
BATCH_SIZE = 256
EPOCH = 30

In [8]:
import torchvision.transforms as transforms
from torchvision.datasets import ImageFolder

transform_base = transforms.Compose([transforms.Resize((64,64)), transforms.ToTensor()])
train_dataset = ImageFolder(root = './splitted/train', transform=transform_base)
val_dataset = ImageFolder(root = './splitted/val', transform=transform_base)

In [9]:
from torch.utils.data import DataLoader

train_loader = torch.utils.data.DataLoader(train_dataset,
                                          batch_size = BATCH_SIZE,
                                          shuffle = True,
                                          num_workers=4)
val_loader = torch.utils.data.DataLoader(val_dataset,
                                          batch_size = BATCH_SIZE,
                                          shuffle = True,
                                          num_workers=4)



In [10]:
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

class Net(nn.Module):
    
    def __init__(self):
        
        super(Net, self).__init__()
        
        self.conv1 = nn.Conv2d(3, 32, 3, padding=1)
        self.pool = nn.MaxPool2d(2, 2)
        self.conv2 = nn.Conv2d(32, 64, 3, padding=1)
        self.conv3 = nn.Conv2d(64, 64, 3, padding=1)
        
        self.fc1 = nn.Linear(4096, 512)
        self.fc2 = nn.Linear(512, 33)
        
    def forward(self, x):
        
        x = self.conv1(x)
        x = F.relu(x)
        x = self.pool(x)
        x = F.dropout(x, p=0.25, training=self.training)
        
        x = self.conv2(x)
        x = F.relu(x)
        x = self.pool(x)
        x = F.dropout(x, p=0.25, training=self.training)
        
        x = self.conv3(x)
        x = F.relu(x)
        x = self.pool(x)
        x = F.dropout(x, p=0.25, training=self.training)
        
        x = x.view(-1, 4096)
        x = self.fc1(x)
        x = F.relu(x)
        x = F.dropout(x, p=0.25, training=self.training)
        x = self.fc2(x)
        
        return F.log_softmax(x, dim=1)

In [11]:
model_base = Net().to(DEVICE)
optimizer = optim.Adam(model_base.parameters(), lr=0.001)

In [12]:
def train(model, train_loader, optimizer):
  model.train()
  for batch_idx, (data, target) in enumerate(train_loader):
    data, target = data.to(DEVICE), target.to(DEVICE)
    optimizer.zero_grad()
    output = model(data)
    loss = F.cross_entropy(output, target)
    loss.backward()
    optimizer.step()

In [16]:
def evaluate(model, test_loader):
  model.eval()
  test_loss = 0
  correct = 0

  with torch.no_grad():
    for data, target in test_loader:
      data, target = data.to(DEVICE), target.to(DEVICE)
      output = model(data)

      test_loss += F.cross_entropy(output, target, reduction='sum').item()

      pred = output.max(1, keepdim=True)[1]
      correct += pred.eq(target.view_as(pred)).sum().item()

  test_loss /= len(test_loader.dataset)
  test_accuracy = 100. * correct / len(test_loader.dataset)
  return test_loss, test_accuracy

In [19]:
import time
import copy

def train_baseline(model, train_loader, val_loader, optimizer, num_epochs = 30):
  bast_acc =0.0
  best_model_wts = copy.deepcopy(model.state_dict())

  for epoch in range(1, num_epochs + 1):
    since = time.time()
    train(model, train_loader, optimizer)
    train_loss, train_acc = evaluate(model, train_loader)
    val_loss, val_acc = evaluate(model, val_loader)

    if val_acc > bast_acc:
      best_acc = val_acc
      best_model_wts = copy.deepcopy(model.state_dict())

    time_elapsed = time.time() - since
    print('---------------epoch {} -------------------'.format(epoch))
    print('train Loss: {:.4f}, Accuracy: {:.2f}%'.format(train_loss, train_acc))
    print('val Loss: {:.4f}, Accuracy: {:.2f}%'.format(val_loss, val_acc))
    print('Completed in {:.0f}m {:.0f}s'.format(time_elapsed // 60, time_elapsed % 60))
  model.load_state_dict(best_model_wts)
  return model

base = train_baseline(model_base, train_loader, val_loader, optimizer, EPOCH)
torch.save(base,'baseline.pt')

---------------epoch 1 -------------------
train Loss: 0.1549, Accuracy: 95.21%
val Loss: 0.2884, Accuracy: 90.64%
Completed in 1m 40s
---------------epoch 2 -------------------
train Loss: 0.1205, Accuracy: 96.67%
val Loss: 0.2473, Accuracy: 92.08%
Completed in 1m 37s
---------------epoch 3 -------------------
train Loss: 0.1114, Accuracy: 96.88%
val Loss: 0.2327, Accuracy: 92.23%
Completed in 1m 40s
---------------epoch 4 -------------------
train Loss: 0.0924, Accuracy: 97.58%
val Loss: 0.2302, Accuracy: 92.58%
Completed in 1m 38s
---------------epoch 5 -------------------
train Loss: 0.1050, Accuracy: 96.86%
val Loss: 0.2584, Accuracy: 91.60%
Completed in 1m 39s
---------------epoch 6 -------------------
train Loss: 0.0833, Accuracy: 97.62%
val Loss: 0.2269, Accuracy: 92.04%
Completed in 1m 37s
---------------epoch 7 -------------------
train Loss: 0.0667, Accuracy: 98.21%
val Loss: 0.2082, Accuracy: 93.19%
Completed in 1m 39s
---------------epoch 8 -------------------
train Loss: 

In [20]:
data_transforms = {
    'train' : transforms.Compose([transforms.Resize([64, 64]),
          transforms.RandomHorizontalFlip(), transforms.RandomVerticalFlip(),
          transforms.RandomCrop(52), transforms.ToTensor(),
          transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]) ]),
    
    'val' : transforms.Compose([transforms.Resize([64, 64]),
          transforms.RandomCrop(52), transforms.ToTensor(),
          transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]) ])
}

In [23]:
data_dir = './splitted'
image_datasets = {x: ImageFolder(root = os.path.join(data_dir,x),
                                 transform = data_transforms[x]) for x in ['train', 'val']}
dataloaders = {x: torch.utils.data.DataLoader(image_datasets[x],
                                              batch_size = BATCH_SIZE,
                                              shuffle = True,
                                              num_workers = 4) for x in ['train', 'val']}
dataset_sizes = {x: len(image_datasets[x]) for x in ['train', 'val']}

class_names = image_datasets['train'].classes



In [26]:
from torchvision import models

resnet = models.resnet50(pretrained=True)
num_ftrs = resnet.fc.in_features
resnet.fc = nn.Linear(num_ftrs, 33)
resnet = resnet.to(DEVICE)

criterion = nn.CrossEntropyLoss()
optimizer_ft = optim.Adam(filter(lambda p: p.requires_grad, resnet.parameters()),lr=0.001)

from torch.optim import lr_scheduler
exp_lr_scheduler = lr_scheduler.StepLR(optimizer_ft, step_size=7, gamma=0.1)

In [27]:
ct = 0
for child in resnet.children():
  ct += 1
  if ct < 6:
    for param in child.parameters():
      param.requires_grad = False

In [30]:
def train_resnet(model,criterion, optimizer, scheduler, num_epochs=25):

  best_model_wts = copy.deepcopy(model.state_dict())
  best_acc = 0.0

  for epoch in range(num_epochs):
    print('---------------- epoch {} -----------------'.format(epoch+1))
    since = time.time()
    for phase in ['train','val']:
      if phase == 'train':
        model.train()
      else:
        model.eval()

      running_loss = 0.0
      running_corrects = 0

      for inputs, labels in dataloaders[phase]:
        inputs = inputs.to(DEVICE)
        labels = labels.to(DEVICE)

        optimizer.zero_grad()

        with torch.set_grad_enabled(phase == 'train'):
          outputs = model(inputs)
          _, preds = torch.max(outputs, 1)
          loss = criterion(outputs, labels)

          if phase == 'train':
            loss.backward()
            optimizer.step()

        running_loss += loss.item() * inputs.size(0)
        running_corrects += torch.sum(preds == labels.data)
      if phase == 'train':
        scheduler.step()

      epoch_loss = running_loss / dataset_sizes[phase]
      epoch_acc = running_corrects.double() / dataset_sizes[phase]

      print('{} Loss: {:.4f} Acc: {:.4f}'.format(phase, epoch_loss, epoch_acc))

      if phase == 'val' and epoch_acc > best_acc:
        best_acc = epoch_acc
        best_model_wts = copy.deepcopy(model.state_dict())
    
    time_elapsed = time.time() - since
    print('Completed in {:.0f}m {:.0f}s'.format(time_elapsed // 60, time_elapsed % 60))
  print('Best val Acc: {:.4f}'.format(best_acc))

  model.load_state_dict(best_model_wts)

  return model

In [31]:
model_resnet50 = train_resnet(resnet, criterion, optimizer_ft,
                              exp_lr_scheduler, num_epochs=EPOCH)

torch.save(model_resnet50, 'resnet50.pt')

---------------- epoch 1 -----------------




train Loss: 0.2247 Acc: 0.9277
val Loss: 0.2141 Acc: 0.9278
Completed in 1m 19s
---------------- epoch 2 -----------------
train Loss: 0.1611 Acc: 0.9479
val Loss: 0.2317 Acc: 0.9308
Completed in 1m 8s
---------------- epoch 3 -----------------
train Loss: 0.1239 Acc: 0.9576
val Loss: 0.1073 Acc: 0.9650
Completed in 1m 11s
---------------- epoch 4 -----------------
train Loss: 0.1089 Acc: 0.9635
val Loss: 0.1397 Acc: 0.9521
Completed in 1m 9s
---------------- epoch 5 -----------------
train Loss: 0.1154 Acc: 0.9615
val Loss: 0.1513 Acc: 0.9578
Completed in 1m 7s
---------------- epoch 6 -----------------
train Loss: 0.0918 Acc: 0.9711
val Loss: 0.1115 Acc: 0.9638
Completed in 1m 10s
---------------- epoch 7 -----------------
train Loss: 0.0438 Acc: 0.9856
val Loss: 0.0530 Acc: 0.9840
Completed in 1m 8s
---------------- epoch 8 -----------------
train Loss: 0.0287 Acc: 0.9907
val Loss: 0.0429 Acc: 0.9877
Completed in 1m 11s
---------------- epoch 9 -----------------
train Loss: 0.0238 A

In [33]:
transform_resNet = transforms.Compose([
    transforms.Resize([64, 64]),
    transforms.RandomCrop(52),
    transforms.ToTensor(),
    transforms.Normalize([0.485, 0.456, 0.406] , [0.229, 0.224, 0.225])
])

test_resNet = ImageFolder(root = './splitted/test', transform = transform_resNet)
test_loader_resNet = torch.utils.data.DataLoader(test_resNet,
                                                 batch_size = BATCH_SIZE,
                                                 shuffle = True,
                                                 num_workers=4)




In [34]:
resnet50 = torch.load('resnet50.pt')
resnet50.eval()
test_loss, test_accuracy = evaluate(resnet50, test_loader_resNet)

print('ResNet test acc: ', test_accuracy)

ResNet test acc:  98.99862310677182
