In [4]:
# [데이터 분할을 위한 폴더 생성]

import os
import shutil

original_dataset_dir = '/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/data/mvtec88'
classes_list = os.listdir(original_dataset_dir)

base_dir = '/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/data/splitted'
os.mkdir(base_dir)

train_dir = os.path.join(base_dir, 'train')
os.mkdir(train_dir)
validation_dir = os.path.join(base_dir, 'val')
os.mkdir(validation_dir)
test_dir = os.path.join(base_dir, 'test')
os.mkdir(test_dir)

# train,validation,test 폴더 하위에 각각 클래스 목록 폴더 생성
for clss in classes_list:
    os.mkdir(os.path.join(train_dir,clss))
    os.mkdir(os.path.join(validation_dir,clss))
    os.mkdir(os.path.join(test_dir,clss))

In [5]:
# [데이터 분할과 클래스별 데이터 수 확인]

import math

for clss in classes_list:
    path = os.path.join(original_dataset_dir,clss)
    fnames = os.listdir(path)
    
    train_size = math.floor(len(fnames)*0.6)
    validation_size = math.floor(len(fnames)*0.2)
    test_size = math.floor(len(fnames)*0.2)
    
    train_fnames = fnames[:train_size]
    print('Train size(',clss,'): ', len(train_fnames))
    for fname in train_fnames:
        src = os.path.join(path, fname)
        dst = os.path.join(os.path.join(train_dir, clss), fname)
        shutil.copyfile(src,dst)
        
    validation_fnames = fnames[train_size:(validation_size + train_size)]
    print('Validation size(',clss,'): ', len(validation_fnames))
    for fname in validation_fnames:
        src = os.path.join(path, fname)
        dst = os.path.join(os.path.join(validation_dir,clss),fname)
        shutil.copyfile(src,dst)
        
    test_fnames = fnames[(train_size+validation_size):(validation_size+train_size+test_size)]
    print('Test size(',clss,'): ', len(test_fnames))
    for fname in test_fnames:
        src = os.path.join(path, fname)
        dst = os.path.join(os.path.join(test_dir, clss),fname)
        shutil.copyfile(src,dst)

Train size( transistor_damaged_case ):  6
Validation size( transistor_damaged_case ):  2
Test size( transistor_damaged_case ):  2
Train size( leather_good ):  166
Validation size( leather_good ):  55
Test size( leather_good ):  55
Train size( tile_gray_stroke ):  9
Validation size( tile_gray_stroke ):  3
Test size( tile_gray_stroke ):  3
Train size( capsule_crack ):  13
Validation size( capsule_crack ):  4
Test size( capsule_crack ):  4
Train size( cable_missing_wire ):  6
Validation size( cable_missing_wire ):  2
Test size( cable_missing_wire ):  2
Train size( grid_bent ):  7
Validation size( grid_bent ):  2
Test size( grid_bent ):  2
Train size( hazelnut_good ):  258
Validation size( hazelnut_good ):  86
Test size( hazelnut_good ):  86
Train size( carpet_thread ):  11
Validation size( carpet_thread ):  3
Test size( carpet_thread ):  3
Train size( transistor_cut_lead ):  6
Validation size( transistor_cut_lead ):  2
Test size( transistor_cut_lead ):  2
Train size( wood_hole ):  6
Valid

In [6]:
# [베이스라인 모델 학습을 위한 준비]

import torch

USE_CUDA = torch.cuda.is_available()
DEVICE = torch.device('cuda' if USE_CUDA else 'cpu')

BATCH_SIZE = 256
EPOCH = 10

import torchvision.transforms as transforms
from torchvision.datasets import ImageFolder

transform_base = transforms.Compose([transforms.Resize((64,64)),transforms.ToTensor()])

train_dataset = ImageFolder(root='/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/data/splitted/train', transform = transform_base)
val_dataset = ImageFolder(root='/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/data/splitted/val', transform = transform_base)


# Dataloader는 이미지 데이터를 미니 배치 단위로 분리하는 역할
from torch.utils.data import DataLoader

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size = BATCH_SIZE, shuffle = True, num_workers = 4)
val_loader = torch.utils.data.DataLoader(val_dataset, batch_size = BATCH_SIZE, shuffle = True, num_workers = 4)

In [7]:
import torchvision.transforms as transforms
from torchvision.datasets import ImageFolder

data_transforms = {
    'train':transforms.Compose([
        transforms.Resize([64,64]),
        transforms.ToTensor(),
        transforms.Normalize([0.485,0.456,0.406],
                             [0.229,0.224,0.225])
    ]),
    'val':transforms.Compose([
        transforms.Resize([64,64]),
        transforms.RandomCrop(52),
        transforms.ToTensor(),
        transforms.Normalize([0.485,0.456,0.406],
                             [0.229,0.224,0.225])
    ])
}

data_dir = '/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/data/splitted'

image_datasets = {x: ImageFolder(root=os.path.join(data_dir,x),
                                 transform=data_transforms[x]) for x in ['train','val']}
dataloaders = {x: torch.utils.data.DataLoader(image_datasets[x], batch_size = BATCH_SIZE, shuffle=True, num_workers = 4) for x in ['train','val']}
dataset_sizes = {x: len(image_datasets[x]) for x in ['train', 'val']}
class_names = image_datasets['train'].classes

In [8]:
# [Pre-Trained Model 불러오기]

from torchvision import models
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim
from torch.optim import lr_scheduler

resnet = models.resnet50(pretrained=True)
# 이 프로젝트에선 33개로 분류해야함. 마지막 Layer 출력 채널 수는 33개여야함.
# 하지만 ResNet의 마지막 Layer 출력 채널 수가 33개가 아님. 이 프로젝트의 주제에 맞추고자 모델의 마지막 Fully Connected Layer 대신 출력 채널의 수가 33개인 새로운 Layer를 추가할 예정
# in_features : 해당 Layer의 입력 채널 수
num_ftrs = resnet.fc.in_features
# 불러온 모델의 마지막 Fully Connected Layer를 새로운 Layer로 교체. 입력 채널의 수는 기존 Layer와 동일하고, 출력 채널 수는 33개로 수정
resnet.fc = nn.Linear(num_ftrs, 88)
resnet = resnet.to(DEVICE)

criterion = nn.CrossEntropyLoss()

# Transfer Learning에선 일부 Layer의 Parameter만을 업데이트 해야하기 때문에 requires_grad = True로 설정된 Layer의 Parameter에만 적용
optimizer_ft = optim.Adam(filter(lambda p:p.requires_grad, resnet.parameters()), lr = 0.001)

# StepLR() 메서드는 Epoch에 따라 Learning Rate를 변경하는 역할
exp_lr_scheduler = lr_scheduler.StepLR(optimizer_ft, step_size=7, gamma=0.1)

In [9]:
# [Pre-Trained Model 일부 Layer Freeze 하기]

ct = 0 # 해당 Layer가 몇 번째인지
for child in resnet.children(): # resnet.children()은 생성한 resnet모델의 모든 Layer 정보를 담고 있음
    ct += 1 # 다음 Layer를 지칭하도록 ct변수를 1씩 증가
    if ct < 6: # 1~5번 Layer는 업데이트 되지 않도록 고정. 6~10번 Layer는 업데이트
        for param in child.parameters():
            param.requires_grad = False

In [10]:
# [Transfer Learning 모델 학습과 검증을 위한 함수]

import time
import copy

def train_resnet(model, criterion, optimizer, scheduler, num_epochs=25):

    best_model_wts = copy.deepcopy(model.state_dict())  
    best_acc = 0.0  
    
    for epoch in range(num_epochs):
        print('-------------- epoch {} ----------------'.format(epoch+1)) 
        since = time.time()                                     
        for phase in ['train', 'val']: 
            if phase == 'train': 
                model.train()  # 학습 모드
            else:
                model.eval() # 검증 모드
 
            running_loss = 0.0  
            running_corrects = 0  
 
            
            for inputs, labels in dataloaders[phase]: 
                inputs = inputs.to(DEVICE)  
                labels = labels.to(DEVICE)  
                
                optimizer.zero_grad() 
                
                with torch.set_grad_enabled(phase == 'train'): # 학습 단계에서만 모델 Gradient 업데이트, 검증 단계에서는 X
                    outputs = model(inputs)  
                    _, preds = torch.max(outputs, 1) 
                    loss = criterion(outputs, labels)  
    
                    if phase == 'train':   
                        loss.backward()
                        optimizer.step()
 
                running_loss += loss.item() * inputs.size(0)  
                running_corrects += torch.sum(preds == labels.data)  
            if phase == 'train':  
                scheduler.step()
 
            epoch_loss = running_loss/dataset_sizes[phase]  
            epoch_acc = running_corrects.double()/dataset_sizes[phase]  
 
            print('{} Loss: {:.4f} Acc: {:.4f}'.format(phase, epoch_loss, epoch_acc)) 
 
          
            if phase == 'val' and epoch_acc > best_acc: 
                best_acc = epoch_acc
                best_model_wts = copy.deepcopy(model.state_dict())
 
        time_elapsed = time.time() - since  
        print('Completed in {:.0f}m {:.0f}s'.format(time_elapsed // 60, time_elapsed % 60))
    print('Best val Acc: {:4f}'.format(best_acc))
 
    model.load_state_dict(best_model_wts) 

    return model

In [11]:
model_resnet50 = train_resnet(resnet, criterion, optimizer_ft, exp_lr_scheduler, num_epochs=EPOCH) 

torch.save(model_resnet50, 'resnet50.pt')

-------------- epoch 1 ----------------
train Loss: 1.8674 Acc: 0.6787
val Loss: 11.2719 Acc: 0.3057
Completed in 0m 19s
-------------- epoch 2 ----------------
train Loss: 0.8994 Acc: 0.7778
val Loss: 1.3693 Acc: 0.7068
Completed in 0m 19s
-------------- epoch 3 ----------------
train Loss: 0.7688 Acc: 0.7829
val Loss: 1.7216 Acc: 0.5959
Completed in 0m 19s
-------------- epoch 4 ----------------
train Loss: 0.7185 Acc: 0.7923
val Loss: 1.6992 Acc: 0.5815
Completed in 0m 19s
-------------- epoch 5 ----------------
train Loss: 0.6275 Acc: 0.8062
val Loss: 2.0445 Acc: 0.4793
Completed in 0m 20s
-------------- epoch 6 ----------------
train Loss: 0.6472 Acc: 0.8014
val Loss: 1.7346 Acc: 0.5362
Completed in 0m 19s
-------------- epoch 7 ----------------
train Loss: 0.5779 Acc: 0.8153
val Loss: 1.5689 Acc: 0.4995
Completed in 0m 20s
-------------- epoch 8 ----------------
train Loss: 0.4959 Acc: 0.8361
val Loss: 1.5753 Acc: 0.4879
Completed in 0m 19s
-------------- epoch 9 ----------------

In [16]:
# [Transfer Learning모델 평가를 위한 전처리]

transform_resNet = transforms.Compose([
        transforms.Resize([224,224]),    
        transforms.ToTensor(),
        transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]) 
    ])
    
test_resNet = ImageFolder(root='/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/data/splitted/test', transform=transform_resNet) 
test_loader_resNet = torch.utils.data.DataLoader(test_resNet, batch_size=BATCH_SIZE, shuffle=True, num_workers=4)

In [17]:
# [모델 평가를 위한 함수]

def evaluate(model, test_loader):
    model.eval()
    test_loss = 0
    correct = 0
    
    with torch.no_grad(): # torch.no_grad() : Parameter 업데이트 중단
        for data, target in test_loader:
            data, target = data.to(DEVICE), target.to(DEVICE)
            output = model(data)
            
            test_loss += F.cross_entropy(output, target, reduction = 'sum').item()
            
            pred = output.max(1, keepdim=True)[1] # Test 데이터가 33개의 클래스에 속할 각각의 확률값이 output으로 출력. 가장 높은 가진 인덱스를 예측값으로 저장
            correct += pred.eq(target.view_as(pred)).sum().item() # pred와 target.view_as(pred)가 일치하면 1, 일치하지 않으면 0 반환
            
    test_loss /= len(test_loader.dataset)
    test_accuracy = 100. * correct / len(test_loader.dataset)
    return test_loss, test_accuracy

In [18]:
# [Transfer Learning 모델 성능 평가하기]

resnet50=torch.load('/home/iai/Desktop/Jeewon/Study/Conference/Active_Learning/resnet50.pt') 
resnet50.eval()  
test_loss, test_accuracy = evaluate(resnet50, test_loader_resNet)

print('ResNet test acc:  ', test_accuracy)

ResNet test acc:   15.911282545805207
