In [1]:
import torch
from torch import nn
from torch import optim
import torch.nn.functional as F
from torchvision import datasets, transforms

In [4]:
train_dir = '../data/train'
test_dir = '../data/test_local'

In [5]:
train_transforms = transforms.Compose([transforms.Resize(32),
                                      transforms.RandomHorizontalFlip(),
                                      transforms.RandomVerticalFlip(),
                                      transforms.RandomRotation(30),
                                      transforms.RandomRotation(60),
                                      transforms.ToTensor(),
                                      transforms.Normalize([0.485, 0.456, 0.406], 
                                                           [0.229, 0.224, 0.225])])
data = datasets.ImageFolder(train_dir, transform=train_transforms)
train_data, val_data = torch.utils.data.random_split(data, [4000, 537])
train_loader = torch.utils.data.DataLoader(train_data, batch_size=64, shuffle=True)
val_loader = torch.utils.data.DataLoader(val_data, batch_size=64, shuffle=True)

test_transforms = transforms.Compose([transforms.Resize(32),
                                     transforms.ToTensor(),
                                     transforms.Normalize([0.485, 0.456, 0.406], 
                                                          [0.229, 0.224, 0.225])])
test_data = datasets.ImageFolder(test_dir, transform=test_transforms)
test_loader = torch.utils.data.DataLoader(test_data, batch_size=64, shuffle=True)

In [4]:
class Net1(nn.Module):
    def __init__(self):
        super(Net1, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 3, 1)
        self.conv2 = nn.Conv2d(32, 64, 2, 1)
        self.conv3 = nn.Conv2d(64, 128, 2, 1)
        self.fc1 = nn.Linear(128*3*3, 1024)
        self.fc2 = nn.Linear(1024, 512)
        self.fc3 = nn.Linear(512, 10)

    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv3(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 128*3*3)
        x = self.fc1(x)
        x = self.fc2(x)
        x = self.fc3(x)
        return F.log_softmax(x, dim=1)

In [5]:
class Net2(nn.Module):
    def __init__(self):
        super(Net2, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 3, 1)
        self.conv2 = nn.Conv2d(32, 64, 2, 1)
        self.conv3 = nn.Conv2d(64, 128, 2, 1)
        self.fc1 = nn.Linear(128*3*3, 1024)
        self.fc2 = nn.Linear(1024, 512)
        self.fc3 = nn.Linear(512, 10)

    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv3(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 128*3*3)
        x = self.fc1(x)
        x - F.dropout(x)
        x = self.fc2(x)
        x - F.dropout(x)
        x = self.fc3(x)
        return F.log_softmax(x, dim=1)

In [6]:
class Net3(nn.Module):
    def __init__(self):
        super(Net3, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 3, 1, 1)
        self.conv2 = nn.Conv2d(32, 64, 3, 1, 1)
        self.conv3 = nn.Conv2d(64, 128, 3, 1, 1)
        
        self.fc1 = nn.Linear(128*4*4, 120)
        self.fc2 = nn.Linear(120, 10)
        
    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv3(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 128*4*4)
        x = self.fc1(x)
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

In [7]:
class Net4(nn.Module):
    def __init__(self):
        super(Net4, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 5, 1)
        self.conv2 = nn.Conv2d(32, 64, 5, 1)
        self.fc1 = nn.Linear(64*5*5, 256)
        self.fc2 = nn.Linear(256, 128)
        self.fc3 = nn.Linear(128, 10)  
        
    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 64*5*5)
        x = self.fc1(x)
        x = self.fc2(x)
        x = self.fc3(x)
        return F.log_softmax(x, dim=1)

In [8]:
class Net5(nn.Module):
    def __init__(self):
        super(Net2, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 3, 1)
        self.conv2 = nn.Conv2d(32, 64, 3, 1)
        self.fc1 = nn.Linear(64*6*6, 128)
        self.fc2 = nn.Linear(128, 10)

    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 64*6*6)
        x = self.fc1(x)
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

In [9]:
class Net6(nn.Module):
    def __init__(self):
        super(Net6, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 5, 1)
        self.conv2 = nn.Conv2d(32, 64, 5, 1)
        self.fc1 = nn.Linear(64*5*5, 120)
        self.fc2 = nn.Linear(120, 10)

    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 64*5*5)
        x = self.fc1(x)
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

In [10]:
class Net7(nn.Module):
    def __init__(self):
        super(Net7, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 5, 1)
        self.conv2 = nn.Conv2d(32, 64, 5, 1)
        self.fc1 = nn.Linear(64*5*5, 120)
        self.fc2 = nn.Linear(120, 10)

    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.avg_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.avg_pool2d(x, 2, 2)
        x = x.view(-1, 64*5*5)
        x = self.fc1(x)
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

In [11]:
class Net8(nn.Module):
    def __init__(self):
        super(Net8, self).__init__()
        # Layers
        self.conv1 = nn.Conv2d(3, 32, 3, 1, 1)
        self.conv2 = nn.Conv2d(32, 64, 3, 1, 1)
        self.conv3 = nn.Conv2d(64, 128, 3, 1, 1)
        
        self.fc1 = nn.Linear(128*4*4, 512)
        self.fc2 = nn.Linear(512, 128)
        self.fc3 = nn.Linear(128, 10)
        
        
    def forward(self, x):
        # define forward propagation here
        x = self.conv1(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv2(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = self.conv3(x)
        x = F.relu(x)
        x = F.max_pool2d(x, 2, 2)
        x = x.view(-1, 128*4*4)
        x = self.fc1(x)
        x = self.fc2(x)
        x = self.fc3(x)
        return F.log_softmax(x, dim=1)

In [12]:
def train(model, device, train_loader, optimizer, epoch):
    model.train()
    for batch_idx, (data, target) in enumerate(train_loader):
        data, target = data.to(device), target.to(device)
        optimizer.zero_grad()
        output = model(data)
        loss = F.nll_loss(output, target)
        loss.backward()
        optimizer.step()
        if batch_idx % 10 == 0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch+1, batch_idx * len(data), len(train_loader.dataset),
                100. * batch_idx / len(train_loader), loss.item()))

In [13]:
def test(model, device, test_loader):
    model.eval()
    test_loss = 0
    correct = 0
    with torch.no_grad():
        for data, target in test_loader:
            data, target = data.to(device), target.to(device)
            output = model(data)
            test_loss += F.nll_loss(output, target, reduction='sum').item() # sum up batch loss
            pred = output.argmax(dim=1, keepdim=True) # get the index of the max log-probability
            correct += pred.eq(target.view_as(pred)).sum().item()

    test_loss /= len(test_loader.dataset)

    print('\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.0f}%)\n'.format(
        test_loss, correct, len(test_loader.dataset),
        100. * correct / len(test_loader.dataset)))

In [14]:
use_cuda = torch.cuda.is_available()
device = torch.device("cuda" if use_cuda else "cpu")

In [15]:
model = Net6().to(device)
optimizer = optim.Adam(model.parameters(), lr=0.001)
# optimizer = optim.SGD(model.parameters(), lr=0.001, momentum=0.5)
epochs = 30

for epoch in range(epochs-20):
    train(model, device, train_loader, optimizer, epoch)
    test(model, device, val_loader)
optimizer = optim.Adam(model.parameters(), lr=0.0005)
for epoch in range(epochs-20, epochs-10):
    train(model, device, train_loader, optimizer, epoch)
    test(model, device, val_loader)    
optimizer = optim.Adam(model.parameters(), lr=0.0001)
for epoch in range(epochs-10, epochs):
    train(model, device, train_loader, optimizer, epoch)
    test(model, device, val_loader)
torch.save(model.state_dict(),"hw2_v16.pth")


Test set: Average loss: 0.7978, Accuracy: 365/537 (68%)


Test set: Average loss: 0.7120, Accuracy: 389/537 (72%)


Test set: Average loss: 0.6968, Accuracy: 381/537 (71%)


Test set: Average loss: 0.7052, Accuracy: 390/537 (73%)


Test set: Average loss: 0.6918, Accuracy: 392/537 (73%)


Test set: Average loss: 0.6634, Accuracy: 411/537 (77%)


Test set: Average loss: 0.6812, Accuracy: 395/537 (74%)


Test set: Average loss: 0.6449, Accuracy: 397/537 (74%)


Test set: Average loss: 0.6363, Accuracy: 408/537 (76%)


Test set: Average loss: 0.6091, Accuracy: 418/537 (78%)


Test set: Average loss: 0.5940, Accuracy: 411/537 (77%)


Test set: Average loss: 0.6023, Accuracy: 419/537 (78%)


Test set: Average loss: 0.6105, Accuracy: 421/537 (78%)


Test set: Average loss: 0.6309, Accuracy: 405/537 (75%)


Test set: Average loss: 0.6044, Accuracy: 417/537 (78%)


Test set: Average loss: 0.6006, Accuracy: 421/537 (78%)


Test set: Average loss: 0.5785, Accuracy: 424/537 (79%)


Test set: Ave


Test set: Average loss: 0.5665, Accuracy: 422/537 (79%)


Test set: Average loss: 0.5770, Accuracy: 432/537 (80%)


Test set: Average loss: 0.5896, Accuracy: 422/537 (79%)


Test set: Average loss: 0.5701, Accuracy: 427/537 (80%)


Test set: Average loss: 0.5877, Accuracy: 420/537 (78%)


Test set: Average loss: 0.5468, Accuracy: 428/537 (80%)


Test set: Average loss: 0.5320, Accuracy: 434/537 (81%)


Test set: Average loss: 0.5682, Accuracy: 430/537 (80%)


Test set: Average loss: 0.5650, Accuracy: 428/537 (80%)


Test set: Average loss: 0.5610, Accuracy: 432/537 (80%)



In [17]:
test(model, device, test_loader)


Test set: Average loss: 0.4882, Accuracy: 232/272 (85%)

