<a href="https://colab.research.google.com/github/Aleesia/2020-knu-df/blob/master/Untitled0.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [0]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torchvision
import torchvision.transforms as transforms
import time

rgb_mean = (0.4914, 0.4822, 0.4465)
rgb_std = (0.2023, 0.1994, 0.2010)
transform = transforms.Compose([transforms.ToTensor(), transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])
transform_train = transforms.Compose([
    transforms.RandomCrop(32, padding=4),
    transforms.RandomHorizontalFlip(),
    transforms.ToTensor(),
    transforms.Normalize(rgb_mean, rgb_std),
])

trainset = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform_train)
train_loader = torch.utils.data.DataLoader(trainset, batch_size=128, shuffle=True, num_workers=0)
testset = torchvision.datasets.CIFAR10(root='./data', train=False, download=True, transform=transform)
test_loader = torch.utils.data.DataLoader(testset, batch_size=1000, shuffle=False, num_workers=0)

classes = ('plane', 'car', 'bird', 'cat', 'deer', 'dog', 'frog', 'horse', 'ship', 'truck')

class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.conv1 = nn.Conv2d(3, 36, 3, padding=1)
        self.bnm1 = nn.BatchNorm2d(36)
        self.conv2 = nn.Conv2d(36, 180, 3, padding=1)
        self.bnm2 = nn.BatchNorm2d(180)
        self.conv3 = nn.Conv2d(180, 720, 3, padding=1)
        self.bnm3 = nn.BatchNorm2d(720)
        self.conv4 = nn.Conv2d(720, 3600, 3)
        self.bnm4 = nn.BatchNorm2d(3600)
        self.fc1 = nn.Linear(9*3600, 6000)
        self.fc2 = nn.Linear(6000, 620)
        self.fc3 = nn.Linear(620, 84)
        self.fc4 = nn.Linear(84, 10)

    def forward(self, x):
        x = F.relu(self.conv1(x))
        x = F.max_pool2d(x, 2, 2)
        x = self.bnm1(x)
        x = F.relu(self.conv2(x))
        #x = F.max_pool2d(x, 2, 2)
        x = self.bnm2(x)
        x = F.relu(self.conv3(x))
        x = F.max_pool2d(x, 2, 2)
        x = self.bnm3(x)
        x = F.relu(self.conv4(x))
        x = F.max_pool2d(x, 2, 2)
        x = self.bnm4(x)
        x = x.view(-1, 9*3600)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = F.relu(self.fc3(x))
        x = self.fc4(x)
        return F.log_softmax(x, dim=1)


import torch.optim as optim

lr=0.04
momentum = 0.5
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

model = Net().to(device)
print(model)

def train(model, device, train_loader, optimizer, epoch,log_interval):
    model.train()
    avg_loss = 0
    for batch_idx, (data, target) in enumerate(train_loader):
        data, target = data.to(device), target.to(device)
        optimizer.zero_grad() # zero the gradient buffers
        output = model(data)
        loss = F.nll_loss(output, target)
        loss.backward()
        optimizer.step() # Does the update
        avg_loss+=F.nll_loss(output, target, reduction='sum').item()
        
        if batch_idx % log_interval == 0:
          print('Train Epoch: {} [{:5.0f}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
              epoch, batch_idx * len(data), len(train_loader.dataset),
              100. * batch_idx / len(train_loader), loss.item()))
    avg_loss/=len(train_loader.dataset)
    return avg_loss

def test(model, device, test_loader):
    model.eval()
    test_loss = 0
    correct = 0
    with torch.no_grad():
        for data, target in test_loader:
            data, target = data.to(device), target.to(device)
            output = model(data)
            test_loss += F.nll_loss(output, target, reduction='sum').item() # sum up batch loss
            pred = output.argmax(dim=1, keepdim=True) # get the index of the max log-probability
            correct += pred.eq(target.view_as(pred)).sum().item()

    test_loss /= len(test_loader.dataset)

    print('\nTest set: Average loss: {:.4f}, Accuracy: {}/{} ({:.1f}%)\n'.format(
        test_loss, correct, len(test_loader.dataset),
        100. * correct / len(test_loader.dataset)))
    accuracy = 100. * correct / len(test_loader.dataset)
    return test_loss,accuracy

epochs = 3
log_interval = 200
save_model = False

train_losses = []
test_losses = []
accuracy_list = []
optimizer = optim.SGD(model.parameters(), lr=lr, momentum=momentum)

#optimizer = optim.Adam(model.parameters(), 0.00001)
for epoch in range(1, epochs + 1):
    #optimizer = optim.Adam(model.parameters(), 0.001)
    trn_loss = train(model, device, train_loader, optimizer, epoch,log_interval)
    test_loss,accuracy = test(model, device, test_loader)
    train_losses.append(trn_loss)
    test_losses.append(test_loss)
    accuracy_list.append(accuracy)

if (save_model):
    torch.save(model.state_dict(),"CIFAR_cnn.pt")

Files already downloaded and verified
Files already downloaded and verified
Net(
  (conv1): Conv2d(3, 36, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (bnm1): BatchNorm2d(36, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (conv2): Conv2d(36, 180, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (bnm2): BatchNorm2d(180, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (conv3): Conv2d(180, 720, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (bnm3): BatchNorm2d(720, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (conv4): Conv2d(720, 3600, kernel_size=(3, 3), stride=(1, 1))
  (bnm4): BatchNorm2d(3600, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc1): Linear(in_features=32400, out_features=6000, bias=True)
  (fc2): Linear(in_features=6000, out_features=620, bias=True)
  (fc3): Linear(in_features=620, out_features=84, bias=True)
  (fc4): Linear(in_features=84, out_features=10, bias=True)
)


In [47]:
#lr=0.15
for epoch in range(4, 10):
    #lr=lr*0.9
    #optimizer = optim.SGD(model.parameters(), lr=lr, momentum=momentum)
    optimizer = optim.Adam(model.parameters(), 0.000001)
    trn_loss = train(model, device, train_loader, optimizer, epoch,log_interval)
    test_loss,accuracy = test(model, device, test_loader)
    train_losses.append(trn_loss)
    test_losses.append(test_loss)
    accuracy_list.append(accuracy)


Test set: Average loss: 2.2971, Accuracy: 3398/10000 (34.0%)


Test set: Average loss: 2.3111, Accuracy: 3284/10000 (32.8%)


Test set: Average loss: 2.2673, Accuracy: 3576/10000 (35.8%)


Test set: Average loss: 2.2580, Accuracy: 3421/10000 (34.2%)



KeyboardInterrupt: ignored

In [0]:
for epoch in range(10, 30):
    lr = lr*15/16
    optimizer = optim.SGD(model.parameters(), lr=lr, momentum=momentum)
    trn_loss = train(model, device, train_loader, optimizer, epoch,log_interval)
    test_loss,accuracy = test(model, device, test_loader)
    train_losses.append(trn_loss)
    test_losses.append(test_loss)
    accuracy_list.append(accuracy)

In [0]:
 """----------------Calculate accuracy, precision, recall, confusion matrix----------------------"""
class_correct = list(0. for i in range(10))
class_total = list(0. for i in range(10))
y_true = []
y_pred = []
with torch.no_grad():
    for data in test_loader:
        images, labels = data
        images = images.to(device)
        labels = labels.to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs, 1)
        c = (predicted == labels).squeeze()
        for i in range(1000):
            label = labels[i]
            y_true.append(classes[labels[i]])
            y_pred.append(classes[predicted[i]])
            class_correct[label] += c[i].item()
            class_total[label] += 1


import sklearn.metrics as metr
mtrx = metr.confusion_matrix(y_true, y_pred, labels=classes)
print("Confusion matrix: \n", mtrx)

precisions = [0,0,0,0,0,0,0,0,0,0]
recalls = [0,0,0,0,0,0,0,0,0,0]
f1_scores = [0,0,0,0,0,0,0,0,0,0]
for i in range(10):
    suma_row=0
    suma_column=0
    for j in range(10):
        suma_row += mtrx[i][j]
        suma_column += mtrx[j][i]
    precisions[i] = mtrx[i][i]/(suma_row)*100
    recalls[i] = mtrx[i][i]/(suma_column)*100
    f1_scores[i] = 2 * (precisions[i] * recalls[i])/(precisions[i] + recalls[i])
    print('Accuracy of %5s : %2d %%  Precision: %4s %%  Recall: %4d %%  F1-score: %4s %%' % (classes[i], 100 * class_correct[i] / class_total[i], precisions[i], recalls[i], f1_scores[i]))
