# Linear Classification

In [57]:
import torch
from torch.autograd import Variable
import torch.nn.functional as F
import matplotlib.pyplot as plt
from data_utils import load_CIFAR10
import numpy as np
import torch.utils.data as utils
import time
%matplotlib inline

torch.manual_seed(1)    # reproducible

<torch._C.Generator at 0x1118602d0>

In [58]:
def get_CIFAR10_data(num_training=49000, num_validation=1000, num_test=1000, num_dev=500):
    """
    Load the CIFAR-10 dataset from disk and perform preprocessing to prepare
    it for the linear classifier. These are the same steps as we used for the
    SVM, but condensed to a single function.  
    """
    # Load the raw CIFAR-10 data
    cifar10_dir = '../datasets/cifar-10-batches-py'
    X_train, y_train, X_test, y_test = load_CIFAR10(cifar10_dir)
    
    # subsample the data
    mask = list(range(num_training, num_training + num_validation))
    X_val = X_train[mask]
    y_val = y_train[mask]
    mask = list(range(num_training))
    X_train = X_train[mask]
    y_train = y_train[mask]
    mask = list(range(num_test))
    X_test = X_test[mask]
    y_test = y_test[mask]
    mask = np.random.choice(num_training, num_dev, replace=False)
    X_dev = X_train[mask]
    y_dev = y_train[mask]
    
    # Preprocessing: reshape the image data into rows
    X_train = np.reshape(X_train, (X_train.shape[0], -1))
    X_val = np.reshape(X_val, (X_val.shape[0], -1))
    X_test = np.reshape(X_test, (X_test.shape[0], -1))
    X_dev = np.reshape(X_dev, (X_dev.shape[0], -1))
    
    # Normalize the data: subtract the mean image
    mean_image = np.mean(X_train, axis = 0)
    X_train -= mean_image
    X_val -= mean_image
    X_test -= mean_image
    X_dev -= mean_image
    
    # add bias dimension and transform into columns
    X_train = np.hstack([X_train, np.ones((X_train.shape[0], 1))])
    X_val = np.hstack([X_val, np.ones((X_val.shape[0], 1))])
    X_test = np.hstack([X_test, np.ones((X_test.shape[0], 1))])
    X_dev = np.hstack([X_dev, np.ones((X_dev.shape[0], 1))])
    
    return X_train, y_train, X_val, y_val, X_test, y_test, X_dev, y_dev


# Invoke the above function to get our data.
X_train, y_train, X_val, y_val, X_test, y_test, X_dev, y_dev = get_CIFAR10_data()
print('Train data shape: ', X_train.shape)
print('Train labels shape: ', y_train.shape)
print('Validation data shape: ', X_val.shape)
print('Validation labels shape: ', y_val.shape)
print('Test data shape: ', X_test.shape)
print('Test labels shape: ', y_test.shape)
print('dev data shape: ', X_dev.shape)
print('dev labels shape: ', y_dev.shape)

X_train, y_train = torch.from_numpy(X_train).type(torch.FloatTensor), torch.from_numpy(y_train).type(torch.LongTensor)

def variable_collate(batch):
    """Puts batch of inputs, labels each into a Variable.
       Args:
         batch: (list) [inputs, labels].  In this simple example, I'm just assuming the input and labels are already Tensor types
       Output:
         minibatch: (Variable)
         targets: (Variable)
    """
    minibatch, targets = zip(*[(a, b) for (a,b) in batch])
    minibatch, targets = torch.stack(minibatch, dim=0), torch.stack(targets, dim=0)
    minibatch, targets = Variable(minibatch), Variable(targets)
    return minibatch, targets

Train data shape:  (49000, 3073)
Train labels shape:  (49000,)
Validation data shape:  (1000, 3073)
Validation labels shape:  (1000,)
Test data shape:  (1000, 3073)
Test labels shape:  (1000,)
dev data shape:  (500, 3073)
dev labels shape:  (500,)


In [59]:
class Net(torch.nn.Module):
    def __init__(self, n_feature, n_hidden, n_output):
        super(Net, self).__init__()
        self.hidden = torch.nn.Linear(n_feature, n_hidden)   # hidden layer
        self.out = torch.nn.Linear(n_hidden, n_output)   # output layer

    def forward(self, x):
        x = F.relu(self.hidden(x))      # activation function for hidden layer
        x = self.out(x)
        return x

In [60]:
net = Net(n_feature=3073, n_hidden=1024, n_output=10)     # define the network
print(net)  # net architecture

# Loss and Optimizer
# Softmax is internally computed.
# Set parameters to be updated.
optimizer = torch.optim.SGD(net.parameters(), lr=0.02)
loss_func = torch.nn.CrossEntropyLoss()  # the target label is NOT an one-hotted

Net(
  (hidden): Linear(in_features=3073, out_features=1024, bias=True)
  (out): Linear(in_features=1024, out_features=10, bias=True)
)


In [33]:
plt.ion()   # something about plotting

In [73]:
'''
for t in range(100):
    out = net(X_train)                 # input x and predict based on x
    loss = loss_func(out, y_train)     # must be (1. nn output, 2. target), the target label is NOT one-hotted

    optimizer.zero_grad()   # clear gradients for next train
    loss.backward()         # backpropagation, compute gradients
    optimizer.step()        # apply gradients
    
    if t % 10 == 0 or t in [3, 6]:
        # show learning process
        _, prediction = torch.max(F.softmax(out), 1)
        pred_y = prediction.data.numpy().squeeze()
        target_y = y_train.data.numpy()
        accuracy = sum(pred_y == target_y)/200.
        print('Accuracy=%.2f' % accuracy)
'''
traindataset = utils.TensorDataset(X_train, y_train)
trainloader = utils.DataLoader(traindataset, batch_size=64, shuffle=True)
#trainloader.batch_size = 128

epochs = 10
steps = 0
print_every = 20
for e in range(epochs):
    start = time.time()
    for images, labels in iter(trainloader):
        images, labels = Variable(images), Variable(labels)
        steps += 1
        
        out = net.forward(images)
        loss = loss_func(out, labels)
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        if steps % print_every == 0:
            stop = time.time()
            # Test accuracy
            _, prediction = torch.max(F.softmax(out), 1)
            pred_y = prediction.data.numpy().squeeze()
            target_y = labels.data.numpy()
            accuracy = sum(pred_y == target_y)/64.
            print('Accuracy=%.2f' % accuracy)
            
            start = time.time()
print(steps)



Accuracy=0.08
Accuracy=0.16
Accuracy=0.06
Accuracy=0.14
Accuracy=0.11
Accuracy=0.08
Accuracy=0.14
Accuracy=0.08
Accuracy=0.08
Accuracy=0.03
Accuracy=0.11
Accuracy=0.05
Accuracy=0.12
Accuracy=0.09
Accuracy=0.16
Accuracy=0.11
Accuracy=0.09
Accuracy=0.08
Accuracy=0.08
Accuracy=0.19
Accuracy=0.14
Accuracy=0.06
Accuracy=0.12
Accuracy=0.11
Accuracy=0.09
Accuracy=0.08
Accuracy=0.02
Accuracy=0.06
Accuracy=0.11
Accuracy=0.14
Accuracy=0.09
Accuracy=0.12
Accuracy=0.12
Accuracy=0.09
Accuracy=0.03
Accuracy=0.09
Accuracy=0.12
Accuracy=0.11
Accuracy=0.12
Accuracy=0.05
Accuracy=0.08
Accuracy=0.05
Accuracy=0.11
Accuracy=0.03
Accuracy=0.12
Accuracy=0.12
Accuracy=0.06
Accuracy=0.17
Accuracy=0.08
Accuracy=0.12
Accuracy=0.03
Accuracy=0.05
Accuracy=0.08
Accuracy=0.11
Accuracy=0.11
Accuracy=0.05
Accuracy=0.08
Accuracy=0.11
Accuracy=0.05
Accuracy=0.11
Accuracy=0.05
Accuracy=0.08
Accuracy=0.14
Accuracy=0.06
Accuracy=0.14
Accuracy=0.08
Accuracy=0.12
Accuracy=0.11
Accuracy=0.11
Accuracy=0.05
Accuracy=0.03
Accura