# Build a Traffic Sign Recognition Classifier

---
## Load The Data

In [None]:
# Load pickled data
import pickle

training_file = "data/train.p"
testing_file = "data/test.p"

with open(training_file, mode='rb') as f:
    train = pickle.load(f)
with open(testing_file, mode='rb') as f:
    test = pickle.load(f)

X_train, y_train = train['features'], train['labels']
X_test, y_test = test['features'], test['labels']

---

## Dataset Summary & Exploration

The pickled data is a dictionary with 4 key/value pairs:

- `'features'` is a 4D array containing raw pixel data of the traffic sign images, (num examples, width, height, channels).
- `'labels'` is a 2D array containing the label/class id of the traffic sign. The file `signnames.csv` contains id -> name mappings for each id.
- `'sizes'` is a list containing tuples, (width, height) representing the the original width and height the image.
- `'coords'` is a list containing tuples, (x1, y1, x2, y2) representing coordinates of a bounding box around the sign in the image. **THESE COORDINATES ASSUME THE ORIGINAL IMAGE. THE PICKLED DATA CONTAINS RESIZED VERSIONS (32 by 32) OF THESE IMAGES**

In [None]:
# Number of training examples
n_train = len(X_train)

# Number of testing examples.
n_test = len(X_test)

# The shape of an traffic sign image
image_shape = X_train[0].shape[:-1]

# Number of unique classes/labels in the dataset.
n_classes = len(set(y_train))

print("Number of training examples =", n_train)
print("Number of testing examples =", n_test)
print("Image data shape =", image_shape)
print("Number of classes =", n_classes)

Visualize the German Traffic Signs Dataset using the pickled file(s).

In [None]:
### Data exploration visualization.
import matplotlib.pyplot as plt
import numpy as np
import random
%matplotlib inline

fig, ax = plt.subplots()
ax.bar(range(n_classes), np.bincount(y_train), 0.5, color='r')
ax.set_xlabel('Signs')
ax.set_ylabel('Count')
ax.set_title('The count of each sign')
plt.show()

plt.figure(figsize=(16, 16))
for c in range(n_classes):
    i = random.choice(np.where(y_train == c)[0])
    plt.subplot(8, 8, c+1)
    plt.axis('off')
    plt.title('class: {}'.format(c))
    plt.imshow(X_train[i])

----

## Design and Test a Baseline Model Architecture

### Custom Dataset

In [None]:
import torch
from torch.utils.data.dataset import Dataset
import torchvision.transforms as transforms

class PickledDataset(Dataset):
    def __init__(self, file_path, transform=None):
        with open(file_path, mode='rb') as f:
            data = pickle.load(f)
            self.features = data['features']
            self.labels = data['labels']
            self.count = len(self.labels)
            self.transform = transform
        
    def __getitem__(self, index):
        feature = self.features[index]
        if self.transform is not None:
            feature = self.transform(feature)
        return (feature, self.labels[index])

    def __len__(self):
        return self.count

In [None]:
data_transforms = transforms.Compose([
    transforms.ToTensor(),
])

train_dataset = PickledDataset(training_file, transform=data_transforms)
test_dataset = PickledDataset(testing_file, transform=data_transforms)

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=64, shuffle=True, num_workers=1)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=64, shuffle=False, num_workers=1)

### Baseline Model

In [None]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

class BaselineNet(nn.Module):
    def __init__(self):
        super(BaselineNet, self).__init__()
        self.conv1 = nn.Conv2d(3, 10, kernel_size=5)
        self.conv2 = nn.Conv2d(10, 20, kernel_size=5)
        self.conv2_drop = nn.Dropout2d()
        self.fc1 = nn.Linear(500, 50)
        self.fc2 = nn.Linear(50, 43)

    def forward(self, x):
        x = F.relu(F.max_pool2d(self.conv1(x), 2))
        x = F.relu(F.max_pool2d(self.conv2_drop(self.conv2(x)), 2))
        x = x.view(-1, 500)
        x = F.relu(self.fc1(x))
        x = F.dropout(x, training=self.training)
        x = self.fc2(x)
        return F.log_softmax(x, dim=1)

### Training

In [None]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model = BaselineNet().to(device)
optimizer = optim.Adam(model.parameters(), lr=0.001)
criterion = nn.NLLLoss()
n_epochs = 30

In [None]:
def train():
    # Train model
    model.train()
    train_loss = 0
    for x, y in train_loader:
        x, y = x.to(device), y.to(device, dtype=torch.int64)
        optimizer.zero_grad()
        output = model(x)
        loss = criterion(output, y)
        loss.backward()
        optimizer.step()
        train_loss += loss.item() * x.size(0)
    # Caculate loss
    train_loss = train_loss / len(train_loader.dataset)
    return train_loss

In [None]:
def validation():
    # Validation model
    model.eval()
    valid_loss = 0
    accuracy = 0
    for x, y in test_loader:
        x, y = x.to(device), y.to(device, dtype=torch.int64)
        output = model(x)
        loss = criterion(output, y)
        valid_loss += loss.item() * x.size(0)
        # Accuracy
        pred = torch.argmax(output, dim=1)
        correct = pred == y.view(*pred.shape)
        accuracy += torch.sum(correct).item()
    # Caculate loss and accuracy
    valid_loss = valid_loss / len(test_loader.dataset)
    accuracy = accuracy / len(test_loader.dataset) * 100
    return valid_loss, accuracy

In [None]:
for epoch in range(1, n_epochs+1):
    train_loss = train()
    valid_loss, accuracy = validation()
    print('[Epoch #{}] Training Loss: {:.6f}\tValidation Loss: {:.6f}\tValidation Accuracy: {:.3f}%'.format(epoch, train_loss, valid_loss, accuracy))

## Experiment and find tuning

### Image normalize

In [None]:
# Channel separation
red_chan = np.reshape(X_train[:,:,:,0], -1)/255
green_chan = np.reshape(X_train[:,:,:,1], -1)/255
blue_chan = np.reshape(X_train[:,:,:,2], -1)/255

# mean
means = [np.mean(red_chan), np.mean(green_chan), np.mean(blue_chan)]

# std
stds = [np.std(red_chan), np.std(green_chan), np.std(blue_chan)]

print(means)
print(stds)

In [None]:
# Add normalize
data_transforms = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.3398, 0.3117, 0.3210), (0.2755, 0.2647, 0.2712))
])

train_dataset = PickledDataset(training_file, transform=data_transforms)
test_dataset = PickledDataset(testing_file, transform=data_transforms)

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=64, shuffle=True, num_workers=1)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=64, shuffle=False, num_workers=1)

In [None]:
for epoch in range(1, n_epochs+1):
    train_loss = train()
    valid_loss, accuracy = validation()
    print('[Epoch #{}] Training Loss: {:.6f}\tValidation Loss: {:.6f}\tValidation Accuracy: {:.3f}%'.format(epoch, train_loss, valid_loss, accuracy))

### Handling imbalanced dataset

In [None]:
# Use weighted sampler
class_sample_count = np.bincount(y_train)
weights = 1 / np.array([class_sample_count[y] for y in y_train])
sampler = torch.utils.data.sampler.WeightedRandomSampler(weights, len(weights))

In [None]:
import PIL

# Data augmentation
train_data_transforms = transforms.Compose([
    transforms.ToPILImage(),
    transforms.RandomRotation(20, resample=PIL.Image.BILINEAR),
    transforms.ToTensor(),
    transforms.Normalize((0.3398, 0.3117, 0.3210), (0.2755, 0.2647, 0.2712))
])
test_data_transforms = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.3398, 0.3117, 0.3210), (0.2755, 0.2647, 0.2712))
])

train_dataset = PickledDataset(training_file, transform=train_data_transforms)
test_dataset = PickledDataset(testing_file, transform=test_data_transforms)

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=64, sampler=sampler, num_workers=1)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=64, shuffle=False, num_workers=1)

In [None]:
balacned_y_train = np.array([], dtype=np.int64)

with torch.no_grad():
    for _, y in train_loader:
        y = y.to(device, dtype=torch.int64)
        balacned_y_train = np.append(balacned_y_train, y.cpu().numpy())

fig, ax = plt.subplots()
ax.bar(range(n_classes), np.bincount(balacned_y_train), 0.5, color='r')
ax.set_xlabel('Signs')
ax.set_ylabel('Count')
ax.set_title('The count of each sign')
plt.show()

In [None]:
with torch.no_grad():
    x, y = next(iter(train_loader))
    x, y = x.to(device).cpu().numpy(), y.to(device).cpu().numpy()
    plt.figure(figsize=(16, 16))
    for i in range(len(y)):
        plt.subplot(8, 8, i+1)
        plt.axis('off')
        plt.title('class: {}'.format(y[i]))
        image = np.transpose(x[i], (1, 2, 0))
        mean = np.array([0.3398, 0.3117, 0.3210])
        std = np.array([0.2755, 0.2647, 0.2712])
        image = std * image + mean
        image = np.clip(image, 0, 1)
        plt.imshow(np.array(image))

In [None]:
for epoch in range(1, n_epochs+1):
    train_loss = train()
    valid_loss, accuracy = validation()
    print('[Epoch #{}] Training Loss: {:.6f}\tValidation Loss: {:.6f}\tValidation Accuracy: {:.3f}%'.format(epoch, train_loss, valid_loss, accuracy))

### Contrast-limited adaptive histogram equalization

### Pretrained model VS Custom model

### Spatial transformer networks