In [18]:
import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import DataLoader
import torchvision.transforms as tfrms
from torchvision import datasets
import torch.nn.functional as F


class DCNN(nn.Module):
    def __init__(self, num_classes=43):
        super(DCNN, self).__init__()

        # First Convolutional Block
        self.conv1 = nn.Conv2d(3, 32, kernel_size=3, stride=1, padding=1)
        self.bn1 = nn.BatchNorm2d(32)  # Batch normalization layer
        self.pool1 = nn.MaxPool2d(kernel_size=2, stride=2)

        # Second Convolutional Block
        self.conv2 = nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=1)
        self.bn2 = nn.BatchNorm2d(64)
        self.pool2 = nn.MaxPool2d(kernel_size=2, stride=2)

        # Third Convolutional Block
        self.conv3 = nn.Conv2d(64, 128, kernel_size=3, stride=1, padding=1)
        self.bn3 = nn.BatchNorm2d(128)
        self.pool3 = nn.MaxPool2d(kernel_size=2, stride=2)

        # Fourth Convolutional Block (Additional layer for more capacity)
        self.conv4 = nn.Conv2d(128, 256, kernel_size=3, stride=1, padding=1)
        self.bn4 = nn.BatchNorm2d(256)
        self.pool4 = nn.MaxPool2d(kernel_size=2, stride=2)

        # Fully Connected Layers
        # Adjust input size based on the output of the last pooling layer
        self.fc1 = nn.Linear(256 * 4 * 4, 512)  # Adjusted for new conv layers
        self.dropout = nn.Dropout(0.5)  # Dropout layer
        self.fc2 = nn.Linear(512, num_classes)

    def forward(self, x):
        # Convolutional layers with ReLU activation and BatchNorm
        x = self.pool1(F.elu(self.bn1(self.conv1(x))))
        x = self.pool2(F.elu(self.bn2(self.conv2(x))))
        x = self.pool3(F.elu(self.bn3(self.conv3(x))))
        x = self.pool4(F.elu(self.bn4(self.conv4(x))))

        # Flatten the tensor
        x = x.view(x.size(0), -1)  # Flatten for fully connected layer

        # Fully connected layers with ReLU and Dropout
        x = F.elu(self.fc1(x))
        x = self.dropout(x)
        x = self.fc2(x)
        return x

# Step 2: Preprocess and load data
transform = tfrms.Compose([
    tfrms.Resize((64, 64)),
    tfrms.Grayscale(num_output_channels=3),
    tfrms.RandomHorizontalFlip(1),
    tfrms.RandomVerticalFlip(1),
    tfrms.ToTensor(),
    tfrms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
])

# Example: If you had a directory for training images
train_data = datasets.ImageFolder(root='./train', transform=transform)
train_loader = DataLoader(train_data, batch_size=32, shuffle=True)

# Step 3: Initialize the model, loss function, and optimizer
model = DCNN()
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.0005, weight_decay=0.0001)  # Reduced learning rate
scheduler = torch.optim.lr_scheduler.StepLR(optimizer, step_size=3, gamma=0.5)

# Step 4: Train the model
num_epochs = 50
for epoch in range(num_epochs):
    model.train()
    running_loss = 0.0
    for images, labels in train_loader:
        optimizer.zero_grad()
        
        # Forward pass
        outputs = model(images)
        loss = criterion(outputs, labels)
        
        # Backward pass and optimize
        loss.backward()
        optimizer.step()
        
        running_loss += loss.item()
    
    print(f"Epoch [{epoch+1}/{num_epochs}], Loss: {running_loss/len(train_loader)}")

# Step 5: Save the model (optional)
torch.save(model.state_dict(), 'road_sign_model.pth')

Epoch [1/50], Loss: 3.3727795680363974
Epoch [2/50], Loss: 2.690106153488159
Epoch [3/50], Loss: 2.2916078567504883
Epoch [4/50], Loss: 2.1802320778369904
Epoch [5/50], Loss: 1.929874489704768
Epoch [6/50], Loss: 1.8027413388093312
Epoch [7/50], Loss: 1.545435627301534
Epoch [8/50], Loss: 1.384815772374471
Epoch [9/50], Loss: 1.2304238726695378
Epoch [10/50], Loss: 0.931684136390686
Epoch [11/50], Loss: 0.8003261884053549
Epoch [12/50], Loss: 0.614353155096372
Epoch [13/50], Loss: 0.5038059130311012
Epoch [14/50], Loss: 0.38790182769298553
Epoch [15/50], Loss: 0.3457387648522854
Epoch [16/50], Loss: 0.23239701303342977
Epoch [17/50], Loss: 0.2783064004033804
Epoch [18/50], Loss: 0.20279688419153294
Epoch [19/50], Loss: 0.15538586614032587
Epoch [20/50], Loss: 0.10159642171735565
Epoch [21/50], Loss: 0.0996670729170243
Epoch [22/50], Loss: 0.0903124666462342
Epoch [23/50], Loss: 0.10131176793947816
Epoch [24/50], Loss: 0.05739230460797747
Epoch [25/50], Loss: 0.06129545524405936
Epoch [

Test The Model

In [19]:
# Load the model
model = DCNN()
model.load_state_dict(torch.load('road_sign_model.pth'))
model.eval()  # Set the model to evaluation mode

test_data = datasets.ImageFolder(root='./test', transform=transform)
test_loader = DataLoader(test_data, batch_size=32, shuffle=False)

correct = 0
total = 0

with torch.no_grad():  # Disable gradient calculation for evaluation
    for images, labels in test_loader:
        outputs = model(images)
        _, predicted = torch.max(outputs, 1)  # Get the class with the highest score
        total += labels.size(0)  # Total number of labels
        correct += (predicted == labels).sum().item()  # Count correct predictions

accuracy = 100 * correct / total
print(f'Accuracy on test dataset: {accuracy:.2f}%')

Accuracy on test dataset: 27.27%


In [20]:
# Load the model
model = DCNN()
model.load_state_dict(torch.load('road_sign_model.pth'))
model.eval()  # Set the model to evaluation mode

test_data = datasets.ImageFolder(root='./testCorrected', transform=transform)
test_loader = DataLoader(test_data, batch_size=32, shuffle=False)

correct = 0
total = 0

with torch.no_grad():  # Disable gradient calculation for evaluation
    for images, labels in test_loader:
        outputs = model(images)
        _, predicted = torch.max(outputs, 1)  # Get the class with the highest score
        total += labels.size(0)  # Total number of labels
        correct += (predicted == labels).sum().item()  # Count correct predictions

accuracy = 100 * correct / total
print(f'Accuracy on test dataset: {accuracy:.2f}%')

Accuracy on test dataset: 14.94%


In [23]:
from PIL import Image

# Load and preprocess a single image
image_path = './test/0/00000_00000_00003.jpg'
image = Image.open(image_path)
image = transform(image).unsqueeze(0)  # Add batch dimension

# Get the model's prediction
model.eval()
with torch.no_grad():
    output = model(image)
    _, predicted = torch.max(output, 1)
    class_idx = predicted.item()

# Get the class name from your dataset
class_name = test_data.classes[class_idx]
print(f'Predicted class: {class_name}')

Predicted class: 12


In [None]:
import matplotlib.pyplot as plt

def imshow(img, label, prediction):
    img = img.permute(1, 2, 0)  # Change shape for display
    img = img * torch.tensor([0.229, 0.224, 0.225]) + torch.tensor([0.485, 0.456, 0.406])  # Denormalize
    plt.imshow(img.numpy())
    plt.title(f'True: {label}, Pred: {prediction}')
    plt.show()

# Display some test images with predictions
for images, labels in test_loader:
    outputs = model(images)
    _, predictions = torch.max(outputs, 1)
    for i in range(4):  # Show first 4 images in the batch
        imshow(images[i], test_data.classes[labels[i]], test_data.classes[predictions[i]])
    break