Using PyTorch to first train on CIFAR -10 data set ( Blind experimentation)

In [None]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
import numpy as np

# Device configuration
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

# Hyperparameters (Blind Experimentation)
num_epochs = 10
batch_size = 100
learning_rate = 0.0001
hidden_sizes = [32, 64]  # Number of channels in hidden layers
dropout_prob = 0.5

# CIFAR-10 dataset
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])

train_dataset = torchvision.datasets.CIFAR10(root='./data', train=True, transform=transform, download=True)
test_dataset = torchvision.datasets.CIFAR10(root='./data', train=False, transform=transform)

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=False)

# Convolutional neural network (CNN)
class CNN(nn.Module):
    def __init__(self, num_classes=10):
        super(CNN, self).__init__()
        self.layer1 = nn.Sequential(
            nn.Conv2d(3, hidden_sizes[0], kernel_size=5, stride=1, padding=2),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2))
        self.layer2 = nn.Sequential(
            nn.Conv2d(hidden_sizes[0], hidden_sizes[1], kernel_size=5, stride=1, padding=2),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2))
        self.fc = nn.Linear(hidden_sizes[1] * 8 * 8, num_classes)
        self.dropout = nn.Dropout(dropout_prob)

    def forward(self, x):
        out = self.layer1(x)
        out = self.layer2(out)
        out = out.reshape(out.size(0), -1)
        out = self.fc(out)
        out = self.dropout(out)
        return out

model = CNN().to(device)

# Loss and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

# Train the model
total_step = len(train_loader)
for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):
        images = images.to(device)
        labels = labels.to(device)

        # Forward pass
        outputs = model(images)
        loss = criterion(outputs, labels)

        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()

        if (i+1) % 100 == 0:
            print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}'
                   .format(epoch+1, num_epochs, i+1, total_step, loss.item()))

# Test the model
model.eval()
with torch.no_grad():
    correct = 0
    total = 0
    for images, labels in test_loader:
        images = images.to(device)
        labels = labels.to(device)
        outputs = model(images)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

    print('Accuracy of the network on the 10000 test images: {} %'.format(100 * correct / total))


Downloading https://www.cs.toronto.edu/~kriz/cifar-10-python.tar.gz to ./data/cifar-10-python.tar.gz


100%|██████████| 170498071/170498071 [00:12<00:00, 13133623.22it/s]


Extracting ./data/cifar-10-python.tar.gz to ./data
Epoch [1/10], Step [100/500], Loss: 2.0631
Epoch [1/10], Step [200/500], Loss: 2.0667
Epoch [1/10], Step [300/500], Loss: 1.9574
Epoch [1/10], Step [400/500], Loss: 1.8549
Epoch [1/10], Step [500/500], Loss: 1.8308
Epoch [2/10], Step [100/500], Loss: 1.8947
Epoch [2/10], Step [200/500], Loss: 1.6624
Epoch [2/10], Step [300/500], Loss: 1.7838
Epoch [2/10], Step [400/500], Loss: 1.7976
Epoch [2/10], Step [500/500], Loss: 1.8401
Epoch [3/10], Step [100/500], Loss: 1.7977
Epoch [3/10], Step [200/500], Loss: 1.8099
Epoch [3/10], Step [300/500], Loss: 1.8168
Epoch [3/10], Step [400/500], Loss: 1.8218
Epoch [3/10], Step [500/500], Loss: 1.6896
Epoch [4/10], Step [100/500], Loss: 1.6834
Epoch [4/10], Step [200/500], Loss: 1.8669
Epoch [4/10], Step [300/500], Loss: 1.8942
Epoch [4/10], Step [400/500], Loss: 1.7599
Epoch [4/10], Step [500/500], Loss: 1.9970
Epoch [5/10], Step [100/500], Loss: 1.7636
Epoch [5/10], Step [200/500], Loss: 1.8005
Epo

Reducing the search space parameter

In [None]:
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms
import numpy as np

# Device configuration
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

# Hyperparameters (Blind Experimentation)
num_epochs = 10
batch_size = 100
learning_rate = 0.0001
hidden_sizes = [32, 64]  # Number of channels in hidden layers
dropout_prob = 0.5

# CIFAR-10 dataset
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))
])

train_dataset = torchvision.datasets.CIFAR10(root='./data', train=True, transform=transform, download=True)
test_dataset = torchvision.datasets.CIFAR10(root='./data', train=False, transform=transform)

train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=batch_size, shuffle=True)
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=batch_size, shuffle=False)

# Convolutional neural network (CNN)
class CNN(nn.Module):
    def __init__(self, num_classes=10):
        super(CNN, self).__init__()
        self.layer1 = nn.Sequential(
            nn.Conv2d(3, hidden_sizes[0], kernel_size=5, stride=1, padding=2),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2))
        self.layer2 = nn.Sequential(
            nn.Conv2d(hidden_sizes[0], hidden_sizes[1], kernel_size=5, stride=1, padding=2),
            nn.ReLU(),
            nn.MaxPool2d(kernel_size=2, stride=2))
        self.fc = nn.Linear(hidden_sizes[1] * 8 * 8, num_classes)
        self.dropout = nn.Dropout(dropout_prob)

    def forward(self, x):
        out = self.layer1(x)
        out = self.layer2(out)
        out = out.reshape(out.size(0), -1)
        out = self.fc(out)
        out = self.dropout(out)
        return out

# Calculate Compression Ratio
def calculate_compression_ratio(input_shape, output_shape, kernel_size, stride):
    input_size = np.prod(input_shape)
    output_size = np.prod(output_shape)
    compression_ratio = input_size / output_size * kernel_size**2 / stride**2
    return compression_ratio

# Loss and optimizer
criterion = nn.CrossEntropyLoss()

# Train and evaluate the model
def train_and_evaluate(model, optimizer, criterion, train_loader, test_loader):
    # Train the model
    total_step = len(train_loader)
    for epoch in range(num_epochs):
        for i, (images, labels) in enumerate(train_loader):
            images = images.to(device)
            labels = labels.to(device)

            # Forward pass
            outputs = model(images)
            loss = criterion(outputs, labels)

            # Backward and optimize
            optimizer.zero_grad()
            loss.backward()
            optimizer.step()

            if (i+1) % 100 == 0:
                print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}'
                       .format(epoch+1, num_epochs, i+1, total_step, loss.item()))

    # Test the model
    model.eval()
    with torch.no_grad():
        correct = 0
        total = 0
        for images, labels in test_loader:
            images = images.to(device)
            labels = labels.to(device)
            outputs = model(images)
            _, predicted = torch.max(outputs.data, 1)
            total += labels.size(0)
            correct += (predicted == labels).sum().item()

        accuracy = 100 * correct / total
        print('Accuracy of the network on the 10000 test images: {} %'.format(accuracy))

    return accuracy

# Initialize model and optimizer
model = CNN().to(device)
optimizer = optim.Adam(model.parameters(), lr=learning_rate)

# Initial blind experiment
accuracy = train_and_evaluate(model, optimizer, criterion, train_loader, test_loader)

# Calculate compression ratio for each convolutional layer
compression_ratio1 = calculate_compression_ratio((3, 32, 32), (32, 16, 16), 5, 1)
compression_ratio2 = calculate_compression_ratio((32, 16, 16), (64, 8, 8), 5, 1)

# Update hyperparameters based on compression ratios and Train and evaluate the model with updated hyperparameters.
#The tuple (3, 32, 32) represents the shape of the input tensor to the first convolutional layer.
# In the CIFAR-10 dataset, each image has three color channels (RGB), and each channel has a resolution of 32x32 pixels.
accuracy_after_compression = train_and_evaluate(model, optimizer, criterion, train_loader, test_loader)

print("Accuracy before compression:", accuracy)
print("Accuracy after compression:", accuracy_after_compression)


Files already downloaded and verified
Epoch [1/10], Step [100/500], Loss: 2.0900
Epoch [1/10], Step [200/500], Loss: 2.0778
Epoch [1/10], Step [300/500], Loss: 2.0102
Epoch [1/10], Step [400/500], Loss: 1.8855
Epoch [1/10], Step [500/500], Loss: 2.0610
Epoch [2/10], Step [100/500], Loss: 2.0170
Epoch [2/10], Step [200/500], Loss: 1.9093
Epoch [2/10], Step [300/500], Loss: 1.8675
Epoch [2/10], Step [400/500], Loss: 1.9958
Epoch [2/10], Step [500/500], Loss: 1.9317
Epoch [3/10], Step [100/500], Loss: 1.6829
Epoch [3/10], Step [200/500], Loss: 1.7935
Epoch [3/10], Step [300/500], Loss: 1.7509
Epoch [3/10], Step [400/500], Loss: 1.7408
Epoch [3/10], Step [500/500], Loss: 1.9767
Epoch [4/10], Step [100/500], Loss: 1.7817
Epoch [4/10], Step [200/500], Loss: 1.8162
Epoch [4/10], Step [300/500], Loss: 1.7876
Epoch [4/10], Step [400/500], Loss: 1.7283
Epoch [4/10], Step [500/500], Loss: 1.7603
Epoch [5/10], Step [100/500], Loss: 1.8196
Epoch [5/10], Step [200/500], Loss: 1.9152
Epoch [5/10], St