In [2]:
import torch
import torch.nn as nn
import torch.optim as optim
from torchvision import datasets, transforms

import tensorflow as tf
from tensorflow import keras

# PyTorch: Define transforms for the dataset: Convert images to tensors and normalize them.
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,))
])

# Load the MNIST training dataset with defined transforms
train_dataset = datasets.MNIST('./data', train=True, download=True, transform=transform)
# DataLoader to batch, shuffle and load the data.
train_loader = torch.utils.data.DataLoader(train_dataset, batch_size=64, shuffle=True)

# Load the MNIST test dataset
test_dataset = datasets.MNIST('./data', train=False, download=True, transform=transform)
# DataLoader for the test data
test_loader = torch.utils.data.DataLoader(test_dataset, batch_size=64, shuffle=False)

# Define a PyTorch Neural Network Class
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        # First fully connected layer
        self.fc1 = nn.Linear(28*28, 512)
        # Second fully connected layer that outputs to 10 classes
        self.fc2 = nn.Linear(512, 10)

    # Forward pass through the network
    def forward(self, x):
        x = x.view(-1, 28*28)  # Flatten the image
        x = torch.relu(self.fc1(x))  # Activation function after first layer
        x = self.fc2(x)  # Output layer
        return x

# Instantiate the network
model_pytorch = Net()

# Loss function and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.SGD(model_pytorch.parameters(), lr=0.01, momentum=0.9)

# Training loop for PyTorch model
for epoch in range(5):
    running_loss = 0.0
    for i, data in enumerate(train_loader, 0):
        inputs, labels = data
        optimizer.zero_grad()  # Zero the parameter gradients
        outputs = model_pytorch(inputs)  # Forward pass
        loss = criterion(outputs, labels)  # Compute loss
        loss.backward()  # Backpropagate the error
        optimizer.step()  # Update the weights
        running_loss += loss.item()  # Add up the loss
        if i % 100 == 99:  # Print every 100 mini-batches
            print(f"[{epoch + 1}, {i + 1}] loss: {running_loss / 100:.3f}")
            running_loss = 0.0

# Evaluation for PyTorch model
correct = 0
total = 0
with torch.no_grad():  # Disabling gradient calculation
    for data in test_loader:
        images, labels = data
        outputs = model_pytorch(images)
        _, predicted = torch.max(outputs.data, 1)  # Get the predicted classes
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print(f'Accuracy of the PyTorch network on the 10000 test images: {100 * correct / total}%')

# TensorFlow and Keras
# Load MNIST dataset
(x_train, y_train), (x_test, y_test) = keras.datasets.mnist.load_data()
x_train = x_train / 255.0  # Normalize the training data
x_test = x_test / 255.0  # Normalize the testing data

# Define the Keras model
model_keras = keras.Sequential([
    keras.layers.Flatten(input_shape=(28, 28)),  # Flatten the images
    keras.layers.Dense(512, activation='relu'),  # Dense layer with 512 neurons
    keras.layers.Dense(10, activation='softmax')  # Output layer with softmax for multi-class classification
])

# Compile the Keras model
model_keras.compile(optimizer='adam',  # Optimizer
              loss='sparse_categorical_crossentropy',  # Loss function
              metrics=['accuracy'])  # Metrics to monitor

# Training for Keras model
model_keras.fit(x_train, y_train, epochs=5, batch_size=64, validation_data=(x_test, y_test))

# Evaluation for Keras model
test_loss, test_acc = model_keras.evaluate(x_test, y_test)
print(f'Test accuracy of the Keras model: {test_acc}')


[1, 100] loss: 0.871
[1, 200] loss: 0.407
[1, 300] loss: 0.365
[1, 400] loss: 0.322
[1, 500] loss: 0.310
[1, 600] loss: 0.263
[1, 700] loss: 0.246
[1, 800] loss: 0.225
[1, 900] loss: 0.222
[2, 100] loss: 0.197
[2, 200] loss: 0.186
[2, 300] loss: 0.165
[2, 400] loss: 0.170
[2, 500] loss: 0.159
[2, 600] loss: 0.158
[2, 700] loss: 0.165
[2, 800] loss: 0.150
[2, 900] loss: 0.130
[3, 100] loss: 0.122
[3, 200] loss: 0.121
[3, 300] loss: 0.127
[3, 400] loss: 0.125
[3, 500] loss: 0.115
[3, 600] loss: 0.122
[3, 700] loss: 0.107
[3, 800] loss: 0.105
[3, 900] loss: 0.104
[4, 100] loss: 0.095
[4, 200] loss: 0.093
[4, 300] loss: 0.095
[4, 400] loss: 0.089
[4, 500] loss: 0.090
[4, 600] loss: 0.083
[4, 700] loss: 0.096
[4, 800] loss: 0.085
[4, 900] loss: 0.085
[5, 100] loss: 0.074
[5, 200] loss: 0.077
[5, 300] loss: 0.073
[5, 400] loss: 0.076
[5, 500] loss: 0.067
[5, 600] loss: 0.076
[5, 700] loss: 0.068
[5, 800] loss: 0.078
[5, 900] loss: 0.080
Accuracy of the PyTorch network on the 10000 test image

  super().__init__(**kwargs)


Epoch 1/5
[1m938/938[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m4s[0m 3ms/step - accuracy: 0.8904 - loss: 0.3796 - val_accuracy: 0.9662 - val_loss: 0.1135
Epoch 2/5
[1m938/938[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3s[0m 3ms/step - accuracy: 0.9721 - loss: 0.0931 - val_accuracy: 0.9731 - val_loss: 0.0878
Epoch 3/5
[1m938/938[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3s[0m 3ms/step - accuracy: 0.9832 - loss: 0.0567 - val_accuracy: 0.9782 - val_loss: 0.0674
Epoch 4/5
[1m938/938[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3s[0m 3ms/step - accuracy: 0.9873 - loss: 0.0403 - val_accuracy: 0.9786 - val_loss: 0.0685
Epoch 5/5
[1m938/938[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3s[0m 3ms/step - accuracy: 0.9919 - loss: 0.0263 - val_accuracy: 0.9779 - val_loss: 0.0715
[1m313/313[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 925us/step - accuracy: 0.9741 - loss: 0.0833
Test accuracy of the Keras model: 0.9779000282287598
