<a href="https://colab.research.google.com/github/DesTuu/LearningDeepLearning/blob/main/first.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
# Import necessary libraries
import torch  # PyTorch main library for deep learning
import torch.nn as nn  # Neural network module
import torch.optim as optim  # Optimization algorithms
import torch.nn.functional as F  # Functional operations (like activation functions)
from torchvision import datasets, transforms  # Utilities for loading datasets and applying transformations
from torch.utils.data import DataLoader  # Helps load data in batches efficiently

# Define a simple neural network
class SimpleNN(nn.Module):  # The neural network inherits from nn.Module (PyTorch's base class for models)
    def __init__(self):  # Constructor for initializing layers
        super(SimpleNN, self).__init__()  # Calls the parent class constructor
        self.fc1 = nn.Linear(28*28, 128)  # Fully connected layer: input 28*28 pixels, output 128 neurons
        self.fc2 = nn.Linear(128, 10)  # Fully connected layer: input 128 neurons, output 10 (for 10 digit classes)

    def forward(self, x):  # Defines how data flows through the network
        x = x.view(-1, 28*28)  # Reshapes 2D images (28x28) into a 1D vector (28*28 = 784)
        x = F.relu(self.fc1(x))  # First layer with ReLU activation
        x = self.fc2(x)  # Second layer (logits, no activation as CrossEntropyLoss handles it)
        return x  # Output is the raw scores (logits) for each class

# Load MNIST dataset (handwritten digits)
transform = transforms.Compose([
    transforms.ToTensor(),  # Convert images to tensors (PyTorch format)
    transforms.Normalize((0.5,), (0.5,))  # Normalize images (mean=0.5, std=0.5) to improve training
])

# Download and load the training data
train_data = datasets.MNIST(root='./data', train=True, transform=transform, download=True)
train_loader = DataLoader(train_data, batch_size=32, shuffle=True)  # Load data in batches of 32

# Initialize model, loss function, and optimizer
model = SimpleNN()  # Create an instance of our neural network
criterion = nn.CrossEntropyLoss()  # Loss function for classification (logits + softmax)
optimizer = optim.Adam(model.parameters(), lr=0.001)  # Adam optimizer with a learning rate of 0.001

# Training loop
num_epochs = 5  # Number of times the entire dataset will be passed through the model

for epoch in range(num_epochs):  # Loop through each epoch
    for images, labels in train_loader:  # Loop through mini-batches
        optimizer.zero_grad()  # Reset gradients to avoid accumulation
        outputs = model(images)  # Forward pass: get predictions
        loss = criterion(outputs, labels)  # Compute loss (how far predictions are from actual labels)
        loss.backward()  # Compute gradients using backpropagation
        optimizer.step()  # Update model parameters based on gradients

    print(f"Epoch [{epoch+1}/{num_epochs}], Loss: {loss.item():.4f}")  # Print loss for monitoring

print("Training complete!")  # Print message after training


Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz
Failed to download (trying next):
<urlopen error [Errno 111] Connection refused>

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-images-idx3-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-images-idx3-ubyte.gz to ./data/MNIST/raw/train-images-idx3-ubyte.gz


100%|██████████| 9.91M/9.91M [00:00<00:00, 52.1MB/s]


Extracting ./data/MNIST/raw/train-images-idx3-ubyte.gz to ./data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/train-labels-idx1-ubyte.gz
Failed to download (trying next):
<urlopen error [Errno 111] Connection refused>

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-labels-idx1-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-labels-idx1-ubyte.gz to ./data/MNIST/raw/train-labels-idx1-ubyte.gz


100%|██████████| 28.9k/28.9k [00:00<00:00, 1.92MB/s]


Extracting ./data/MNIST/raw/train-labels-idx1-ubyte.gz to ./data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-images-idx3-ubyte.gz
Failed to download (trying next):
<urlopen error [Errno 111] Connection refused>

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-images-idx3-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-images-idx3-ubyte.gz to ./data/MNIST/raw/t10k-images-idx3-ubyte.gz


100%|██████████| 1.65M/1.65M [00:00<00:00, 14.5MB/s]


Extracting ./data/MNIST/raw/t10k-images-idx3-ubyte.gz to ./data/MNIST/raw

Downloading http://yann.lecun.com/exdb/mnist/t10k-labels-idx1-ubyte.gz
Failed to download (trying next):
<urlopen error [Errno 111] Connection refused>

Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-labels-idx1-ubyte.gz
Downloading https://ossci-datasets.s3.amazonaws.com/mnist/t10k-labels-idx1-ubyte.gz to ./data/MNIST/raw/t10k-labels-idx1-ubyte.gz


100%|██████████| 4.54k/4.54k [00:00<00:00, 3.91MB/s]


Extracting ./data/MNIST/raw/t10k-labels-idx1-ubyte.gz to ./data/MNIST/raw

Epoch [1/5], Loss: 0.1393
Epoch [2/5], Loss: 0.1027
Epoch [3/5], Loss: 0.1386
Epoch [4/5], Loss: 0.0227
Epoch [5/5], Loss: 0.0139
Training complete!
