# Asynchronous learning materials for week_6_CNNs


In [None]:
# Import necessary modules from TensorFlow for building and training a neural network
import tensorflow as tf
from tensorflow.keras import layers, models

# Load the MNIST dataset, which includes 60,000 images for training and 10,000 images for testing.
# Each image is a 28x28 grayscale image of a handwritten digit.
(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()

# Normalize the pixel values of the training and testing images to be between 0 and 1.
# This is a common preprocessing step for images to ensure all pixel values are on the same scale.
x_train, x_test = x_train / 255.0, x_test / 255.0

# Define a Sequential model, which is a linear stack of layers.
model = models.Sequential([
    # Flatten the input images to prepare them for the dense layers.
    # The input shape is specified as (28, 28) to match the shape of the input images.
    layers.Flatten(input_shape=(28, 28)),
    # Add a dense layer with 128 units and a ReLU activation function.
    # This layer will learn to recognize features in the input data.
    layers.Dense(128, activation='relu'),
    # Add a dropout layer with a dropout rate of 0.2.
    # Dropout layers randomly set a fraction of the output units of the previous layer to 0 during training,
    # which helps prevent overfitting by making the model less sensitive to specific weights.
    layers.Dropout(0.2),
    # Add a final dense layer with 10 units (one for each digit class) and a softmax activation function.
    # The softmax function ensures the output is a probability distribution over the 10 classes.
    layers.Dense(10, activation='softmax')
])

# Compile the model with the Adam optimizer and sparse categorical cross-entropy loss.
# The Adam optimizer is a popular stochastic gradient descent algorithm for training neural networks.
# Sparse categorical cross-entropy is a loss function suitable for multi-class classification problems.
model.compile(optimizer='adam',
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'])

# Train the model on the training data for 5 epochs.
# An epoch is a complete pass through the training dataset.
model.fit(x_train, y_train, epochs=5)

# Evaluate the model on the testing data.
# This will give us an idea of how well the model generalizes to unseen data.
model.evaluate(x_test, y_test)


In [None]:
import tensorflow as tf
from tensorflow.keras import layers, models
from tensorflow.keras.datasets import mnist
from tensorflow.keras.utils import to_categorical

# Load the MNIST dataset, which includes 60,000 images for training and 10,000 images for testing.
# Each image is a 28x28 grayscale image of a handwritten digit.
(train_images, train_labels), (test_images, test_labels) = mnist.load_data()

# Preprocess the training images by reshaping them to include the channel dimension (1 for grayscale images)
# and normalizing the pixel values to be between 0 and 1.
train_images = train_images.reshape((60000, 28, 28, 1)).astype('float32') / 255

# Similarly, preprocess the test images.
test_images = test_images.reshape((10000, 28, 28, 1)).astype('float32') / 255

# Convert the integer labels to categorical labels, which are suitable for categorical cross-entropy loss.
train_labels = to_categorical(train_labels)
test_labels = to_categorical(test_labels)

# Build a convolutional neural network (CNN) model using the Sequential API.
model = models.Sequential()

# Add the first convolutional layer with 32 filters, each of size 3x3, followed by a ReLU activation function.
# The input shape is specified as (28, 28, 1) to match the shape of the input images.
model.add(layers.Conv2D(32, (3, 3), activation='relu', input_shape=(28, 28, 1)))

# Add a max pooling layer with a pool size of 2x2 to downsample the feature maps.
model.add(layers.MaxPooling2D((2, 2)))

# Add the second convolutional layer with 64 filters, each of size 3x3, followed by a ReLU activation function.
model.add(layers.Conv2D(64, (3, 3), activation='relu'))

# Add another max pooling layer with a pool size of 2x2 to further downsample the feature maps.
model.add(layers.MaxPooling2D((2, 2)))

# Add the third convolutional layer with 64 filters, each of size 3x3, followed by a ReLU activation function.
model.add(layers.Conv2D(64, (3, 3), activation='relu'))

# Flatten the output of the convolutional layers to prepare it for the dense layers.
model.add(layers.Flatten())

# Add a dense layer with 64 units and a ReLU activation function.
model.add(layers.Dense(64, activation='relu'))

# Add the final dense layer with 10 units (one for each digit class) and a softmax activation function for output.
model.add(layers.Dense(10, activation='softmax'))

# Compile the model with the Adam optimizer and categorical cross-entropy loss.
# The model will also track accuracy during training and testing.
model.compile(optimizer='adam',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

# Train the model on the training data for 5 epochs with a batch size of 64.
# 10% of the training data will be used for validation.
model.fit(train_images, train_labels, epochs=5, batch_size=64, validation_split=0.1)

# Evaluate the model on the test data.
test_loss, test_acc = model.evaluate(test_images, test_labels)

# Print the test accuracy.
print(f'Test accuracy: {test_acc}')
