This is an example of a simple CNN developed, trained and utilized

AI was used to help generate the codebase

Note: Make sure that the tensorflow package is installed in your device.

In [118]:
# Lib imports
import os
import tensorflow as tf
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras import layers, models
import numpy as np

In [None]:
# DATASET DIRECTORY CONFIGURATION
# Using muffin_vs_chihuahua dataset
train_dir = "muffin_vs_chihuahua/train"  # Contains 'chihuahua' and 'muffin' folders
test_dir = "muffin_vs_chihuahua/test"   # Contains 'chihuahua' and 'muffin' folders    

In [120]:
# IMAGE PARAMETERS
# Used to resize the input images, also will determine the input size of your input layer.
IMG_SIZE = (128, 128)
BATCH_SIZE = 32

In [121]:
# DATA PREPROCESSING & AUGMENTATION
# Optional but recommended for image processing tasks, especially with limited data.
train_datagen = ImageDataGenerator(
    rescale=1./255,
    rotation_range=15,
    width_shift_range=0.1,
    height_shift_range=0.1,
    horizontal_flip=True,
    validation_split=0.2
)
test_datagen = ImageDataGenerator(rescale=1./255)

train_generator = train_datagen.flow_from_directory(
    train_dir,
    target_size=IMG_SIZE,
    batch_size=BATCH_SIZE,
    class_mode='binary',
    subset='training'
)
val_generator = train_datagen.flow_from_directory(
    train_dir,
    target_size=IMG_SIZE,
    batch_size=BATCH_SIZE,
    class_mode='binary',
    subset='validation'
)
test_generator = test_datagen.flow_from_directory(
    test_dir,
    target_size=IMG_SIZE,
    batch_size=BATCH_SIZE,
    class_mode='binary',
    shuffle=False
)

Found 1532 images belonging to 2 classes.
Found 383 images belonging to 2 classes.
Found 1915 images belonging to 2 classes.


In [122]:
# IMPROVED CNN MODEL ARCHITECTURE WITH REGULARIZATION AND DROPOUT

# Some modifications are applied
initial_learning_rate = 0.001
# We are combining ExponentialDecay with Adam optimizer for better learning rate management
lr_schedule = tf.keras.optimizers.schedules.ExponentialDecay(
    initial_learning_rate,
    decay_steps=10000,
    decay_rate=0.9,
    staircase=True
)

# Create the optimizer with the learning rate schedule
optimizer = tf.keras.optimizers.Adam(learning_rate=lr_schedule)

# Applied dropout layers and L2 regularization to reduce overfitting
# L2 regularization helps prevent overfitting by penalizing large weights
model = models.Sequential([
    layers.Input(shape=(IMG_SIZE[0], IMG_SIZE[1], 3)),
    layers.Conv2D(32, (3, 3), activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.MaxPooling2D(2, 2),
    layers.Dropout(0.25),
    layers.Conv2D(64, (3, 3), activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.MaxPooling2D(2, 2),
    layers.Dropout(0.25),
    layers.Conv2D(128, (3, 3), activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.MaxPooling2D(2, 2),
    layers.Flatten(),
    layers.Dense(128, activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.Dropout(0.5),
    layers.Dense(1, activation='sigmoid')
])

In [123]:
# Configure the model optimizers, loss function, and metrics
# model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy']) # old
model.compile(optimizer=optimizer, loss='binary_crossentropy', metrics=['accuracy'])

In [None]:
# TRAINING THE CNN
history = model.fit(
    train_generator,
    epochs=10,
    validation_data=val_generator
)

Epoch 1/10
[1m48/48[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m34s[0m 560ms/step - accuracy: 0.5242 - loss: 1.2870 - val_accuracy: 0.5509 - val_loss: 0.8229
Epoch 2/10
[1m48/48[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m49s[0m 1s/step - accuracy: 0.6725 - loss: 0.7807 - val_accuracy: 0.7546 - val_loss: 0.6754
Epoch 3/10
[1m48/48[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m23s[0m 478ms/step - accuracy: 0.7523 - loss: 0.6394 - val_accuracy: 0.7154 - val_loss: 0.5881
Epoch 4/10


In [None]:
# EVALUATE THE MODEL
test_loss, test_acc = model.evaluate(test_generator, verbose=1)
print(f"\n{'='*50}")
print(f"IMPROVED MODEL - Test Accuracy: {test_acc:.4f} ({test_acc*100:.2f}%)")
print(f"Test Loss: {test_loss:.4f}")
print(f"{'='*50}")

[1m60/60[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m10s[0m 173ms/step - accuracy: 0.9441 - loss: 0.2503

IMPROVED MODEL - Test Accuracy: 0.8449 (84.49%)
Test Loss: 0.3849


In [None]:
# SAVE THE MODEL (optional - for comparison)
model.save('muffin_vs_chihuahua_cnn_improved.keras')
print("Model saved as 'muffin_vs_chihuahua_cnn_improved.keras'")

Improved model saved as 'muffin_vs_chihuahua_cnn_improved.keras'


In [None]:
# INFERENCE SCRIPT FOR IMPROVED MODEL
from tensorflow.keras.preprocessing import image

# Load model once for efficiency
_loaded_model = None

def predict_image(img_path, model_path='muffin_vs_chihuahua_cnn_improved.keras', img_size=IMG_SIZE):
    global _loaded_model
    if _loaded_model is None:
        _loaded_model = tf.keras.models.load_model(model_path)
    img = image.load_img(img_path, target_size=img_size)
    img_array = image.img_to_array(img) / 255.0
    img_array = np.expand_dims(img_array, axis=0)
    pred = _loaded_model.predict(img_array, verbose=0)[0,0]
    label = "Chihuahua" if pred >= 0.5 else "Muffin" 
    confidence = pred if pred >= 0.5 else (1 - pred)
    print(f"Image: {img_path}")
    print(f"Prediction: {label}")
    print(f"Confidence: {confidence:.4f} ({confidence*100:.2f}%)")
    print(f"Raw prediction value: {pred:.4f}")
    print("-" * 50)
    return label, pred, confidence


In [None]:
predict_image("run_1/run_1.jpg")
predict_image("run_1/run_2.jpg")

Image: run_1/run_1.jpg
Prediction: Paper
Confidence: 0.6779 (67.79%)
Raw prediction value: 0.3221
--------------------------------------------------
Image: run_1/run_2.jpg
Prediction: Paper
Confidence: 0.6507 (65.07%)
Raw prediction value: 0.3493
--------------------------------------------------


('Paper', np.float32(0.34932846), np.float32(0.65067154))

In [None]:
# IMPROVED CNN MODEL WITH REGULARIZATION AND DROPOUT


# Learning rate schedule
initial_learning_rate = 0.001
lr_schedule = tf.keras.optimizers.schedules.ExponentialDecay(
    initial_learning_rate,
    decay_steps=10000,
    decay_rate=0.9,
    staircase=True
)

# Create the optimizer with the learning rate schedule
optimizer = tf.keras.optimizers.Adam(learning_rate=lr_schedule)

# Improved model with dropout and L2 regularization
# L2 regularization (lambda=0.001) penalizes large weights to prevent overfitting
# Dropout layers randomly deactivate neurons during training to improve generalization
model_improved = models.Sequential([
    layers.Input(shape=(IMG_SIZE[0], IMG_SIZE[1], 3)),
    layers.Conv2D(32, (3, 3), activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.MaxPooling2D(2, 2),
    layers.Dropout(0.25),
    layers.Conv2D(64, (3, 3), activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.MaxPooling2D(2, 2),
    layers.Dropout(0.25),
    layers.Conv2D(128, (3, 3), activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.MaxPooling2D(2, 2),
    layers.Flatten(),
    layers.Dense(128, activation='relu', kernel_regularizer=tf.keras.regularizers.l2(0.001)),
    layers.Dropout(0.5),
    layers.Dense(1, activation='sigmoid')
])

# Compile the improved model
model_improved.compile(optimizer=optimizer, loss='binary_crossentropy', metrics=['accuracy'])

print("Improved model architecture created with:")
print("- L2 regularization (lambda=0.001) on all Conv2D and Dense layers")
print("- Dropout layers: 0.25 after conv layers, 0.5 after dense layer")


Improved model architecture created with:
- L2 regularization (lambda=0.001) on all Conv2D and Dense layers
- Dropout layers: 0.25 after conv layers, 0.5 after dense layer


In [None]:
# TRAINING THE IMPROVED CNN MODEL
print("Training improved model with regularization and dropout...")
history_improved = model_improved.fit(
    train_generator,
    epochs=10,
    validation_data=val_generator,
    verbose=1
)


Training improved model with regularization and dropout...
Epoch 1/10
[1m43/48[0m [32m━━━━━━━━━━━━━━━━━[0m[37m━━━[0m [1m2s[0m 504ms/step - accuracy: 0.4978 - loss: 1.4044

KeyboardInterrupt: 

In [None]:
# EVALUATE THE IMPROVED MODEL
print("EVALUATING IMPROVED MODEL")
test_loss_improved, test_acc_improved = model_improved.evaluate(test_generator, verbose=1)
print(f"IMPROVED MODEL RESULTS:")
print(f"Test Accuracy: {test_acc_improved:.4f} ({test_acc_improved*100:.2f}%)")
print(f"Test Loss: {test_loss_improved:.4f}")

#2a: Accuracy
print("2a) ACCURACY: ")
print(f"The improved model achieves a test accuracy of {test_acc_improved:.4f} ({test_acc_improved*100:.2f}%)")

EVALUATING IMPROVED MODEL


[1m60/60[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m9s[0m 153ms/step - accuracy: 0.9277 - loss: 0.2681
IMPROVED MODEL RESULTS:
Test Accuracy: 0.7864 (78.64%)
Test Loss: 0.5251
2a) ACCURACY: 
The improved model achieves a test accuracy of 0.7864 (78.64%)


In [None]:
# SAVE THE IMPROVED MODEL
model_improved.save('exercise_6_trained_model_improved.h5')
print("Improved model saved as 'exercise_6_trained_model_improved.h5'")




Improved model saved as 'exercise_6_custom_lastname.grecia.h5'


In [None]:
# PREDICTIONS ON RUN 1 AND RUN 2 USING IMPROVED MODEL
from tensorflow.keras.preprocessing import image

# Load the improved model
_loaded_model_improved = None

def predict_image_improved(img_path, model_path='exercise_6_trained_model_improved.h5', img_size=IMG_SIZE):
    global _loaded_model_improved
    if _loaded_model_improved is None:
        _loaded_model_improved = tf.keras.models.load_model(model_path)
    img = image.load_img(img_path, target_size=img_size)
    img_array = image.img_to_array(img) / 255.0
    img_array = np.expand_dims(img_array, axis=0)
    pred = _loaded_model_improved.predict(img_array, verbose=0)[0,0]
    label = "Chihuahua" if pred >= 0.5 else "Muffin"  # Class 0=Chihuahua, Class 1=Muffin (alphabetical order)
    confidence = pred if pred >= 0.5 else (1 - pred)
    return label, pred, confidence

print("IMPROVED MODEL PREDICTIONS ON RUN 1 AND RUN 2")

print("\nRun 1:")
label1, pred1, conf1 = predict_image_improved("run_1/run_1.jpg")
print(f"  Image: run_1/run_1.jpg")
print(f"  Prediction: {label1}")
print(f"  Confidence: {conf1:.4f} ({conf1*100:.2f}%)")
print(f"  Raw prediction value: {pred1:.4f}")

print("\nRun 2:")
label2, pred2, conf2 = predict_image_improved("run_1/run_2.jpg")
print(f"  Image: run_1/run_2.jpg")
print(f"  Prediction: {label2}")
print(f"  Confidence: {conf2:.4f} ({conf2*100:.2f}%)")
print(f"  Raw prediction value: {pred2:.4f}")

print("2b): RUN 1 AND 2 PREDICTIONS")
print(f"Run 1 Prediction: {label1}")
print(f"Run 1 Confidence: {conf1:.4f} ({conf1*100:.2f}%)")
print(f"\nRun 2 Prediction: {label2}")
print(f"Run 2 Confidence: {conf2:.4f} ({conf2*100:.2f}%)")


IMPROVED MODEL PREDICTIONS ON RUN 1 AND RUN 2

Run 1:




  Image: run_1/run_1.jpg
  Prediction: Plastic
  Confidence: 0.8273 (82.73%)
  Raw prediction value: 0.8273

Run 2:
  Image: run_1/run_2.jpg
  Prediction: Plastic
  Confidence: 0.5565 (55.65%)
  Raw prediction value: 0.5565
2b): RUN 1 AND 2 PREDICTIONS
Run 1 Prediction: Plastic
Run 1 Confidence: 0.8273 (82.73%)

Run 2 Prediction: Plastic
Run 2 Confidence: 0.5565 (55.65%)
