# CD2_P1_FT

### Variable Paths, Execution Environments

In [1]:
modelname = 'CD2_P1_FT'

I use 3 Local Machines & 2 Cloud Compute Engines (Google, Kaggle). The appropriate paths for each platform of execution are declared here.

In [2]:
Kaggle = 0
Colab = 0
Local = 1
LocalRM = 0
LocalOldLaptop = 0

# Kaggle Notebooks
Kaggle_Dataset = '/kaggle/input/catsdogsconv/KaggleCatsDogsConv'
Kaggle_SavedModels = '/kaggle/working/SavedModels'
Kaggle_TrainingHistory = '/kaggle/working/TrainingHistory'

# Google Drive
GD_Dataset = '/content/drive/MyDrive/Datasets/KaggleCatsDogs'
GD_SavedModels = '/content/drive/MyDrive/NotebookWorkspace/SavedModels'
CD_TrainingHistory = '/content/drive/MyDrive/NotebookWorkspace/TrainingHistory'

# Local Directories
Lc_Dataset = 'C:\\Programming_Files\\JupyterVSCode\\Binary_Classification_Transfer_Learning\\CatsDogs\\DatasetConv'
Lc_SavedModels = 'C:\\Programming_Files\\JupyterVSCode\\Binary_Classification_Transfer_Learning\\CatsDogs\\SavedModels'
Lc_TrainingHistory = 'C:\\Programming_Files\\JupyterVSCode\\Binary_Classification_Transfer_Learning\\CatsDogs\\Docs_Reports\\RawTrainingData'

Lc_RM_Dataset = "C:\\Users\\arisi\\Documents\\VSCode\\CatsDogs\\Dataset\\KaggleCatsDogsConv"
Lc_RM_SavedModels = "C:\\Users\\arisi\\Documents\\VSCode\\CatsDogs\\SavedModels"
Lc_RM_TrainingHistory = "C:\\Users\\arisi\\Documents\\VSCode\\CatsDogs\\Docs_Reports\\RawTrainingData"

Lc_Old_Dataset = 'Test'
Lc_Old_SavedModels = 'Test'
Lc_Old_TrainingHistory = 'Test'

In [3]:
if Kaggle:
    data_dir = Kaggle_Dataset
    SavedModelsPath = Kaggle_SavedModels
    TrainingHistoryPath = Kaggle_TrainingHistory
if Colab:
    from google.colab import drive
    drive.mount('/content/drive')
    data_dir = GD_Dataset
    SavedModelsPath = GD_SavedModels
    TrainingHistoryPath = CD_TrainingHistory
if Local:
    data_dir = Lc_Dataset
    SavedModelsPath = Lc_SavedModels
    TrainingHistoryPath = Lc_TrainingHistory
if LocalRM:
    data_dir = Lc_RM_Dataset
    SavedModelsPath = Lc_RM_SavedModels
    TrainingHistoryPath = Lc_RM_TrainingHistory
if LocalOldLaptop:
    data_dir = Lc_Old_Dataset
    SavedModelsPath = Lc_Old_SavedModels
    TrainingHistoryPath = Lc_Old_TrainingHistory

### Import Packages

In [4]:
import tensorflow as tf
from tensorflow.keras import layers, models
from tensorflow.keras.applications import VGG16

### Load the Dataset

In [5]:
from tensorflow.keras.utils import image_dataset_from_directory

In [6]:
# Load Datasets
train_dataset = image_dataset_from_directory(
    data_dir,
    image_size=(224, 224),
    batch_size=32,
    label_mode='binary',
    validation_split=0.2,  # 20% for validation
    subset='training',     # Use the 'training' subset
    seed=123
)

val_dataset = image_dataset_from_directory(
    data_dir,
    image_size=(224, 224),
    batch_size=32,
    label_mode='binary',
    validation_split=0.2,  # 20% for validation
    subset='validation',   # Use the 'validation' subset
    seed=123
)

Found 24997 files belonging to 2 classes.
Using 19998 files for training.
Found 24997 files belonging to 2 classes.
Using 4999 files for validation.


### Preprocessing & Augmentation

In [7]:
from tensorflow.keras.applications.vgg16 import preprocess_input

In [8]:
# Augmentation layer
data_augmentation = tf.keras.Sequential([
    layers.RandomFlip('horizontal'),
    layers.RandomRotation(0.1),  # 10% random rotation
    layers.RandomZoom(0.1),      # 10% zoom
    layers.RandomTranslation(0.1, 0.1),  # Random height and width shift
    layers.RandomBrightness(0.2)
])

# Augment the training data
def augment_img(image, label):
    image = data_augmentation(image)  # Apply augmentations
    return image, label

train_dataset = train_dataset.map(augment_img)

In [9]:
# Apply VGG-16 preprocessing
def preprocess_img(image, label):
    image = preprocess_input(image)  # Apply VGG16-specific preprocessing
    return image, label

train_dataset = train_dataset.map(preprocess_img)
val_dataset = val_dataset.map(preprocess_img)

### Load Model with Trained Head

In [10]:
filepath = f'{SavedModelsPath}\\CD2\\CD2_P1_003_val0.0486.keras'
model = tf.keras.models.load_model(filepath)

### Unfreeze Last VGG Block & Verify

In [11]:
# Unfreeze the last few layers (e.g., last 4 layers)
for layer in model.layers[-4:]:
    layer.trainable = True

# Optionally, print trainable status
for i, layer in enumerate(model.layers):
    print(f"Layer {i}: {layer.name}, Trainable: {layer.trainable}")

Layer 0: vgg16, Trainable: True
Layer 1: global_average_pooling2d, Trainable: True
Layer 2: dense, Trainable: True
Layer 3: dropout, Trainable: True
Layer 4: dense_1, Trainable: True


In [12]:
for layer in model.layers[0].layers:
    if layer.name in ['block5_conv1', 'block5_conv2', 'block5_conv3']:
        layer.trainable = True
    else:
        layer.trainable = False

In [13]:
def print_model_layers(model, indent=0):
    for layer in model.layers:
        print(" " * indent + f"- {layer.name} ({layer.__class__.__name__}), Trainable: {layer.trainable}")
        # If this layer has sublayers (like Functional or Sequential models)
        if hasattr(layer, 'layers'):
            print_model_layers(layer, indent + 2)

print_model_layers(model)

print(model.optimizer.get_config())

- vgg16 (Functional), Trainable: True
  - input_layer_1 (InputLayer), Trainable: False
  - block1_conv1 (Conv2D), Trainable: False
  - block1_conv2 (Conv2D), Trainable: False
  - block1_pool (MaxPooling2D), Trainable: False
  - block2_conv1 (Conv2D), Trainable: False
  - block2_conv2 (Conv2D), Trainable: False
  - block2_pool (MaxPooling2D), Trainable: False
  - block3_conv1 (Conv2D), Trainable: False
  - block3_conv2 (Conv2D), Trainable: False
  - block3_conv3 (Conv2D), Trainable: False
  - block3_pool (MaxPooling2D), Trainable: False
  - block4_conv1 (Conv2D), Trainable: False
  - block4_conv2 (Conv2D), Trainable: False
  - block4_conv3 (Conv2D), Trainable: False
  - block4_pool (MaxPooling2D), Trainable: False
  - block5_conv1 (Conv2D), Trainable: True
  - block5_conv2 (Conv2D), Trainable: True
  - block5_conv3 (Conv2D), Trainable: True
  - block5_pool (MaxPooling2D), Trainable: False
- global_average_pooling2d (GlobalAveragePooling2D), Trainable: True
- dense (Dense), Trainable: Tr

### Compile

In [14]:
name = f'{modelname}'
checkpoint_path = f"{SavedModelsPath}\\CD2\\{name}_{{epoch:03d}}_val{{val_loss:.4f}}.keras"

from tensorflow.keras.callbacks import ModelCheckpoint

# Create the ModelCheckpoint callback
checkpoint_callback = ModelCheckpoint(
    filepath=checkpoint_path,
    save_freq='epoch',              # Save every epoch
    save_weights_only=False,
    save_best_only=False,           # Save every time, not just best
    monitor='val_loss',
    verbose=1,
)

from tensorflow.keras.callbacks import ReduceLROnPlateau
lr_scheduler = ReduceLROnPlateau(monitor='val_loss', factor=0.5, patience=2, verbose=1)

In [15]:
from tensorflow.keras.optimizers import Adam
optimizer = Adam(learning_rate=5*1e-5)

model.compile(optimizer=optimizer, loss='binary_crossentropy', metrics=['accuracy'])

### Train & Save Results

In [16]:
history = model.fit(
    train_dataset,
    epochs=4,
    validation_data=val_dataset,
    callbacks=[checkpoint_callback, lr_scheduler]
)

Epoch 1/4
[1m625/625[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 5s/step - accuracy: 0.9613 - loss: 0.1092
Epoch 1: saving model to C:\Programming_Files\JupyterVSCode\Binary_Classification_Transfer_Learning\CatsDogs\SavedModels\CD2\CD2_P1_FT_001_val0.0394.keras
[1m625/625[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3698s[0m 6s/step - accuracy: 0.9613 - loss: 0.1092 - val_accuracy: 0.9882 - val_loss: 0.0394 - learning_rate: 5.0000e-05
Epoch 2/4
[1m625/625[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 4s/step - accuracy: 0.9793 - loss: 0.0556
Epoch 2: saving model to C:\Programming_Files\JupyterVSCode\Binary_Classification_Transfer_Learning\CatsDogs\SavedModels\CD2\CD2_P1_FT_002_val0.0683.keras
[1m625/625[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3410s[0m 5s/step - accuracy: 0.9793 - loss: 0.0556 - val_accuracy: 0.9790 - val_loss: 0.0683 - learning_rate: 5.0000e-05
Epoch 3/4
[1m625/625[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 5s/step - accura

In [17]:
import json

name = f'{modelname}'
filepath = f"{TrainingHistoryPath}\\{name}.json"
with open(filepath, 'w') as f:
    json.dump(history.history, f)

### Continue Training (2)

In [None]:
history2 = model.fit(
    train_dataset,
    epochs=5,
    validation_data=val_dataset,
    callbacks=[checkpoint_callback, lr_scheduler]
)

In [None]:
import json

name = f'{modelname}_continue'
filepath = f"{TrainingHistoryPath}\\{name}.json"
with open(filepath, 'w') as f:
    json.dump(history2.history, f)