In [1]:
import tensorflow as tf
for device in tf.config.list_physical_devices():
    print(": {}".format(device.name))

: /physical_device:CPU:0
: /physical_device:GPU:0


In [2]:
# Import all necessary libraries
import os
import logging
import warnings
import numpy as np
import matplotlib.pyplot as plt

# Suppress warnings and logs
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2'
tf.get_logger().setLevel(logging.ERROR)
warnings.filterwarnings('ignore', category=DeprecationWarning)
warnings.filterwarnings('ignore', category=UserWarning)

# Set seeds for reproducibility
SEED = 42
np.random.seed(SEED)
tf.random.set_seed(SEED)

# Define constants
IMAGE_SIZE = (224, 224)  # Directly using ResNet50 input size
BATCH_SIZE = 64
TRAINING_DATA_PATH = "Final_Arabic_Alpha_dataset/train"
TEST_DATA_PATH = "Final_Arabic_Alpha_dataset/test"

# Load datasets
print("Loading datasets...")
train_ds = tf.keras.utils.image_dataset_from_directory(
    TRAINING_DATA_PATH,
    validation_split=0.1,
    subset="training",
    seed=SEED,
    image_size=IMAGE_SIZE,
    batch_size=BATCH_SIZE,
    color_mode='rgb',
    label_mode='int'
)

val_ds = tf.keras.utils.image_dataset_from_directory(
    TRAINING_DATA_PATH,
    validation_split=0.1,
    subset="validation",
    seed=SEED,
    image_size=IMAGE_SIZE,
    batch_size=BATCH_SIZE,
    color_mode='rgb',
    label_mode='int'
)

test_ds = tf.keras.utils.image_dataset_from_directory(
    TEST_DATA_PATH,
    image_size=IMAGE_SIZE,
    batch_size=BATCH_SIZE,
    color_mode='rgb',
    label_mode=None,
    shuffle=False
)

# Get class names
class_names = train_ds.class_names
print(f"Class names: {class_names}")


AUTOTUNE = tf.data.AUTOTUNE

train_ds = train_ds.prefetch(buffer_size=AUTOTUNE)
val_ds = val_ds.prefetch(buffer_size=AUTOTUNE)
test_ds = test_ds.prefetch(buffer_size=AUTOTUNE)

Loading datasets...
Found 42559 files belonging to 65 classes.
Using 38304 files for training.
Found 42559 files belonging to 65 classes.
Using 4255 files for validation.
Found 10640 files belonging to 1 classes.
Class names: ['0', '1', '10', '11', '12', '13', '14', '15', '16', '17', '18', '19', '2', '20', '21', '22', '23', '24', '25', '26', '27', '28', '29', '3', '30', '31', '32', '33', '34', '35', '36', '37', '38', '39', '4', '40', '41', '42', '43', '44', '45', '46', '47', '48', '49', '5', '50', '51', '52', '53', '54', '55', '56', '57', '58', '59', '6', '60', '61', '62', '63', '64', '7', '8', '9']


In [3]:
# Data augmentation and preprocessing
print("Creating preprocessing pipeline...")
# data_augmentation = tf.keras.Sequential([
#     tf.keras.layers.RandomRotation(0.2, seed=SEED),
#     tf.keras.layers.RandomZoom(0.1, seed=SEED),
# ])

resnet_preprocess = tf.keras.applications.resnet50.preprocess_input

# Build model
print("Building model...")
base_model = tf.keras.applications.ResNet50(
    weights='imagenet',
    include_top=False,
    input_shape=(*IMAGE_SIZE, 3)
)

inputs = tf.keras.Input(shape=(*IMAGE_SIZE, 3))
# x = data_augmentation(inputs)
x = inputs
x = resnet_preprocess(x)
x = base_model(x)
x = tf.keras.layers.GlobalAveragePooling2D()(x)
x = tf.keras.layers.Dense(256, activation='relu')(x)
outputs = tf.keras.layers.Dense(len(class_names), activation='softmax')(x)

model = tf.keras.Model(inputs, outputs)

# Freeze base model initially
base_model.trainable = False

# Compile model
model.compile(
    optimizer=tf.keras.optimizers.Adam(learning_rate=1e-3),
    loss=tf.keras.losses.SparseCategoricalCrossentropy(),
    metrics=['accuracy']
)

model.summary()

Creating preprocessing pipeline...
Building model...
Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_2 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 tf.__operators__.getitem (S  (None, 224, 224, 3)      0         
 licingOpLambda)                                                 
                                                                 
 tf.nn.bias_add (TFOpLambda)  (None, 224, 224, 3)      0         
                                                                 
 resnet50 (Functional)       (None, 7, 7, 2048)        23587712  
                                                                 
 global_average_pooling2d (G  (None, 2048)             0         
 lobalAveragePooling2D)                                          
                                                                 
 dense (

In [4]:
# Callbacks
callbacks = [
    tf.keras.callbacks.ReduceLROnPlateau(
        monitor='val_loss',
        factor=0.2,
        patience=2,
        min_lr=1e-7
    )
]

EPOCHS = 5

# Train model
print("Training model...")
history = model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=EPOCHS,
    callbacks=callbacks
)

Training model...
Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


In [5]:
# # Unfreeze some layers of the base model
# fine_tune_at = 150  # Unfreeze from this layer onwards

# base_model.trainable = True
# for layer in base_model.layers[:fine_tune_at]:
#     layer.trainable = False

model.optimizer.learning_rate.assign(1e-5)

<tf.Variable 'UnreadVariable' shape=() dtype=float32, numpy=1e-05>

In [6]:
# Train the model again with fine-tuning
fine_tune_epochs = 10  # Fine-tune for 10 more epochs
total_epochs = EPOCHS + fine_tune_epochs  # Add to previous epochs

history_fine = model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=total_epochs,
    initial_epoch=history.epoch[-1],  # Resume from where we left off
    callbacks=callbacks
)

Epoch 5/15


Epoch 6/15
Epoch 7/15
Epoch 8/15
Epoch 9/15
Epoch 10/15
Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


In [3]:
# Load the model
loaded_model = tf.keras.models.load_model("arabic_letter_classifier_95_87")
loaded_model.summary()

Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_2 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 tf.__operators__.getitem (S  (None, 224, 224, 3)      0         
 licingOpLambda)                                                 
                                                                 
 tf.nn.bias_add (TFOpLambda)  (None, 224, 224, 3)      0         
                                                                 
 resnet50 (Functional)       (None, 7, 7, 2048)        23587712  
                                                                 
 global_average_pooling2d (G  (None, 2048)             0         
 lobalAveragePooling2D)                                          
                                                                 
 dense (Dense)               (None, 256)               524544

In [None]:
loss, accuracy = loaded_model.evaluate(train_ds)
val_loss, val_accuracy = loaded_model.evaluate(val_ds)

print(f"Training loss: {loss}, Training Accuracy: {accuracy}")
print(f"Val loss: {val_loss}, Val Accuracy: {val_accuracy}")

Training loss: 0.1766589730978012, Training Accuracy: 0.9521459937095642
Val loss: 0.40367570519447327, Val Accuracy: 0.87144535779953


In [5]:
base_model = loaded_model.get_layer("resnet50")

# Unfreeze some layers of the base model
fine_tune_at = 100  # Unfreeze from this layer onwards

base_model.trainable = True
for layer in base_model.layers[:fine_tune_at]:
    layer.trainable = False

loaded_model.compile(
    optimizer=tf.keras.optimizers.Adam(learning_rate=1e-6),
    loss=tf.keras.losses.SparseCategoricalCrossentropy(),
    metrics=['accuracy']
)

loaded_model.summary()

Model: "model"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 input_2 (InputLayer)        [(None, 224, 224, 3)]     0         
                                                                 
 tf.__operators__.getitem (S  (None, 224, 224, 3)      0         
 licingOpLambda)                                                 
                                                                 
 tf.nn.bias_add (TFOpLambda)  (None, 224, 224, 3)      0         
                                                                 
 resnet50 (Functional)       (None, 7, 7, 2048)        23587712  
                                                                 
 global_average_pooling2d (G  (None, 2048)             0         
 lobalAveragePooling2D)                                          
                                                                 
 dense (Dense)               (None, 256)               524544

In [6]:
# Callbacks
callbacks = [
    tf.keras.callbacks.ReduceLROnPlateau(
        monitor='val_loss',
        factor=0.2,
        patience=2,
        min_lr=1e-7
    )
]


# Train the model again with fine-tuning
fine_tune_epochs = 5  # Fine-tune for 10 more epochs
# total_epochs_final = EPOCHS + total_epochs  # Add to previous epochs

history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs,
    callbacks=callbacks
)

Epoch 1/5
Epoch 2/5
Epoch 3/5
Epoch 4/5
Epoch 5/5


In [7]:
history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs+5,
    initial_epoch=5,
    callbacks=callbacks
)

Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10


In [9]:
for layer in loaded_model.layers:
    if layer.name == "dense":
        layer.kernel_regularizer = tf.keras.regularizers.l2(1e-3)

history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs+5+5,
    initial_epoch=10,
    callbacks=callbacks
)

Epoch 11/15
Epoch 12/15
Epoch 13/15
Epoch 14/15
Epoch 15/15


In [10]:
for layer in loaded_model.layers:
    if layer.name == "dense":
        layer.kernel_regularizer = tf.keras.regularizers.l2(1e-1)

history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs+5+5+5,
    initial_epoch=15,
    callbacks=callbacks
)

Epoch 16/20
Epoch 17/20
Epoch 18/20
Epoch 19/20
Epoch 20/20


In [11]:
for layer in loaded_model.layers:
    if hasattr(layer, "kernel_regularizer"):
        layer.kernel_regularizer = tf.keras.regularizers.l2(1)

history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs+5+5+5+5,
    initial_epoch=20,
    callbacks=callbacks
)

Epoch 21/25
Epoch 22/25
Epoch 23/25
Epoch 24/25
Epoch 25/25


In [12]:
for layer in loaded_model.layers:
    if hasattr(layer, "kernel_regularizer"):
        layer.kernel_regularizer = tf.keras.regularizers.l2(2)

history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs+5+5+5+5+5,
    initial_epoch=25,
    callbacks=callbacks
)

Epoch 26/30
Epoch 27/30
Epoch 28/30
Epoch 29/30
Epoch 30/30


In [15]:
history_fine_final = loaded_model.fit(
    train_ds,
    validation_data=val_ds,
    epochs=fine_tune_epochs+5+5+5+5+5+5,
    initial_epoch=30,
    callbacks=callbacks
)

Epoch 31/35
Epoch 32/35
Epoch 33/35
Epoch 34/35
Epoch 35/35


In [16]:
loaded_model.save('arabic_letter_classifier_100_90')

