In [None]:
# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load

import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

# Input data files are available in the read-only "../input/" directory
# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory

import os
for dirname, _, filenames in os.walk('/kaggle/input'):
    for filename in filenames:
        print(os.path.join(dirname, filename))

# You can write up to 20GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using "Save & Run All" 
# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session

In [1]:
import os
os.environ["KERAS_BACKEND"]="jax" 
os.environ["XLA_PYTHON_CLIENT_MEM_FRACTION"]="1.00"
os.environ["TF_GPU_ALLOCATOR"]="cuda_malloc_async"

In [2]:
import tensorflow as tf
def swish(x):
    return x*tf.nn.sigmoid(x)

In [3]:
from tensorflow.keras import layers,models
from tensorflow.keras.callbacks import EarlyStopping,CSVLogger,ModelCheckpoint
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.applications.convnext import ConvNeXtLarge

In [4]:
(x_train,y_train),(x_test,y_test)=tf.keras.datasets.cifar100.load_data()

Downloading data from https://www.cs.toronto.edu/~kriz/cifar-100-python.tar.gz
[1m169001437/169001437[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m4s[0m 0us/step


In [5]:
x_train=tf.image.resize(x_train,(64,64)).numpy()
x_test=tf.image.resize(x_test,(64,64)).numpy()

In [6]:
x_train=tf.keras.applications.convnext.preprocess_input(x_train)
x_test=tf.keras.applications.convnext.preprocess_input(x_test)

In [7]:
from sklearn.model_selection import train_test_split
x_train,x_val,y_train,y_val=train_test_split(x_train,y_train,random_state=42,test_size=0.25,stratify=y_train)

In [8]:
datagen=ImageDataGenerator(
    rotation_range=20,
    width_shift_range=0.2,
    height_shift_range=0.2,
    horizontal_flip=True,
    zoom_range=0.2,
    shear_range=0.2,
    fill_mode='nearest'
)

In [9]:
base_model_large=ConvNeXtLarge(
    include_top=False,
    weights='imagenet',
    input_shape=(64,64,3)
)

Downloading data from https://storage.googleapis.com/tensorflow/keras-applications/convnext/convnext_large_notop.h5
[1m785596384/785596384[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m3s[0m 0us/step


In [10]:
base_model_large.trainable=False

In [11]:
model=models.Sequential([
    base_model_large,
    layers.GlobalAveragePooling2D(),
    layers.Dense(1024,activation='swish'),
    layers.BatchNormalization(),
    layers.Dropout(0.5),
    layers.Dense(512,activation='swish'),
    layers.BatchNormalization(),
    layers.Dropout(0.4),
    layers.Dense(256,activation='swish'),
    layers.BatchNormalization(),
    layers.Dropout(0.3),
    layers.Dense(100,activation='softmax') 
])
model.summary()

In [12]:
model.compile(optimizer=Adam(learning_rate=1e-4),loss='sparse_categorical_crossentropy',metrics=["accuracy"],jit_compile=True)

In [13]:
early_stopper=EarlyStopping(restore_best_weights=True,monitor="val_loss",patience=5)

In [14]:
checkpoint=ModelCheckpoint('best_model.keras',monitor='val_accuracy',save_best_only=True)

In [15]:
csv_logger=CSVLogger('training_log.csv',append=True)

In [16]:
import time
start_time=time.time()

In [17]:
history=model.fit(datagen.flow(x_train,y_train),epochs=20,batch_size=32,callbacks=[early_stopper],validation_data=[x_val,y_val],verbose=1)

  self._warn_if_super_not_called()


Epoch 1/20
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m125s[0m 102ms/step - accuracy: 0.0987 - loss: 4.5359 - val_accuracy: 0.5809 - val_loss: 1.7647
Epoch 2/20
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m102s[0m 84ms/step - accuracy: 0.3475 - loss: 2.7602 - val_accuracy: 0.6433 - val_loss: 1.4109
Epoch 3/20
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m99s[0m 85ms/step - accuracy: 0.4217 - loss: 2.3104 - val_accuracy: 0.6708 - val_loss: 1.2586
Epoch 4/20
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m99s[0m 85ms/step - accuracy: 0.4690 - loss: 2.0678 - val_accuracy: 0.6890 - val_loss: 1.1628
Epoch 5/20
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m99s[0m 84ms/step - accuracy: 0.4969 - loss: 1.9211 - val_accuracy: 0.6998 - val_loss: 1.1057
Epoch 6/20
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m99s[0m 84ms/step - accuracy: 0.5178 - loss: 1.8208 - val_accuracy: 0.7122 - val_loss: 1.0574
E

In [18]:
head_training_time=time.time()-start_time

In [19]:
base_model_large.trainable=True

In [20]:
model.compile(optimizer=Adam(learning_rate=1e-5),
              loss='sparse_categorical_crossentropy',
              metrics=['accuracy'],jit_compile=True)

In [21]:
start_fine_tune=time.time()

In [22]:
fine_tune_history=model.fit(
    datagen.flow(x_train,y_train,batch_size=32),
    validation_data=(x_val,y_val),
    epochs=10,
    callbacks=[early_stopper,csv_logger],
    verbose=1
)

  self._warn_if_super_not_called()


Epoch 1/10
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m287s[0m 225ms/step - accuracy: 0.7320 - loss: 0.9443 - val_accuracy: 0.8553 - val_loss: 0.5021
Epoch 2/10
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m226s[0m 181ms/step - accuracy: 0.8208 - loss: 0.6333 - val_accuracy: 0.8670 - val_loss: 0.4502
Epoch 3/10
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m211s[0m 180ms/step - accuracy: 0.8519 - loss: 0.5178 - val_accuracy: 0.8765 - val_loss: 0.4245
Epoch 4/10
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m212s[0m 181ms/step - accuracy: 0.8727 - loss: 0.4411 - val_accuracy: 0.8841 - val_loss: 0.4048
Epoch 5/10
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m211s[0m 180ms/step - accuracy: 0.8955 - loss: 0.3741 - val_accuracy: 0.8885 - val_loss: 0.3931
Epoch 6/10
[1m1172/1172[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m212s[0m 181ms/step - accuracy: 0.9071 - loss: 0.3255 - val_accuracy: 0.8904 - val_loss:

In [23]:
fine_tune_time=time.time()-start_fine_tune

In [24]:
import numpy as np
y_pred=model.predict(x_test)
y_pred_class=np.argmax(y_pred,axis=1)

[1m313/313[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m17s[0m 47ms/step


In [25]:
test_loss, test_accuracy=model.evaluate(x_test,y_test,verbose=1)
print(f"\nTest Accuracy: {test_accuracy * 100:.2f}%")
print(f"Total training time: {head_training_time + fine_tune_time:.2f} seconds")

[1m313/313[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m16s[0m 46ms/step - accuracy: 0.8903 - loss: 0.4019

Test Accuracy: 89.07%
Total training time: 4222.41 seconds


In [26]:
val_loss,val_accuracy=model.evaluate(x_val,y_val)
print(f"Validation accuracy: {val_accuracy * 100:.4f}%")

[1m391/391[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m14s[0m 36ms/step - accuracy: 0.8932 - loss: 0.3800
Validation accuracy: 89.1120%


In [27]:
from sklearn.metrics import precision_score,recall_score,f1_score,accuracy_score,classification_report


accuracy=accuracy_score(y_test,y_pred_class)
precision=precision_score(y_test,y_pred_class,average='weighted')
recall=recall_score(y_test,y_pred_class,average='weighted')
f1=f1_score(y_test,y_pred_class,average='weighted')


print("\nPerformance Metrics Breakdown for ConvNext Large:")
print(f"Accuracy: {accuracy:.4f}")
print(f"Precision: {precision:.4f}")
print(f"Recall: {recall:.4f}")
print(f"F1-Score: {f1:.4f}")


Performance Metrics Breakdown for ConvNext Large:
Accuracy: 0.8907
Precision: 0.8929
Recall: 0.8907
F1-Score: 0.8908


In [28]:
import pandas as pd
results=pd.DataFrame({
    "Model": ["ConvNext Large"],
    "Test Accuracy": [test_accuracy],
    "Validation Accuracy":[val_accuracy],
    "Test Loss": [test_loss],
    "Head Training Time (s)": [head_training_time],
    "Fine-tuning Time (s)": [fine_tune_time],
    "Total Params": [model.count_params()]
})

In [29]:
print(results)

            Model  Test Accuracy  Validation Accuracy  Test Loss  \
0  ConvNext Large         0.8907              0.89112   0.395179   

   Head Training Time (s)  Fine-tuning Time (s)  Total Params  
0             2014.234277           2208.179708     198493220  


In [30]:
results.to_csv("ConvNext Large.csv",index=False)
print("\nResults saved to ConvNext Large.csv")


Results saved to ConvNext Large.csv
