In [8]:
import numpy as np
import pandas as pd
import tensorflow as tf
from tensorflow.keras.preprocessing.image import ImageDataGenerator
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Flatten, Dense

**Read dataset**

In [9]:
filtered_clothing = pd.read_csv('filtered_clothing_dataset.csv')

**Split dataset in training and testing set**

In [10]:
eighty_pct = int(0.8*len(filtered_clothing))
  
train_set = filtered_clothing.iloc[:(eighty_pct-1), :] 
test_set = filtered_clothing.iloc[eighty_pct:, :] 
  
train_set.to_csv("train_data.csv")
test_set.to_csv("test_data.csv")

**Loading the dataset**

In [11]:
train_data = pd.read_csv('train_data.csv')
test_data = pd.read_csv('test_data.csv')

In [12]:
# image dimensions and batch size
img_width, img_height = 224, 224
batch_size = 32

# data generators for training and validation
train_datagen = ImageDataGenerator(rescale=1./255,
                                   shear_range=0.2,
                                   zoom_range=0.2,
                                   horizontal_flip=True)

test_datagen = ImageDataGenerator(rescale=1./255)

train_data['id'] = train_data['id'].astype(str) + '.jpg'
test_data['id'] = test_data['id'].astype(str) + '.jpg'

train_generator = train_datagen.flow_from_dataframe(
    dataframe=train_data,
    directory='filtered_images',
    x_col="id",
    y_col="subCategory",
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='categorical')

validation_generator = test_datagen.flow_from_dataframe(
    dataframe=test_data,
    directory='filtered_images',
    x_col="id",
    y_col="subCategory",
    target_size=(img_width, img_height),
    batch_size=batch_size,
    class_mode='categorical')

Found 22615 validated image filenames belonging to 7 classes.
Found 5655 validated image filenames belonging to 7 classes.


**Defining the CNN model**

In [13]:
model = Sequential([
    Conv2D(32, (3, 3), activation='relu', input_shape=(img_width, img_height, 3)),
    MaxPooling2D((2, 2)),
    Conv2D(64, (3, 3), activation='relu'),
    MaxPooling2D((2, 2)),
    Conv2D(128, (3, 3), activation='relu'),
    MaxPooling2D((2, 2)),
    Conv2D(128, (3, 3), activation='relu'),
    MaxPooling2D((2, 2)),
    Flatten(),
    Dense(512, activation='relu'),
    Dense(7, activation='softmax')  # 7 categories in the dataset
])

model.compile(optimizer='adam',
              loss='categorical_crossentropy',
              metrics=['accuracy'])

model.summary()

  super().__init__(


**Model training**

In [15]:
# number of training and validation steps
train_steps = train_generator.samples // batch_size
validation_steps = validation_generator.samples // batch_size

# model training
history = model.fit(
    train_generator,
    steps_per_epoch=train_steps,
    epochs=10,  # adjust as needed
    validation_data=validation_generator,
    validation_steps=validation_steps)

Epoch 1/10


  self._warn_if_super_not_called()


[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1146s[0m 2s/step - accuracy: 0.8112 - loss: 0.5776 - val_accuracy: 0.9364 - val_loss: 0.1930
Epoch 2/10
[1m  1/706[0m [37m━━━━━━━━━━━━━━━━━━━━[0m [1m12:26[0m 1s/step - accuracy: 0.9375 - loss: 0.1215

  self.gen.throw(typ, value, traceback)


[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 403us/step - accuracy: 0.9375 - loss: 0.0608 - val_accuracy: 0.9565 - val_loss: 0.0591
Epoch 3/10
[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m885s[0m 1s/step - accuracy: 0.9382 - loss: 0.1917 - val_accuracy: 0.9547 - val_loss: 0.1604
Epoch 4/10
[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 298us/step - accuracy: 0.9688 - loss: 0.0257 - val_accuracy: 1.0000 - val_loss: 0.0172
Epoch 5/10
[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m888s[0m 1s/step - accuracy: 0.9510 - loss: 0.1439 - val_accuracy: 0.9627 - val_loss: 0.1326
Epoch 6/10
[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 299us/step - accuracy: 1.0000 - loss: 0.0090 - val_accuracy: 0.8696 - val_loss: 0.1008
Epoch 7/10
[1m706/706[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m888s[0m 1s/step - accuracy: 0.9618 - loss: 0.1138 - val_accuracy: 0.9513 - val_loss: 0.1622
Epoch 8/10
[1m706/706[0m [3

**Model evaluation**

In [16]:
test_loss, test_accuracy = model.evaluate(validation_generator, steps=validation_steps)
print("Test Loss:", test_loss)
print("Test Accuracy:", test_accuracy)

[1m176/176[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m63s[0m 357ms/step - accuracy: 0.9534 - loss: 0.1462
Test Loss: 0.14031553268432617
Test Accuracy: 0.955078125


**Save model**

In [17]:
model.save('CNN_model_11032024.keras')
print("Saving the model as CNN_model_11032024")

Saving the model as CNN_model_11032024
