In [1]:
import os
from PIL import Image
import numpy as np
from sklearn.preprocessing import LabelEncoder
from tensorflow.keras.utils import to_categorical

# Define the path to the directory
directory_path = r'F:\OfficeHomeDataset_10072016\OfficeHomeDataset_10072016\Real World'

# Initialize empty lists for images and labels
X = []
Y = []

# Initialize LabelEncoder
label_encoder = LabelEncoder()

# Create a dictionary to map folder names to unique labels
folder_to_label = {}

# Loop through subdirectories (classes) and assign unique labels
for index, class_folder in enumerate(os.listdir(directory_path)):
    class_path = os.path.join(directory_path, class_folder)

    # Store the mapping of folder name to unique label
    folder_to_label[class_folder] = index

    for image_file in os.listdir(class_path):
        try:
            if image_file.endswith('.jpg'):
                image_path = os.path.join(class_path, image_file)

                # Load image, convert to RGB and resize
                img = Image.open(image_path).convert('RGB')
                img = img.resize((32, 32))
                img_array = np.array(img)

                # Append image and label to lists
                X.append(img_array)
                Y.append(index)  # Use the unique label for this folder
        except Exception as e:
            print(f"Error processing image file {image_file}: {e}")

# Convert lists to numpy arrays
X = np.array(X)

# Encode labels using one-hot encoding
Y = to_categorical(Y, num_classes=65)  # 65 different folders

print(f'X shape: {X.shape}')
print(f'Y shape: {Y.shape}')


X shape: (4357, 32, 32, 3)
Y shape: (4357, 65)


In [2]:
from sklearn.model_selection import train_test_split

# Split the data into train and test sets
X_train, X_test, Y_train, Y_test = train_test_split(X, Y, test_size=0.99, random_state=42)

print(f'X_train shape: {X_train.shape}')
print(f'Y_train shape: {Y_train.shape}')
print(f'X_test shape: {X_test.shape}')
print(f'Y_test shape: {Y_test.shape}')


X_train shape: (43, 32, 32, 3)
Y_train shape: (43, 65)
X_test shape: (4314, 32, 32, 3)
Y_test shape: (4314, 65)


In [24]:
import os
from PIL import Image
import numpy as np
from sklearn.preprocessing import LabelEncoder
from tensorflow.keras.utils import to_categorical

# Define the path to the directory
directory_path = r'F:\OfficeHomeDataset_10072016\OfficeHomeDataset_10072016\Product'

# Initialize empty lists for images and labels
X = []
Y = []

# Initialize LabelEncoder
label_encoder = LabelEncoder()

# Create a dictionary to map folder names to unique labels
folder_to_label = {}

# Loop through subdirectories (classes) and assign unique labels
for index, class_folder in enumerate(os.listdir(directory_path)):
    class_path = os.path.join(directory_path, class_folder)

    # Store the mapping of folder name to unique label
    folder_to_label[class_folder] = index

    for image_file in os.listdir(class_path):
        try:
            if image_file.endswith('.jpg'):
                image_path = os.path.join(class_path, image_file)

                # Load image, convert to RGB and resize
                img = Image.open(image_path).convert('RGB')
                img = img.resize((32, 32))
                img_array = np.array(img)

                # Append image and label to lists
                X.append(img_array)
                Y.append(index)  # Use the unique label for this folder
        except Exception as e:
            print(f"Error processing image file {image_file}: {e}")

# Convert lists to numpy arrays
X = np.array(X)

# Encode labels using one-hot encoding
Y = to_categorical(Y, num_classes=65)  # 65 different folders

print(f'X shape: {X.shape}')
print(f'Y shape: {Y.shape}')


X shape: (4439, 32, 32, 3)
Y shape: (4439, 65)


In [25]:
from sklearn.model_selection import train_test_split

# Split the data into train and test sets
x_train, x_test, y_train, y_test = train_test_split(X, Y, test_size=0.01, random_state=42)

print(f'X_train shape: {x_train.shape}')
print(f'Y_train shape: {y_train.shape}')
print(f'X_test shape: {x_test.shape}')
print(f'Y_test shape: {y_test.shape}')


X_train shape: (4394, 32, 32, 3)
Y_train shape: (4394, 65)
X_test shape: (45, 32, 32, 3)
Y_test shape: (45, 65)


In [26]:
from tensorflow import keras
model = keras.models.load_model(r"C:\Users\shaif\Downloads\office_real_32_model.h5")

from tensorflow.keras.applications import ResNet50
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, GlobalAveragePooling2D
    
num_classes = 65  # Update with the actual number of classes in your target data
x = model.layers[-4].output  # Access the last 4th layer from the end
x = GlobalAveragePooling2D()(x)
output = Dense(num_classes, activation='softmax')(x)

# Create the new model with the updated head
new_model = keras.models.Model(inputs=model.input, outputs=output)
new_model.compile(optimizer='Adam', loss='categorical_crossentropy', metrics=['accuracy'])
# Train the model with early stopping
new_model.fit(x_train, y_train,validation_split = 0.2, batch_size=32, epochs=50)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


<keras.callbacks.History at 0x1fc3f40c250>

In [27]:
import numpy as np
from sklearn.metrics import accuracy_score, f1_score

# Assuming you have trained a model and obtained predicted probabilities on x_test
y_pred_prob = new_model.predict(X_test)

# Convert predicted probabilities to predicted labels
y_pred = np.argmax(y_pred_prob, axis=1)

# Convert y_test to predicted labels format
y_test_labels = np.argmax(Y_test, axis=1)

# Calculate accuracy
accuracy = accuracy_score(y_test_labels, y_pred)
print("Accuracy:", accuracy)

# Calculate F1 score (micro-average)
f1_micro = f1_score(y_test_labels, y_pred, average='micro')
print("F1 Score (Micro):", f1_micro)

Accuracy: 0.09457579972183588
F1 Score (Micro): 0.09457579972183588


In [34]:
from tensorflow.keras.applications import ResNet50
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, GlobalAveragePooling2D

# Create the ResNet model without the top (fully connected) layers
from tensorflow.keras.applications import ResNet50

base_model = ResNet50(weights=None, include_top=False, input_shape=(32, 32, 3))
    
# Add the top layers for classification
model = Sequential()
model.add(base_model)
model.add(GlobalAveragePooling2D())
model.add(Dense(65, activation='softmax'))

# Compile the model
model.compile(optimizer='Adam', loss='categorical_crossentropy', metrics=['accuracy'])
# Train the model
model.fit(x_train, y_train, batch_size=32, epochs=50, validation_split = .2)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


<keras.callbacks.History at 0x1fc3f2810d0>

In [35]:
import numpy as np
from sklearn.metrics import accuracy_score, f1_score

# Assuming you have trained a model and obtained predicted probabilities on x_test
y_pred_prob = model.predict(X_test)

# Convert predicted probabilities to predicted labels
y_pred = np.argmax(y_pred_prob, axis=1)

# Convert y_test to predicted labels format
y_test_labels = np.argmax(Y_test, axis=1)

# Calculate accuracy
accuracy = accuracy_score(y_test_labels, y_pred)
print("Accuracy:", accuracy)

# Calculate F1 score (micro-average)
f1_micro = f1_score(y_test_labels, y_pred, average='micro')
print("F1 Score (Micro):", f1_micro)

Accuracy: 0.09040333796940195
F1 Score (Micro): 0.09040333796940195
