In [1]:
import os
import numpy as np
import tensorflow as tf
from sklearn.model_selection import train_test_split
from tensorflow.keras.utils import to_categorical

# Function to load data
def load_data(data_dir, emotion_labels):
    faces = []
    emotions = []
    for label in emotion_labels:
        emotion_dir = os.path.join(data_dir, label)
        for img_name in os.listdir(emotion_dir):
            img_path = os.path.join(emotion_dir, img_name)
            img = tf.keras.preprocessing.image.load_img(img_path, color_mode='grayscale', target_size=(48, 48))
            img = tf.keras.preprocessing.image.img_to_array(img)
            img = img / 255.0
            faces.append(img)
            emotions.append(emotion_labels.index(label))
    return np.array(faces), np.array(emotions)

# Define base path
base_dir = r"C:\Users\sagar\OneDrive\Desktop\DS & ML Project\fer2013_dataset"

# Define emotion labels
emotion_labels = ['angry', 'disgust', 'fear', 'happy', 'neutral', 'sad', 'surprise']

# Define train and test paths
train_dir = os.path.join(base_dir, 'train')
test_dir = os.path.join(base_dir, 'test')

# Load training and testing data
train_faces, train_emotions = load_data(train_dir, emotion_labels)
test_faces, test_emotions = load_data(test_dir, emotion_labels)

# One-hot encode the emotion labels
train_emotions = to_categorical(train_emotions, num_classes=len(emotion_labels))
test_emotions = to_categorical(test_emotions, num_classes=len(emotion_labels))

# Split training data into training and validation sets
X_train, X_val, y_train, y_val = train_test_split(train_faces, train_emotions, test_size=0.2, random_state=42)


In [2]:
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv2D, MaxPooling2D, Dropout, Flatten, Dense, BatchNormalization, Input


In [3]:
# Build the model
model = Sequential()

# Input layer
model.add(Input(shape=(48, 48, 1)))

# 1st CNN layer
model.add(Conv2D(64, (3,3), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# 2nd CNN layer
model.add(Conv2D(128, (5,5), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# 3rd CNN layer
model.add(Conv2D(512, (3,3), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# 4th CNN layer
model.add(Conv2D(512, (3,3), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# Flattening
model.add(Flatten())

# Fully connected layer
model.add(Dense(256, activation='relu'))
model.add(BatchNormalization())
model.add(Dropout(0.25))

# Output layer
model.add(Dense(7, activation='softmax'))


In [4]:
# Build the model
model = Sequential()

# Input layer
model.add(Input(shape=(48, 48, 1)))

# 1st CNN layer
model.add(Conv2D(64, (3,3), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# 2nd CNN layer
model.add(Conv2D(128, (5,5), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# 3rd CNN layer
model.add(Conv2D(512, (3,3), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# 4th CNN layer
model.add(Conv2D(512, (3,3), padding='same', activation='relu'))
model.add(BatchNormalization())
model.add(MaxPooling2D(pool_size=(2,2)))
model.add(Dropout(0.25))

# Flattening
model.add(Flatten())

# Fully connected layer
model.add(Dense(256, activation='relu'))
model.add(BatchNormalization())
model.add(Dropout(0.25))

# Output layer
model.add(Dense(7, activation='softmax'))


In [5]:
# Compile the model
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])


In [6]:
# Train the model
history = model.fit(X_train, y_train, epochs=50, validation_data=(X_val, y_val))


Epoch 1/50
[1m718/718[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m293s[0m 397ms/step - accuracy: 0.2410 - loss: 2.1149 - val_accuracy: 0.3441 - val_loss: 1.6977
Epoch 2/50
[1m718/718[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m281s[0m 391ms/step - accuracy: 0.4187 - loss: 1.5167 - val_accuracy: 0.3295 - val_loss: 1.6940
Epoch 3/50
[1m718/718[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m281s[0m 392ms/step - accuracy: 0.5112 - loss: 1.2867 - val_accuracy: 0.4920 - val_loss: 1.3232
Epoch 4/50
[1m718/718[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m284s[0m 395ms/step - accuracy: 0.5583 - loss: 1.1686 - val_accuracy: 0.5430 - val_loss: 1.1986
Epoch 5/50
[1m718/718[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m281s[0m 392ms/step - accuracy: 0.5950 - loss: 1.0885 - val_accuracy: 0.5343 - val_loss: 1.2065
Epoch 6/50
[1m718/718[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m281s[0m 392ms/step - accuracy: 0.6153 - loss: 1.0280 - val_accuracy: 0.5512 - val_loss: 1.2048
Epoc

In [7]:
# Save the trained model without optimizer state
model.save('emotion_detection_model.keras', include_optimizer=False)

# Load the trained model
from tensorflow.keras.models import load_model
model = load_model('emotion_detection_model.keras')

# Compile the model (to ensure metrics are available)
model.compile(optimizer='adam', loss='categorical_crossentropy', metrics=['accuracy'])


In [None]:
import cv2

# Define emotion labels
emotion_labels = ['Angry', 'Disgust', 'Fear', 'Happy', 'Neutral', 'Sad', 'Surprise']

# Start webcam
cap = cv2.VideoCapture(0)

while True:
    ret, frame = cap.read()
    if not ret:
        break
    gray = cv2.cvtColor(frame, cv2.COLOR_BGR2GRAY)
    face_cascade = cv2.CascadeClassifier(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml')
    faces = face_cascade.detectMultiScale(gray, scaleFactor=1.3, minNeighbors=5)

    for (x, y, w, h) in faces:
        roi_gray = gray[y:y+h, x:x+w]
        roi_gray = cv2.resize(roi_gray, (48, 48))
        roi_gray = roi_gray.astype('float') / 255.0
        roi_gray = np.expand_dims(roi_gray, axis=0)
        roi_gray = np.expand_dims(roi_gray, axis=-1)
        prediction = model.predict(roi_gray)
        maxindex = int(np.argmax(prediction))
        cv2.putText(frame, emotion_labels[maxindex], (x, y-10), cv2.FONT_HERSHEY_SIMPLEX, 1, (0, 255, 0), 2, cv2.LINE_AA)
        cv2.rectangle(frame, (x, y), (x+w, y+h), (0, 255, 0), 2)
    
    cv2.imshow('Emotion Detector', frame)
    
    # Exit the loop when 'q' key is pressed
    if cv2.waitKey(1) & 0xFF == ord('q'):
        break

# Release the webcam and close all OpenCV windows
cap.release()
cv2.destroyAllWindows()
