# Emotion Recognition and Analysis using DeepFace and MongoDB
This code accesses your webcam through Google Colab, does emotion recognition and pushes results to our MongoDB

In [None]:
! pip install deepface
! pip install pymongo

Collecting deepface
  Downloading deepface-0.0.79-py3-none-any.whl (49 kB)
[?25l     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m0.0/49.6 kB[0m [31m?[0m eta [36m-:--:--[0m[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m49.6/49.6 kB[0m [31m3.7 MB/s[0m eta [36m0:00:00[0m
Collecting mtcnn>=0.1.0 (from deepface)
  Downloading mtcnn-0.1.1-py3-none-any.whl (2.3 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m2.3/2.3 MB[0m [31m55.8 MB/s[0m eta [36m0:00:00[0m
[?25hCollecting retina-face>=0.0.1 (from deepface)
  Downloading retina_face-0.0.13-py3-none-any.whl (16 kB)
Collecting fire>=0.4.0 (from deepface)
  Downloading fire-0.5.0.tar.gz (88 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m88.3/88.3 kB[0m [31m10.8 MB/s[0m eta [36m0:00:00[0m
[?25h  Preparing metadata (setup.py) ... [?25l[?25hdone
Collecting gunicorn>=20.1.0 (from deepface)
  Downloading gunicorn-21.1.0-py3-none-any.whl (80 kB)
[2K     [9

In [None]:
# import dependencies
from IPython.display import display, Javascript, Image
from google.colab.output import eval_js
from base64 import b64decode, b64encode
import cv2
import numpy as np
import PIL
import io
import html
import time
from pymongo.mongo_client import MongoClient
from pymongo.server_api import ServerApi
from google.colab.patches import cv2_imshow
from deepface import DeepFace
import matplotlib.pyplot as plt
from PIL import Image
from bson.binary import Binary

Directory  /root /.deepface created
Directory  /root /.deepface/weights created


In [None]:
from pymongo.mongo_client import MongoClient
from pymongo.server_api import ServerApi

uri = API_KEY_HERE

# Create a new client and connect to the server
client = MongoClient(uri, server_api=ServerApi('1'))

# Send a ping to confirm a successful connection
try:
    client.admin.command('ping')
    print("Pinged your deployment. You successfully connected to MongoDB!")
except Exception as e:
    print(e)

Pinged your deployment. You successfully connected to MongoDB!


In [None]:
db = client.get_database('StudentRecord')

## Helper Functions
Below are a few helper function to make converting between different image data types and formats.

In [None]:
from datetime import datetime

def get_datetime_info():
    now = datetime.now()
    month = now.strftime("%m")
    day = now.strftime("%d")
    year = now.strftime("%Y")
    hour = now.strftime("%H")
    minute = now.strftime("%M")
    second = now.strftime("%S")
    iso_time = now.isoformat()

    result = {
        "month": int(month),
        "day": int(day),
        "year": int(year),
        "hour": int(hour),
        "minute": int(minute),
        "second": int(second),
        "iso_time": iso_time
    }

    return result


In [None]:
# function to convert the JavaScript object into an OpenCV image
# This funciton was taken from the notebook: 'Google Colab: Access Webcam for Images and Video'
# https://colab.research.google.com/drive/1QnC7lV7oVFk5OZCm75fqbLAfD9qBy9bw

def js_to_image(js_reply):
  """
  Params:
          js_reply: JavaScript object containing image from webcam
  Returns:
          img: OpenCV BGR image
  """
  # decode base64 image
  image_bytes = b64decode(js_reply.split(',')[1])
  # convert bytes to numpy array
  jpg_as_np = np.frombuffer(image_bytes, dtype=np.uint8)
  # decode numpy array into OpenCV BGR image
  img = cv2.imdecode(jpg_as_np, flags=1)

  return img

# function to convert OpenCV Rectangle bounding box image into base64 byte string to be overlayed on video stream
def bbox_to_bytes(bbox_array):
  """
  Params:
          bbox_array: Numpy array (pixels) containing rectangle to overlay on video stream.
  Returns:
        bytes: Base64 image byte string
  """
  # convert array into PIL image
  bbox_PIL = PIL.Image.fromarray(bbox_array, 'RGBA')
  iobuf = io.BytesIO()
  # format bbox into png for return
  bbox_PIL.save(iobuf, format='png')
  # format return string
  bbox_bytes = 'data:image/png;base64,{}'.format((str(b64encode(iobuf.getvalue()), 'utf-8')))

  return bbox_bytes

## Haar Cascade Classifier
For this tutorial we will run a simple object detection algorithm called Haar Cascade on our images and video fetched from our webcam. OpenCV has a pre-trained Haar Cascade face detection model.

In [None]:
# initialize the Haar Cascade face detection model
face_cascade = cv2.CascadeClassifier(cv2.samples.findFile(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml'))

## Data Collection



In [None]:
# JavaScript to properly create our live video stream using our webcam as input\
# This funciton was taken from the notebook: 'Google Colab: Access Webcam for Images and Video'
# https://colab.research.google.com/drive/1QnC7lV7oVFk5OZCm75fqbLAfD9qBy9bw

def video_stream():
  js = Javascript('''
    var video;
    var div = null;
    var stream;
    var captureCanvas;
    var imgElement;
    var labelElement;

    var pendingResolve = null;
    var shutdown = false;
  //This function closes everything when needed
    function removeDom() {
       stream.getVideoTracks()[0].stop();
       video.remove();
       div.remove();
       video = null;
       div = null;
       stream = null;
       imgElement = null;
       captureCanvas = null;
       labelElement = null;
    }

    function onAnimationFrame() {
      if (!shutdown) {
        window.requestAnimationFrame(onAnimationFrame);
      }
      if (pendingResolve) {
        var result = "";
        if (!shutdown) {
          captureCanvas.getContext('2d').drawImage(video, 0, 0, 640, 480);
          result = captureCanvas.toDataURL('image/jpeg', 0.8)
        }
        var lp = pendingResolve;
        pendingResolve = null;
        lp(result);
      }
    }

    async function createDom() {
      if (div !== null) {
        return stream;
      }

      div = document.createElement('div');
      div.style.border = '2px solid black';
      div.style.padding = '3px';
      div.style.width = '100%';
      div.style.maxWidth = '600px';
      document.body.appendChild(div);

      const modelOut = document.createElement('div');
      modelOut.innerHTML = "<span>Status:</span>";
      labelElement = document.createElement('span');
      labelElement.innerText = 'No data';
      labelElement.style.fontWeight = 'bold';
      modelOut.appendChild(labelElement);
      div.appendChild(modelOut);

      video = document.createElement('video');
      video.style.display = 'block';
      video.width = div.clientWidth - 6;
      video.setAttribute('playsinline', '');
      video.onclick = () => { shutdown = true; };
      stream = await navigator.mediaDevices.getUserMedia(
          {video: { facingMode: "environment"}});
      div.appendChild(video);

      imgElement = document.createElement('img');
      imgElement.style.position = 'absolute';
      imgElement.style.zIndex = 1;
      imgElement.onclick = () => { shutdown = true; };
      div.appendChild(imgElement);

      const instruction = document.createElement('div');
      instruction.innerHTML =
          '<span style="color: red; font-weight: bold;">' +
          'When finished, click here or on the video to stop this demo</span>';
      div.appendChild(instruction);
      instruction.onclick = () => { shutdown = true; };

      video.srcObject = stream;
      await video.play();

      captureCanvas = document.createElement('canvas');
      captureCanvas.width = 640; //video.videoWidth;
      captureCanvas.height = 480; //video.videoHeight;
      window.requestAnimationFrame(onAnimationFrame);

      return stream;
    }
    async function stream_frame(label, imgData) {
      if (shutdown) {
        removeDom();
        shutdown = false;
        return '';
      }

      var preCreate = Date.now();
      stream = await createDom();

      var preShow = Date.now();
      if (label != "") {
        labelElement.innerHTML = label;
      }

      if (imgData != "") {
        var videoRect = video.getClientRects()[0];
        imgElement.style.top = videoRect.top + "px";
        imgElement.style.left = videoRect.left + "px";
        imgElement.style.width = videoRect.width + "px";
        imgElement.style.height = videoRect.height + "px";
        imgElement.src = imgData;
      }

      var preCapture = Date.now();
      var result = await new Promise(function(resolve, reject) {
        pendingResolve = resolve;
      });
      shutdown = false;

      return {'create': preShow - preCreate,
              'show': preCapture - preShow,
              'capture': Date.now() - preCapture,
              'img': result};
    }
    ''')

  display(js)

def video_frame(label, bbox):
  data = eval_js('stream_frame("{}", "{}")'.format(label, bbox))
  return data

#Demo

In [None]:
#Change name of collection everytime we run it

collection = db.entryDemo


In [None]:
# start streaming video from webcam
video_stream()
# label for video
label_html = 'Capturing...'
# initialze bounding box to empty
bbox = ''
count = 0
frame = 0

while True:
    js_reply = video_frame(label_html, bbox)
    if not js_reply:
        break

    # convert JS response to OpenCV Image
    img = js_to_image(js_reply["img"])

    # create transparent overlay for bounding box
    bbox_array = np.zeros([480,640,4], dtype=np.uint8)

    # grayscale image for face detection
    gray = cv2.cvtColor(img, cv2.COLOR_RGB2GRAY)

    emotion_predictions = DeepFace.analyze(img,actions = ['emotion'], enforce_detection = True)
    dom_em = max(emotion_predictions[0]['emotion'], key=emotion_predictions[0]['emotion'].get)

    # get face region coordinates
    faces = face_cascade.detectMultiScale(gray)
    # get face bounding box for overlay
    for (x,y,w,h) in faces:
      bbox_array = cv2.rectangle(bbox_array,(x,y),(x+w,y+h),(255,0,0),2)
      bbox_array = cv2.putText(bbox_array, dom_em, (x,y), cv2.FONT_HERSHEY_PLAIN, 4, (0,180,0), 3, cv2.LINE_AA)

      image_byte_array = io.BytesIO()
      image_data = image_byte_array.getvalue()

      _, img_encoded = cv2.imencode('.jpg', img[y:y+h,x:x+w])
      image_bytes = img_encoded.tobytes()

      result = {
            'emotion_distribution': {k: float(format(v, '.2g')) for k, v in emotion_predictions[0]['emotion'].items()},
            'dominant_emotion': dom_em,
            'time': get_datetime_info(),
            'image': Binary(image_bytes),
            'frame_number': frame
          }
      collection.insert_one(result)



    bbox_array[:,:,3] = (bbox_array.max(axis = 2) > 0 ).astype(int) * 255
    # convert overlay of bbox into bytes
    bbox_bytes = bbox_to_bytes(bbox_array)
    # update bbox so next frame gets new overlay
    bbox = bbox_bytes
    frame += 1

<IPython.core.display.Javascript object>

facial_expression_model_weights.h5 will be downloaded...


Downloading...
From: https://github.com/serengil/deepface_models/releases/download/v1.0/facial_expression_model_weights.h5
To: /root/.deepface/weights/facial_expression_model_weights.h5
100%|██████████| 5.98M/5.98M [00:00<00:00, 68.9MB/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00,  2.02it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 13.45it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 13.99it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00,  8.41it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00,  8.13it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 14.94it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 14.39it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 13.35it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 14.32it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 14.38it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00,  8.58it/s]
Action: emotion: 100%|██████████| 1/1 [00:00<00:00, 10.36it/s]


In [None]:
# collection = db.entryUD7

# target_emotions = ['sad','angry']

# documents = collection.find({'dominant_emotion': {'$in': target_emotions}})
documents = collection.find()



  # Display the frame images
for doc in documents:
    frame_image = doc['image']
    emotion = doc['dominant_emotion']
    time = doc['time']

    # Load the image from the byte array
    pil_image = Image.open(io.BytesIO(frame_image))

    # Display the image using matplotlib
    plt.imshow(pil_image)
    plt.title(f"Emotion: {emotion}")
    plt.axis('off')
    plt.show()