# 0. Install and Import Dependencies

In [30]:
!pip install mediapipe opencv-python pandas scikit-learn



In [14]:
import mediapipe as mp # Import mediapipe
import cv2 # Import opencv

In [15]:
mp_drawing = mp.solutions.drawing_utils # Drawing helpers
mp_holistic = mp.solutions.holistic # Mediapipe Solutions

# 1. Make Some Detections

In [16]:
import cv2
import mediapipe as mp

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Start capturing video from the webcam
cap = cv2.VideoCapture(0)

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (no FACE_CONNECTIONS, just landmarks)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION,  # Use FACEMESH_TESSELATION for face mesh connections
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Show the processed image
        cv2.imshow('Raw Webcam Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture object and close windows
cap.release()
cv2.destroyAllWindows()


In [5]:
import cv2
import mediapipe as mp
import os

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Path to input video
video_path = r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Vid3.mp4'

# Specify output folder and file
output_folder = 'output_videos'
if not os.path.exists(output_folder):
    os.makedirs(output_folder)
output_video_path = os.path.join(output_folder, r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Vid3Processed.mp4')

# Start capturing video from the file
cap = cv2.VideoCapture(video_path)

# Get frame width, height, and FPS for saving the output video
frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
fps = int(cap.get(cv2.CAP_PROP_FPS))

# Define the codec and create VideoWriter object to save the video
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out = cv2.VideoWriter(output_video_path, fourcc, fps, (frame_width, frame_height))

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            break
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Write the processed frame to the output video
        out.write(image)
        
        # Show the processed image (optional)
        cv2.imshow('Processed Video Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture and writer objects, and close windows
cap.release()
out.release()
cv2.destroyAllWindows()


In [17]:
results.pose_landmarks.landmark[0].visibility

0.9999231100082397

In [18]:
results.face_landmarks.landmark[0].visibility

0.0

In [19]:
print(results.face_landmarks.landmark[0])
results.face_landmarks.landmark[0].x

x: 0.7042917609214783
y: 0.7482007741928101
z: -0.01587127335369587



0.7042917609214783

# 2. Capture Landmarks & Export to CSV
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<!--<img src="https://i.imgur.com/AzKNp7A.png">-->
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<img src="https://i.imgur.com/AzKNp7A.png">

In [20]:
import csv
import os
import numpy as np

In [21]:
num_coords = len(results.pose_landmarks.landmark)+len(results.face_landmarks.landmark)
num_coords

501

In [22]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [23]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [24]:
with open('coords2.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [38]:
class_name = "sad"

In [39]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))

        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('coords2.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()


# 3. Train Custom Model Using Scikit Learn

## 3.1 Read in Collected Data and Process

In [40]:
import pandas as pd
from sklearn.model_selection import train_test_split

In [41]:
df = pd.read_csv('coords2.csv')

In [42]:
df.head()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,bored,0.695377,0.535628,-1.015433,0.999973,0.739084,0.465467,-0.921336,0.999923,0.75714,...,0.004293,0.0,0.81434,0.477923,0.044335,0.0,0.823962,0.473417,0.046238,0.0
1,bored,0.696018,0.535825,-1.210933,0.999968,0.739245,0.46677,-1.107235,0.999913,0.757203,...,0.003373,0.0,0.812043,0.474216,0.04303,0.0,0.82217,0.468346,0.044998,0.0
2,bored,0.697035,0.535323,-1.354688,0.999961,0.739779,0.466585,-1.245109,0.999897,0.757645,...,0.002928,0.0,0.814081,0.472327,0.043676,0.0,0.82375,0.467295,0.045598,0.0
3,bored,0.697878,0.534776,-1.267635,0.99996,0.739979,0.466329,-1.154958,0.999894,0.757724,...,0.001868,0.0,0.812105,0.469181,0.043169,0.0,0.821586,0.464528,0.044996,0.0
4,bored,0.698973,0.53473,-1.391941,0.999957,0.740502,0.466326,-1.283805,0.999886,0.758008,...,0.001249,0.0,0.811591,0.469647,0.042169,0.0,0.821337,0.464461,0.044102,0.0


In [43]:
df.tail()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
226,sad,0.52796,0.560921,-1.392597,0.997975,0.572186,0.459613,-1.348279,0.995907,0.60153,...,-0.021214,0.0,0.667019,0.428468,0.014353,0.0,0.676906,0.417453,0.014713,0.0
227,sad,0.527991,0.56191,-1.410983,0.998018,0.572239,0.460102,-1.366928,0.996014,0.601591,...,-0.020974,0.0,0.667029,0.429084,0.014848,0.0,0.676972,0.417895,0.015247,0.0
228,sad,0.529251,0.567729,-1.54834,0.997964,0.573125,0.463024,-1.511829,0.995934,0.602393,...,-0.022289,0.0,0.674415,0.436707,0.014311,0.0,0.684611,0.424908,0.014852,0.0
229,sad,0.533709,0.573654,-1.915413,0.997984,0.576964,0.466569,-1.884927,0.995959,0.605714,...,-0.020901,0.0,0.685373,0.433797,0.018741,0.0,0.695464,0.421258,0.019448,0.0
230,sad,0.5464,0.576593,-1.801864,0.997912,0.587288,0.469666,-1.766664,0.99583,0.615296,...,-0.019076,0.0,0.691751,0.422688,0.021977,0.0,0.701494,0.410474,0.022933,0.0


In [44]:
df[df['class']=='bored']

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,bored,0.695377,0.535628,-1.015433,0.999973,0.739084,0.465467,-0.921336,0.999923,0.757140,...,0.004293,0.0,0.814340,0.477923,0.044335,0.0,0.823962,0.473417,0.046238,0.0
1,bored,0.696018,0.535825,-1.210933,0.999968,0.739245,0.466770,-1.107235,0.999913,0.757203,...,0.003373,0.0,0.812043,0.474216,0.043030,0.0,0.822170,0.468346,0.044998,0.0
2,bored,0.697035,0.535323,-1.354688,0.999961,0.739779,0.466585,-1.245109,0.999897,0.757645,...,0.002928,0.0,0.814081,0.472327,0.043676,0.0,0.823750,0.467295,0.045598,0.0
3,bored,0.697878,0.534776,-1.267635,0.999960,0.739979,0.466329,-1.154958,0.999894,0.757724,...,0.001868,0.0,0.812105,0.469181,0.043169,0.0,0.821586,0.464528,0.044996,0.0
4,bored,0.698973,0.534730,-1.391941,0.999957,0.740502,0.466326,-1.283805,0.999886,0.758008,...,0.001249,0.0,0.811591,0.469647,0.042169,0.0,0.821337,0.464461,0.044102,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
71,bored,0.409780,0.531581,-1.419889,0.999613,0.439118,0.435768,-1.349440,0.999451,0.467345,...,-0.011788,0.0,0.509624,0.394690,0.002514,0.0,0.515444,0.383800,0.002183,0.0
72,bored,0.409122,0.531547,-1.422530,0.999616,0.438394,0.435698,-1.352234,0.999449,0.466412,...,-0.011487,0.0,0.509005,0.393612,0.002568,0.0,0.514838,0.382499,0.002219,0.0
73,bored,0.408724,0.531562,-1.424697,0.999611,0.438113,0.435716,-1.354076,0.999432,0.466073,...,-0.011562,0.0,0.508239,0.393012,0.002389,0.0,0.514102,0.382055,0.002014,0.0
74,bored,0.408333,0.531742,-1.429652,0.999611,0.437818,0.435860,-1.357315,0.999423,0.465717,...,-0.011319,0.0,0.508091,0.392806,0.002513,0.0,0.513956,0.381661,0.002143,0.0


In [45]:
X = df.drop('class', axis=1) # features
y = df['class'] # target value

In [46]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1234)

In [47]:
X_test

Unnamed: 0,x1,y1,z1,v1,x2,y2,z2,v2,x3,y3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
6,0.700977,0.533620,-1.268037,0.999953,0.741430,0.466068,-1.168045,0.999876,0.758658,0.474870,...,0.003144,0.0,0.814448,0.474732,0.043715,0.0,0.824404,0.469240,0.045777,0.0
205,0.509921,0.566921,-1.607367,0.995780,0.557617,0.466634,-1.571785,0.991621,0.587935,0.468518,...,-0.016974,0.0,0.666700,0.417279,0.020052,0.0,0.676614,0.407001,0.020668,0.0
104,0.555704,0.532025,-1.189480,0.997947,0.602077,0.431797,-1.139944,0.995565,0.630576,0.431712,...,-0.022973,0.0,0.688522,0.412085,0.012512,0.0,0.698962,0.399233,0.013379,0.0
31,0.725932,0.541631,-1.201730,0.999951,0.763936,0.469126,-1.091796,0.999876,0.779000,0.477223,...,0.007441,0.0,0.831648,0.481995,0.048415,0.0,0.841486,0.476432,0.050620,0.0
74,0.408333,0.531742,-1.429652,0.999611,0.437818,0.435860,-1.357315,0.999423,0.465717,0.429591,...,-0.011319,0.0,0.508091,0.392806,0.002513,0.0,0.513956,0.381661,0.002143,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
222,0.527006,0.558710,-1.484489,0.997755,0.571118,0.458342,-1.439286,0.995406,0.600523,0.458647,...,-0.023167,0.0,0.669184,0.426582,0.012891,0.0,0.678959,0.416112,0.013225,0.0
207,0.514222,0.563657,-1.484648,0.996096,0.560972,0.463264,-1.441353,0.992173,0.591246,0.465214,...,-0.017647,0.0,0.667296,0.413837,0.019024,0.0,0.677240,0.403065,0.019639,0.0
25,0.724741,0.539646,-1.185694,0.999949,0.762775,0.467780,-1.077408,0.999874,0.777926,0.475775,...,0.005931,0.0,0.828562,0.479450,0.045782,0.0,0.838415,0.473759,0.047890,0.0
163,0.532327,0.626052,-1.994306,0.998781,0.575829,0.521569,-1.965454,0.997111,0.605560,0.524029,...,-0.024665,0.0,0.696852,0.486231,0.019789,0.0,0.706344,0.474358,0.020856,0.0


## 3.2 Train Machine Learning Classification Model

In [48]:
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 

from sklearn.linear_model import LogisticRegression, RidgeClassifier
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [49]:
pipelines = {
    'lr':make_pipeline(StandardScaler(), LogisticRegression()),
    'rc':make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf':make_pipeline(StandardScaler(), RandomForestClassifier()),
    'gb':make_pipeline(StandardScaler(), GradientBoostingClassifier()),
}

In [50]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model

In [51]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rc': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('ridgeclassifier', RidgeClassifier())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())]),
 'gb': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('gradientboostingclassifier', GradientBoostingClassifier())])}

In [52]:
fit_models['rc'].predict(X_test)

array(['bored', 'sad', 'happy', 'bored', 'bored', 'bored', 'sad', 'sad',
       'bored', 'bored', 'happy', 'happy', 'bored', 'bored', 'bored',
       'bored', 'bored', 'bored', 'bored', 'sad', 'sad', 'happy', 'happy',
       'happy', 'sad', 'sad', 'sad', 'sad', 'happy', 'bored', 'bored',
       'bored', 'happy', 'happy', 'bored', 'happy', 'happy', 'happy',
       'sad', 'bored', 'happy', 'sad', 'bored', 'happy', 'sad', 'happy',
       'bored', 'sad', 'happy', 'bored', 'happy', 'sad', 'sad', 'happy',
       'happy', 'sad', 'sad', 'sad', 'happy', 'sad', 'sad', 'happy',
       'bored', 'sad', 'bored', 'sad', 'sad', 'bored', 'sad', 'happy'],
      dtype='<U5')

## 3.3 Evaluate and Serialize Model 

In [53]:
from sklearn.metrics import accuracy_score # Accuracy metrics 
import pickle 

In [54]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rc 1.0
rf 1.0
gb 1.0


In [55]:
fit_models['rc'].predict(X_test)

array(['bored', 'sad', 'happy', 'bored', 'bored', 'bored', 'sad', 'sad',
       'bored', 'bored', 'happy', 'happy', 'bored', 'bored', 'bored',
       'bored', 'bored', 'bored', 'bored', 'sad', 'sad', 'happy', 'happy',
       'happy', 'sad', 'sad', 'sad', 'sad', 'happy', 'bored', 'bored',
       'bored', 'happy', 'happy', 'bored', 'happy', 'happy', 'happy',
       'sad', 'bored', 'happy', 'sad', 'bored', 'happy', 'sad', 'happy',
       'bored', 'sad', 'happy', 'bored', 'happy', 'sad', 'sad', 'happy',
       'happy', 'sad', 'sad', 'sad', 'happy', 'sad', 'sad', 'happy',
       'bored', 'sad', 'bored', 'sad', 'sad', 'bored', 'sad', 'happy'],
      dtype='<U5')

In [56]:
y_test

6      bored
205      sad
104    happy
31     bored
74     bored
       ...  
222      sad
207      sad
25     bored
163      sad
132    happy
Name: class, Length: 70, dtype: object

In [57]:
with open('model2.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

# 4. Make Detections with Model

In [58]:
with open('model2.pkl', 'rb') as f:
    model = pickle.load(f)

In [59]:
model

In [60]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Make Detections
            X = pd.DataFrame([row])
            body_language_class = model.predict(X)[0]
            body_language_prob = model.predict_proba(X)[0]
            print(body_language_class, body_language_prob)
            
            # Grab ear coords
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
            cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Get status box
            cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)
            
            # Display Class
            cv2.putText(image, 'CLASS', (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, body_language_class.split(' ')[0], (90,40), 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Display Probability
            cv2.putText(image, 'PROB', (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2)), 
                        (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()




bored [0.75 0.24 0.01]




bored [0.59 0.4  0.01]




bored [0.6  0.39 0.01]




bored [0.73 0.26 0.01]




bored [0.76 0.23 0.01]
bored [0.67 0.32 0.01]




bored [0.71 0.28 0.01]




bored [0.68 0.31 0.01]
bored [0.72 0.27 0.01]




bored [0.67 0.32 0.01]
bored [0.76 0.23 0.01]




bored [0.71 0.28 0.01]
bored [0.66 0.33 0.01]




bored [0.72 0.27 0.01]




bored [0.72 0.27 0.01]




bored [0.82 0.17 0.01]




bored [0.99 0.01 0.  ]




bored [0.96 0.04 0.  ]




bored [0.95 0.05 0.  ]
bored [0.95 0.05 0.  ]




bored [0.93 0.07 0.  ]




happy [0.47 0.51 0.02]




sad [0.13 0.27 0.6 ]




sad [0.11 0.02 0.87]




sad [0.1  0.01 0.89]
sad [0.08 0.01 0.91]




sad [0.08 0.01 0.91]




sad [0.08 0.01 0.91]




sad [0.08 0.01 0.91]




sad [0.11 0.01 0.88]
sad [0.11 0.01 0.88]




sad [0.11 0.01 0.88]




sad [0.11 0.01 0.88]




happy [0.11 0.82 0.07]




happy [0.13 0.84 0.03]




happy [0.17 0.8  0.03]




happy [0.46 0.53 0.01]




bored [0.52 0.47 0.01]




happy [0.35 0.63 0.02]




happy [0.28 0.7  0.02]




happy [0.31 0.67 0.02]




happy [0.32 0.66 0.02]




happy [0.38 0.6  0.02]


In [61]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(454, 202)