# 0. Install and Import Dependencies

In [30]:
!pip install mediapipe opencv-python pandas scikit-learn



In [1]:
import mediapipe as mp # Import mediapipe
import cv2 # Import opencv

In [2]:
mp_drawing = mp.solutions.drawing_utils # Drawing helpers
mp_holistic = mp.solutions.holistic # Mediapipe Solutions

# 1. Make Some Detections

In [4]:
import cv2
import mediapipe as mp

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Start capturing video from the webcam
cap = cv2.VideoCapture(0)

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (no FACE_CONNECTIONS, just landmarks)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION,  # Use FACEMESH_TESSELATION for face mesh connections
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Show the processed image
        cv2.imshow('Raw Webcam Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture object and close windows
cap.release()
cv2.destroyAllWindows()


In [5]:
import cv2
import mediapipe as mp
import os

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Path to input video
video_path = r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Vid3.mp4'

# Specify output folder and file
output_folder = 'output_videos'
if not os.path.exists(output_folder):
    os.makedirs(output_folder)
output_video_path = os.path.join(output_folder, r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Vid3Processed.mp4')

# Start capturing video from the file
cap = cv2.VideoCapture(video_path)

# Get frame width, height, and FPS for saving the output video
frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
fps = int(cap.get(cv2.CAP_PROP_FPS))

# Define the codec and create VideoWriter object to save the video
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out = cv2.VideoWriter(output_video_path, fourcc, fps, (frame_width, frame_height))

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            break
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Write the processed frame to the output video
        out.write(image)
        
        # Show the processed image (optional)
        cv2.imshow('Processed Video Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture and writer objects, and close windows
cap.release()
out.release()
cv2.destroyAllWindows()


In [5]:
results.pose_landmarks.landmark[0].visibility

0.999747633934021

In [6]:
results.face_landmarks.landmark[0].visibility

0.0

In [7]:
print(results.face_landmarks.landmark[0])
results.face_landmarks.landmark[0].x

x: 0.5599642992019653
y: 0.4843197762966156
z: -0.05199878662824631



0.5599642992019653

# 2. Capture Landmarks & Export to CSV
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<!--<img src="https://i.imgur.com/AzKNp7A.png">-->
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<img src="https://i.imgur.com/AzKNp7A.png">

In [8]:
import csv
import os
import numpy as np

In [9]:
num_coords = len(results.pose_landmarks.landmark)+len(results.face_landmarks.landmark)
num_coords

501

In [10]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [11]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [18]:
with open('coords1.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [22]:
class_name = "sad"

In [23]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))

        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('coords1.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()


# 3. Train Custom Model Using Scikit Learn

## 3.1 Read in Collected Data and Process

In [24]:
import pandas as pd
from sklearn.model_selection import train_test_split

In [25]:
df = pd.read_csv('coords1.csv')

In [26]:
df.head()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,bored,0.694425,0.352597,-0.976673,0.999997,0.736778,0.297052,-0.887116,0.999994,0.751022,...,0.000773,0.0,0.80006,0.310798,0.035983,0.0,0.808742,0.307553,0.037656,0.0
1,bored,0.703496,0.352618,-1.023966,0.999997,0.742252,0.296995,-0.926303,0.999993,0.756884,...,0.00255,0.0,0.801517,0.310639,0.038213,0.0,0.810123,0.306749,0.039845,0.0
2,bored,0.706086,0.35219,-0.99668,0.999997,0.744198,0.296603,-0.899047,0.999993,0.759114,...,0.002594,0.0,0.798954,0.310396,0.038584,0.0,0.807744,0.306233,0.040279,0.0
3,bored,0.698201,0.351792,-1.010329,0.999996,0.73573,0.296363,-0.915542,0.999992,0.752029,...,0.002823,0.0,0.78425,0.317261,0.037959,0.0,0.793174,0.312882,0.039717,0.0
4,bored,0.690306,0.351668,-1.100166,0.999996,0.727081,0.296299,-1.002947,0.999992,0.744378,...,0.000848,0.0,0.779506,0.318352,0.035752,0.0,0.788316,0.314476,0.037358,0.0


In [27]:
df.tail()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
234,sad,0.561855,0.462289,-1.557456,0.999888,0.600518,0.373373,-1.511698,0.999705,0.625138,...,-0.019291,0.0,0.652669,0.377001,0.006581,0.0,0.658384,0.369852,0.006854,0.0
235,sad,0.562187,0.465611,-1.567497,0.99989,0.600602,0.376257,-1.521221,0.999709,0.625194,...,-0.021074,0.0,0.653176,0.374369,0.003752,0.0,0.658856,0.367696,0.003865,0.0
236,sad,0.562579,0.466379,-1.547644,0.999894,0.600685,0.376944,-1.502247,0.99972,0.625277,...,-0.02121,0.0,0.654468,0.374081,0.003786,0.0,0.660139,0.367363,0.003872,0.0
237,sad,0.562673,0.467256,-1.526024,0.999895,0.600747,0.377724,-1.496971,0.999723,0.625322,...,-0.020912,0.0,0.65452,0.373876,0.004131,0.0,0.660181,0.366999,0.004222,0.0
238,sad,0.563302,0.4676,-1.506186,0.999894,0.601059,0.378289,-1.476859,0.99972,0.625542,...,-0.020453,0.0,0.653945,0.37365,0.005079,0.0,0.659624,0.366633,0.005235,0.0


In [29]:
df[df['class']=='bored']

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,bored,0.694425,0.352597,-0.976673,0.999997,0.736778,0.297052,-0.887116,0.999994,0.751022,...,0.000773,0.0,0.800060,0.310798,0.035983,0.0,0.808742,0.307553,0.037656,0.0
1,bored,0.703496,0.352618,-1.023966,0.999997,0.742252,0.296995,-0.926303,0.999993,0.756884,...,0.002550,0.0,0.801517,0.310639,0.038213,0.0,0.810123,0.306749,0.039845,0.0
2,bored,0.706086,0.352190,-0.996680,0.999997,0.744198,0.296603,-0.899047,0.999993,0.759114,...,0.002594,0.0,0.798954,0.310396,0.038584,0.0,0.807744,0.306233,0.040279,0.0
3,bored,0.698201,0.351792,-1.010329,0.999996,0.735730,0.296363,-0.915542,0.999992,0.752029,...,0.002823,0.0,0.784250,0.317261,0.037959,0.0,0.793174,0.312882,0.039717,0.0
4,bored,0.690306,0.351668,-1.100166,0.999996,0.727081,0.296299,-1.002947,0.999992,0.744378,...,0.000848,0.0,0.779506,0.318352,0.035752,0.0,0.788316,0.314476,0.037358,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
113,bored,0.457134,0.386801,-1.502363,0.999937,0.489515,0.303442,-1.433758,0.999853,0.515754,...,-0.015792,0.0,0.545208,0.279116,0.002231,0.0,0.551421,0.269484,0.002392,0.0
114,bored,0.456926,0.387755,-1.462176,0.999937,0.489446,0.304027,-1.394551,0.999854,0.516117,...,-0.015957,0.0,0.548348,0.279135,0.002580,0.0,0.554459,0.269513,0.002739,0.0
115,bored,0.456814,0.387789,-1.410782,0.999936,0.489377,0.304029,-1.343379,0.999853,0.516305,...,-0.016126,0.0,0.549584,0.277376,0.002738,0.0,0.555512,0.267955,0.002884,0.0
116,bored,0.456622,0.387769,-1.350590,0.999933,0.489169,0.303983,-1.284831,0.999847,0.516097,...,-0.015099,0.0,0.546089,0.275018,0.003790,0.0,0.551901,0.266118,0.003827,0.0


In [30]:
X = df.drop('class', axis=1) # features
y = df['class'] # target value

In [31]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1234)

In [32]:
X_test

Unnamed: 0,x1,y1,z1,v1,x2,y2,z2,v2,x3,y3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
93,0.468520,0.385747,-1.379474,0.999955,0.500877,0.300105,-1.312755,0.999894,0.528273,0.291912,...,-0.019063,0.0,0.554017,0.279259,-0.001907,0.0,0.559818,0.271301,-0.002192,0.0
92,0.468497,0.385415,-1.370816,0.999955,0.500833,0.299252,-1.305767,0.999893,0.528228,0.291164,...,-0.018955,0.0,0.552442,0.278263,-0.000969,0.0,0.558239,0.270909,-0.001229,0.0
31,0.714048,0.350654,-1.111664,0.999993,0.752616,0.293404,-1.012097,0.999987,0.767830,0.299694,...,-0.001599,0.0,0.801553,0.307743,0.030660,0.0,0.810749,0.303455,0.032013,0.0
40,0.711681,0.351736,-1.006486,0.999993,0.748593,0.293364,-0.920763,0.999987,0.763279,0.299487,...,-0.002572,0.0,0.801621,0.305910,0.029480,0.0,0.810696,0.301901,0.030720,0.0
220,0.562103,0.426140,-1.286074,0.999848,0.601837,0.344829,-1.230263,0.999611,0.626630,0.341864,...,-0.013884,0.0,0.652080,0.337389,0.013957,0.0,0.657961,0.331684,0.014348,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
179,0.385755,0.421586,-0.654067,0.999560,0.428014,0.350954,-0.726972,0.998834,0.448691,0.345941,...,-0.018769,0.0,0.449630,0.340673,-0.053870,0.0,0.455768,0.332731,-0.058386,0.0
168,0.393135,0.422759,-0.655401,0.999670,0.433418,0.352269,-0.714543,0.999104,0.453114,0.347320,...,-0.020063,0.0,0.455219,0.339812,-0.055535,0.0,0.461574,0.331528,-0.060089,0.0
181,0.410346,0.428461,-0.818742,0.999540,0.446225,0.353593,-0.868136,0.998753,0.467521,0.347836,...,-0.020777,0.0,0.508739,0.340945,-0.043273,0.0,0.515283,0.328882,-0.046553,0.0
22,0.716191,0.350627,-1.021315,0.999994,0.756097,0.294446,-0.928348,0.999988,0.772471,0.301772,...,-0.001018,0.0,0.820290,0.308112,0.032783,0.0,0.829120,0.304075,0.034267,0.0


## 3.2 Train Machine Learning Classification Model

In [33]:
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 

from sklearn.linear_model import LogisticRegression, RidgeClassifier
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [34]:
pipelines = {
    'lr':make_pipeline(StandardScaler(), LogisticRegression()),
    'rc':make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf':make_pipeline(StandardScaler(), RandomForestClassifier()),
    'gb':make_pipeline(StandardScaler(), GradientBoostingClassifier()),
}

In [35]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model

In [36]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rc': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('ridgeclassifier', RidgeClassifier())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())]),
 'gb': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('gradientboostingclassifier', GradientBoostingClassifier())])}

In [37]:
fit_models['rc'].predict(X_test)

array(['bored', 'bored', 'bored', 'bored', 'sad', 'bored', 'bored', 'sad',
       'bored', 'bored', 'bored', 'sad', 'sad', 'bored', 'sad', 'sad',
       'bored', 'sad', 'bored', 'sad', 'bored', 'bored', 'bored', 'bored',
       'bored', 'bored', 'sad', 'sad', 'bored', 'sad', 'bored', 'sad',
       'bored', 'sad', 'bored', 'sad', 'sad', 'bored', 'bored', 'sad',
       'sad', 'bored', 'sad', 'sad', 'bored', 'sad', 'sad', 'bored',
       'bored', 'sad', 'bored', 'sad', 'bored', 'bored', 'sad', 'sad',
       'sad', 'sad', 'sad', 'sad', 'bored', 'bored', 'bored', 'sad',
       'bored', 'sad', 'bored', 'sad', 'sad', 'sad', 'bored', 'sad'],
      dtype='<U5')

## 3.3 Evaluate and Serialize Model 

In [38]:
from sklearn.metrics import accuracy_score # Accuracy metrics 
import pickle 

In [39]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rc 1.0
rf 1.0
gb 1.0


In [43]:
fit_models['rc'].predict(X_test)

array(['bored', 'bored', 'bored', 'bored', 'sad', 'bored', 'bored', 'sad',
       'bored', 'bored', 'bored', 'sad', 'sad', 'bored', 'sad', 'sad',
       'bored', 'sad', 'bored', 'sad', 'bored', 'bored', 'bored', 'bored',
       'bored', 'bored', 'sad', 'sad', 'bored', 'sad', 'bored', 'sad',
       'bored', 'sad', 'bored', 'sad', 'sad', 'bored', 'bored', 'sad',
       'sad', 'bored', 'sad', 'sad', 'bored', 'sad', 'sad', 'bored',
       'bored', 'sad', 'bored', 'sad', 'bored', 'bored', 'sad', 'sad',
       'sad', 'sad', 'sad', 'sad', 'bored', 'bored', 'bored', 'sad',
       'bored', 'sad', 'bored', 'sad', 'sad', 'sad', 'bored', 'sad'],
      dtype='<U5')

In [44]:
y_test

93     bored
92     bored
31     bored
40     bored
220      sad
       ...  
179      sad
168      sad
181      sad
22     bored
144      sad
Name: class, Length: 72, dtype: object

In [45]:
with open('model1.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

# 4. Make Detections with Model

In [46]:
with open('model1.pkl', 'rb') as f:
    model = pickle.load(f)

In [47]:
model

In [50]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Make Detections
            X = pd.DataFrame([row])
            body_language_class = model.predict(X)[0]
            body_language_prob = model.predict_proba(X)[0]
            print(body_language_class, body_language_prob)
            
            # Grab ear coords
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
            cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Get status box
            cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)
            
            # Display Class
            cv2.putText(image, 'CLASS', (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, body_language_class.split(' ')[0], (90,40), 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Display Probability
            cv2.putText(image, 'PROB', (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2)), 
                        (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()




sad [0.02 0.98]




sad [0.03 0.97]
sad [0.04 0.96]




sad [0.04 0.96]




sad [0.03 0.97]




sad [0.01 0.99]




sad [0.01 0.99]
sad [0. 1.]




sad [0. 1.]
sad [0. 1.]




sad [0. 1.]




sad [0. 1.]




sad [0. 1.]
sad [0. 1.]




sad [0. 1.]




sad [0. 1.]




sad [0.11 0.89]




sad [0.16 0.84]
sad [0.17 0.83]




sad [0.19 0.81]




sad [0.2 0.8]




sad [0.21 0.79]




sad [0.25 0.75]




sad [0.26 0.74]




sad [0.26 0.74]
sad [0.28 0.72]




sad [0.28 0.72]




sad [0.27 0.73]




sad [0.26 0.74]
sad [0.26 0.74]
sad [0.26 0.74]




sad [0.26 0.74]




sad [0.25 0.75]
sad [0.23 0.77]




sad [0.25 0.75]
sad [0.3 0.7]




sad [0.3 0.7]




sad [0.3 0.7]
sad [0.31 0.69]




sad [0.34 0.66]
sad [0.37 0.63]




sad [0.49 0.51]
bored [0.56 0.44]




bored [0.54 0.46]
bored [0.52 0.48]




bored [0.51 0.49]
bored [0.5 0.5]




sad [0.49 0.51]




sad [0.47 0.53]
sad [0.47 0.53]




sad [0.47 0.53]
sad [0.46 0.54]




sad [0.46 0.54]
sad [0.43 0.57]




sad [0.41 0.59]
sad [0.37 0.63]




sad [0.37 0.63]




sad [0.34 0.66]
sad [0.33 0.67]
sad [0.25 0.75]




sad [0.23 0.77]
sad [0.23 0.77]




sad [0.22 0.78]
sad [0.21 0.79]




sad [0.21 0.79]




sad [0.21 0.79]
sad [0.21 0.79]




sad [0.21 0.79]




sad [0.21 0.79]




sad [0.25 0.75]




sad [0.48 0.52]




bored [0.51 0.49]




bored [0.5 0.5]
bored [0.5 0.5]




sad [0.49 0.51]
bored [0.5 0.5]




bored [0.5 0.5]
bored [0.5 0.5]




bored [0.5 0.5]




bored [0.5 0.5]




bored [0.5 0.5]
bored [0.5 0.5]




bored [0.51 0.49]




sad [0.49 0.51]
sad [0.47 0.53]




sad [0.47 0.53]




sad [0.43 0.57]




sad [0.43 0.57]




sad [0.44 0.56]




sad [0.43 0.57]




sad [0.43 0.57]




sad [0.45 0.55]
sad [0.44 0.56]
sad [0.44 0.56]




sad [0.44 0.56]
sad [0.43 0.57]




sad [0.44 0.56]




sad [0.44 0.56]




sad [0.25 0.75]




sad [0.21 0.79]
sad [0.19 0.81]




sad [0.19 0.81]
sad [0.18 0.82]




In [51]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(415, 201)