# 0. Install and Import Dependencies

In [30]:
!pip install mediapipe opencv-python pandas scikit-learn



In [31]:
import mediapipe as mp # Import mediapipe
import cv2 # Import opencv

In [32]:
mp_drawing = mp.solutions.drawing_utils # Drawing helpers
mp_holistic = mp.solutions.holistic # Mediapipe Solutions

# 1. Make Some Detections

In [33]:
import cv2
import mediapipe as mp

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Start capturing video from the webcam
cap = cv2.VideoCapture(0)

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (no FACE_CONNECTIONS, just landmarks)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION,  # Use FACEMESH_TESSELATION for face mesh connections
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Show the processed image
        cv2.imshow('Raw Webcam Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture object and close windows
cap.release()
cv2.destroyAllWindows()


In [22]:
import cv2
import mediapipe as mp
import os

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Path to input video
video_path = r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Run.mp4'

# Specify output folder and file
output_folder = 'output_videos'
if not os.path.exists(output_folder):
    os.makedirs(output_folder)
output_video_path = os.path.join(output_folder, r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\RunProcessed.mp4')

# Start capturing video from the file
cap = cv2.VideoCapture(video_path)

# Get frame width, height, and FPS for saving the output video
frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
fps = int(cap.get(cv2.CAP_PROP_FPS))

# Define the codec and create VideoWriter object to save the video
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out = cv2.VideoWriter(output_video_path, fourcc, fps, (frame_width, frame_height))

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            break
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Write the processed frame to the output video
        out.write(image)
        
        # Show the processed image (optional)
        cv2.imshow('Processed Video Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture and writer objects, and close windows
cap.release()
out.release()
cv2.destroyAllWindows()


In [34]:
results.pose_landmarks.landmark[0].visibility

0.8834391832351685

In [35]:
results.face_landmarks.landmark[0].visibility

0.0

In [37]:
print(results.face_landmarks.landmark[0])
results.face_landmarks.landmark[0].x

x: 0.6861182451248169
y: 0.4856717586517334
z: -0.042298201471567154



0.6861182451248169

# 2. Capture Landmarks & Export to CSV
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<!--<img src="https://i.imgur.com/AzKNp7A.png">-->
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<!--<img src="https://i.imgur.com/AzKNp7A.png">-->

In [38]:
import csv
import os
import numpy as np

In [39]:
num_coords = len(results.pose_landmarks.landmark)+len(results.face_landmarks.landmark)
num_coords

501

In [40]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [41]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [42]:
with open('coords.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [43]:
class_name = "cough"

In [78]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))

        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('coords.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()


# 3. Train Custom Model Using Scikit Learn

## 3.1 Read in Collected Data and Process

In [79]:
import pandas as pd
from sklearn.model_selection import train_test_split

In [80]:
df = pd.read_csv('coords.csv')

In [81]:
df.head()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,sad,0.553035,0.49889,-1.466447,0.999054,0.585991,0.426179,-1.390513,0.998633,0.607517,...,-0.01061,0.0,0.657822,0.401433,0.015453,0.0,0.664554,0.390399,0.01614,0.0
1,sad,0.459598,0.495241,-1.687205,0.999114,0.4875,0.422675,-1.67651,0.998759,0.508403,...,-0.02154,0.0,0.534175,0.406746,-0.02629,0.0,0.540744,0.392593,-0.02845,0.0
2,sad,0.465693,0.494824,-1.591422,0.999083,0.491563,0.422632,-1.562784,0.998722,0.511949,...,-0.017707,0.0,0.538163,0.404281,-0.018237,0.0,0.544776,0.391026,-0.019965,0.0
3,sad,0.475315,0.489554,-1.587022,0.999071,0.500395,0.419452,-1.544876,0.998745,0.519864,...,-0.0145,0.0,0.584368,0.392841,-0.001627,0.0,0.590864,0.379803,-0.002119,0.0
4,sad,0.545305,0.48389,-1.67704,0.999021,0.582484,0.413149,-1.606523,0.998665,0.604808,...,-0.006782,0.0,0.663153,0.400816,0.020523,0.0,0.669844,0.390941,0.021188,0.0


In [82]:
df.tail()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
59,cough,0.592634,0.559022,-1.379131,0.998987,0.624417,0.475038,-1.341297,0.998728,0.640185,...,-0.008509,0.0,0.718874,0.414894,0.025999,0.0,0.72541,0.403676,0.027455,0.0
60,cough,0.574677,0.509051,-1.27031,0.999355,0.605702,0.436911,-1.175613,0.999178,0.620231,...,-0.014935,0.0,0.694986,0.397888,0.016921,0.0,0.700621,0.387299,0.018126,0.0
61,cough,0.567858,0.503025,-1.324689,0.999494,0.602605,0.430036,-1.235161,0.999339,0.619402,...,-0.012861,0.0,0.693811,0.397174,0.021451,0.0,0.699528,0.387235,0.022801,0.0
62,cough,0.567101,0.502444,-1.222134,0.999523,0.60216,0.429532,-1.139177,0.999357,0.619373,...,-0.010614,0.0,0.691038,0.403482,0.02577,0.0,0.696649,0.393954,0.027233,0.0
63,cough,0.565351,0.500558,-1.227669,0.999557,0.601015,0.427727,-1.149352,0.999395,0.618935,...,-0.010845,0.0,0.693963,0.400383,0.02445,0.0,0.699429,0.3906,0.025888,0.0


In [83]:
df[df['class']=='sad']

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,sad,0.553035,0.49889,-1.466447,0.999054,0.585991,0.426179,-1.390513,0.998633,0.607517,...,-0.01061,0.0,0.657822,0.401433,0.015453,0.0,0.664554,0.390399,0.01614,0.0
1,sad,0.459598,0.495241,-1.687205,0.999114,0.4875,0.422675,-1.67651,0.998759,0.508403,...,-0.02154,0.0,0.534175,0.406746,-0.02629,0.0,0.540744,0.392593,-0.02845,0.0
2,sad,0.465693,0.494824,-1.591422,0.999083,0.491563,0.422632,-1.562784,0.998722,0.511949,...,-0.017707,0.0,0.538163,0.404281,-0.018237,0.0,0.544776,0.391026,-0.019965,0.0
3,sad,0.475315,0.489554,-1.587022,0.999071,0.500395,0.419452,-1.544876,0.998745,0.519864,...,-0.0145,0.0,0.584368,0.392841,-0.001627,0.0,0.590864,0.379803,-0.002119,0.0
4,sad,0.545305,0.48389,-1.67704,0.999021,0.582484,0.413149,-1.606523,0.998665,0.604808,...,-0.006782,0.0,0.663153,0.400816,0.020523,0.0,0.669844,0.390941,0.021188,0.0
5,sad,0.544347,0.482915,-1.613517,0.99907,0.582492,0.411865,-1.537072,0.998718,0.604813,...,-0.005397,0.0,0.665699,0.402594,0.02309,0.0,0.672079,0.392387,0.023854,0.0
6,sad,0.552304,0.483127,-1.651171,0.999057,0.590429,0.411894,-1.570296,0.998702,0.611478,...,0.00284,0.0,0.667921,0.358789,0.031032,0.0,0.67368,0.344718,0.032454,0.0
7,sad,0.553305,0.484776,-1.679841,0.999012,0.592359,0.413135,-1.602408,0.998641,0.613485,...,0.003031,0.0,0.671301,0.352839,0.033106,0.0,0.677452,0.340067,0.034441,0.0
8,sad,0.555947,0.484811,-1.633462,0.999031,0.594115,0.413506,-1.543746,0.998672,0.614406,...,0.00181,0.0,0.670451,0.351798,0.031609,0.0,0.67664,0.339026,0.032966,0.0
9,sad,0.557094,0.484562,-1.623167,0.999064,0.594656,0.413528,-1.529322,0.998739,0.614545,...,0.000836,0.0,0.675254,0.357856,0.031298,0.0,0.68151,0.344796,0.032792,0.0


In [84]:
X = df.drop('class', axis=1) # features
y = df['class'] # target value

In [85]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1234)

In [86]:
X_test

Unnamed: 0,x1,y1,z1,v1,x2,y2,z2,v2,x3,y3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
22,0.556,0.482466,-1.661009,0.999106,0.593846,0.413191,-1.570206,0.998886,0.613877,0.41879,...,0.000914,0.0,0.679897,0.37247,0.031986,0.0,0.685991,0.362271,0.033453,0.0
32,0.56585,0.513967,-1.60753,0.999353,0.59899,0.438952,-1.531564,0.999163,0.615548,0.444124,...,-0.016522,0.0,0.66072,0.393902,-7.6e-05,0.0,0.669269,0.382828,-0.00016,0.0
33,0.565777,0.513796,-1.554085,0.999394,0.599268,0.438921,-1.474537,0.99922,0.616131,0.44407,...,-0.016554,0.0,0.659515,0.395319,-0.001157,0.0,0.668187,0.38431,-0.001188,0.0
8,0.555947,0.484811,-1.633462,0.999031,0.594115,0.413506,-1.543746,0.998672,0.614406,0.418032,...,0.00181,0.0,0.670451,0.351798,0.031609,0.0,0.67664,0.339026,0.032966,0.0
6,0.552304,0.483127,-1.651171,0.999057,0.590429,0.411894,-1.570296,0.998702,0.611478,0.415757,...,0.00284,0.0,0.667921,0.358789,0.031032,0.0,0.67368,0.344718,0.032454,0.0
56,0.570374,0.502859,-1.338266,0.998419,0.600457,0.43154,-1.277196,0.997912,0.615644,0.435741,...,-0.010408,0.0,0.702587,0.398507,0.02543,0.0,0.708661,0.386651,0.027039,0.0
40,0.53495,0.503335,-1.525194,0.99936,0.571772,0.434327,-1.472899,0.999242,0.588589,0.440122,...,-0.019426,0.0,0.607345,0.388919,-0.021011,0.0,0.617014,0.378802,-0.022521,0.0
20,0.555962,0.481989,-1.694436,0.999161,0.593885,0.412817,-1.610087,0.998951,0.613909,0.418195,...,9.9e-05,0.0,0.678428,0.366941,0.031144,0.0,0.684593,0.356021,0.032547,0.0
4,0.545305,0.48389,-1.67704,0.999021,0.582484,0.413149,-1.606523,0.998665,0.604808,0.417344,...,-0.006782,0.0,0.663153,0.400816,0.020523,0.0,0.669844,0.390941,0.021188,0.0
21,0.55596,0.483312,-1.74983,0.999122,0.593863,0.413627,-1.6635,0.99891,0.613896,0.419145,...,-0.000641,0.0,0.679801,0.366996,0.030828,0.0,0.685866,0.356388,0.032242,0.0


## 3.2 Train Machine Learning Classification Model

In [87]:
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 

from sklearn.linear_model import LogisticRegression, RidgeClassifier
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [88]:
pipelines = {
    'lr':make_pipeline(StandardScaler(), LogisticRegression()),
    'rc':make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf':make_pipeline(StandardScaler(), RandomForestClassifier()),
    'gb':make_pipeline(StandardScaler(), GradientBoostingClassifier()),
}

In [89]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model

In [90]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rc': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('ridgeclassifier', RidgeClassifier())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())]),
 'gb': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('gradientboostingclassifier', GradientBoostingClassifier())])}

In [91]:
fit_models['rc'].predict(X_test)

array(['sad', 'happy', 'happy', 'sad', 'sad', 'cough', 'happy', 'sad',
       'sad', 'sad', 'cough', 'cough', 'happy', 'sad', 'happy', 'cough',
       'happy', 'sad', 'happy', 'cough'], dtype='<U5')

## 3.3 Evaluate and Serialize Model 

In [92]:
from sklearn.metrics import accuracy_score # Accuracy metrics 
import pickle 

In [93]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rc 1.0
rf 1.0
gb 0.95


In [94]:
fit_models['rc'].predict(X_test)

array(['sad', 'happy', 'happy', 'sad', 'sad', 'cough', 'happy', 'sad',
       'sad', 'sad', 'cough', 'cough', 'happy', 'sad', 'happy', 'cough',
       'happy', 'sad', 'happy', 'cough'], dtype='<U5')

In [95]:
y_test

22      sad
32    happy
33    happy
8       sad
6       sad
56    cough
40    happy
20      sad
4       sad
21      sad
50    cough
54    cough
29    happy
18      sad
45    happy
55    cough
36    happy
13      sad
25    happy
57    cough
Name: class, dtype: object

In [96]:
with open('body_language.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

# 4. Make Detections with Model

In [114]:
with open('body_language.pkl', 'rb') as f:
    model = pickle.load(f)

In [115]:
model

In [118]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Make Detections
            X = pd.DataFrame([row])
            body_language_class = model.predict(X)[0]
            body_language_prob = model.predict_proba(X)[0]
            print(body_language_class, body_language_prob)
            
            # Grab ear coords
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
            cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Get status box
            cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)
            
            # Display Class
            cv2.putText(image, 'CLASS', (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, body_language_class.split(' ')[0], (90,40), 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Display Probability
            cv2.putText(image, 'PROB', (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2)), 
                        (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()




happy [0.34 0.58 0.08]
happy [0.3  0.49 0.21]




happy [0.31 0.49 0.2 ]
happy [0.31 0.47 0.22]




happy [0.32 0.46 0.22]
happy [0.26 0.53 0.21]




happy [0.27 0.53 0.2 ]
happy [0.23 0.51 0.26]




happy [0.24 0.51 0.25]
happy [0.24 0.51 0.25]




happy [0.28 0.5  0.22]
happy [0.23 0.54 0.23]




happy [0.22 0.52 0.26]
happy [0.3  0.47 0.23]




happy [0.24 0.5  0.26]
happy [0.24 0.5  0.26]




happy [0.24 0.52 0.24]




cough [0.43 0.35 0.22]
cough [0.42 0.35 0.23]




happy [0.35 0.45 0.2 ]
happy [0.34 0.48 0.18]




happy [0.35 0.48 0.17]
happy [0.33 0.48 0.19]
happy [0.34 0.45 0.21]




happy [0.35 0.44 0.21]
cough [0.4  0.39 0.21]




cough [0.45 0.34 0.21]
cough [0.45 0.32 0.23]




cough [0.42 0.33 0.25]
cough [0.43 0.32 0.25]




cough [0.43 0.34 0.23]
cough [0.43 0.37 0.2 ]




cough [0.43 0.35 0.22]
happy [0.4  0.41 0.19]




cough [0.41 0.37 0.22]
cough [0.4  0.39 0.21]




cough [0.41 0.39 0.2 ]
cough [0.41 0.38 0.21]




cough [0.39 0.39 0.22]
cough [0.4 0.4 0.2]




cough [0.4  0.39 0.21]
cough [0.41 0.37 0.22]




cough [0.42 0.36 0.22]
cough [0.42 0.36 0.22]




cough [0.4  0.39 0.21]
cough [0.43 0.35 0.22]




cough [0.4  0.38 0.22]
cough [0.4  0.39 0.21]




happy [0.4  0.41 0.19]
cough [0.41 0.4  0.19]




cough [0.41 0.4  0.19]
happy [0.39 0.41 0.2 ]




happy [0.36 0.45 0.19]
happy [0.35 0.47 0.18]




happy [0.32 0.47 0.21]
happy [0.36 0.47 0.17]




happy [0.34 0.45 0.21]




happy [0.33 0.45 0.22]
happy [0.37 0.41 0.22]




cough [0.39 0.38 0.23]
cough [0.48 0.27 0.25]




cough [0.54 0.2  0.26]
cough [0.55 0.2  0.25]




cough [0.59 0.16 0.25]
cough [0.63 0.12 0.25]




cough [0.59 0.14 0.27]
cough [0.55 0.17 0.28]




cough [0.43 0.35 0.22]
happy [0.35 0.42 0.23]




happy [0.33 0.48 0.19]
happy [0.34 0.46 0.2 ]




happy [0.33 0.46 0.21]
happy [0.36 0.44 0.2 ]




happy [0.34 0.44 0.22]
happy [0.34 0.45 0.21]




happy [0.34 0.46 0.2 ]
happy [0.33 0.47 0.2 ]




happy [0.32 0.46 0.22]
happy [0.33 0.45 0.22]




happy [0.37 0.42 0.21]
happy [0.38 0.45 0.17]




happy [0.37 0.43 0.2 ]
happy [0.37 0.45 0.18]




cough [0.41 0.38 0.21]
happy [0.39 0.4  0.21]




cough [0.41 0.41 0.18]
cough [0.4 0.4 0.2]




cough [0.42 0.38 0.2 ]
cough [0.43 0.38 0.19]




cough [0.43 0.38 0.19]
happy [0.39 0.4  0.21]




happy [0.4  0.42 0.18]
happy [0.38 0.43 0.19]




cough [0.43 0.36 0.21]
cough [0.42 0.35 0.23]




happy [0.17 0.58 0.25]




sad [0.12 0.34 0.54]




sad [0.12 0.41 0.47]
sad [0.13 0.34 0.53]




sad [0.15 0.29 0.56]
sad [0.13 0.28 0.59]




sad [0.13 0.29 0.58]
sad [0.14 0.21 0.65]




sad [0.13 0.28 0.59]
sad [0.15 0.28 0.57]




sad [0.15 0.33 0.52]
sad [0.12 0.38 0.5 ]




sad [0.13 0.38 0.49]
sad [0.12 0.38 0.5 ]




sad [0.13 0.37 0.5 ]
sad [0.13 0.38 0.49]




sad [0.13 0.39 0.48]
sad [0.13 0.28 0.59]




sad [0.12 0.37 0.51]
sad [0.12 0.37 0.51]




cough [0.41 0.41 0.18]




cough [0.47 0.32 0.21]
cough [0.46 0.33 0.21]




cough [0.42 0.39 0.19]
cough [0.52 0.24 0.24]




cough [0.56 0.2  0.24]




cough [0.56 0.19 0.25]
cough [0.59 0.19 0.22]




cough [0.6  0.18 0.22]
cough [0.61 0.2  0.19]




cough [0.61 0.19 0.2 ]
cough [0.61 0.19 0.2 ]




cough [0.6 0.2 0.2]
cough [0.6  0.18 0.22]




cough [0.58 0.19 0.23]




cough [0.58 0.19 0.23]
cough [0.56 0.2  0.24]




cough [0.6  0.18 0.22]
cough [0.56 0.18 0.26]




cough [0.58 0.18 0.24]
cough [0.41 0.4  0.19]




happy [0.34 0.48 0.18]


In [119]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(442, 225)