# 0. Install and Import Dependencies

In [30]:
!pip install mediapipe opencv-python pandas scikit-learn



In [1]:
import mediapipe as mp # Import mediapipe
import cv2 # Import opencv

In [2]:
mp_drawing = mp.solutions.drawing_utils # Drawing helpers
mp_holistic = mp.solutions.holistic # Mediapipe Solutions

# 1. Make Some Detections

In [3]:
import cv2
import mediapipe as mp

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Start capturing video from the webcam
cap = cv2.VideoCapture(0)

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (no FACE_CONNECTIONS, just landmarks)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION,  # Use FACEMESH_TESSELATION for face mesh connections
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Show the processed image
        cv2.imshow('Raw Webcam Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture object and close windows
cap.release()
cv2.destroyAllWindows()


In [102]:
import cv2
import mediapipe as mp
import os

# Initialize mediapipe holistic model and drawing utilities
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

# Path to input video
video_path = r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Vid3.mp4'

# Specify output folder and file
output_folder = 'output_videos'
if not os.path.exists(output_folder):
    os.makedirs(output_folder)
output_video_path = os.path.join(output_folder, r'C:\Users\Admin\Downloads\Body Language Detection with mediapipe\output_videos\Vid3Processed.mp4')

# Start capturing video from the file
cap = cv2.VideoCapture(video_path)

# Get frame width, height, and FPS for saving the output video
frame_width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
fps = int(cap.get(cv2.CAP_PROP_FPS))

# Define the codec and create VideoWriter object to save the video
fourcc = cv2.VideoWriter_fourcc(*'mp4v')
out = cv2.VideoWriter(output_video_path, fourcc, fps, (frame_width, frame_height))

# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    while cap.isOpened():
        ret, frame = cap.read()
        if not ret:
            break
        
        # Recolor Feed to RGB for Mediapipe processing
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, 
                                      mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))
        
        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))
        
        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Write the processed frame to the output video
        out.write(image)
        
        # Show the processed image (optional)
        cv2.imshow('Processed Video Feed', image)

        # Break the loop if 'q' is pressed
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

# Release the video capture and writer objects, and close windows
cap.release()
out.release()
cv2.destroyAllWindows()


In [4]:
results.pose_landmarks.landmark[0].visibility

0.9956830143928528

In [5]:
results.face_landmarks.landmark[0].visibility

0.0

In [6]:
print(results.face_landmarks.landmark[0])
results.face_landmarks.landmark[0].x

x: 0.7129311561584473
y: 0.5160745978355408
z: -0.038663674145936966



0.7129311561584473

# 2. Capture Landmarks & Export to CSV
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<!--<img src="https://i.imgur.com/AzKNp7A.png">-->
<!--<img src="https://i.imgur.com/8bForKY.png">-->
<img src="https://i.imgur.com/AzKNp7A.png">

In [7]:
import csv
import os
import numpy as np

In [8]:
num_coords = len(results.pose_landmarks.landmark)+len(results.face_landmarks.landmark)
num_coords

501

In [9]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [10]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [11]:
with open('coords.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [12]:
class_name = "sad"

In [13]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))

        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('coords.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()


# 3. Train Custom Model Using Scikit Learn

## 3.1 Read in Collected Data and Process

In [14]:
import pandas as pd
from sklearn.model_selection import train_test_split

In [15]:
df = pd.read_csv('coords.csv')

In [16]:
df.head()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,sad,0.673883,0.606078,-1.513018,0.998811,0.70182,0.522578,-1.416662,0.997406,0.721743,...,-0.000915,0.0,0.770042,0.501003,0.045191,0.0,0.777396,0.492871,0.047277,0.0
1,sad,0.673756,0.605776,-1.602976,0.998288,0.70056,0.521706,-1.481247,0.997074,0.720726,...,-0.001793,0.0,0.767857,0.499251,0.043503,0.0,0.774546,0.491796,0.045474,0.0
2,sad,0.672151,0.605527,-1.659409,0.998057,0.697928,0.521139,-1.536518,0.996966,0.718747,...,-0.001387,0.0,0.764472,0.497448,0.043428,0.0,0.771108,0.489933,0.045337,0.0
3,sad,0.671193,0.605522,-1.722264,0.997797,0.69611,0.520594,-1.599508,0.996804,0.717311,...,-0.001856,0.0,0.765807,0.49735,0.042415,0.0,0.772435,0.489599,0.044355,0.0
4,sad,0.671179,0.605909,-1.797587,0.997611,0.696093,0.520555,-1.673583,0.996649,0.717304,...,-0.000357,0.0,0.766631,0.496793,0.044155,0.0,0.773426,0.488797,0.046108,0.0


In [17]:
df.tail()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
19,sad,0.50432,0.622547,-1.553665,0.994527,0.546405,0.521492,-1.488438,0.99398,0.576042,...,-0.008654,0.0,0.59937,0.485452,-0.01226,0.0,0.607536,0.472993,-0.01429,0.0
20,sad,0.516787,0.618693,-1.640543,0.994485,0.555269,0.52027,-1.549209,0.993969,0.584949,...,-0.006789,0.0,0.659042,0.476493,0.015047,0.0,0.665804,0.465347,0.015208,0.0
21,sad,0.566741,0.611077,-1.686461,0.99472,0.598177,0.516136,-1.574126,0.994257,0.623813,...,-0.002872,0.0,0.694509,0.474532,0.030244,0.0,0.700897,0.46443,0.031377,0.0
22,sad,0.609985,0.606968,-1.690077,0.994707,0.63293,0.514866,-1.573542,0.994322,0.652723,...,0.003946,0.0,0.724913,0.478644,0.051095,0.0,0.730734,0.470254,0.05336,0.0
23,sad,0.635079,0.601488,-1.686964,0.994535,0.651106,0.513079,-1.56965,0.994209,0.668871,...,0.004167,0.0,0.736976,0.48002,0.055205,0.0,0.7423,0.471265,0.057794,0.0


In [70]:
df[df['class']=='wave']

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501


In [71]:
X = df.drop('class', axis=1) # features
y = df['class'] # target value

In [72]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1234)

In [73]:
X_test

Unnamed: 0,x1,y1,z1,v1,x2,y2,z2,v2,x3,y3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
263,0.529031,0.539838,-1.208879,0.999475,0.559137,0.480468,-1.138925,0.998923,0.582513,0.481862,...,-0.001608,0.0,0.590233,0.468628,0.020492,0.0,0.595983,0.461490,0.021075,0.0
77,0.392653,0.559100,-1.430887,0.999548,0.422583,0.490989,-1.331480,0.999476,0.440784,0.495545,...,-0.016099,0.0,0.474671,0.503379,0.003644,0.0,0.481827,0.494505,0.003946,0.0
163,0.559856,0.604692,-1.537517,0.998916,0.585246,0.524771,-1.457976,0.997477,0.600971,0.523674,...,-0.013425,0.0,0.635077,0.517787,0.017497,0.0,0.639931,0.511390,0.018394,0.0
206,0.520391,0.588952,-1.338330,0.999192,0.553459,0.508157,-1.278191,0.998464,0.576750,0.505051,...,-0.014673,0.0,0.594599,0.517553,0.000154,0.0,0.600545,0.508007,0.000044,0.0
167,0.561019,0.605435,-1.474053,0.998663,0.585978,0.525987,-1.401680,0.996999,0.601071,0.525276,...,-0.015614,0.0,0.635474,0.519326,0.012322,0.0,0.640690,0.512325,0.012918,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
51,0.371020,0.545866,-1.415979,0.999313,0.410275,0.486595,-1.311429,0.999225,0.430361,0.492007,...,-0.014271,0.0,0.457727,0.509061,0.008053,0.0,0.464680,0.501833,0.008377,0.0
284,0.518099,0.543335,-1.290829,0.999371,0.547564,0.482061,-1.218027,0.998729,0.570402,0.482558,...,0.002969,0.0,0.604905,0.480979,0.030421,0.0,0.610917,0.475190,0.031543,0.0
205,0.522656,0.580285,-1.336037,0.999226,0.555130,0.502012,-1.273325,0.998561,0.578338,0.499466,...,-0.015013,0.0,0.594865,0.516136,-0.000913,0.0,0.600881,0.505847,-0.000949,0.0
9,0.628595,0.573134,-1.218545,0.999945,0.660316,0.490308,-1.145461,0.999928,0.678244,0.490302,...,-0.014698,0.0,0.720123,0.471514,0.018277,0.0,0.726254,0.463033,0.019299,0.0


## 3.2 Train Machine Learning Classification Model

In [74]:
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 

from sklearn.linear_model import LogisticRegression, RidgeClassifier
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [75]:
pipelines = {
    'lr':make_pipeline(StandardScaler(), LogisticRegression()),
    'rc':make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf':make_pipeline(StandardScaler(), RandomForestClassifier()),
    'gb':make_pipeline(StandardScaler(), GradientBoostingClassifier()),
}

In [76]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model

In [77]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rc': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('ridgeclassifier', RidgeClassifier())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())]),
 'gb': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('gradientboostingclassifier', GradientBoostingClassifier())])}

In [78]:
fit_models['rc'].predict(X_test)

array(['sad', 'bored', 'sad', 'sad', 'sad', 'bored', 'sad', 'sad', 'sad',
       'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad',
       'bored', 'bored', 'bored', 'bored', 'bored', 'sad', 'bored',
       'bored', 'sad', 'sad', 'sad', 'bored', 'bored', 'bored', 'bored',
       'sad', 'bored', 'sad', 'sad', 'sad', 'sad', 'bored', 'sad', 'sad',
       'bored', 'sad', 'sad', 'bored', 'bored', 'sad', 'sad', 'sad',
       'bored', 'sad', 'sad', 'sad', 'sad', 'bored', 'sad', 'bored',
       'sad', 'bored', 'bored', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad',
       'bored', 'bored', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad',
       'sad', 'bored', 'bored', 'bored', 'sad', 'sad', 'sad', 'bored',
       'bored', 'sad', 'bored', 'sad', 'sad', 'bored', 'bored'],
      dtype='<U5')

## 3.3 Evaluate and Serialize Model 

In [19]:
from sklearn.metrics import accuracy_score # Accuracy metrics 
import pickle 

In [80]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rc 1.0
rf 1.0
gb 1.0


In [81]:
fit_models['rc'].predict(X_test)

array(['sad', 'bored', 'sad', 'sad', 'sad', 'bored', 'sad', 'sad', 'sad',
       'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad',
       'bored', 'bored', 'bored', 'bored', 'bored', 'sad', 'bored',
       'bored', 'sad', 'sad', 'sad', 'bored', 'bored', 'bored', 'bored',
       'sad', 'bored', 'sad', 'sad', 'sad', 'sad', 'bored', 'sad', 'sad',
       'bored', 'sad', 'sad', 'bored', 'bored', 'sad', 'sad', 'sad',
       'bored', 'sad', 'sad', 'sad', 'sad', 'bored', 'sad', 'bored',
       'sad', 'bored', 'bored', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad',
       'bored', 'bored', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad', 'sad',
       'sad', 'bored', 'bored', 'bored', 'sad', 'sad', 'sad', 'bored',
       'bored', 'sad', 'bored', 'sad', 'sad', 'bored', 'bored'],
      dtype='<U5')

In [82]:
y_test

263      sad
77     bored
163      sad
206      sad
167      sad
       ...  
51     bored
284      sad
205      sad
9      bored
83     bored
Name: class, Length: 91, dtype: object

In [83]:
with open('model.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

# 4. Make Detections with Model

In [20]:
with open('model.pkl', 'rb') as f:
    model = pickle.load(f)

In [21]:
model

In [25]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.1, min_tracking_confidence=0.1) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks (use FACEMESH_TESSELATION)
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION, 
                                      mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                      mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
        
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concatenate rows
            row = pose_row + face_row
            
            # Make Detections
            X = pd.DataFrame([row])
            body_language_class = model.predict(X)[0]
            body_language_prob = model.predict_proba(X)[0]
            print(body_language_class, body_language_prob)
            
            # Grab ear coords
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
            cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Get status box
            cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)
            
            # Display Class
            cv2.putText(image, 'CLASS', (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, body_language_class.split(' ')[0], (90,40), 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Display Probability
            cv2.putText(image, 'PROB', (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2)), 
                        (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()




bored [0.88 0.12]




bored [0.87 0.13]




bored [0.85 0.15]
bored [0.85 0.15]




bored [0.84 0.16]




bored [0.85 0.15]




bored [0.85 0.15]
bored [0.85 0.15]




bored [0.85 0.15]




bored [0.8 0.2]




bored [0.81 0.19]




bored [0.72 0.28]




bored [0.6 0.4]




bored [0.55 0.45]




bored [0.62 0.38]




bored [0.65 0.35]




bored [0.62 0.38]




bored [0.61 0.39]




bored [0.65 0.35]




bored [0.63 0.37]




bored [0.61 0.39]




bored [0.61 0.39]




bored [0.62 0.38]




bored [0.62 0.38]




bored [0.61 0.39]




bored [0.57 0.43]




bored [0.57 0.43]




bored [0.55 0.45]




bored [0.52 0.48]




bored [0.53 0.47]




bored [0.52 0.48]




sad [0.44 0.56]




bored [0.52 0.48]




bored [0.57 0.43]




bored [0.56 0.44]
bored [0.56 0.44]




bored [0.56 0.44]
bored [0.54 0.46]
bored [0.57 0.43]




bored [0.52 0.48]


In [24]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(363, 208)