# 0. Install and Import Dependencies

In [1]:
!pip install mediapipe opencv-python pandas scikit-learn



In [1]:
import mediapipe as mp # Import mediapipe
import cv2 # Import opencv

In [2]:
mp_drawing = mp.solutions.drawing_utils # Drawing helpers
mp_holistic = mp.solutions.holistic # Mediapipe Solutions

# 1. Make Some Detections

In [3]:
cap = cv2.VideoCapture(1)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
         
        #    
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

In [4]:
results.face_landmarks.landmark[0].visibility

0.0

# 2. Capture Landmarks & Export to CSV
<img src="https://i.imgur.com/8bForKY.png">
<img src="https://i.imgur.com/AzKNp7A.png">

In [5]:
import csv
import os
import numpy as np

In [6]:
results.face_landmarks.landmark

[x: 0.554776668548584
y: 0.8044458627700806
z: -0.028675880283117294
, x: 0.5537651777267456
y: 0.7487563490867615
z: -0.0673699900507927
, x: 0.5521619319915771
y: 0.7624728679656982
z: -0.03330077603459358
, x: 0.538690984249115
y: 0.6872466802597046
z: -0.05568819120526314
, x: 0.55340975522995
y: 0.7312408685684204
z: -0.07286413758993149
, x: 0.5517671704292297
y: 0.7060811519622803
z: -0.06937525421380997
, x: 0.546964168548584
y: 0.6422461271286011
z: -0.03995903953909874
, x: 0.4476086497306824
y: 0.6348496675491333
z: 0.002314015757292509
, x: 0.544600248336792
y: 0.5906815528869629
z: -0.034061551094055176
, x: 0.5440767407417297
y: 0.5649400353431702
z: -0.03854047507047653
, x: 0.5408483743667603
y: 0.47757846117019653
z: -0.03296862542629242
, x: 0.5550376176834106
y: 0.8126574754714966
z: -0.02610272727906704
, x: 0.5547488927841187
y: 0.8184000253677368
z: -0.021370626986026764
, x: 0.554135799407959
y: 0.8201895952224731
z: -0.015486016869544983
, x: 0.5548650026321411


In [7]:
num_coords = len(results.pose_landmarks.landmark)+len(results.face_landmarks.landmark)
num_coords #Tong 501 pose tracking

501

In [8]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [9]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [10]:
with open('khautrang.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [20]:
class_name = "Khong Khau trang"

In [21]:
cap = cv2.VideoCapture(1)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_CONTOURS, 
                                  mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                  mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                  )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concate rows
            row = pose_row+face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('khautrang.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

# 3. Train Custom Model Using Scikit Learn

## 3.1 Read in Collected Data and Process

In [22]:
import pandas as pd
from sklearn.model_selection import train_test_split

In [23]:
df = pd.read_csv('khautrang.csv')

In [24]:
df.head()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,Khau trang,0.415743,0.532489,-0.688768,0.999888,0.452584,0.479172,-0.672577,0.999684,0.476827,...,0.003813,0.0,0.511344,0.473964,0.007217,0.0,0.51821,0.467047,0.006222,0.0
1,Khau trang,0.392152,0.51841,-0.919907,0.999302,0.429105,0.474411,-0.905029,0.998862,0.452077,...,0.000367,0.0,0.442949,0.468498,-0.010705,0.0,0.449468,0.46031,-0.012549,0.0
2,Khau trang,0.373521,0.555362,-0.78349,0.999424,0.401816,0.498657,-0.770004,0.999025,0.424278,...,-0.00097,0.0,0.433719,0.503042,-0.012715,0.0,0.43895,0.494317,-0.014497,0.0
3,Khau trang,0.375491,0.57334,-0.808794,0.999371,0.404824,0.513256,-0.798833,0.998925,0.427186,...,0.000997,0.0,0.434833,0.514211,-0.010075,0.0,0.440819,0.505476,-0.011694,0.0
4,Khau trang,0.372332,0.574253,-0.769505,0.999381,0.404335,0.515017,-0.775106,0.998938,0.427313,...,-0.008161,0.0,0.474618,0.518523,-0.00736,0.0,0.480523,0.509004,-0.008331,0.0


In [25]:
df.tail()

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
327,Khong Khau trang,0.531576,0.721696,-1.308099,0.999373,0.577723,0.651314,-1.229471,0.998932,0.603296,...,-0.011827,0.0,0.638068,0.656225,0.009833,0.0,0.644787,0.648186,0.010104,0.0
328,Khong Khau trang,0.533415,0.731559,-1.138252,0.999387,0.578885,0.659159,-1.060831,0.998924,0.604365,...,-0.011344,0.0,0.636557,0.655114,0.010105,0.0,0.642957,0.648194,0.010222,0.0
329,Khong Khau trang,0.532794,0.717384,-1.269596,0.999416,0.578374,0.643671,-1.188416,0.998975,0.604012,...,-0.01281,0.0,0.631577,0.618782,0.008069,0.0,0.638196,0.612374,0.008167,0.0
330,Khong Khau trang,0.532623,0.70557,-1.335126,0.999436,0.578175,0.634216,-1.214648,0.999019,0.603218,...,-0.012644,0.0,0.627844,0.587118,0.008403,0.0,0.634772,0.579412,0.008652,0.0
331,Khong Khau trang,0.533065,0.698373,-1.55634,0.999458,0.577814,0.627699,-1.448766,0.999082,0.602801,...,-0.012305,0.0,0.64068,0.599626,0.01137,0.0,0.646905,0.59143,0.011843,0.0


In [31]:
df[df['class']=="Think?"]

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
342,Think?,0.428042,0.601111,-1.099079,0.999861,0.480492,0.520044,-1.063433,0.999627,0.506605,...,-0.008373,0.0,0.534677,0.507974,-0.003867,0.0,0.542080,0.502733,-0.004923,0.0
343,Think?,0.429084,0.600968,-1.114720,0.999869,0.480497,0.520141,-1.074123,0.999650,0.506774,...,-0.009833,0.0,0.534964,0.510410,-0.005678,0.0,0.542458,0.505154,-0.006829,0.0
344,Think?,0.429725,0.599402,-1.142413,0.999876,0.480496,0.520026,-1.094620,0.999667,0.506871,...,-0.009799,0.0,0.534555,0.514928,-0.006406,0.0,0.542361,0.508850,-0.007450,0.0
345,Think?,0.429720,0.598336,-1.149945,0.999877,0.479694,0.519797,-1.106555,0.999672,0.506365,...,-0.009003,0.0,0.534233,0.508584,-0.005197,0.0,0.541935,0.502760,-0.006239,0.0
346,Think?,0.430317,0.599545,-1.196663,0.999878,0.480024,0.520684,-1.156068,0.999673,0.507054,...,-0.011339,0.0,0.535130,0.512320,-0.006737,0.0,0.542780,0.506563,-0.007756,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
646,Think?,0.402907,0.544077,-0.830941,0.999726,0.446968,0.476758,-0.836027,0.999326,0.465005,...,-0.006514,0.0,0.473788,0.461975,-0.027024,0.0,0.481094,0.454943,-0.029901,0.0
647,Think?,0.402981,0.543618,-0.821909,0.999673,0.447129,0.476327,-0.830315,0.999212,0.465214,...,-0.005833,0.0,0.473513,0.460780,-0.024232,0.0,0.480819,0.453714,-0.026930,0.0
648,Think?,0.403118,0.543653,-0.763753,0.999674,0.447172,0.476311,-0.768121,0.999217,0.465243,...,-0.007276,0.0,0.470352,0.461953,-0.027758,0.0,0.477743,0.454780,-0.030616,0.0
649,Think?,0.403200,0.543645,-0.794687,0.999666,0.447261,0.476273,-0.795741,0.999201,0.465376,...,-0.007179,0.0,0.470776,0.461828,-0.026986,0.0,0.478176,0.454635,-0.029796,0.0


In [26]:
X = df.drop('class', axis=1) # features
y = df['class'] # target value

In [27]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1234)

In [28]:
y_test

146          Khau trang
54           Khau trang
80           Khau trang
90           Khau trang
208    Khong Khau trang
             ...       
69           Khau trang
33           Khau trang
162          Khau trang
167          Khau trang
156          Khau trang
Name: class, Length: 100, dtype: object

## 3.2 Train Machine Learning Classification Model

In [29]:
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 

from sklearn.linear_model import LogisticRegression, RidgeClassifier
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [30]:
pipelines = {
    'lr':make_pipeline(StandardScaler(), LogisticRegression()),
    
    'rf':make_pipeline(StandardScaler(), RandomForestClassifier())
    
}
#'rc':make_pipeline(StandardScaler(), RidgeClassifier()),
#'gb':make_pipeline(StandardScaler(), GradientBoostingClassifier()),

In [31]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model

In [32]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())])}

In [33]:
fit_models['rf'].predict(X_test)

array(['Khau trang', 'Khau trang', 'Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khau trang', 'Khau trang', 'Khong Khau trang',
       'Khau trang', 'Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khong Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khau trang', 'Khau trang',
       'Khau trang', 'Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khau trang', 'Khau trang', 'Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khau trang', 'Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khong Khau trang',
       'Khong Khau trang', 'Khau trang', 'Khong Khau trang', 'Khau trang',
       '

## 3.3 Evaluate and Serialize Model 

In [34]:
from sklearn.metrics import accuracy_score # Accuracy metrics 
import pickle 

In [35]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rf 0.98


In [36]:
fit_models['rf'].predict(X_test)

array(['Khau trang', 'Khau trang', 'Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khau trang', 'Khau trang', 'Khong Khau trang',
       'Khau trang', 'Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khong Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khau trang', 'Khau trang',
       'Khau trang', 'Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khau trang', 'Khau trang', 'Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khau trang', 'Khau trang',
       'Khau trang', 'Khong Khau trang', 'Khong Khau trang', 'Khau trang',
       'Khong Khau trang', 'Khong Khau trang', 'Khong Khau trang',
       'Khong Khau trang', 'Khau trang', 'Khong Khau trang', 'Khau trang',
       '

In [37]:
y_test

146          Khau trang
54           Khau trang
80           Khau trang
90           Khau trang
208    Khong Khau trang
             ...       
69           Khau trang
33           Khau trang
162          Khau trang
167          Khau trang
156          Khau trang
Name: class, Length: 100, dtype: object

In [38]:
with open('khautrang.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

# 4. Make Detections with Model

In [39]:
with open('khautrang.pkl', 'rb') as f:
    model = pickle.load(f)

In [15]:
model

Pipeline(steps=[('standardscaler', StandardScaler()),
                ('randomforestclassifier', RandomForestClassifier())])

In [17]:
cap = cv2.VideoCapture(1)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
   
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_CONTOURS, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())

            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())

            # Concate rows
            row = pose_row+face_row

    #             # Append class name 
    #             row.insert(0, class_name)

    #             # Export to CSV
    #             with open('coords.csv', mode='a', newline='') as f:
    #                 csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    #                 csv_writer.writerow(row) 

            # Make Detections
            X = pd.DataFrame([row])
            body_language_class = model.predict(X)[0]
            body_language_prob = model.predict_proba(X)[0]

            #print(body_language_class, body_language_prob)

            # Grab ear coords
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))

            cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_COMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)

            # Get status box
            cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)

            # Display Class
            cv2.putText(image, "CLASS"
                        , (95,12), cv2.FONT_HERSHEY_COMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, body_language_class.split(' ')[0]
                        , (90,40), cv2.FONT_HERSHEY_COMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)

            # Display Probability
            cv2.putText(image, "PROB"
                       , (15,12), cv2.FONT_HERSHEY_COMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2))
                       , (10,40), cv2.FONT_HERSHEY_COMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)

        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break
        

cap.release()
cv2.destroyAllWindows()

In [82]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(438, 278)

In [49]:
cap = cv2.VideoCapture(1)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_CONTOURS, 
                                  mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                  mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                  )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        cv2.putText(image, "DUCK HET BUG R"
                        , (90,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)

 
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()