### Install and import Dependencies

In [42]:
import cv2
import mediapipe as mp 

In [43]:
mp_drawing = mp.solutions.drawing_utils
mp_holistic = mp.solutions.holistic

### Make some detection

In [44]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()



In [45]:
results.face_landmarks.landmark[0]

x: 0.478361
y: 0.69993031
z: -0.0198857784

### Capture Landmarks and Export to CSV

In [46]:
import csv 
import os 
import numpy as np 

In [47]:
num_coords = len(results.pose_landmarks.landmark) + len(results.face_landmarks.landmark)
num_coords

501

In [48]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [49]:
landmarks[-1]

'v501'

In [50]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [None]:
with open('coords.csv', mode='w', newline='') as f:
    csv_writter = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writter.writerow(landmarks)

In [None]:
class_name = "Victorious"

In [None]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concate rows
            row = pose_row+face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('coords.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

In [None]:
len(row)

In [None]:
# face = results.pose_world_landmarks.landmark

In [None]:
# pose_row = np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten()

In [None]:
# face_row = np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten()

In [None]:
# row = pose_row+face_row

In [None]:
# row.insert(0, class_name)

In [None]:
# len(row) 

### Train Custom Model using scikitlearn

#### Read in collected Data and Process

In [51]:
import pandas as pd 
from sklearn.model_selection import train_test_split 

In [52]:
df = pd.read_csv("coords.csv")
df

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,Happy,0.488605,0.585417,-1.245149,0.999535,0.518417,0.523218,-1.167269,0.998767,0.536462,...,-0.007699,0.0,0.551217,0.524423,0.013217,0.0,0.557298,0.517729,0.014006,0.0
1,Happy,0.488604,0.597173,-1.128628,0.999516,0.518407,0.531122,-1.055943,0.998796,0.536446,...,-0.006456,0.0,0.552950,0.527253,0.014659,0.0,0.558940,0.521474,0.015386,0.0
2,Happy,0.488612,0.608904,-1.085987,0.999507,0.518355,0.539792,-1.014913,0.998834,0.536423,...,-0.009329,0.0,0.554525,0.528685,0.010920,0.0,0.560535,0.522218,0.011635,0.0
3,Happy,0.488656,0.611156,-1.074319,0.999515,0.518355,0.541776,-1.004128,0.998894,0.536440,...,-0.009308,0.0,0.555586,0.532307,0.010802,0.0,0.561680,0.526040,0.011517,0.0
4,Happy,0.491783,0.619147,-1.097466,0.999528,0.520929,0.548552,-1.024631,0.998938,0.538321,...,-0.011321,0.0,0.560200,0.538365,0.008164,0.0,0.566312,0.532468,0.008687,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
477,Victorious,0.511042,0.719340,-1.021762,0.999646,0.536823,0.659338,-0.951616,0.999511,0.548930,...,-0.014132,0.0,0.553147,0.637781,0.003327,0.0,0.557459,0.632397,0.003742,0.0
478,Victorious,0.508381,0.674971,-1.133450,0.999575,0.533355,0.609981,-1.056884,0.999388,0.545310,...,-0.013209,0.0,0.551124,0.607024,0.007416,0.0,0.555608,0.601605,0.008079,0.0
479,Victorious,0.504468,0.661356,-1.186786,0.999523,0.529214,0.593203,-1.109085,0.999316,0.541175,...,-0.010059,0.0,0.547178,0.596913,0.010682,0.0,0.551478,0.591459,0.011340,0.0
480,Victorious,0.497818,0.657158,-1.217317,0.999519,0.522977,0.586601,-1.146403,0.999288,0.535460,...,-0.011913,0.0,0.543697,0.570938,0.009928,0.0,0.547767,0.565948,0.010533,0.0


In [53]:
X = df.drop(columns='class', axis=1)

In [54]:
y = df['class']

In [55]:
X_train, X_test, y_train, y_test = train_test_split(X, y ,test_size=0.3, random_state=1234)

In [56]:
y_test

239           Sad
459    Victorious
329           Sad
278           Sad
381    Victorious
          ...    
99          Happy
423    Victorious
163           Sad
339    Victorious
101         Happy
Name: class, Length: 145, dtype: object

#### Train Machine Learning Classification model

In [57]:
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 
from sklearn.linear_model import LogisticRegression, RidgeClassifier 
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier 

In [58]:
pipelines = {
    'lr': make_pipeline(StandardScaler(), LogisticRegression()),
    'rc': make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf': make_pipeline(StandardScaler(), RandomForestClassifier()),
    'gb': make_pipeline(StandardScaler(), GradientBoostingClassifier())
}

In [59]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model 

In [60]:
list(pipelines.values())[0]

In [61]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rc': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('ridgeclassifier', RidgeClassifier())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())]),
 'gb': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('gradientboostingclassifier', GradientBoostingClassifier())])}

In [62]:
fit_models['rc'].predict(X_test)

array(['Sad', 'Victorious', 'Sad', 'Sad', 'Victorious', 'Sad',
       'Victorious', 'Sad', 'Happy', 'Sad', 'Victorious', 'Happy',
       'Happy', 'Sad', 'Happy', 'Happy', 'Sad', 'Sad', 'Sad', 'Sad',
       'Victorious', 'Sad', 'Sad', 'Happy', 'Happy', 'Happy', 'Happy',
       'Victorious', 'Sad', 'Sad', 'Sad', 'Victorious', 'Victorious',
       'Sad', 'Happy', 'Happy', 'Happy', 'Sad', 'Victorious', 'Sad',
       'Victorious', 'Sad', 'Sad', 'Happy', 'Happy', 'Happy', 'Sad',
       'Victorious', 'Sad', 'Sad', 'Victorious', 'Sad', 'Victorious',
       'Victorious', 'Victorious', 'Sad', 'Sad', 'Sad', 'Sad',
       'Victorious', 'Sad', 'Happy', 'Victorious', 'Happy', 'Happy',
       'Victorious', 'Sad', 'Victorious', 'Victorious', 'Victorious',
       'Sad', 'Sad', 'Victorious', 'Victorious', 'Sad', 'Happy', 'Happy',
       'Happy', 'Happy', 'Victorious', 'Victorious', 'Victorious', 'Sad',
       'Happy', 'Happy', 'Victorious', 'Sad', 'Victorious', 'Victorious',
       'Victorious', 'Happy'

#### Evaluate and Serialize Model

In [63]:
from sklearn.metrics import accuracy_score 
import pickle 

In [64]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rc 1.0
rf 1.0
gb 0.993103448275862


In [65]:
fit_models['rf'].predict(X_test)

array(['Sad', 'Victorious', 'Sad', 'Sad', 'Victorious', 'Sad',
       'Victorious', 'Sad', 'Happy', 'Sad', 'Victorious', 'Happy',
       'Happy', 'Sad', 'Happy', 'Happy', 'Sad', 'Sad', 'Sad', 'Sad',
       'Victorious', 'Sad', 'Sad', 'Happy', 'Happy', 'Happy', 'Happy',
       'Victorious', 'Sad', 'Sad', 'Sad', 'Victorious', 'Victorious',
       'Sad', 'Happy', 'Happy', 'Happy', 'Sad', 'Victorious', 'Sad',
       'Victorious', 'Sad', 'Sad', 'Happy', 'Happy', 'Happy', 'Sad',
       'Victorious', 'Sad', 'Sad', 'Victorious', 'Sad', 'Victorious',
       'Victorious', 'Victorious', 'Sad', 'Sad', 'Sad', 'Sad',
       'Victorious', 'Sad', 'Happy', 'Victorious', 'Happy', 'Happy',
       'Victorious', 'Sad', 'Victorious', 'Victorious', 'Victorious',
       'Sad', 'Sad', 'Victorious', 'Victorious', 'Sad', 'Happy', 'Happy',
       'Happy', 'Happy', 'Victorious', 'Victorious', 'Victorious', 'Sad',
       'Happy', 'Happy', 'Victorious', 'Sad', 'Victorious', 'Victorious',
       'Victorious', 'Happy'

In [66]:
y_test

239           Sad
459    Victorious
329           Sad
278           Sad
381    Victorious
          ...    
99          Happy
423    Victorious
163           Sad
339    Victorious
101         Happy
Name: class, Length: 145, dtype: object

In [67]:
with open('body_language.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

### Make Detections with Model

In [68]:
with open('body_language.pkl', 'rb') as f:
    model = pickle.load(f)

In [69]:
model

In [None]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concate rows
            row = pose_row+face_row
            
            # Append class name 
            # row.insert(0, class_name)
            
            # # Export to CSV
            # with open('coords.csv', mode='a', newline='') as f:
            #     csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
            #     csv_writer.writerow(row) 

            # Make Detections
            X = pd.DataFrame([row])
            body_language_class = model.predict(X)[0]
            body_language_prob = model.predict_proba(X)[0]
            print(body_language_class, body_language_prob)

            # Grabs ear coords
            coords = tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x,
                                                results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)),
                                                [640, 480]).astype(int))

            cv2.rectangle(image, (coords[0], coords[1]+5), (coords[0]+len(body_language_class)*20, coords[1]-30),
            (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords,
            cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

In [None]:
np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x,
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640, 480]).astype(int)
