In [5]:
!pip install mediapipe opencv-python



In [63]:
import cv2
import mediapipe as mp
import pickle
import joblib
import pandas as pd

In [10]:
# Initialize holistic model
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils
mp_face_mesh = mp.solutions.face_mesh  # Import face mesh for FACEMESH_TESSELATION

cap = cv2.VideoCapture(0)

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        
        # Make Detections
        results = holistic.process(image)
        
        # Recolor image back to BGR for rendering
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks using FACEMESH_TESSELATION
        if results.face_landmarks:
            mp_drawing.draw_landmarks(image, results.face_landmarks, mp_face_mesh.FACEMESH_TESSELATION, 
                                     mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                     mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1))
        
        # 2. Right hand
        if results.right_hand_landmarks:
            mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                     mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                     mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2))

        # 3. Left Hand
        if results.left_hand_landmarks:
            mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                     mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                     mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2))

        # 4. Pose Detections
        if results.pose_landmarks:
            mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                     mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                     mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2))
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()




In [12]:
import csv
import os
import numpy as np

In [10]:
# Initialize num_coords to 0
num_coords = 0

# Check if pose_landmarks are detected
if results.pose_landmarks:
    num_coords += len(results.pose_landmarks.landmark)

# Check if face_landmarks are detected
if results.face_landmarks:
    num_coords += len(results.face_landmarks.landmark)

num_coords


501

In [12]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [14]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [16]:
with open('cods.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [62]:
class_name = "Kill"

In [64]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        # Export coordinates
        try:
            # Extract Pose landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concate rows
            row = pose_row+face_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('cods.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

In [38]:
model = joblib.load('body_language.pkl')

In [40]:
model

In [73]:
cap = cv2.VideoCapture(0)
# Initiate holistic model
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        # print(results.face_landmarks)
        
        # face_landmarks, pose_landmarks, left_hand_landmarks, right_hand_landmarks
        
        # Recolor image back to BGR for rendering
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        
        # 1. Draw face landmarks
        mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                                 mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                                 )
        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )

        # 4. Pose Detections
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                                 )
        # Export coordinates
            # Extract Pose landmarks
        pose = results.pose_landmarks.landmark
        pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            # Extract Face landmarks
        face = results.face_landmarks.landmark
        face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            # Concate rows
        row = pose_row+face_row
                   

            # Make Detections
        X = pd.DataFrame([row])
        body_language_class = model.predict(X)[0]
        body_language_prob = model.predict_proba(X)[0]
        print(body_language_class, body_language_prob)
        print("Predicted Class:", body_language_class)
        print("Predicted Probabilities:", body_language_prob)
        print(X)
            
            # Grab ear coords
        coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
        cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
        cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Get status box
        cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)
            
            # Display Class
        cv2.putText(image, 'CLASS'
                        , (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
        cv2.putText(image, body_language_class.split(' ')[0]
                        , (90,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Display Probability
        cv2.putText(image, 'PROB'
                        , (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
        cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2))
                        , (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
      
                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()



Sad [0.   0.25 0.01 0.06 0.   0.58 0.   0.09 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.25 0.01 0.06 0.   0.58 0.   0.09 0.01]
      0        1         2         3         4         5         6     \
0  0.44789  0.65539 -1.322682  0.999146  0.482933  0.580237 -1.300415   

       7         8         9     ...      1994  1995     1996      1997  \
0  0.997656  0.501352  0.579238  ... -0.014931   0.0  0.52379  0.555366   

       1998  1999      2000      2001      2002  2003  
0  0.010271   0.0  0.528928  0.550403  0.010616   0.0  

[1 rows x 2004 columns]




Sad [0.   0.24 0.01 0.06 0.   0.59 0.   0.1  0.  ]
Predicted Class: Sad
Predicted Probabilities: [0.   0.24 0.01 0.06 0.   0.59 0.   0.1  0.  ]
      0         1       2         3         4         5         6     \
0  0.45969  0.651747 -1.6474  0.999219  0.489432  0.576489 -1.606315   

       7         8         9     ...      1994  1995      1996      1997  \
0  0.997862  0.509167  0.575617  ... -0.016359   0.0  0.528645  0.561209   

       1998  1999      2000      2001      2002  2003  
0  0.007847   0.0  0.533702  0.556836  0.008031   0.0  

[1 rows x 2004 columns]




Sad [0.   0.23 0.01 0.06 0.   0.6  0.   0.09 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.23 0.01 0.06 0.   0.6  0.   0.09 0.01]
       0         1         2         3         4         5         6     \
0  0.465044  0.649781 -1.541255  0.999278  0.492462  0.573883 -1.497749   

       7         8         9     ...      1994  1995      1996      1997  \
0  0.998036  0.512888  0.573011  ... -0.015382   0.0  0.530834  0.561688   

       1998  1999      2000      2001      2002  2003  
0  0.009794   0.0  0.535956  0.557302  0.010108   0.0  

[1 rows x 2004 columns]




Sad [0.   0.23 0.01 0.06 0.   0.61 0.   0.08 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.23 0.01 0.06 0.   0.61 0.   0.08 0.01]
       0         1         2         3       4         5         6     \
0  0.466415  0.649369 -1.546215  0.999341  0.4932  0.572525 -1.502588   

       7         8         9     ...     1994  1995      1996      1997  \
0  0.998209  0.513714  0.571585  ... -0.01581   0.0  0.535305  0.563219   

       1998  1999      2000      2001      2002  2003  
0  0.010284   0.0  0.540473  0.558524  0.010671   0.0  

[1 rows x 2004 columns]




Sad [0.   0.22 0.01 0.07 0.   0.62 0.   0.07 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.22 0.01 0.07 0.   0.62 0.   0.07 0.01]
       0         1         2         3        4         5         6     \
0  0.469881  0.647215 -1.481682  0.999397  0.49543  0.570738 -1.425318   

       7         8         9     ...      1994  1995      1996      1997  \
0  0.998367  0.515966  0.569822  ... -0.014064   0.0  0.539767  0.564855   

       1998  1999      2000      2001      2002  2003  
0  0.013434   0.0  0.544866  0.560311  0.013985   0.0  

[1 rows x 2004 columns]




Sad [0.   0.23 0.01 0.06 0.   0.62 0.   0.07 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.23 0.01 0.06 0.   0.62 0.   0.07 0.01]
       0         1         2         3         4         5         6     \
0  0.473248  0.648085 -1.519652  0.999442  0.497229  0.571187 -1.475717   

       7        8         9     ...      1994  1995      1996      1997  \
0  0.998495  0.51747  0.570151  ... -0.015287   0.0  0.542629  0.565807   

       1998  1999      2000      2001     2002  2003  
0  0.012821   0.0  0.547611  0.561168  0.01342   0.0  

[1 rows x 2004 columns]




Sad [0.   0.22 0.01 0.06 0.   0.63 0.   0.07 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.22 0.01 0.06 0.   0.63 0.   0.07 0.01]
       0         1         2         3         4         5         6     \
0  0.475917  0.649261 -1.602066  0.999488  0.499146  0.571894 -1.562698   

       7         8         9     ...      1994  1995    1996      1997  \
0  0.998622  0.519118  0.570738  ... -0.014744   0.0  0.5431  0.566956   

       1998  1999      2000      2001      2002  2003  
0  0.013596   0.0  0.547999  0.562498  0.014225   0.0  

[1 rows x 2004 columns]
Sad [0.   0.21 0.01 0.08 0.   0.62 0.   0.07 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.21 0.01 0.08 0.   0.62 0.   0.07 0.01]
       0         1         2         3         4         5         6     \
0  0.478586  0.649084 -1.582328  0.999526  0.502263  0.571575 -1.539471   

       7         8         9     ...      1994  1995      1996      1997  \
0  0.998731  0.522692  0.570445  ... -0.011525  



Sad [0.   0.23 0.01 0.08 0.   0.6  0.   0.07 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.23 0.01 0.08 0.   0.6  0.   0.07 0.01]
      0         1         2         3         4         5         6     \
0  0.48387  0.649873 -1.553116  0.999565  0.508193  0.571984 -1.497565   

       7         8         9     ...      1994  1995     1996      1997  \
0  0.998853  0.528368  0.570623  ... -0.012079   0.0  0.54265  0.569419   

       1998  1999      2000      2001      2002  2003  
0  0.018682   0.0  0.547214  0.564378  0.019564   0.0  

[1 rows x 2004 columns]




Sad [0.   0.2  0.01 0.09 0.   0.65 0.   0.04 0.01]
Predicted Class: Sad
Predicted Probabilities: [0.   0.2  0.01 0.09 0.   0.65 0.   0.04 0.01]
       0         1         2         3         4        5         6     \
0  0.483108  0.649893 -1.658009  0.999595  0.507663  0.57199 -1.611645   

       7         8         9     ...      1994  1995      1996      1997  \
0  0.998933  0.527819  0.570566  ... -0.011642   0.0  0.545219  0.571212   

      1998  1999      2000      2001      2002  2003  
0  0.02044   0.0  0.549685  0.566436  0.021498   0.0  

[1 rows x 2004 columns]


In [24]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(353, 252)