In [1]:
import mediapipe as mp # Import mediapipe
import cv2 # Import opencv
from sklearn.metrics import accuracy_score # Accuracy metrics 
import pickle 
import numpy as np
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.pipeline import make_pipeline 
from sklearn.preprocessing import StandardScaler 

from sklearn.linear_model import LogisticRegression, RidgeClassifier
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [2]:
mp_drawing = mp.solutions.drawing_utils # Drawing helpers
mp_holistic = mp.solutions.holistic # Mediapipe Solutions
mp_drawing_styles = mp.solutions.drawing_styles
mp_hands = mp.solutions.hands

In [25]:
cap = cv2.VideoCapture(0)
# Initiate holistic model

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)

        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        

        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )


                        
        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

In [26]:
results.right_hand_landmarks

landmark {
  x: 0.14437124133110046
  y: 0.9566307663917542
  z: 9.408352639184159e-07
}
landmark {
  x: 0.11672013998031616
  y: 0.8380743861198425
  z: 0.006609819829463959
}
landmark {
  x: 0.1402462124824524
  y: 0.7217616438865662
  z: -0.011087841354310513
}
landmark {
  x: 0.20241068303585052
  y: 0.6511917114257812
  z: -0.03206909820437431
}
landmark {
  x: 0.25792068243026733
  y: 0.6181348562240601
  z: -0.05177158862352371
}
landmark {
  x: 0.10470138490200043
  y: 0.6677518486976624
  z: -0.057137418538331985
}
landmark {
  x: 0.136560320854187
  y: 0.5119690895080566
  z: -0.09196576476097107
}
landmark {
  x: 0.16239404678344727
  y: 0.42012715339660645
  z: -0.1099366769194603
}
landmark {
  x: 0.1856287717819214
  y: 0.3507571518421173
  z: -0.11938516795635223
}
landmark {
  x: 0.14840954542160034
  y: 0.6993244886398315
  z: -0.07913800328969955
}
landmark {
  x: 0.2165832817554474
  y: 0.538245439529419
  z: -0.11156529188156128
}
landmark {
  x: 0.2637627422809601


In [27]:
results

mediapipe.python.solution_base.SolutionOutputs

In [28]:
len(results.right_hand_landmarks.landmark)

21

In [29]:
num_coords = len(results.right_hand_landmarks.landmark)
num_coords

21

In [30]:
landmarks = ['class']
for val in range(1, num_coords+1):
    landmarks += ['x{}'.format(val), 'y{}'.format(val), 'z{}'.format(val), 'v{}'.format(val)]

In [31]:
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21']

In [10]:
import csv
with open('coords.csv', mode='w', newline='') as f:
    csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)

In [32]:
class_name = "good"

In [17]:
cap = cv2.VideoCapture(0)
# Initiate holistic model

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)

        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        

        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS 
                                 
                              #   mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                               #  mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS 
                              #   mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                               #  mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )


        try:
            # Extract Pose landmarks
            hand = results.right_hand_landmarks.landmark
            hand_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in hand]).flatten())
            
            
            # Concate rows
            row = hand_row
            
            # Append class name 
            row.insert(0, class_name)
            
            # Export to CSV
            with open('D:\ApplAi\Hand recognition\coords.csv', mode='a', newline='') as f:
                csv_writer = csv.writer(f, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row) 
            
        except:
            pass

        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

In [4]:
df = pd.read_csv('D:\ApplAi\Hand recognition\coords.csv')

In [5]:
df[df['class']=='good']

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z19,v19,x20,y20,z20,v20,x21,y21,z21,v21
2282,good,0.249515,0.790073,-4.709165e-07,0.0,0.271229,0.663633,-0.018736,0.0,0.312935,...,-0.052019,0.0,0.451564,0.812190,-0.032942,0.0,0.422280,0.823076,-0.020912,0.0
2283,good,0.232836,0.816452,-5.047947e-07,0.0,0.264075,0.673375,-0.002723,0.0,0.313275,...,-0.047161,0.0,0.451986,0.813645,-0.025983,0.0,0.419992,0.826453,-0.013844,0.0
2284,good,0.233896,0.821059,-4.783585e-07,0.0,0.263487,0.675251,-0.006623,0.0,0.314060,...,-0.041395,0.0,0.451132,0.810017,-0.019613,0.0,0.420271,0.824618,-0.007135,0.0
2285,good,0.236112,0.819890,-4.805428e-07,0.0,0.268307,0.676613,-0.006903,0.0,0.317006,...,-0.043061,0.0,0.453575,0.816200,-0.021359,0.0,0.422065,0.828831,-0.008835,0.0
2286,good,0.236159,0.822350,-4.736905e-07,0.0,0.268447,0.677549,-0.005977,0.0,0.318047,...,-0.036911,0.0,0.452885,0.811910,-0.016052,0.0,0.422070,0.824780,-0.004091,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3324,good,0.258407,0.637694,-3.861919e-07,0.0,0.258411,0.519011,-0.004529,0.0,0.289474,...,-0.064764,0.0,0.478417,0.603240,-0.042876,0.0,0.444502,0.610140,-0.028364,0.0
3325,good,0.259524,0.640742,-3.891307e-07,0.0,0.258837,0.521410,-0.004217,0.0,0.290108,...,-0.058947,0.0,0.479706,0.602599,-0.038200,0.0,0.446094,0.607801,-0.024542,0.0
3326,good,0.259229,0.639149,-4.105003e-07,0.0,0.258203,0.520837,-0.006041,0.0,0.289679,...,-0.060652,0.0,0.478563,0.601662,-0.040086,0.0,0.445030,0.608660,-0.026707,0.0
3327,good,0.258980,0.637045,-4.070019e-07,0.0,0.258610,0.519651,-0.006352,0.0,0.289214,...,-0.062461,0.0,0.479807,0.601246,-0.041612,0.0,0.446166,0.607412,-0.027968,0.0


In [6]:
X = df.drop('class', axis=1) # features
y = df['class'] # target value

In [7]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=1234)

In [8]:
y_test

674        1
1084       1
3101    good
936        1
2635    good
        ... 
3049    good
2743    good
686        1
3109    good
1576       2
Name: class, Length: 999, dtype: object

In [10]:
pipelines = {
    'lr':make_pipeline(StandardScaler(), LogisticRegression()),
    'rc':make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf':make_pipeline(StandardScaler(), RandomForestClassifier())
}

In [11]:
fit_models = {}
for algo, pipeline in pipelines.items():
    model = pipeline.fit(X_train, y_train)
    fit_models[algo] = model

STOP: TOTAL NO. of ITERATIONS REACHED LIMIT.

Increase the number of iterations (max_iter) or scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression
  n_iter_i = _check_optimize_result(


In [12]:
fit_models

{'lr': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('logisticregression', LogisticRegression())]),
 'rc': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('ridgeclassifier', RidgeClassifier())]),
 'rf': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('randomforestclassifier', RandomForestClassifier())]),
 'gb': Pipeline(steps=[('standardscaler', StandardScaler()),
                 ('gradientboostingclassifier', GradientBoostingClassifier())])}

In [13]:
fit_models['rc'].predict(X_test)

array(['1', '1', 'good', '1', 'good', '2', 'good', '2', '1', '2', '2',
       '2', '2', 'good', '1', '2', 'good', '1', '1', '2', '1', 'good',
       '1', '1', 'good', '1', '2', '1', '1', 'good', '1', '2', '2', '1',
       '2', '1', '2', '2', 'good', '2', 'good', '2', '1', '1', '2', '1',
       '2', '2', '2', 'good', 'good', '1', '2', '2', '2', '1', 'good',
       '1', 'good', '2', '1', '2', '1', 'good', '2', '2', '1', '2',
       'good', '2', '2', '1', '1', '1', 'good', '1', '2', 'good', '1',
       '2', 'good', '1', 'good', '2', 'good', '1', 'good', '1', 'good',
       '1', '2', 'good', '2', '2', 'good', '1', '1', '1', 'good', '1',
       'good', 'good', '2', '1', '2', 'good', '1', '1', '2', '1', 'good',
       '1', 'good', 'good', 'good', '1', '1', '1', 'good', 'good', 'good',
       '1', '2', '2', 'good', '1', 'good', 'good', 'good', '1', '1', '1',
       'good', '1', '2', '2', '1', '2', '2', '2', 'good', 'good', '1',
       'good', 'good', '1', 'good', '2', '2', '2', '2', '1', 'goo

In [15]:
for algo, model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo, accuracy_score(y_test, yhat))

lr 1.0
rc 0.997997997997998
rf 1.0
gb 0.998998998998999


In [16]:
fit_models['rf'].predict(X_test)

array(['1', '1', 'good', '1', 'good', '2', 'good', '2', '1', '2', '2',
       '2', '2', 'good', '1', '2', 'good', '1', '1', '2', '1', 'good',
       '1', '1', 'good', '1', '2', '1', '1', 'good', '1', '2', '2', '1',
       '2', '1', '2', '2', 'good', '1', 'good', '2', '1', '1', '2', '1',
       '2', '2', '2', 'good', 'good', '1', '2', '2', '2', '1', 'good',
       '1', 'good', '2', '1', '2', '1', 'good', '2', '2', '1', '1',
       'good', '2', '2', '1', '1', '1', 'good', '1', '2', 'good', '1',
       '2', 'good', '1', 'good', '2', 'good', '1', 'good', '1', 'good',
       '1', '2', 'good', '2', '2', 'good', '1', '1', '1', 'good', '1',
       'good', 'good', '2', '1', '2', 'good', '1', '1', '2', '1', 'good',
       '1', 'good', 'good', 'good', '1', '1', '1', 'good', 'good', 'good',
       '1', '2', '2', 'good', '1', 'good', 'good', 'good', '1', '1', '1',
       'good', '1', '2', '2', '1', '2', '2', '2', 'good', 'good', '1',
       'good', 'good', '1', 'good', '2', '2', '2', '2', '1', 'goo

In [17]:
y_test

674        1
1084       1
3101    good
936        1
2635    good
        ... 
3049    good
2743    good
686        1
3109    good
1576       2
Name: class, Length: 999, dtype: object

In [18]:
with open('handsign.pkl', 'wb') as f:
    pickle.dump(fit_models['rf'], f)

In [3]:
with open('handsign.pkl', 'rb') as f:
    model = pickle.load(f)

https://scikit-learn.org/stable/modules/model_persistence.html#security-maintainability-limitations
https://scikit-learn.org/stable/modules/model_persistence.html#security-maintainability-limitations
https://scikit-learn.org/stable/modules/model_persistence.html#security-maintainability-limitations
https://scikit-learn.org/stable/modules/model_persistence.html#security-maintainability-limitations


In [4]:
model

Pipeline(steps=[('standardscaler', StandardScaler()),
                ('randomforestclassifier',
                 RandomForestClassifier(max_features='sqrt'))])

In [5]:
cap = cv2.VideoCapture(0)
# Initiate holistic model

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    while cap.isOpened():
        ret, frame = cap.read()
        
        # Recolor Feed
        image = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
        image.flags.writeable = False        
        
        # Make Detections
        results = holistic.process(image)
        image.flags.writeable = True   
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
        

        
        # 2. Right hand
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                                 )

        # 3. Left Hand
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                                 mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4),
                                 mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                                 )


        try:
            # Extract Pose landmarks
            hand = results.right_hand_landmarks.landmark
            hand_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in hand]).flatten())
            
            
            # Concate rows
            row = hand_row

            X = pd.DataFrame([row])
            sign_class = model.predict(X)[0]
            sign_prop = model.predict_proba(X)[0]
            
           
            # Grab ear coords
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
           
            
            # Display Class
            cv2.putText(image, 'CLASS'
                        , (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, sign_class.split(' ')[0]
                        , (90,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            # Display Probability
            cv2.putText(image, 'PROB'
                        , (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(sign_prop[np.argmax(sign_prop)],2))
                        , (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            
            
        except:
            pass

        cv2.imshow('Raw Webcam Feed', image)

        if cv2.waitKey(10) & 0xFF == ord('q'):
            break

cap.release()
cv2.destroyAllWindows()

KKKKKKKKKKKKKKKKKKKKKK




In [6]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(465, 321)