In [None]:
!pip install mediapipe

# 1. Import

In [1]:
import cv2
import numpy as np
import os
from matplotlib import pyplot as plt
import time
import mediapipe as mp

# 2. Keypoints using Mediapipe Holistic

In [2]:
mp_hands = mp.solutions.hands
mp_pose = mp.solutions.pose
mp_drawing = mp.solutions.drawing_utils # drawing utils
mp_drawing_styles = mp.solutions.drawing_styles

In [8]:
cap = cv2.VideoCapture(0)
with mp_hands.Hands(model_complexity=0,min_detection_confidence=0.5,min_tracking_confidence=0.5) as hands:
    with mp_pose.Pose(min_detection_confidence=0.5,min_tracking_confidence=0.5) as pose:
        while cap.isOpened():
            success, image = cap.read()
            
            if not success:
                print("Ignoring empty camera frame.")
                # If loading a video, use 'break' instead of 'continue'.
                continue

            # To improve performance, optionally mark the image as not writeable to
            # pass by reference.
            image.flags.writeable = False
            image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
            results = hands.process(image)
            results_pose = pose.process(image)
            

            # Draw the hand annotations on the image.
            image.flags.writeable = True
            image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
            
            hand_np = []
            if results.multi_hand_landmarks:
                for i in range(len(results.multi_hand_landmarks)):
                    print(i)
                    mp_drawing.draw_landmarks(image,results.multi_hand_landmarks[i],mp_hands.HAND_CONNECTIONS,mp_drawing_styles.get_default_hand_landmarks_style(),mp_drawing_styles.get_default_hand_connections_style())
                    hand_np.append(np.array([[res.x, res.y, res.z] for res in results.multi_hand_landmarks[i].landmark]).flatten() if results.multi_hand_landmarks[i] else np.zeros(21*3))
                    
            if len(hand_np) == 0:
                lh = np.zeros(21*3)
                rh = np.zeros(21*3)
            elif len(hand_np) == 1:
                lh = hand_np[0]
                rh = np.zeros(21*3)
            else:
                lh = hand_np[0]
                rh = hand_np[1]        
                    
            # Draw pose annotations        
            mp_drawing.draw_landmarks(image,results_pose.pose_landmarks,mp_pose.POSE_CONNECTIONS,landmark_drawing_spec=mp_drawing_styles.get_default_pose_landmarks_style())
            
            ps = np.array([[res.x, res.y, res.z, res.visibility] for res in results_pose.pose_landmarks.landmark]).flatten() if results_pose.pose_landmarks else np.zeros(33*4)
            
            extracted_keypoints = np.concatenate([ps, lh, rh])
            print("EXTRACTED_KEYPOINTS: ")
            print(len(extracted_keypoints))
            
            # Flip the image horizontally for a selfie-view display.
            cv2.imshow('MediaPipe Result', cv2.flip(image, 1))
            if cv2.waitKey(10) & 0xFF == ord('q'):
                  break
cap.release()
cap.destroyAllWindows()

EXTRACTED_KEYPOINTS: 
258


error: OpenCV(4.6.0) D:\a\opencv-python\opencv-python\opencv\modules\highgui\src\window.cpp:1267: error: (-2:Unspecified error) The function is not implemented. Rebuild the library with Windows, GTK+ 2.x or Cocoa support. If you are on Ubuntu or Debian, install libgtk2.0-dev and pkg-config, then re-run cmake or configure script in function 'cvShowImage'


# 3. Extract Keypoints Values

In [3]:
def extract_keypoints(results):
    pose = np.array([[res.x, res.y, res.z, res.visibility] for res in results.pose_landmarks.landmark]).flatten() if results.pose_landmarks else np.zeros(33*4)
    face = np.array([[res.x, res.y, res.z] for res in results.face_landmarks.landmark]).flatten() if results.face_landmarks else np.zeros(468*3)
    lh = np.array([[res.x, res.y, res.z] for res in results.left_hand_landmarks.landmark]).flatten() if results.left_hand_landmarks else np.zeros(21*3)
    rh = np.array([[res.x, res.y, res.z] for res in results.right_hand_landmarks.landmark]).flatten() if results.right_hand_landmarks else np.zeros(21*3)
    return np.concatenate([pose, face, lh, rh])

# 4. Setup Folders for Manual Collection

In [4]:
# Path for exported data, numpy arrays
DATA_PATH = os.path.join('MP_Data_m_noface') 

# Actions that we try to detect
actions = ['can','you','help','me','what','name','hamburger','french fries','thanks','bye','hello','excuse me','sorry']

In [5]:
# Thirty videos worth of data
no_sequences = 30

# Videos are going to be 30 frames in length
sequence_length = 30

In [6]:
len(actions)

16

In [19]:
np.save('actions_list.npy',actions)

In [13]:
os.makedirs('MP_Data_m_noface',exist_ok=True)
for action in actions:
    os.makedirs(os.path.join(DATA_PATH, action),exist_ok=True)

In [14]:
for action in actions: 
    for sequence in range(1,no_sequences+1):
        try: 
            os.makedirs(os.path.join(DATA_PATH, action, str(sequence)))
        except:
            pass

# 5. Manual data collecting

In [18]:
cap = cv2.VideoCapture(0)
# Set mediapipe model 
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    
    # NEW LOOP
    # Loop through actions
    for action in actions:
        # Loop through sequences aka videos
        ret, frame = cap.read()           
        cv2.putText(frame, 'Moving on to the next sign: {}, you have 30 seconds to learn the next sign'.format(action), (15,12), 
                   cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 1, cv2.LINE_AA)
        # Show to screen
        cv2.imshow('OpenCV Feed', frame)
        cv2.waitKey(30000)
        
        for sequence in range(1,no_sequences+1):
            # Loop through video length aka sequence length
            for frame_num in range(sequence_length):

                # Read feed
                ret, frame = cap.read()

                # Make detections
                image, results = mediapipe_detection(frame, holistic)

                # Draw landmarks
                draw_styled_landmarks(image, results)
                
                # Apply wait logic
                if frame_num == 0: 
                    cv2.putText(image, 'STARTING COLLECTION', (120,200), 
                               cv2.FONT_HERSHEY_SIMPLEX, 1, (0,255, 0), 4, cv2.LINE_AA)
                    cv2.putText(image, 'Collecting frames for {} Video Number {}'.format(action, sequence), (15,12), 
                               cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 1, cv2.LINE_AA)
                    # Show to screen
                    cv2.imshow('OpenCV Feed', image)
                    cv2.waitKey(500)
                else: 
                    cv2.putText(image, 'Collecting frames for {} Video Number {}'.format(action, sequence), (15,12), 
                               cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 255), 1, cv2.LINE_AA)
                    # Show to screen
                    cv2.imshow('OpenCV Feed', image)
                
                # Export keypoints
                keypoints = extract_keypoints(results)
                npy_path = os.path.join(DATA_PATH, action, str(sequence), str(frame_num))
                np.save(npy_path, keypoints)

                # Break gracefully
                if cv2.waitKey(10) & 0xFF == ord('q'):
                    cap.release()
                    cv2.destroyAllWindows()
                    break
                    
                    
    cap.release()
    cv2.destroyAllWindows()

# 6. Use downloaded Dataset

In [None]:
root = 'C:\\Users\\ryanr\\ASLtoEng\\'
MP_DATA_PATH = os.path.join(root,'MP_Data_MSASL')

In [None]:
for label in os.listdir(MP_DATA_PATH):
    LABEL_PATH = os.path.join(MP_DATA_PATH,label)
    for filename in os.listdir(LABEL_PATH):
        if filename.endswith('.mp4'):
            print(f'Reading {filename}...')
            
            video_name = filename.split('.')[0]
            VIDEO_PATH = os.path.join(LABEL_PATH,filename)
            VIDEO_FOLDER_PATH = os.path.join(LABEL_PATH,video_name)
#             VIDEO_FOLDER_PATH_FLIPPED = os.path.join(LABEL_PATH,video_name+"(1)")
            os.makedirs(VIDEO_FOLDER_PATH,exist_ok=True)
#             os.makedirs(VIDEO_FOLDER_PATH_FLIPPED,exist_ok=True)
            
            # Capture video
            vidcap = cv2.VideoCapture(VIDEO_PATH)
            # Set mediapipe model 
            with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:

                # Read feed
                success, frame = vidcap.read()
                
                frame_num = 0
                
                while success:
                    # Make detections
                    image, results = mediapipe_detection(frame, holistic)
#                     image_flipped, results_flipped = mediapipe_detection(cv2.flip(frame, 1), holistic)
#                     image_flipped, results_flipped = mediapipe_detection(frame, holistic)

                    
#                     Draw detections for debugging
#                     draw_styled_landmarks(image, results)
#                     cv2.imshow('OpenCV Feed', image)
#                     cv2.waitKey(10)         
            
#                     draw_styled_landmarks(image_flipped, results_flipped)
#                     cv2.imshow('OpenCV Feed', image_flipped)
                    
                    # Export keypoints
                    keypoints = extract_keypoints(results)
                    npy_path = os.path.join(VIDEO_FOLDER_PATH, str(frame_num))
                    np.save(npy_path, keypoints)
                    
#                     keypoints_flipped = extract_keypoints(results_flipped)
#                     npy_path_flipped = os.path.join(VIDEO_FOLDER_PATH_FLIPPED, str(frame_num))
#                     np.save(npy_path_flipped, keypoints_flipped)
                         
                    success,frame = vidcap.read()
                    frame_num += 1
            
                    Break gracefully
                    if cv2.waitKey(10) & 0xFF == ord('q'):
                        break
                
                print('Converted.')                    
                        
                Break gracefully
                if cv2.waitKey(10) & 0xFF == ord('q'):
                    break
            
            # close the video
            vidcap.release()
            
cv2.destroyAllWindows()        

In [None]:
import shutil

In [None]:
# remove videos after converting
for label in os.listdir(MP_DATA_PATH):
    LABEL_PATH = os.path.join(MP_DATA_PATH,label)
    for filename in os.listdir(LABEL_PATH):
        if filename.endswith('.mp4'):
#         if filename.startswith('fast_') and filename.endswith('(1)'):
            filepath = os.path.join(LABEL_PATH,filename)
            print(f'Deleting {filename}...')
            os.remove(filepath)
#             shutil.rmtree(filepath)

In [None]:
# sanity check that the data collected is correct
for label in os.listdir(MP_DATA_PATH):
    LABEL_PATH = os.path.join(MP_DATA_PATH,label)
    for filename in os.listdir(LABEL_PATH):
        if not filename.endswith('.mp4'):
            for npfile in os.listdir(os.path.join(LABEL_PATH,filename)):
                print(np.load(os.path.join(LABEL_PATH,filename,npfile)))
                break

# 6.* Preprocess Data and Create Labels and Features

In [6]:
from sklearn.model_selection import train_test_split
from tensorflow.keras.utils import to_categorical

In [None]:
label_map = {label:num for num, label in enumerate(actions)}
print(label_map)

In [None]:
sequences, labels = [], []
for action in label_map.keys():
    for sequence in np.array(os.listdir(os.path.join(DATA_PATH, action))):
        window = []
        last_frame = 0
        for frame_num in range(sequence_length):
            if  os.path.exists(os.path.join(DATA_PATH, action, sequence, "{}.npy".format(frame_num))):
                res = np.load(os.path.join(DATA_PATH, action, sequence, "{}.npy".format(frame_num)))
                last_frame = frame_num
            else:
#                 res = np.zeros((1662,),dtype='float64') # zero padding
                res = np.load(os.path.join(DATA_PATH, action, sequence, "{}.npy".format(last_frame))) # last frame padding
            print(len(np.concatenate([res[0:132],res[1536:]]))) 
            window.append(np.concatenate([res[0:132],res[1536:]])) # skip face landmarks
        sequences.append(window)
        labels.append(label_map[action])        

In [13]:
X = np.array(sequences)

In [14]:
X.shape

(480, 30, 258)

In [None]:
np.save('cached_data/X_data_m_noface',X)

In [15]:
y = to_categorical(labels,num_classes=len(actions)).astype(int)

In [None]:
np.save('cached_data/y_data_m_noface',y)

In [16]:
y.shape

(480, 16)

In [17]:
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.1, stratify=y)

In [18]:
y_train.sum(axis=0)

array([27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27, 27])

# 7. Build and Train LSTM Neural Network

In [19]:
import tensorflow
from tensorflow.keras.models import Sequential
from tensorflow.keras.optimizers import SGD, Adam
from tensorflow.keras.layers import LSTM, Dense, Dropout
from tensorflow.keras.callbacks import TensorBoard
from tensorflow.keras.callbacks import ModelCheckpoint

In [20]:
log_dir = os.path.join('Logs/data_m_noface')
tb_callback = TensorBoard(log_dir=log_dir)

In [21]:
checkpoint_path = os.path.join("Logs","data_m_noface",'checkpoints','cp-{epoch:04d}.ckpt')
cp_callback = ModelCheckpoint(filepath=checkpoint_path,verbose=1,save_weights_only=True,save_freq=50*14)

In [None]:
model = Sequential()
model.add(LSTM(16, return_sequences=True, activation='relu', input_shape=(sequence_length,258)))
model.add(LSTM(32, return_sequences=True, activation='relu'))
model.add(LSTM(16, return_sequences=False, activation='relu'))
model.add(Dense(16, activation='relu'))
model.add(Dense(32, activation='relu'))
model.add(Dense(len(actions), activation='softmax'))

In [24]:
# opt = SGD(learning_rate=0.01,momentum=0.9)
# opt = Adam(learning_rate=0.0001)
opt = 'Adam'

In [25]:
model.compile(optimizer=opt, loss='categorical_crossentropy', metrics=['categorical_accuracy'])

In [31]:
model.load_weights('Logs/data_m_noface/checkpoints/cp-0292.ckpt')

<tensorflow.python.training.tracking.util.CheckpointLoadStatus at 0x2759b01d6f0>

In [26]:
model.fit(X_train, y_train, epochs=2000, callbacks=[cp_callback])

Epoch 1/2000
Epoch 2/2000
Epoch 3/2000
Epoch 4/2000
Epoch 5/2000
Epoch 6/2000
Epoch 7/2000
Epoch 8/2000
Epoch 9/2000
Epoch 10/2000
Epoch 11/2000
Epoch 12/2000
Epoch 13/2000
Epoch 14/2000
Epoch 15/2000
Epoch 16/2000
Epoch 17/2000
Epoch 18/2000
Epoch 19/2000
Epoch 20/2000
Epoch 21/2000
Epoch 22/2000
Epoch 23/2000
Epoch 24/2000
Epoch 25/2000
Epoch 26/2000
Epoch 27/2000
Epoch 28/2000
Epoch 29/2000
Epoch 30/2000
Epoch 31/2000
Epoch 32/2000
Epoch 33/2000
Epoch 34/2000
Epoch 35/2000
Epoch 36/2000
Epoch 37/2000
Epoch 38/2000
Epoch 39/2000
Epoch 40/2000
Epoch 41/2000
Epoch 42/2000
Epoch 43/2000
Epoch 44/2000
Epoch 45/2000
Epoch 46/2000
Epoch 47/2000
Epoch 47: saving model to Logs\data_m_noface\checkpoints\cp-0047.ckpt
Epoch 48/2000
Epoch 49/2000
Epoch 50/2000
Epoch 51/2000
Epoch 52/2000
Epoch 53/2000
Epoch 54/2000
Epoch 55/2000
Epoch 56/2000
Epoch 57/2000
Epoch 58/2000
Epoch 59/2000
Epoch 60/2000
Epoch 61/2000
Epoch 62/2000
Epoch 63/2000
Epoch 64/2000
Epoch 65/2000
Epoch 66/2000
Epoch 67/2000
E

Epoch 140/2000
 3/14 [=====>........................] - ETA: 2s - loss: 0.5531 - categorical_accuracy: 0.7292
Epoch 140: saving model to Logs\data_m_noface\checkpoints\cp-0140.ckpt
Epoch 141/2000
Epoch 142/2000
Epoch 143/2000
Epoch 144/2000
Epoch 145/2000
Epoch 146/2000
Epoch 147/2000
Epoch 148/2000
Epoch 149/2000
Epoch 150/2000
Epoch 151/2000
Epoch 152/2000
Epoch 153/2000
Epoch 154/2000
Epoch 155/2000
Epoch 156/2000
Epoch 157/2000
Epoch 158/2000
Epoch 159/2000
Epoch 160/2000
Epoch 161/2000
Epoch 162/2000
Epoch 163/2000
Epoch 164/2000
Epoch 165/2000
Epoch 166/2000
Epoch 167/2000
Epoch 168/2000
Epoch 169/2000
Epoch 170/2000
Epoch 171/2000
Epoch 172/2000
Epoch 173/2000
Epoch 174/2000
Epoch 175/2000
Epoch 176/2000
Epoch 177/2000
Epoch 178/2000
Epoch 179/2000
Epoch 180/2000
Epoch 181/2000
Epoch 182/2000
Epoch 183/2000
Epoch 184/2000
Epoch 185/2000
Epoch 186/2000
Epoch 186: saving model to Logs\data_m_noface\checkpoints\cp-0186.ckpt
Epoch 187/2000
Epoch 188/2000
Epoch 189/2000
Epoch 190/200

Epoch 276/2000
Epoch 277/2000
Epoch 278/2000
Epoch 279/2000
Epoch 279: saving model to Logs\data_m_noface\checkpoints\cp-0279.ckpt
Epoch 280/2000
Epoch 281/2000
Epoch 282/2000
Epoch 283/2000
Epoch 284/2000
Epoch 285/2000
Epoch 286/2000
Epoch 287/2000
Epoch 288/2000
Epoch 289/2000
Epoch 290/2000
Epoch 291/2000
Epoch 292/2000
Epoch 293/2000
Epoch 294/2000
Epoch 295/2000
Epoch 296/2000
Epoch 297/2000
Epoch 298/2000
Epoch 299/2000
Epoch 300/2000
Epoch 301/2000
Epoch 302/2000
Epoch 303/2000
Epoch 304/2000
Epoch 305/2000
Epoch 306/2000
Epoch 307/2000
Epoch 308/2000
Epoch 309/2000
Epoch 310/2000
Epoch 311/2000
Epoch 312/2000
Epoch 313/2000
Epoch 314/2000
Epoch 315/2000
Epoch 316/2000
Epoch 317/2000
Epoch 318/2000
Epoch 319/2000
Epoch 320/2000
Epoch 321/2000
Epoch 322/2000
Epoch 323/2000
Epoch 324/2000
Epoch 325/2000
Epoch 325: saving model to Logs\data_m_noface\checkpoints\cp-0325.ckpt
Epoch 326/2000
Epoch 327/2000
Epoch 328/2000
Epoch 329/2000
Epoch 330/2000
Epoch 331/2000
Epoch 332/2000
Epo

Epoch 412/2000
Epoch 413/2000
Epoch 414/2000
Epoch 415/2000
Epoch 416/2000
Epoch 417/2000
Epoch 418/2000
Epoch 418: saving model to Logs\data_m_noface\checkpoints\cp-0418.ckpt
Epoch 419/2000
Epoch 420/2000
Epoch 421/2000
Epoch 422/2000
Epoch 423/2000
Epoch 424/2000
Epoch 425/2000
Epoch 426/2000
Epoch 427/2000
Epoch 428/2000
Epoch 429/2000
Epoch 430/2000
Epoch 431/2000
Epoch 432/2000
Epoch 433/2000
Epoch 434/2000
Epoch 435/2000
Epoch 436/2000
Epoch 437/2000
Epoch 438/2000
Epoch 439/2000
Epoch 440/2000
Epoch 441/2000
Epoch 442/2000
Epoch 443/2000
Epoch 444/2000
Epoch 445/2000
Epoch 446/2000
Epoch 447/2000
Epoch 448/2000
Epoch 449/2000
Epoch 450/2000
Epoch 451/2000
Epoch 452/2000
Epoch 453/2000
Epoch 454/2000
Epoch 455/2000
Epoch 456/2000
Epoch 457/2000
Epoch 458/2000
Epoch 459/2000
Epoch 460/2000
Epoch 461/2000
Epoch 462/2000
Epoch 463/2000
Epoch 464/2000
Epoch 465/2000
 3/14 [=====>........................] - ETA: 2s - loss: 0.0019 - categorical_accuracy: 1.0000
Epoch 465: saving model 

Epoch 546/2000
Epoch 547/2000
Epoch 548/2000
Epoch 549/2000
Epoch 550/2000
Epoch 551/2000
Epoch 552/2000
Epoch 553/2000
Epoch 554/2000
Epoch 555/2000
Epoch 556/2000
Epoch 557/2000
Epoch 558/2000
 1/14 [=>............................] - ETA: 2s - loss: 3.6883e-04 - categorical_accuracy: 1.0000
Epoch 558: saving model to Logs\data_m_noface\checkpoints\cp-0558.ckpt
Epoch 559/2000
Epoch 560/2000
Epoch 561/2000
Epoch 562/2000
Epoch 563/2000
Epoch 564/2000
Epoch 565/2000
Epoch 566/2000
Epoch 567/2000
Epoch 568/2000
Epoch 569/2000
Epoch 570/2000
Epoch 571/2000
Epoch 572/2000
Epoch 573/2000
Epoch 574/2000
Epoch 575/2000
Epoch 576/2000
Epoch 577/2000
Epoch 578/2000
Epoch 579/2000
Epoch 580/2000
Epoch 581/2000
Epoch 582/2000
Epoch 583/2000
Epoch 584/2000
Epoch 585/2000
Epoch 586/2000
Epoch 587/2000
Epoch 588/2000
Epoch 589/2000
Epoch 590/2000
Epoch 591/2000
Epoch 592/2000
Epoch 593/2000
Epoch 594/2000
Epoch 595/2000
Epoch 596/2000

KeyboardInterrupt: 

In [None]:
model.summary()

# 8. Make Predictions

In [None]:
res = model.predict(X_test)
res.shape

In [None]:
actions[np.argmax(res[2])]

In [None]:
actions[np.argmax(y_test[2])]

# 9. Save Weights

In [None]:
model.save('weights/data_m_noface.h5')

In [None]:
model_json = model.to_json()
with open("model.json", "w") as json_file:
    json_file.write(model_json)

In [None]:
del model

In [None]:
# Save keras model & weights to saved_model folder
tensorflow.saved_model.save(model,'saved_model/1')
# Use this command to convert into onnx to deploy !python -m tf2onnx.convert --saved-model C:\Users\ryanr\ASLtoEng\saved_model\1 --output model.onnx

In [None]:
model.load_weights('weights/data_m_noface.h5')

# 10. Evaluation using Confusion Matrix and Accuracy

In [None]:
from sklearn.metrics import multilabel_confusion_matrix, accuracy_score

In [None]:
yhat = model.predict(X_test)

In [None]:
ytrue = np.argmax(y_test, axis=1).tolist()
yhat = np.argmax(yhat, axis=1).tolist()

In [None]:
multilabel_confusion_matrix(ytrue, yhat)

In [None]:
accuracy_score(ytrue, yhat)

# 11. Test in Real Time

In [None]:
from scipy import stats

In [25]:
colors = [(245,117,16), (117,245,16), (16,117,245)]
def prob_viz(res, actions, input_frame, colors):
    output_frame = input_frame.copy()
    for num, prob in enumerate(res):
        cv2.rectangle(output_frame, (0,60+num*40), (int(prob*100), 90+num*40), colors[num%3], -1)
        cv2.putText(output_frame, actions[num], (0, 85+num*40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255,255,255), 2, cv2.LINE_AA)
        
    return output_frame

In [None]:
plt.figure(figsize=(18,18))
plt.imshow(prob_viz(res, actions, image, colors))

In [None]:
# 1. New detection variables
sequence = []
sentence = []
predictions = []
threshold = 0.5

cap = cv2.VideoCapture(1)
# Set mediapipe model 
with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    while cap.isOpened():

        # Read feed
        ret, frame = cap.read()

        # To improve performance, optionally mark the image as not writeable to
        # pass by reference.
        image.flags.writeable = False
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        results = hands.process(image)
        results_pose = pose.process(image)


        # Draw the hand annotations on the image.
        image.flags.writeable = True
        image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)



#             print(len(results.multi_hand_landmarks))
        hand_np = []
        if results.multi_hand_landmarks:
            for i in range(len(results.multi_hand_landmarks)):
                print(i)
                mp_drawing.draw_landmarks(image,results.multi_hand_landmarks[i],mp_hands.HAND_CONNECTIONS,mp_drawing_styles.get_default_hand_landmarks_style(),mp_drawing_styles.get_default_hand_connections_style())
                hand_np.append(np.array([[res.x, res.y, res.z] for res in results.multi_hand_landmarks[i].landmark]).flatten() if results.multi_hand_landmarks[i] else np.zeros(21*3))

        if len(hand_np) == 0:
            lh = np.zeros(21*3)
            rh = np.zeros(21*3)
        elif len(hand_np) == 1:
            lh = hand_np[0]
            rh = np.zeros(21*3)
        else:
            lh = hand_np[0]
            rh = hand_np[1]        

        # Draw pose annotations        
        mp_drawing.draw_landmarks(image,results_pose.pose_landmarks,mp_pose.POSE_CONNECTIONS,landmark_drawing_spec=mp_drawing_styles.get_default_pose_landmarks_style())

        ps = np.array([[res.x, res.y, res.z, res.visibility] for res in results_pose.pose_landmarks.landmark]).flatten() if results_pose.pose_landmarks else np.zeros(33*4)

        keypoints = np.concatenate([ps, lh, rh])
        sequence.append(keypoints)
        sequence = sequence[-sequence_length:]
        
        if len(sequence) == sequence_length:
            res = model.predict(np.expand_dims(sequence, axis=0))[0]
            print(actions[np.argmax(res)])
            predictions.append(np.argmax(res))
            
            
            #3. Viz logic
            if np.unique(predictions[-10:])[0]==np.argmax(res): 
                if res[np.argmax(res)] > threshold: 
                    
                    if len(sentence) > 0: 
                        if actions[np.argmax(res)] != sentence[-1]:
                            sentence.append(actions[np.argmax(res)])
                    else:
                        sentence.append(actions[np.argmax(res)])

            if len(sentence) > 4: 
                sentence = sentence[-4:]

            # Viz probabilities
            image = prob_viz(res, actions, image, colors)
            
        cv2.rectangle(image, (0,0), (640, 40), (245, 117, 16), -1)
        cv2.putText(image, ' '.join(sentence), (3,30), 
                       cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
        
        # Show to screen
        cv2.imshow('OpenCV Feed', image)

        # Break gracefully
        if cv2.waitKey(10) & 0xFF == ord('q'):
            break
    cap.release()
    cv2.destroyAllWindows()