In [2]:
import cv2
import mediapipe as mp
import time

class HandDetector():
    def __init__(self, mode=False, max_hands=2, modelComplexity=1, detection_confidence=0.5, tracking_confidence=0.5):
        self.mode = mode
        self.max_hands = max_hands
        self.modelComplex = modelComplexity
        self.detection_confidence = detection_confidence
        self.tracking_confidence = tracking_confidence
        self.mp_hands = mp.solutions.hands
        # The four parameters of the hands() are
        # 1. static_image_mode (it tracks and detects, when false it sometimes detects and sometimes tracks)
        # 2. max_num_hands
        # 3. min_detection_confidence
        # 4. min_tracking_confidence
    
        self.hands = self.mp_hands.Hands(self.mode, self.max_hands, self.modelComplex , self.detection_confidence, self.tracking_confidence)

        # method to draw points
        self.mp_draw = mp.solutions.drawing_utils
        
    def findHands(self, image, draw=True):
        # converting bgr image to rgb
        rgb_img = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)


        # get the image and let the hands() process the image
        self.results = self.hands.process(rgb_img)

        # print(results.multi_hand_landmarks)

        # when my hand is in the frame
        if self.results.multi_hand_landmarks:
            # iterating through each landmark
            for hand_landmarks in self.results.multi_hand_landmarks:
                for ID, lm in enumerate(hand_landmarks.landmark):
                    if draw:
                        self.mp_draw.draw_landmarks(image, hand_landmarks, self.mp_hands.HAND_CONNECTIONS)
        return image
    
    def findPosition(self, image, handNo=0, draw=True):
        
        lm_list = []
        # when my hand is in the frame
        if self.results.multi_hand_landmarks:
            myHand = self.results.multi_hand_landmarks[handNo]
            for ID, lm in enumerate(myHand.landmark):
                # print(ID, lm)
                # height, width and channel of our image
                h,w,c = image.shape
                # centre of each landmark point
                cx = int(lm.x*w)
                cy = int(lm.y*h)
                # print(ID, cx, cy)
                lm_list.append([ID,cx,cy])
                if draw:
                    cv2.circle(image, (cx,cy), 13, (255,0 ,255), cv2.FILLED)
    
        return lm_list

# vid.release()
# cv2.destroyAllWindows()


def main():
    pTime=0
    cTime=0
    vid = cv2.VideoCapture(0)
    detector = HandDetector()
    
    while True:
        ret, image = vid.read()
        image = detector.findHands(image)
        lm_list = detector.findPosition(image)
        if len(lm_list) !=0:
            print(lm_list[4])
        
        cTime = time.time()
        fps = 1/(cTime-pTime)
        pTime = cTime
    
        cv2.putText(image, str(int(fps)), (10,70), cv2.FONT_HERSHEY_SIMPLEX, 1.0, (255,255,255), 2, cv2.LINE_AA)
        cv2.imshow('Hand Tracking', image)
    
        if cv2.waitKey(1) & 0xFF == ord('c'):
            break

if __name__ == "__main__":
    main()

[4, 376, 319]
[4, 389, 262]
[4, 395, 220]
[4, 389, 173]
[4, 388, 169]
[4, 387, 166]
[4, 384, 158]
[4, 382, 154]
[4, 382, 152]
[4, 379, 149]
[4, 375, 145]
[4, 316, 122]
[4, 298, 123]
[4, 304, 117]
[4, 332, 150]
[4, 332, 152]
[4, 333, 153]
[4, 336, 153]
[4, 337, 152]
[4, 337, 152]
[4, 338, 152]
[4, 338, 151]
[4, 338, 150]
[4, 339, 147]
[4, 342, 146]
[4, 339, 148]
[4, 331, 177]
[4, 331, 177]
[4, 327, 190]
[4, 325, 187]
[4, 322, 190]
[4, 323, 189]
[4, 321, 191]
[4, 324, 191]
[4, 330, 193]
[4, 354, 197]
[4, 370, 192]
[4, 377, 186]
[4, 379, 188]
[4, 380, 188]
[4, 380, 187]
[4, 380, 186]
[4, 378, 187]
[4, 376, 186]
[4, 382, 185]
[4, 387, 185]
[4, 396, 184]
[4, 409, 184]
[4, 423, 187]
[4, 423, 186]
[4, 447, 186]
[4, 458, 189]
[4, 472, 189]
[4, 488, 190]
[4, 504, 192]
[4, 518, 192]
[4, 531, 193]
[4, 546, 195]
[4, 556, 197]
[4, 557, 196]
[4, 568, 197]
[4, 579, 200]
[4, 586, 202]
[4, 597, 205]
[4, 604, 206]
[4, 613, 208]
[4, 615, 212]
[4, 619, 213]
[4, 622, 214]
[4, 629, 219]
[4, 629, 220]
[4, 64