## Digital

This python notebook contains the digital software project, which has an ML model that recognizes the numbers your hands are holding up in real time

In [1]:
import cv2 as cv
import numpy as np
import time
import mediapipe as mp
from mediapipe.tasks import python
from mediapipe.tasks.python import vision
from mediapipe.tasks.python.vision import HandLandmarkerResult

mp_drawing = vision.drawing_utils
mp_hands = vision.HandLandmarksConnections
BaseOptions = mp.tasks.BaseOptions
HandLandmarker = mp.tasks.vision.HandLandmarker
HandLandmarkerOptions = mp.tasks.vision.HandLandmarkerOptions
VisionRunningMode = mp.tasks.vision.RunningMode

In [2]:
detection_res = None

In [3]:
# Supporting functions

def print_result(result: HandLandmarkerResult, output_image: mp.Image, timestamp_ms: int):
    global detection_res
    detection_res = result

    if result.hand_landmarks:
        print('Hands found!: ', result)


In [4]:
base_opt = python.BaseOptions(model_asset_path='models/hand_landmarker.task')
options = vision.HandLandmarkerOptions(base_options=base_opt, num_hands=2, running_mode=mp.tasks.vision.RunningMode.LIVE_STREAM, result_callback=print_result)

In [6]:
with HandLandmarker.create_from_options(options) as detector:
    cap = cv.VideoCapture(0)
    start_time = time.time()

    while cap.isOpened():
        success, frame = cap.read()
        frame = cv.flip(frame, 1)

        if not success:
            print("Can't receive frame :( exiting...")
            break

        timestamp_ms = int((time.time() - start_time)* 1000)

        frame_rgb = cv.cvtColor(frame, cv.COLOR_BGR2RGB)
        mp_image = mp.Image(image_format=mp.ImageFormat.SRGB, data=frame_rgb)
        
        detector.detect_async(mp_image, timestamp_ms) 

        if detection_res and detection_res.hand_landmarks:
            for hand_landmarks in detection_res.hand_landmarks:
                mp_drawing.draw_landmarks(
                    frame,
                    hand_landmarks,
                    mp_hands.HAND_CONNECTIONS,
                    mp_drawing.DrawingSpec(color=(0,255,0), thickness=6, circle_radius=4),
                    mp_drawing.DrawingSpec(thickness=2, circle_radius=2),
                )

        cv.imshow('frame',frame)

        if cv.waitKey(1) == ord('q'):
            break

cap.release()
cv.destroyAllWindows()

I0000 00:00:1770617675.834657 11437279 gl_context.cc:407] GL version: 2.1 (2.1 Metal - 90.5), renderer: Apple M4 Pro
W0000 00:00:1770617675.840696 11437286 inference_feedback_manager.cc:121] Feedback manager requires a model with a single signature inference. Disabling support for feedback tensors.
W0000 00:00:1770617675.849404 11437291 inference_feedback_manager.cc:121] Feedback manager requires a model with a single signature inference. Disabling support for feedback tensors.


Hands found!:  HandLandmarkerResult(handedness=[[Category(index=0, score=0.9888301491737366, display_name='Right', category_name='Right')]], hand_landmarks=[[NormalizedLandmark(x=0.1193666011095047, y=0.9225441813468933, z=2.824217517627403e-07, visibility=None, presence=None, name=None), NormalizedLandmark(x=0.20801648497581482, y=0.9328297972679138, z=-0.013832202181220055, visibility=None, presence=None, name=None), NormalizedLandmark(x=0.2756817638874054, y=0.9428302645683289, z=-0.03819844126701355, visibility=None, presence=None, name=None), NormalizedLandmark(x=0.32186564803123474, y=0.9486649036407471, z=-0.06350305676460266, visibility=None, presence=None, name=None), NormalizedLandmark(x=0.3517228662967682, y=0.9258574843406677, z=-0.08862517774105072, visibility=None, presence=None, name=None), NormalizedLandmark(x=0.28228074312210083, y=0.8118768930435181, z=-0.06424436718225479, visibility=None, presence=None, name=None), NormalizedLandmark(x=0.3223402798175812, y=0.972004