In [6]:
pip install --upgrade tensorflow numpy mediapipe

Collecting numpy
  Obtaining dependency information for numpy from https://files.pythonhosted.org/packages/93/fd/3f826c6d15d3bdcf65b8031e4835c52b7d9c45add25efa2314b53850e1a2/numpy-1.26.0-cp311-cp311-win_amd64.whl.metadata
  Using cached numpy-1.26.0-cp311-cp311-win_amd64.whl.metadata (61 kB)
Note: you may need to restart the kernel to use updated packages.


In [8]:
import cv2
import numpy as np
import os
from matplotlib import pyplot as plt
import time
import mediapipe as mp

In [11]:
mp_holistic = mp.solutions.holistic # Holistic model
mp_drawing = mp.solutions.drawing_utils # Drawing utilities

In [12]:
def mediapipe_detection(image, model):
    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB) # COLOR CONVERSION BGR 2 RGB
    image.flags.writeable = False                  # Image is no longer writeable
    results = model.process(image)                 # Make prediction
    image.flags.writeable = True                   # Image is now writeable 
    image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR) # COLOR COVERSION RGB 2 BGR
    return image, results

In [13]:
def draw_landmarks(image, results):
    mp_drawing.draw_landmarks(image, results.face_landmarks, mp.solutions.holistic.FACEMESH_TESSELATION) # Draw face connections
    mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS) # Draw pose connections
    mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS) # Draw left hand connections
    mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS) # Draw right hand connections

In [14]:
def draw_styled_landmarks(image, results):
    # Draw face connections
    mp_drawing.draw_landmarks(image, results.face_landmarks, mp_holistic.FACEMESH_TESSELATION, 
                             mp_drawing.DrawingSpec(color=(80,110,10), thickness=1, circle_radius=1), 
                             mp_drawing.DrawingSpec(color=(80,256,121), thickness=1, circle_radius=1)
                             ) 
    # Draw pose connections
    mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS,
                             mp_drawing.DrawingSpec(color=(80,22,10), thickness=2, circle_radius=4), 
                             mp_drawing.DrawingSpec(color=(80,44,121), thickness=2, circle_radius=2)
                             ) 
    # Draw left hand connections
    mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                             mp_drawing.DrawingSpec(color=(121,22,76), thickness=2, circle_radius=4), 
                             mp_drawing.DrawingSpec(color=(121,44,250), thickness=2, circle_radius=2)
                             ) 
    # Draw right hand connections  
    mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS, 
                             mp_drawing.DrawingSpec(color=(245,117,66), thickness=2, circle_radius=4), 
                             mp_drawing.DrawingSpec(color=(245,66,230), thickness=2, circle_radius=2)
                             ) 

In [15]:
def extract_keypoints(results):
    pose = np.array([[res.x, res.y, res.z, res.visibility] for res in results.pose_landmarks.landmark]).flatten() if results.pose_landmarks else np.zeros(33*4)
    face = np.array([[res.x, res.y, res.z] for res in results.face_landmarks.landmark]).flatten() if results.face_landmarks else np.zeros(468*3)
    lh = np.array([[res.x, res.y, res.z] for res in results.left_hand_landmarks.landmark]).flatten() if results.left_hand_landmarks else np.zeros(21*3)
    rh = np.array([[res.x, res.y, res.z] for res in results.right_hand_landmarks.landmark]).flatten() if results.right_hand_landmarks else np.zeros(21*3)
    return np.concatenate([pose, face, lh, rh])
    #return np.concatenate([pose,lh, rh])

# Criando pasta para armazenar os dados

In [16]:
#para cada action são criadas pastas com subpastas index_video
def criarPastas(actions,numeros_videos_por_action):
    for action in actions: 
        for index_video in range(numeros_videos_por_action):
            try: 
                os.makedirs(os.path.join(DATA_PATH, action, str(index_video)))
            except:
                pass

In [17]:
# Path for exported data, numpy arrays
DATA_PATH = os.path.join('MP_Data') 

#target que serão detectados
actions = np.array(["Acontecer","Aluno","Amarelo","America","Aproveitar","Bala","Banco","Banheiro","Cinco","Conhecer","Espelho"])

# número de vídeos para cada target
numeros_videos_por_action = 5;

criarPastas(actions,numeros_videos_por_action)


# Capturar vídeos

In [18]:
import cv2
import mediapipe as mp
import numpy as np

# Inicialize o MediaPipe
mp_holistic = mp.solutions.holistic
mp_drawing = mp.solutions.drawing_utils

max_frames_per_video = 100
desired_fps = 30

In [22]:
def capturarVideos():
    for action in actions:
        print(action)
        for index_video in range(numeros_videos_por_action):
            sequence_str = str(index_video).zfill(1)
            video_path = f'./treino/{action}/{sequence_str}.mp4'

            cap = cv2.VideoCapture(video_path)

            if not cap.isOpened():
                print(f"Erro ao abrir o vídeo {video_path}.")
                continue

            holistic = mp_holistic.Holistic()

            frame_count = 0
            stop_processing = False  # Variável de controle

            while frame_count < max_frames_per_video and not stop_processing:
                ret, frame = cap.read()

                if not ret:
                    break

                rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
                results = holistic.process(rgb_frame)

                annotated_frame = rgb_frame.copy()

                draw_landmarks( annotated_frame, results)

                cv2.imshow('Video', cv2.cvtColor(annotated_frame, cv2.COLOR_RGB2BGR))

                frame_count += 1
                keypoints = extract_keypoints(results)
                npy_path = os.path.join(DATA_PATH, action, str(index_video), str(frame_count))
                np.save(npy_path, keypoints)
                if cv2.waitKey(1) & 0xFF == ord('q'):
                    stop_processing = True  # Atualiza a variável de controle para encerrar
            while frame_count < max_frames_per_video:
                frame_count += 1
                npy_path = os.path.join(DATA_PATH, action, str(index_video), str(frame_count))
                np.save(npy_path, np.zeros_like(keypoints))
                
            cap.release()
            cv2.destroyAllWindows()

            if stop_processing:
                break  # Encerra os loops internos e avança para a próxima ação

In [26]:
def capturarVideos():
    for action in actions:
        for index_video in range(numeros_videos_por_action):
            sequence_str = str(index_video).zfill(1)
            video_path = f'./treino/{action}/{sequence_str}.mp4'

            cap = cv2.VideoCapture(video_path)

            if not cap.isOpened():
                print(f"Erro ao abrir o vídeo {video_path}.")
                continue

            holistic = mp_holistic.Holistic()

            frame_count = 0
            stop_processing = False  # Variável de controle

            while frame_count < max_frames_per_video and not stop_processing:
                ret, frame = cap.read()

                if not ret:
                    break

                rgb_frame = cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)
                results = holistic.process(rgb_frame)

                annotated_frame = rgb_frame.copy()

                draw_landmarks( annotated_frame, results)

                cv2.imshow('Video', cv2.cvtColor(annotated_frame, cv2.COLOR_RGB2BGR))

                frame_count += 1
                keypoints = extract_keypoints(results)
                npy_path = os.path.join(DATA_PATH, action, str(index_video), str(frame_count))
                np.save(npy_path, keypoints)
                if cv2.waitKey(1) & 0xFF == ord('q'):
                    stop_processing = True  # Atualiza a variável de controle para encerrar

            cap.release()
            cv2.destroyAllWindows()

            if stop_processing:
                break  # Encerra os loops internos e avança para a próxima ação

In [None]:
capturarVideos()

Acontecer
Erro ao abrir o vídeo ./treino/Acontecer/0.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/6.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/7.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/8.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/9.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/10.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/11.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/12.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/13.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/14.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/15.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/16.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/17.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/18.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/19.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/20.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/21.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/22.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/23.mp4.
Erro ao abrir o vídeo ./treino/Acontecer/24.mp4.
Erro ao abrir o