# Install and Import

In [1]:
!pip install mediapipe opencv-python pandas scikit-learn



You should consider upgrading via the 'e:\media_pipe_ml\venv\scripts\python.exe -m pip install --upgrade pip' command.


In [2]:
import numpy as np
import cv2  #opencv
import mediapipe as mp

In [3]:
mp_drawing = mp.solutions.drawing_utils  #繪圖助手
mp_holistic = mp.solutions.holistic  #偵測工具  ##包含臉、左手、右手、肢體

# Detections && Tag

In [4]:
cap = cv2.VideoCapture(0)  #預設攝影機 

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    while cap.isOpened():  #判斷鏡頭是否開啟
        ret,frame = cap.read()
        
        image = cv2.cvtColor(frame,cv2.COLOR_BGR2RGB)
        image.flags.writeable = False
        
        results = holistic.process(image)   #進行偵測 results裡有所有偵測結果的資料
        
        image.flags.writeable = True
        image = cv2.cvtColor(image,cv2.COLOR_RGB2BGR)
        
        # 1. 臉部特徵標記 
        mp_drawing.draw_landmarks(image,results.face_landmarks, mp_holistic.FACE_CONNECTIONS,
                                 mp_drawing.DrawingSpec(color=(80,110,50),thickness=2, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121),thickness=2, circle_radius=1))
        
        # 2. 右手特徵標記  
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=2)
                                )
        # 3. 左手特徵標記
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=2)
                                )
        
        # 4. 肢體特徵標記
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(245,117,66),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(245,66,230),thickness=2,circle_radius=2)
                                )
        
        cv2.imshow('Webcam',image)  #顯示影像




        if cv2.waitKey(10) & 0xFF == ord('q'):
            break



cap.release()
cv2.destroyAllWindows()

In [5]:
results.pose_landmarks

landmark {
  x: 0.43682972
  y: 0.55097556
  z: -2.0030084
  visibility: 0.99991983
}
landmark {
  x: 0.46994862
  y: 0.47047308
  z: -1.9190626
  visibility: 0.9998486
}
landmark {
  x: 0.4959982
  y: 0.46982518
  z: -1.9192078
  visibility: 0.9998401
}
landmark {
  x: 0.5184617
  y: 0.46937478
  z: -1.9193327
  visibility: 0.9998259
}
landmark {
  x: 0.39588073
  y: 0.4724785
  z: -1.919343
  visibility: 0.9998366
}
landmark {
  x: 0.36914793
  y: 0.47261193
  z: -1.9194758
  visibility: 0.9998337
}
landmark {
  x: 0.3435267
  y: 0.47255197
  z: -1.9192808
  visibility: 0.99984187
}
landmark {
  x: 0.5518226
  y: 0.49624258
  z: -1.2953064
  visibility: 0.9998221
}
landmark {
  x: 0.31136805
  y: 0.4997644
  z: -1.2892039
  visibility: 0.9998103
}
landmark {
  x: 0.48457608
  y: 0.6382698
  z: -1.7545841
  visibility: 0.9998975
}
landmark {
  x: 0.3884548
  y: 0.64096487
  z: -1.7524166
  visibility: 0.99990183
}
landmark {
  x: 0.6963558
  y: 0.8938364
  z: -0.812101
  visibility: 0

# 2. Capture Landmarks & Export to CSV
<img src='https://google.github.io/mediapipe/images/mobile/pose_tracking_full_body_landmarks.png' >

In [6]:
import csv
import os
import numpy as np

In [7]:
#coord 座標
num_coords = len(results.pose_landmarks.landmark) + len(results.face_landmarks.landmark)
num_coords

501

In [8]:
#整理資料 --> 預備訓練

landmarks = ['class']
for val in range(1,num_coords+1):   
    landmarks += ['x{}'.format(val) , 'y{}'.format(val) , 'z{}'.format(val) , 'v{}'.format(val)]
landmarks

['class',
 'x1',
 'y1',
 'z1',
 'v1',
 'x2',
 'y2',
 'z2',
 'v2',
 'x3',
 'y3',
 'z3',
 'v3',
 'x4',
 'y4',
 'z4',
 'v4',
 'x5',
 'y5',
 'z5',
 'v5',
 'x6',
 'y6',
 'z6',
 'v6',
 'x7',
 'y7',
 'z7',
 'v7',
 'x8',
 'y8',
 'z8',
 'v8',
 'x9',
 'y9',
 'z9',
 'v9',
 'x10',
 'y10',
 'z10',
 'v10',
 'x11',
 'y11',
 'z11',
 'v11',
 'x12',
 'y12',
 'z12',
 'v12',
 'x13',
 'y13',
 'z13',
 'v13',
 'x14',
 'y14',
 'z14',
 'v14',
 'x15',
 'y15',
 'z15',
 'v15',
 'x16',
 'y16',
 'z16',
 'v16',
 'x17',
 'y17',
 'z17',
 'v17',
 'x18',
 'y18',
 'z18',
 'v18',
 'x19',
 'y19',
 'z19',
 'v19',
 'x20',
 'y20',
 'z20',
 'v20',
 'x21',
 'y21',
 'z21',
 'v21',
 'x22',
 'y22',
 'z22',
 'v22',
 'x23',
 'y23',
 'z23',
 'v23',
 'x24',
 'y24',
 'z24',
 'v24',
 'x25',
 'y25',
 'z25',
 'v25',
 'x26',
 'y26',
 'z26',
 'v26',
 'x27',
 'y27',
 'z27',
 'v27',
 'x28',
 'y28',
 'z28',
 'v28',
 'x29',
 'y29',
 'z29',
 'v29',
 'x30',
 'y30',
 'z30',
 'v30',
 'x31',
 'y31',
 'z31',
 'v31',
 'x32',
 'y32',
 'z32',
 'v32',
 '

In [9]:
#建立名為'coords.csv'的新csv檔案

with open('coords.csv', mode = 'w',newline='') as f:
    csv_writer = csv.writer(f,delimiter=',',quotechar = '"',quoting=csv.QUOTE_MINIMAL)
    csv_writer.writerow(landmarks)   #將landmarks的row資料寫入coords.csv檔案
    
    
    

In [14]:
#這次實作三個class -->[Happy,Sad,Yeah!!!]
#必須每個都偵測一次
#穰程式讀取資料並寫入csv

class_name = 'sad'
 

In [15]:
cap = cv2.VideoCapture(0)  #預設攝影機 

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    while cap.isOpened():  #判斷鏡頭是否開啟
        ret,frame = cap.read()
        
        image = cv2.cvtColor(frame,cv2.COLOR_BGR2RGB)
        image.flags.writeable = False
        
        results = holistic.process(image)   #進行偵測 results裡有所有偵測結果的資料
        
        image.flags.writeable = True
        image = cv2.cvtColor(image,cv2.COLOR_RGB2BGR)
        
        # 1. 臉部特徵標記 
        mp_drawing.draw_landmarks(image,results.face_landmarks, mp_holistic.FACE_CONNECTIONS,
                                 mp_drawing.DrawingSpec(color=(80,110,50),thickness=2, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121),thickness=2, circle_radius=1))
        
        # 2. 右手特徵標記  
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=2)
                                )
        # 3. 左手特徵標記
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=2)
                                )
        
        # 4. 肢體特徵標記
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(245,117,66),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(245,66,230),thickness=2,circle_radius=2)
                                )
        #輸出座標
        #array.flatten() --> 將array資料壓縮為一維 
        
        try:
            #提取pose_landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            #提取face_landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            #連結資料
            row = pose_row + face_row
            #插入開頭
            row.insert(0,class_name)
            with open('coords.csv', mode = 'a',newline='') as f:
                csv_writer = csv.writer(f,delimiter=',',quotechar = '"',quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row)   #將landmarks的row資料寫入coords.csv檔案
        except:
            pass
        
        
        
        cv2.imshow('Webcam',image)  #顯示影像




        if cv2.waitKey(10) & 0xFF == ord('q'):
            break



cap.release()
cv2.destroyAllWindows()

# 訓練模型 Train Model
## using Scikit Learn

##  1.分割資料

In [16]:
import pandas as pd
from sklearn.model_selection import train_test_split  
#分割訓練資料和測試資料
#用來判斷模型正確率

In [17]:
train_data = pd.read_csv('coords.csv')
train_data

Unnamed: 0,class,x1,y1,z1,v1,x2,y2,z2,v2,x3,...,z499,v499,x500,y500,z500,v500,x501,y501,z501,v501
0,YA!!!!!!!!!,0.481813,0.435055,-1.248385,0.999972,0.507619,0.382357,-1.151800,0.999927,0.523704,...,-0.000408,0.0,0.528172,0.373698,0.018688,0.0,0.532397,0.369108,0.019277,0.0
1,YA!!!!!!!!!,0.482197,0.435647,-1.285806,0.999973,0.507889,0.382609,-1.190105,0.999929,0.523668,...,-0.000980,0.0,0.529386,0.374116,0.018620,0.0,0.533631,0.369841,0.019149,0.0
2,YA!!!!!!!!!,0.482323,0.435649,-1.294325,0.999974,0.507955,0.382375,-1.197827,0.999933,0.523591,...,-0.000769,0.0,0.529878,0.373594,0.018533,0.0,0.534111,0.369205,0.019059,0.0
3,YA!!!!!!!!!,0.482954,0.434791,-1.290047,0.999976,0.508101,0.381200,-1.193818,0.999937,0.523575,...,-0.001414,0.0,0.529240,0.374880,0.017639,0.0,0.533582,0.370540,0.018141,0.0
4,YA!!!!!!!!!,0.482985,0.434206,-1.306946,0.999977,0.508078,0.380597,-1.210468,0.999940,0.523327,...,-0.001335,0.0,0.528885,0.375427,0.017765,0.0,0.533241,0.371132,0.018235,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
376,sad,0.455059,0.630906,-1.853804,0.999832,0.489969,0.560557,-1.823537,0.999776,0.512362,...,-0.015006,0.0,0.516929,0.577725,0.003058,0.0,0.521510,0.569701,0.003504,0.0
377,sad,0.452463,0.652548,-2.151999,0.999835,0.485073,0.577570,-2.121454,0.999784,0.507086,...,-0.014382,0.0,0.514854,0.585377,0.004813,0.0,0.519252,0.577263,0.005258,0.0
378,sad,0.448316,0.679415,-2.173855,0.999839,0.479163,0.601709,-2.142796,0.999792,0.501291,...,-0.015745,0.0,0.514966,0.601031,0.004544,0.0,0.519709,0.591203,0.005228,0.0
379,sad,0.444029,0.715778,-2.485679,0.999855,0.473919,0.629846,-2.436769,0.999812,0.496611,...,-0.018390,0.0,0.513823,0.627394,0.002008,0.0,0.519048,0.617644,0.002383,0.0


In [18]:
x = train_data.drop('class',axis=1)
y = train_data['class']    
X_train ,X_test ,Y_train,Y_test = train_test_split(x,y,test_size = 0.3,random_state=1234)

## 2.訓練模型


In [19]:
#管線 --> 建構模型鏈
from sklearn.pipeline import make_pipeline 

#將資料常態分布化，平均值會變為0, 標準差變為1，使離群值影響降低
from sklearn.preprocessing import StandardScaler 

#線性分類
from sklearn.linear_model import LogisticRegression, RidgeClassifier

#集成學習
from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier

In [20]:
##建構模型管線

pipelines = {
    'lr' : make_pipeline(StandardScaler(), LogisticRegression(max_iter=1000)),
    'rc' : make_pipeline(StandardScaler(), RidgeClassifier()),
    'rf' : make_pipeline(StandardScaler(), RandomForestClassifier()),
    'gb' : make_pipeline(StandardScaler(), GradientBoostingClassifier())
}

In [21]:
##訓練模型
fit_models = {}

for algo , pipeline in pipelines.items():
    model = pipeline.fit(X_train,Y_train)
    ##存入fit_model字典
    fit_models[algo] = model
    
    
##可能會出現警告 --> 因為迭代次數達到上限而中止

'''
解決方法三種：

增加迭代總數（max_iter 參數預設為 100）
-->將LogisticRegression() 參數max_iter設為1000

縮放資料規模（scale）
更換其他求解器（solver）

'''

'\n解決方法三種：\n\n增加迭代總數（max_iter 參數預設為 100）\n-->將LogisticRegression() 參數max_iter設為1000\n\n縮放資料規模（scale）\n更換其他求解器（solver）\n\n'

In [22]:
fit_models['rf'].predict(X_test)

array(['sad', 'sad', 'muscle', 'sad', 'muscle', 'muscle', 'muscle',
       'muscle', 'muscle', 'muscle', 'muscle', 'muscle', 'sad',
       'YA!!!!!!!!!', 'YA!!!!!!!!!', 'YA!!!!!!!!!', 'sad', 'sad', 'sad',
       'sad', 'muscle', 'muscle', 'YA!!!!!!!!!', 'muscle', 'sad',
       'muscle', 'YA!!!!!!!!!', 'muscle', 'muscle', 'muscle',
       'YA!!!!!!!!!', 'muscle', 'YA!!!!!!!!!', 'muscle', 'sad', 'muscle',
       'sad', 'sad', 'sad', 'YA!!!!!!!!!', 'muscle', 'YA!!!!!!!!!',
       'YA!!!!!!!!!', 'muscle', 'muscle', 'muscle', 'sad', 'sad', 'sad',
       'muscle', 'YA!!!!!!!!!', 'muscle', 'muscle', 'sad', 'muscle',
       'YA!!!!!!!!!', 'sad', 'YA!!!!!!!!!', 'muscle', 'sad',
       'YA!!!!!!!!!', 'muscle', 'sad', 'YA!!!!!!!!!', 'sad',
       'YA!!!!!!!!!', 'YA!!!!!!!!!', 'muscle', 'YA!!!!!!!!!',
       'YA!!!!!!!!!', 'sad', 'sad', 'muscle', 'sad', 'muscle', 'muscle',
       'muscle', 'sad', 'YA!!!!!!!!!', 'YA!!!!!!!!!', 'muscle', 'muscle',
       'sad', 'muscle', 'YA!!!!!!!!!', 'sad', 'muscl

# 評估、序列化模型
## Evaluate and Serialize Model

In [23]:
from sklearn.metrics import accuracy_score
import pickle


In [25]:
#模型正確率

for algo,model in fit_models.items():
    yhat = model.predict(X_test)
    print(algo,accuracy_score(Y_test,yhat))

lr 1.0
rc 1.0
rf 1.0
gb 1.0


In [26]:
with open('body_language.pkl','wb') as f:
    pickle.dump(fit_models['rf'],f)

# 檢測

In [27]:
with open('body_language.pkl','rb') as f:
    model = pickle.load(f)
    

In [31]:
cap = cv2.VideoCapture(0)  #預設攝影機 

with mp_holistic.Holistic(min_detection_confidence=0.5, min_tracking_confidence=0.5) as holistic:
    while cap.isOpened():  #判斷鏡頭是否開啟
        ret,frame = cap.read()
        
        image = cv2.cvtColor(frame,cv2.COLOR_BGR2RGB)
        image.flags.writeable = False
        
        results = holistic.process(image)   #進行偵測 results裡有所有偵測結果的資料
        
        image.flags.writeable = True
        image = cv2.cvtColor(image,cv2.COLOR_RGB2BGR)
        
        # 1. 臉部特徵標記 
        mp_drawing.draw_landmarks(image,results.face_landmarks, mp_holistic.FACE_CONNECTIONS,
                                 mp_drawing.DrawingSpec(color=(80,110,50),thickness=2, circle_radius=1),
                                 mp_drawing.DrawingSpec(color=(80,256,121),thickness=2, circle_radius=1))
        
        # 2. 右手特徵標記  
        mp_drawing.draw_landmarks(image, results.right_hand_landmarks, mp_holistic.HAND_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=2)
                                )
        # 3. 左手特徵標記
        mp_drawing.draw_landmarks(image, results.left_hand_landmarks, mp_holistic.HAND_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(80,22,10),thickness=2,circle_radius=2)
                                )
        
        # 4. 肢體特徵標記
        mp_drawing.draw_landmarks(image, results.pose_landmarks, mp_holistic.POSE_CONNECTIONS,
                                mp_drawing.DrawingSpec(color=(245,117,66),thickness=2,circle_radius=4),
                                mp_drawing.DrawingSpec(color=(245,66,230),thickness=2,circle_radius=2)
                                )
        #輸出座標
        #array.flatten() --> 將array資料壓縮為一維 
        
        try:
            #提取pose_landmarks
            pose = results.pose_landmarks.landmark
            pose_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in pose]).flatten())
            
            #提取face_landmarks
            face = results.face_landmarks.landmark
            face_row = list(np.array([[landmark.x, landmark.y, landmark.z, landmark.visibility] for landmark in face]).flatten())
            
            #連結資料
            row = pose_row + face_row
            '''
            #插入開頭
            row.insert(0,class_name)
            with open('coords.csv', mode = 'a',newline='') as f:
                csv_writer = csv.writer(f,delimiter=',',quotechar = '"',quoting=csv.QUOTE_MINIMAL)
                csv_writer.writerow(row)   #將landmarks的row資料寫入coords.csv檔案
            '''
            
            
            X = pd.DataFrame([row])
            #回傳預測出的標籤
            body_language_class = model.predict(X)[0]
            #回傳預測屬於某標籤的機率
            body_language_prob = model.predict_proba(X)[0]  
            print(body_language_class,body_language_prob)
            
            
            #####顯示預測結果於畫面上#####
            #1. 抓取左耳座標 --> 讓解果顯示於左耳旁
            coords = tuple(np.multiply(
                            np.array(
                                (results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
                                 results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y))
                        , [640,480]).astype(int))
            
            cv2.rectangle(image, 
                          (coords[0], coords[1]+5), 
                          (coords[0]+len(body_language_class)*20, coords[1]-30), 
                          (245, 117, 16), -1)
            cv2.putText(image, body_language_class, coords, 
                        cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
            # Get status box
            cv2.rectangle(image, (0,0), (250, 60), (245, 117, 16), -1)
            
            # Display Class
            cv2.putText(image, 'CLASS'
                        , (95,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, body_language_class.split(' ')[0]
                        , (90,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
        
            # Display Probability
            cv2.putText(image, 'PROB'
                        , (15,12), cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 0, 0), 1, cv2.LINE_AA)
            cv2.putText(image, str(round(body_language_prob[np.argmax(body_language_prob)],2))
                        , (10,40), cv2.FONT_HERSHEY_SIMPLEX, 1, (255, 255, 255), 2, cv2.LINE_AA)
        except:
            pass
        
        
        
        cv2.imshow('Webcam',image)  #顯示影像




        if cv2.waitKey(10) & 0xFF == ord('q'):
            break



cap.release()
cv2.destroyAllWindows()

muscle [0.17 0.81 0.02]
muscle [0.15 0.83 0.02]
muscle [0.29 0.69 0.02]
muscle [0.29 0.69 0.02]
muscle [0.32 0.66 0.02]
muscle [0.27 0.71 0.02]
muscle [0.22 0.76 0.02]
muscle [0.17 0.81 0.02]
muscle [0.16 0.82 0.02]
muscle [0.08 0.9  0.02]
muscle [0.06 0.92 0.02]
muscle [0.06 0.92 0.02]
muscle [0.1  0.88 0.02]
muscle [0.12 0.86 0.02]
muscle [0.09 0.89 0.02]
muscle [0.1  0.88 0.02]
muscle [0.08 0.9  0.02]
muscle [0.11 0.87 0.02]
muscle [0.1  0.88 0.02]
muscle [0.14 0.84 0.02]
muscle [0.17 0.82 0.01]
muscle [0.18 0.8  0.02]
muscle [0.18 0.8  0.02]
muscle [0.18 0.8  0.02]
muscle [0.2  0.78 0.02]
muscle [0.16 0.83 0.01]
muscle [0.17 0.82 0.01]
muscle [0.17 0.82 0.01]
muscle [0.18 0.81 0.01]
muscle [0.08 0.9  0.02]
muscle [0.07 0.91 0.02]
muscle [0.1  0.88 0.02]
muscle [0.13 0.81 0.06]
muscle [0.17 0.77 0.06]
muscle [0.17 0.77 0.06]
muscle [0.1  0.84 0.06]
muscle [0.09 0.86 0.05]
muscle [0.13 0.82 0.05]
muscle [0.09 0.86 0.05]
muscle [0.1  0.85 0.05]
muscle [0.05 0.9  0.05]
muscle [0.05 0.9

In [32]:
tuple(np.multiply(np.array((results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].x, 
results.pose_landmarks.landmark[mp_holistic.PoseLandmark.LEFT_EAR].y)), [640,480]).astype(int))

(331, 212)