In [1]:
#Run cell to mount Google Drive

from google.colab import drive
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [2]:
# install package to have access to custom functions
%pip install /content/drive/MyDrive/EMG_gestures/ --use-feature=in-tree-build

Processing ./drive/MyDrive/EMG_gestures
Building wheels for collected packages: EMG-gestures
  Building wheel for EMG-gestures (setup.py) ... [?25l[?25hdone
  Created wheel for EMG-gestures: filename=EMG_gestures-0.1.0-py3-none-any.whl size=47152 sha256=34ccc88e34cf0e28bd7e0eb8b1c20c599c86b82b086ddb287e6b7a13547e62da
  Stored in directory: /tmp/pip-ephem-wheel-cache-57vcie0k/wheels/a2/b7/61/2147fa082a9e51bef5dcc38dd3f0898fe0554d62203c0e383e
Successfully built EMG-gestures
Installing collected packages: EMG-gestures
  Attempting uninstall: EMG-gestures
    Found existing installation: EMG-gestures 0.1.0
    Uninstalling EMG-gestures-0.1.0:
      Successfully uninstalled EMG-gestures-0.1.0
Successfully installed EMG-gestures-0.1.0


In [3]:
#import necessary packages

#our workhorses
import numpy as np
import pandas as pd
import scipy

#to visualize
%matplotlib inline
import seaborn as sns
import matplotlib.pyplot as plt
#style params for figures
sns.set(font_scale = 2)
plt.style.use('seaborn-white')
plt.rc("axes", labelweight="bold")
from IPython.display import display, HTML

#to load files
import os
import sys
import h5py

#import cusotm functions
from EMG_gestures.utils import *
from EMG_gestures.analysis import within_subject_rnn_performance


In [4]:
#define where the data files are located
data_folder = '/content/drive/MyDrive/EMG_gestures/EMG_data/'
results_folder = '/content/drive/MyDrive/EMG_gestures/results_data/single_subject_training/RNN/'

nsubjects = 36


# User-defined parameters
lo_freq = 20 #lower bound of bandpass filter
hi_freq = 450 #upper bound of bandpass filter

win_size = 100 #define window size over which to compute time-domain features
step = win_size #keeping this parameter in case we want to re-run later with some overlap

nreps = 10
exclude = [0,7]#labels to exclude

#for RNN training
verbose = 0
epochs = 200
batch_size = 2
es_patience = 5
#number of permutations to use for training
n_shuffled_sets = 20
model_dict = {'fe_layers':1, 'fe_activation':'tanh'}
#performance metrics
score_list = ['f1','accuracy']



for subject_id in range(1,nsubjects+1):

    subject_folder = os.path.join(data_folder,'%02d'%(subject_id))
    print('=======================')
    print(subject_folder)

    # Process data and get features 
    #get features across segments and corresponding info
    feature_matrix_sub, target_labels_sub, window_tstamps_sub, \
    block_labels_sub, series_labels_sub = get_subject_data_for_classification(subject_folder, lo_freq, hi_freq, \
                                                                    win_size, step)
    np.random.seed(1)#for reproducibility
    results_df = []#initialize empty array for dataframes


    for rep in range(nreps):
        print('Subject %d|Rep %d'%(subject_id, rep+1))
        print('True Data')
        train_scores, test_scores,train_info_dict = within_subject_rnn_performance(feature_matrix_sub, target_labels_sub, block_labels_sub,\
                                                                series_labels_sub, model_dict, exclude, score_list,\
                                                                n_shuffled_sets = n_shuffled_sets,\
                                                                verbose = verbose, epochs = epochs, batch_size = batch_size, es_patience = es_patience)

        n_splits, n_scores = train_scores.shape
        #put testing results in dataframe
        data_dict = {'Fold':np.arange(n_splits)+1,\
                            'Rep':[rep+1 for x in range(n_splits)],\
                            'Type':['Train' for x in range(n_splits)],\
                            'Shuffled':[False for x in range(n_splits)],\
                            'Subject':[subject_id for x in range(n_splits)],\
                        'Epochs':[epochs for x in range(n_splits)],\
                'Batch_Size':[batch_size for x in range(n_splits)],\
                'Train_Loss':train_info_dict['train_loss'],\
                    'Val_Loss':train_info_dict['val_loss'],\
                    'Epochs_Trained':train_info_dict['epochs_trained'],\
                }
        for sidx in range(n_scores):
            data_dict['%s_score'%(score_list[sidx])] = train_scores[:,sidx]
        results_df.append(pd.DataFrame(data_dict))

        data_dict = {'Fold':np.arange(n_splits)+1,\
                            'Rep':[rep+1 for x in range(n_splits)],\
                            'Type':['Test' for x in range(n_splits)],\
                            'Shuffled':[False for x in range(n_splits)],\
                            'Subject':[subject_id for x in range(n_splits)],\
                        'Epochs':[epochs for x in range(n_splits)],\
                'Batch_Size':[batch_size for x in range(n_splits)],\
                'Train_Loss':train_info_dict['train_loss'],\
                    'Val_Loss':train_info_dict['val_loss'],\
                    'Epochs_Trained':train_info_dict['epochs_trained'],\
                }
        for sidx in range(n_scores):
            data_dict['%s_score'%(score_list[sidx])] = test_scores[:,sidx]
        results_df.append(pd.DataFrame(data_dict))
        print('Subject %d|Rep %d'%(subject_id, rep+1))
        print('Permuted Data')
        target_labels_sub_perm = permute_class_within_sub(target_labels_sub, block_labels_sub, series_labels_sub, exclude)
        train_scores, test_scores, train_info_dict = within_subject_rnn_performance(feature_matrix_sub, target_labels_sub_perm, block_labels_sub,\
                                                                series_labels_sub, model_dict, exclude, score_list,\
                                                                n_shuffled_sets = n_shuffled_sets,\
                                                                verbose = verbose, epochs = epochs, batch_size = batch_size, es_patience = es_patience)
        n_splits, n_scores = train_scores.shape
        #put testing results in dataframe
        data_dict = {'Fold':np.arange(n_splits)+1,\
                            'Rep':[rep+1 for x in range(n_splits)],\
                            'Type':['Train' for x in range(n_splits)],\
                            'Shuffled':[True for x in range(n_splits)],\
                            'Subject':[subject_id for x in range(n_splits)],\
                        'Epochs':[epochs for x in range(n_splits)],\
                'Batch_Size':[batch_size for x in range(n_splits)],\
                'Train_Loss':train_info_dict['train_loss'],\
                    'Val_Loss':train_info_dict['val_loss'],\
                    'Epochs_Trained':train_info_dict['epochs_trained'],\
                }
        for sidx in range(n_scores):
            data_dict['%s_score'%(score_list[sidx])] = train_scores[:,sidx]
        results_df.append(pd.DataFrame(data_dict))

        data_dict = {'Fold':np.arange(n_splits)+1,\
                            'Rep':[rep+1 for x in range(n_splits)],\
                            'Type':['Test' for x in range(n_splits)],\
                            'Shuffled':[True for x in range(n_splits)],\
                            'Subject':[subject_id for x in range(n_splits)],\
                        'Epochs':[epochs for x in range(n_splits)],\
                'Batch_Size':[batch_size for x in range(n_splits)],\
                'Train_Loss':train_info_dict['train_loss'],\
                    'Val_Loss':train_info_dict['val_loss'],\
                    'Epochs_Trained':train_info_dict['epochs_trained'],\
                }
        for sidx in range(n_scores):
            data_dict['%s_score'%(score_list[sidx])] = test_scores[:,sidx]
        results_df.append(pd.DataFrame(data_dict))

    results_df = pd.concat(results_df, axis = 0)
    #save results to file
    results_fn = 'subject_%02d_within_subject_results.h5'%(subject_id)
    results_df.to_hdf(os.path.join(results_folder,results_fn), key='results_df', mode='w')

        



[1;30;43mStreaming output truncated to the last 5000 lines.[0m
Epochs Trained: 33
Evaluate Model
Subject 12|Rep 3
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 6
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 7
Evaluate Model
Subject 12|Rep 4
True Data
Split Count: 1
Training Model
Epochs Trained: 22
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 23
Evaluate Model
Subject 12|Rep 4
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 7
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 6
Evaluate Model
Subject 12|Rep 5
True Data
Split Count: 1
Training Model
Epochs Trained: 30
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 36
Evaluate Model
Subject 12|Rep 5
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 6
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 6
Evaluate Model
Subject 12|Rep 6
True Data
Split Count: 1
Training Model
Epochs Trained: 23
Evaluate Model
Split Count: 2
Training Model

In [9]:
results_df.groupby(['Type','Shuffled']).mean()

Unnamed: 0_level_0,Unnamed: 1_level_0,Fold,Rep,Subject,Epochs,Batch_Size,Train_Loss,Val_Loss,Epochs_Trained,f1_score,accuracy_score
Type,Shuffled,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1
Test,False,1.5,5.5,11.0,200.0,2.0,0.069822,0.005311,101.9,0.994666,0.994673
Test,True,1.5,5.5,11.0,200.0,2.0,1.333502,0.646427,6.25,0.138239,0.16004
Train,False,1.5,5.5,11.0,200.0,2.0,0.069822,0.005311,101.9,1.0,1.0
Train,True,1.5,5.5,11.0,200.0,2.0,1.333502,0.646427,6.25,0.568712,0.621756


In [None]:
#define where the data files are located
data_folder = '/content/drive/MyDrive/EMG_gestures/EMG_data/'
results_folder = '/content/drive/MyDrive/EMG_gestures/results_data/single_subject_training/RNN/'

nsubjects = 36


# User-defined parameters
lo_freq = 20 #lower bound of bandpass filter
hi_freq = 450 #upper bound of bandpass filter

win_size = 100 #define window size over which to compute time-domain features
step = win_size #keeping this parameter in case we want to re-run later with some overlap

nreps = 10
exclude = [0,7]#labels to exclude

#for RNN training
verbose = 0
epochs = 100
batch_size = 2
es_patience = 5
#number of permutations to use for training
n_shuffled_sets = 20
model_dict = {'fe_layers':1, 'fe_activation':'tanh'}
#performance metrics
score_list = ['f1','accuracy']


#subject_id = 1
for subject_id in range(1,nsubjects+1):

    subject_folder = os.path.join(data_folder,'%02d'%(subject_id))
    print('=======================')
    print(subject_folder)

    # Process data and get features 
    #get features across segments and corresponding info
    feature_matrix_sub, target_labels_sub, window_tstamps_sub, \
    block_labels_sub, series_labels_sub = get_subject_data_for_classification(subject_folder, lo_freq, hi_freq, \
                                                                    win_size, step)
    np.random.seed(1)#for reproducibility
    results_df = []#initialize empty array for dataframes


    for rep in range(nreps):

        print('Subject %d|Rep %d'%(subject_id, rep+1))
        print('Permuted Data')
        target_labels_sub_perm = permute_class_within_sub(target_labels_sub, block_labels_sub, series_labels_sub, exclude)
        train_scores, test_scores, train_info_dict = within_subject_rnn_performance(feature_matrix_sub, target_labels_sub_perm, block_labels_sub,\
                                                                series_labels_sub, model_dict, exclude, score_list,\
                                                                n_shuffled_sets = n_shuffled_sets,\
                                                                verbose = verbose, epochs = epochs, batch_size = batch_size, es_patience = es_patience)
        n_splits, n_scores = train_scores.shape
        #put testing results in dataframe
        data_dict = {'Fold':np.arange(n_splits)+1,\
                            'Rep':[rep+1 for x in range(n_splits)],\
                            'Type':['Train' for x in range(n_splits)],\
                            'Shuffled':[True for x in range(n_splits)],\
                            'Subject':[subject_id for x in range(n_splits)],\
                     'Epochs':[epochs for x in range(n_splits)],\
                'Batch_Size':[batch_size for x in range(n_splits)],\
                'Train_Loss':train_info_dict['train_loss'],\
                    'Val_Loss':train_info_dict['val_loss'],\
                    'Epochs_Trained':train_info_dict['epochs_trained'],\
                }
        for sidx in range(n_scores):
            data_dict['%s_score'%(score_list[sidx])] = train_scores[:,sidx]
        results_df.append(pd.DataFrame(data_dict))

        data_dict = {'Fold':np.arange(n_splits)+1,\
                            'Rep':[rep+1 for x in range(n_splits)],\
                            'Type':['Test' for x in range(n_splits)],\
                            'Shuffled':[True for x in range(n_splits)],\
                            'Subject':[subject_id for x in range(n_splits)],\
                     'Epochs':[epochs for x in range(n_splits)],\
                'Batch_Size':[batch_size for x in range(n_splits)],\
                'Train_Loss':train_info_dict['train_loss'],\
                    'Val_Loss':train_info_dict['val_loss'],\
                    'Epochs_Trained':train_info_dict['epochs_trained'],\
                }
        for sidx in range(n_scores):
            data_dict['%s_score'%(score_list[sidx])] = test_scores[:,sidx]
        results_df.append(pd.DataFrame(data_dict))

    results_df = pd.concat(results_df, axis = 0)
    #save results to file
    results_fn = 'subject_%02d_within_subject_permuted_data_results.h5'%(subject_id)
    results_df.to_hdf(os.path.join(results_folder,results_fn), key='results_df', mode='w')

    



/content/drive/MyDrive/EMG_gestures/EMG_data/01
Subject 1|Rep 1
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 6
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 6
Evaluate Model
Subject 1|Rep 2
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 8
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 7
Evaluate Model
Subject 1|Rep 3
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 6
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 8
Evaluate Model
Subject 1|Rep 4
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 6
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 6
Evaluate Model
Subject 1|Rep 5
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 7
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 6
Evaluate Model
Subject 1|Rep 6
Permuted Data
Split Count: 1
Training Model
Epochs Trained: 6
Evaluate Model
Split Count: 2
Training Model
Epochs Trained: 6
Evaluate Model
Subject 1|Rep 7
