# Running Injury Clinic PhD data

Reginaldo K Fukuchi, Jan 2023, reginaldo.fukuchi@ufabc.edu.br

This NB imports mat file containing static and dynamic data of running trials I collected during my PhD at RIC in 2012.

In [1]:
# Prepare environment
import os
import scipy.io as spio
import numpy as np
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
%matplotlib notebook

In [2]:
# Import data
pathname = r'../data'

## Import mat file data
### Helper functions to prepare data
https://stackoverflow.com/questions/7008608/scipy-io-loadmat-nested-structures-i-e-dictionaries

In [7]:
def loadmat(filename):
    '''
    this function should be called instead of direct spio.loadmat
    as it cures the problem of not properly recovering python dictionaries
    from mat files. It calls the function check keys to cure all entries
    which are still mat-objects
    '''
    def _check_keys(d):
        '''
        checks if entries in dictionary are mat-objects. If yes
        todict is called to change them to nested dictionaries
        '''
        for key in d:
            if isinstance(d[key], spio.matlab.mat_struct):
                d[key] = _todict(d[key])
        return d

    def _todict(matobj):
        '''
        A recursive function which constructs from matobjects nested dictionaries
        '''
        d = {}
        for strg in matobj._fieldnames:
            elem = matobj.__dict__[strg]
            if isinstance(elem, spio.matlab.mat_struct):
                d[strg] = _todict(elem)
            elif isinstance(elem, np.ndarray):
                d[strg] = _tolist(elem)
            else:
                d[strg] = elem
        return d

    def _tolist(ndarray):
        '''
        A recursive function which constructs lists from cellarrays
        (which are loaded as numpy ndarrays), recursing into the elements
        if they contain matobjects.
        '''
        elem_list = []
        for sub_elem in ndarray:
            if isinstance(sub_elem, spio.matlab.mat_struct):
                elem_list.append(_todict(sub_elem))
            elif isinstance(sub_elem, np.ndarray):
                elem_list.append(_tolist(sub_elem))
            else:
                elem_list.append(sub_elem)
        return elem_list
    data = spio.loadmat(filename, struct_as_record=False, squeeze_me=True)
    return _check_keys(data)

### Import mat file data

In [8]:
fname    = os.path.join(pathname, '20120821T104617.mat') 
# Import data
data = loadmat(fname)

### Create pandas df from dictionay

In [34]:
mkr_S_labels = list(data['out']['full_static'].keys())

In [44]:
mkr_S_data = np.empty(shape=(200,3*len(mkr_S_labels)))
for m, marker in enumerate(mkr_S_labels):
    mkr_S_data[:,3*m:3*m+3] = np.array(data['out']['full_static'][marker])

In [48]:
direction = ['X','Y','Z']*len(mkr_S_labels)

In [49]:
    if df_multi:  # dataframe with multiple labels
        df.drop(labels='Frame#', axis=1, inplace=True)
        df.set_index('Time', inplace=True)
        df.index.name = 'Time'
        cols = [s[:-1] for s in df.columns.str.replace(r'.', r'_')]
        df.columns = [cols, list('XYZ')*int(df.shape[1]/3), xyz]
        df.columns.set_names(names=['Marker', 'Coordinate', 'XYZ'],
                             level=[0, 1, 2], inplace=True)

183

In [50]:
mkr_S_data.shape

(200, 183)

In [31]:
df_s = pd.DataFrame.from_dict(data['out']['full_static'])
df_s.head()

Unnamed: 0,RIC,LIC,RASI,LASI,RPSI,LPSI,VSAC,RGTR,RTTL,RTTM,...,MAI,IJ,RA,RELB,RW,LA,LELB,LW,RBAK,RARM
0,"[690.303, -24.144964, 1186.502]","[358.82016, -45.394676, 1193.25]","[651.3727, 58.36694, 1110.8032]","[382.158, 48.91054, 1115.131]","[572.2703, -130.8362, 1147.7698]","[494.23367, -131.95474, 1154.3748]","[524.8812, -153.71997, 1100.819]","[712.0781, -29.690912, 994.40625]","[705.3605, -34.873222, 764.90765]","[654.45135, -76.3512, 754.5543]",...,"[522.44165, -171.05545, 1382.6163]","[521.7265, 42.657265, 1535.5942]","[717.5611, -85.00025, 1559.632]","[910.7251, -79.293625, 1280.2725]","[865.3957, 182.5797, 1322.3882]","[345.49744, -99.965614, 1571.3601]","[136.04614, -59.753326, 1292.336]","[145.00455, 217.81528, 1287.8462]","[651.6967, -161.04485, 1530.5139]","[813.9317, -37.80553, 1399.3903]"
1,"[690.3032, -24.149342, 1186.498]","[358.8694, -45.3493, 1193.2429]","[651.4329, 58.410744, 1110.8114]","[382.10538, 48.848274, 1115.1531]","[572.25543, -130.84793, 1147.7628]","[494.22153, -131.93053, 1154.3461]","[524.86206, -153.71922, 1100.798]","[712.1179, -29.707058, 994.40027]","[705.3727, -34.863182, 764.91595]","[654.43805, -76.34176, 754.53723]",...,"[522.4347, -171.03117, 1382.6244]","[521.8142, 42.689983, 1535.6272]","[717.5314, -84.93972, 1559.6387]","[910.72437, -79.29521, 1280.2563]","[865.3111, 182.62885, 1322.4008]","[345.49744, -99.965614, 1571.3601]","[136.03296, -59.752625, 1292.3809]","[144.96864, 217.84282, 1287.7993]","[651.6928, -160.97816, 1530.5469]","[813.94604, -37.799965, 1399.3844]"
2,"[690.30334, -24.149654, 1186.4978]","[358.77875, -45.391197, 1193.2559]","[651.41583, 58.387333, 1110.798]","[382.088, 48.830948, 1115.152]","[572.2519, -130.84161, 1147.7474]","[494.22818, -131.92348, 1154.3685]","[524.8558, -153.7159, 1100.8489]","[712.07684, -29.686523, 994.38983]","[705.36194, -34.872658, 764.9084]","[654.4372, -76.34137, 754.5367]",...,"[522.4444, -171.05562, 1382.6584]","[521.8185, 42.703773, 1535.5785]","[717.56866, -84.98046, 1559.6777]","[910.76373, -79.24408, 1280.2782]","[865.30853, 182.63152, 1322.4338]","[345.49744, -99.965614, 1571.3601]","[135.97481, -59.690987, 1292.3872]","[144.96014, 217.84444, 1287.8359]","[651.6934, -161.02051, 1530.5673]","[813.94824, -37.797764, 1399.3878]"
3,"[690.3731, -24.186714, 1186.4689]","[358.83917, -45.360054, 1193.2523]","[651.4025, 58.374546, 1110.7954]","[382.09662, 48.84198, 1115.1544]","[572.2523, -130.84087, 1147.7468]","[494.22968, -131.9238, 1154.3702]","[524.87933, -153.71962, 1100.8209]","[712.0302, -29.661835, 994.37476]","[705.32715, -34.838192, 764.8942]","[654.4447, -76.346664, 754.5351]",...,"[522.3926, -171.0053, 1382.6237]","[521.74164, 42.666523, 1535.6366]","[717.5749, -85.003456, 1559.6595]","[910.7852, -79.24269, 1280.2686]","[865.2585, 182.6789, 1322.4326]","[345.49744, -99.965614, 1571.3601]","[136.00629, -59.67788, 1292.364]","[145.00027, 217.88835, 1287.8676]","[651.7441, -160.98076, 1530.5286]","[813.9141, -37.733063, 1399.3605]"
4,"[690.34424, -24.152397, 1186.4698]","[358.84586, -45.32006, 1193.2183]","[651.38763, 58.393387, 1110.8086]","[382.1403, 48.893497, 1115.1293]","[572.25653, -130.84499, 1147.7278]","[494.2428, -131.91296, 1154.3756]","[524.8999, -153.68208, 1100.7881]","[712.0312, -29.672976, 994.3855]","[705.38226, -34.86162, 764.909]","[654.42255, -76.32516, 754.53143]",...,"[522.3879, -171.00252, 1382.6223]","[521.7825, 42.65298, 1535.606]","[717.57434, -84.96423, 1559.6986]","[910.74524, -79.2099, 1280.3094]","[865.30707, 182.71387, 1322.43]","[345.59042, -99.86807, 1571.3287]","[136.02382, -59.6663, 1292.3708]","[144.96443, 217.89464, 1287.8561]","[651.74884, -160.95631, 1530.5133]","[813.9044, -37.73279, 1399.4192]"


In [30]:
data['out']['full_static']

{'RIC': [[690.303, -24.144964, 1186.502],
  [690.3032, -24.149342, 1186.498],
  [690.30334, -24.149654, 1186.4978],
  [690.3731, -24.186714, 1186.4689],
  [690.34424, -24.152397, 1186.4698],
  [690.34, -24.088327, 1186.4729],
  [690.30975, -24.072437, 1186.4886],
  [690.2586, -24.063133, 1186.4884],
  [690.3269, -24.080727, 1186.474],
  [690.2595, -24.081783, 1186.4774],
  [690.1976, -24.008486, 1186.488],
  [690.18555, -23.999575, 1186.4863],
  [690.27405, -24.062126, 1186.4766],
  [690.283, -24.013586, 1186.491],
  [690.21045, -23.944777, 1186.4408],
  [690.1476, -23.897049, 1186.4249],
  [690.1409, -23.893291, 1186.4258],
  [690.1769, -23.904472, 1186.4208],
  [690.19775, -23.850851, 1186.4181],
  [690.1404, -23.784199, 1186.4703],
  [690.0823, -23.763117, 1186.4349],
  [690.1544, -23.812277, 1186.4395],
  [690.1802, -23.827532, 1186.4402],
  [690.1888, -23.766487, 1186.4446],
  [690.11884, -23.710304, 1186.4442],
  [690.0042, -23.616055, 1186.461],
  [690.084, -23.67468, 1186.4491]

In [23]:
print(data['out'].keys())

dict_keys(['study_description', 'session_description', 'datestring', 'subject_type', 'IDnumber', 'demo', 'staticfilepath', 'walkfilepath', 'runfilepath', 'speed_w', 'dv_w', 'neutral', 'joints', 'full_static', 'full_walk', 'walking', 'hz_w', 'speed_r', 'dv_r', 'full_run', 'running', 'hz_r', 'location', 'strengthdata', 'flexdata', 'aligndata', 'endurancedata', 'rawneutral', 'Inj'])


In [21]:
data['out']['neutral'].keys()

30

In [22]:
data['out']['full_static'].keys()

61

In [None]:
data['out'][0][0]

In [None]:
data['__header__']

### Data stored in RBA directory

In [None]:
fname_q= os.path.join(pathname, 'RBDS_google_forms.csv') 
# Import data
data_q = pd.read_csv(fname_q, sep = ',', index_col = 'ID')
data_q.head()

In [None]:
df_rba = data_q[['Altura (cm)','Massa (kg)']]
df_rba

In [None]:
df_figshare = info[['Subject','Height','Mass']]
df_figshare.set_index('Subject')

In [None]:
df_out = df_rba.loc[df_rba['Altura (cm)']==df_figshare['Height'].values[5]]
df_out.index.tolist()

In [None]:
ids = []
for i in range(df_figshare.shape[0]):
    df_out = df_rba.loc[(df_rba['Altura (cm)']==df_figshare['Height'].values[i]) & (df_rba['Massa (kg)']==df_figshare['Mass'].values[i])]
    if df_out.empty:
        print('Subject '+ str(df_figshare['Subject'].values[i]) + ' not found!')
    else:
        ids.append(df_out.index.tolist())

In [None]:
ids

# PENDING
* Find who is who. 
Find the subjects in Figshare RBDSinfo.txt with the corresponding ID in RBA spreadsheet