## Deep Learning for Human Activity Recognition - Basic Data Analysis

In [2]:
# Suppress warnings 
import warnings
warnings.filterwarnings("ignore", category=DeprecationWarning)
warnings.filterwarnings("ignore", category=UserWarning)
warnings.filterwarnings("ignore", category=FutureWarning)

### 1. Imports

In [3]:
import numpy as np
import pandas as pd
np.set_printoptions(linewidth=200)
pd.options.display.max_columns = 100
pd.options.display.max_rows = 100
pd.options.display.max_colwidth = 100

# matplotlib and seaborn for plotting
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline
sns.set(style="darkgrid")

# import other libraries
import os, pickle, json
from collections import Counter 
from operator import itemgetter

### 2. Read in Data

In [4]:
root = '../data/hapt_data_set/'
print(os.listdir(root))
print(os.listdir(root + 'Train'))
print(os.listdir(root + 'Test'))

['Test', 'features.txt', 'activity_labels.txt', 'features_info.txt', 'Train', 'README.txt', 'RawData']
['X_train.txt', 'subject_id_train.txt', 'y_train.txt']
['X_test.txt', 'y_test.txt', 'subject_id_test.txt']


In [5]:
features = pd.read_table(root + 'features.txt', header=None).values.flatten()
features = np.array([feature.rstrip() for feature in features])

In [6]:
%%time
X_train = pd.read_table(root + 'Train/X_train.txt', sep=' ', header=None, names=features)
y_train = pd.read_table(root + 'Train/y_train.txt', sep=' ', header=None)
subject_id_train = pd.read_table(root + 'Train/subject_id_train.txt', sep=' ', header=None)

X_test = pd.read_table(root + 'Test/X_test.txt', sep=' ', header=None, names=features)
y_test = pd.read_table(root + 'Test/y_test.txt', sep=' ', header=None)
subject_id_test = pd.read_table(root + 'Test/subject_id_test.txt', sep=' ', header=None)

CPU times: user 1.37 s, sys: 138 ms, total: 1.51 s
Wall time: 1.73 s


### 3. Glimpse of Data


In [7]:
print('Size of train data', X_train.shape)
display(pd.DataFrame(X_train.dtypes, columns=['dtype']).T)
display(X_train.head(3))

Size of train data (7767, 561)


Unnamed: 0,tBodyAcc-Mean-1,tBodyAcc-Mean-2,tBodyAcc-Mean-3,tBodyAcc-STD-1,tBodyAcc-STD-2,tBodyAcc-STD-3,tBodyAcc-Mad-1,tBodyAcc-Mad-2,tBodyAcc-Mad-3,tBodyAcc-Max-1,tBodyAcc-Max-2,tBodyAcc-Max-3,tBodyAcc-Min-1,tBodyAcc-Min-2,tBodyAcc-Min-3,tBodyAcc-SMA-1,tBodyAcc-Energy-1,tBodyAcc-Energy-2,tBodyAcc-Energy-3,tBodyAcc-IQR-1,tBodyAcc-IQR-2,tBodyAcc-IQR-3,tBodyAcc-ropy-1,tBodyAcc-ropy-2,tBodyAcc-ropy-3,tBodyAcc-ARCoeff-1,tBodyAcc-ARCoeff-2,tBodyAcc-ARCoeff-3,tBodyAcc-ARCoeff-4,tBodyAcc-ARCoeff-5,tBodyAcc-ARCoeff-6,tBodyAcc-ARCoeff-7,tBodyAcc-ARCoeff-8,tBodyAcc-ARCoeff-9,tBodyAcc-ARCoeff-10,tBodyAcc-ARCoeff-11,tBodyAcc-ARCoeff-12,tBodyAcc-Correlation-1,tBodyAcc-Correlation-2,tBodyAcc-Correlation-3,tGravityAcc-Mean-1,tGravityAcc-Mean-2,tGravityAcc-Mean-3,tGravityAcc-STD-1,tGravityAcc-STD-2,tGravityAcc-STD-3,tGravityAcc-Mad-1,tGravityAcc-Mad-2,tGravityAcc-Mad-3,tGravityAcc-Max-1,...,fBodyAccMag-MaxInds-1,fBodyAccMag-MeanFreq-1,fBodyAccMag-Skewness-1,fBodyAccMag-Kurtosis-1,fBodyAccJerkMag-Mean-1,fBodyAccJerkMag-STD-1,fBodyAccJerkMag-Mad-1,fBodyAccJerkMag-Max-1,fBodyAccJerkMag-Min-1,fBodyAccJerkMag-SMA-1,fBodyAccJerkMag-Energy-1,fBodyAccJerkMag-IQR-1,fBodyAccJerkMag-ropy-1,fBodyAccJerkMag-MaxInds-1,fBodyAccJerkMag-MeanFreq-1,fBodyAccJerkMag-Skewness-1,fBodyAccJerkMag-Kurtosis-1,fBodyGyroMag-Mean-1,fBodyGyroMag-STD-1,fBodyGyroMag-Mad-1,fBodyGyroMag-Max-1,fBodyGyroMag-Min-1,fBodyGyroMag-SMA-1,fBodyGyroMag-Energy-1,fBodyGyroMag-IQR-1,fBodyGyroMag-ropy-1,fBodyGyroMag-MaxInds-1,fBodyGyroMag-MeanFreq-1,fBodyGyroMag-Skewness-1,fBodyGyroMag-Kurtosis-1,fBodyGyroJerkMag-Mean-1,fBodyGyroJerkMag-STD-1,fBodyGyroJerkMag-Mad-1,fBodyGyroJerkMag-Max-1,fBodyGyroJerkMag-Min-1,fBodyGyroJerkMag-SMA-1,fBodyGyroJerkMag-Energy-1,fBodyGyroJerkMag-IQR-1,fBodyGyroJerkMag-ropy-1,fBodyGyroJerkMag-MaxInds-1,fBodyGyroJerkMag-MeanFreq-1,fBodyGyroJerkMag-Skewness-1,fBodyGyroJerkMag-Kurtosis-1,tBodyAcc-AngleWRTGravity-1,tBodyAccJerk-AngleWRTGravity-1,tBodyGyro-AngleWRTGravity-1,tBodyGyroJerk-AngleWRTGravity-1,tXAxisAcc-AngleWRTGravity-1,tYAxisAcc-AngleWRTGravity-1,tZAxisAcc-AngleWRTGravity-1
dtype,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,...,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64


Unnamed: 0,tBodyAcc-Mean-1,tBodyAcc-Mean-2,tBodyAcc-Mean-3,tBodyAcc-STD-1,tBodyAcc-STD-2,tBodyAcc-STD-3,tBodyAcc-Mad-1,tBodyAcc-Mad-2,tBodyAcc-Mad-3,tBodyAcc-Max-1,tBodyAcc-Max-2,tBodyAcc-Max-3,tBodyAcc-Min-1,tBodyAcc-Min-2,tBodyAcc-Min-3,tBodyAcc-SMA-1,tBodyAcc-Energy-1,tBodyAcc-Energy-2,tBodyAcc-Energy-3,tBodyAcc-IQR-1,tBodyAcc-IQR-2,tBodyAcc-IQR-3,tBodyAcc-ropy-1,tBodyAcc-ropy-2,tBodyAcc-ropy-3,tBodyAcc-ARCoeff-1,tBodyAcc-ARCoeff-2,tBodyAcc-ARCoeff-3,tBodyAcc-ARCoeff-4,tBodyAcc-ARCoeff-5,tBodyAcc-ARCoeff-6,tBodyAcc-ARCoeff-7,tBodyAcc-ARCoeff-8,tBodyAcc-ARCoeff-9,tBodyAcc-ARCoeff-10,tBodyAcc-ARCoeff-11,tBodyAcc-ARCoeff-12,tBodyAcc-Correlation-1,tBodyAcc-Correlation-2,tBodyAcc-Correlation-3,tGravityAcc-Mean-1,tGravityAcc-Mean-2,tGravityAcc-Mean-3,tGravityAcc-STD-1,tGravityAcc-STD-2,tGravityAcc-STD-3,tGravityAcc-Mad-1,tGravityAcc-Mad-2,tGravityAcc-Mad-3,tGravityAcc-Max-1,...,fBodyAccMag-MaxInds-1,fBodyAccMag-MeanFreq-1,fBodyAccMag-Skewness-1,fBodyAccMag-Kurtosis-1,fBodyAccJerkMag-Mean-1,fBodyAccJerkMag-STD-1,fBodyAccJerkMag-Mad-1,fBodyAccJerkMag-Max-1,fBodyAccJerkMag-Min-1,fBodyAccJerkMag-SMA-1,fBodyAccJerkMag-Energy-1,fBodyAccJerkMag-IQR-1,fBodyAccJerkMag-ropy-1,fBodyAccJerkMag-MaxInds-1,fBodyAccJerkMag-MeanFreq-1,fBodyAccJerkMag-Skewness-1,fBodyAccJerkMag-Kurtosis-1,fBodyGyroMag-Mean-1,fBodyGyroMag-STD-1,fBodyGyroMag-Mad-1,fBodyGyroMag-Max-1,fBodyGyroMag-Min-1,fBodyGyroMag-SMA-1,fBodyGyroMag-Energy-1,fBodyGyroMag-IQR-1,fBodyGyroMag-ropy-1,fBodyGyroMag-MaxInds-1,fBodyGyroMag-MeanFreq-1,fBodyGyroMag-Skewness-1,fBodyGyroMag-Kurtosis-1,fBodyGyroJerkMag-Mean-1,fBodyGyroJerkMag-STD-1,fBodyGyroJerkMag-Mad-1,fBodyGyroJerkMag-Max-1,fBodyGyroJerkMag-Min-1,fBodyGyroJerkMag-SMA-1,fBodyGyroJerkMag-Energy-1,fBodyGyroJerkMag-IQR-1,fBodyGyroJerkMag-ropy-1,fBodyGyroJerkMag-MaxInds-1,fBodyGyroJerkMag-MeanFreq-1,fBodyGyroJerkMag-Skewness-1,fBodyGyroJerkMag-Kurtosis-1,tBodyAcc-AngleWRTGravity-1,tBodyAccJerk-AngleWRTGravity-1,tBodyGyro-AngleWRTGravity-1,tBodyGyroJerk-AngleWRTGravity-1,tXAxisAcc-AngleWRTGravity-1,tYAxisAcc-AngleWRTGravity-1,tZAxisAcc-AngleWRTGravity-1
0,0.04358,-0.00597,-0.035054,-0.995381,-0.988366,-0.937382,-0.995007,-0.988816,-0.953325,-0.794796,-0.744893,-0.648447,0.841796,0.70844,0.651716,-0.975752,-0.99995,-0.999888,-0.998014,-0.993999,-0.99198,-0.97097,-0.547095,-0.700974,-0.622697,0.921884,-0.719483,0.342168,-0.161318,0.266049,-0.274351,0.267205,-0.020958,0.38261,-0.501748,0.512463,-0.206337,0.376778,0.435172,0.660199,0.960051,-0.135939,0.115556,-0.988134,-0.982693,-0.919723,-0.988362,-0.985523,-0.931834,0.892055,...,-0.842105,-0.061629,-0.44612,-0.797046,-0.99361,-0.994226,-0.992839,-0.993778,-0.988172,-0.99361,-0.999918,-0.991736,-1.0,-0.936508,0.34926,-0.517127,-0.801006,-0.980135,-0.961301,-0.974129,-0.956013,-0.989894,-0.980135,-0.99924,-0.992673,-0.701291,-1.0,-0.13248,0.565697,0.363478,-0.991994,-0.990877,-0.990169,-0.992521,-0.991044,-0.991994,-0.999937,-0.990537,-0.871306,-1.0,-0.012236,-0.314848,-0.713308,-0.112754,0.0304,-0.464761,-0.018446,-0.841559,0.179913,-0.051718
1,0.03948,-0.002131,-0.029067,-0.998348,-0.982945,-0.971273,-0.998702,-0.983315,-0.974,-0.802537,-0.736338,-0.712415,0.838758,0.70844,0.65934,-0.987427,-0.999993,-0.999826,-0.999411,-0.998918,-0.985482,-0.973481,-0.781973,-0.534604,-0.593165,0.607435,-0.266783,0.275882,0.200417,0.131266,-0.149017,0.292436,-0.192986,0.217496,-0.089175,0.059909,-0.236609,-0.012696,-0.072711,0.578649,0.963215,-0.136648,0.109558,-0.997918,-0.990006,-0.95516,-0.998358,-0.990346,-0.956796,0.89206,...,-1.0,-0.01827,-0.128777,-0.448744,-0.99022,-0.992431,-0.990594,-0.994902,-0.989545,-0.99022,-0.999867,-0.991506,-1.0,-0.84127,0.533688,-0.625993,-0.898311,-0.988296,-0.983313,-0.982951,-0.987406,-0.992134,-0.988296,-0.999811,-0.993996,-0.720683,-0.948718,-0.268979,-0.364219,-0.723724,-0.995857,-0.99658,-0.995671,-0.996939,-0.994436,-0.995857,-0.999981,-0.994623,-1.0,-1.0,0.202804,-0.603199,-0.860677,0.053477,-0.007435,-0.732626,0.703511,-0.845092,0.180261,-0.047436
2,0.039978,-0.005153,-0.022651,-0.995482,-0.977314,-0.98476,-0.996415,-0.975835,-0.985973,-0.798477,-0.736338,-0.712415,0.834002,0.705008,0.674551,-0.988528,-0.999972,-0.999719,-0.999803,-0.996898,-0.976781,-0.986754,-0.688176,-0.520514,-0.593165,0.272262,-0.056424,0.322283,-0.273292,0.03718,-0.133612,0.332487,-0.240491,0.348733,-0.195409,0.229436,-0.316816,-0.123889,-0.181137,0.608219,0.963532,-0.137105,0.102062,-0.999657,-0.993236,-0.995364,-0.999717,-0.993122,-0.995437,0.892401,...,-0.894737,0.277458,-0.630062,-0.880125,-0.989165,-0.991337,-0.988135,-0.993592,-0.999886,-0.989165,-0.999845,-0.987029,-1.0,-0.904762,0.661975,-0.725887,-0.926663,-0.989255,-0.986019,-0.984533,-0.991701,-0.995857,-0.989255,-0.999854,-0.993256,-0.736521,-0.794872,-0.212429,-0.564868,-0.874594,-0.995034,-0.995308,-0.994868,-0.996133,-0.995863,-0.995034,-0.999973,-0.993834,-1.0,-0.555556,0.440079,-0.404427,-0.761847,-0.118559,0.177899,0.100699,0.808529,-0.84923,0.18061,-0.042271


In [8]:
print('Size of test data', X_test.shape)
display(pd.DataFrame(X_test.dtypes, columns=['dtype']).T)
display(X_test.head(3))

Size of test data (3162, 561)


Unnamed: 0,tBodyAcc-Mean-1,tBodyAcc-Mean-2,tBodyAcc-Mean-3,tBodyAcc-STD-1,tBodyAcc-STD-2,tBodyAcc-STD-3,tBodyAcc-Mad-1,tBodyAcc-Mad-2,tBodyAcc-Mad-3,tBodyAcc-Max-1,tBodyAcc-Max-2,tBodyAcc-Max-3,tBodyAcc-Min-1,tBodyAcc-Min-2,tBodyAcc-Min-3,tBodyAcc-SMA-1,tBodyAcc-Energy-1,tBodyAcc-Energy-2,tBodyAcc-Energy-3,tBodyAcc-IQR-1,tBodyAcc-IQR-2,tBodyAcc-IQR-3,tBodyAcc-ropy-1,tBodyAcc-ropy-2,tBodyAcc-ropy-3,tBodyAcc-ARCoeff-1,tBodyAcc-ARCoeff-2,tBodyAcc-ARCoeff-3,tBodyAcc-ARCoeff-4,tBodyAcc-ARCoeff-5,tBodyAcc-ARCoeff-6,tBodyAcc-ARCoeff-7,tBodyAcc-ARCoeff-8,tBodyAcc-ARCoeff-9,tBodyAcc-ARCoeff-10,tBodyAcc-ARCoeff-11,tBodyAcc-ARCoeff-12,tBodyAcc-Correlation-1,tBodyAcc-Correlation-2,tBodyAcc-Correlation-3,tGravityAcc-Mean-1,tGravityAcc-Mean-2,tGravityAcc-Mean-3,tGravityAcc-STD-1,tGravityAcc-STD-2,tGravityAcc-STD-3,tGravityAcc-Mad-1,tGravityAcc-Mad-2,tGravityAcc-Mad-3,tGravityAcc-Max-1,...,fBodyAccMag-MaxInds-1,fBodyAccMag-MeanFreq-1,fBodyAccMag-Skewness-1,fBodyAccMag-Kurtosis-1,fBodyAccJerkMag-Mean-1,fBodyAccJerkMag-STD-1,fBodyAccJerkMag-Mad-1,fBodyAccJerkMag-Max-1,fBodyAccJerkMag-Min-1,fBodyAccJerkMag-SMA-1,fBodyAccJerkMag-Energy-1,fBodyAccJerkMag-IQR-1,fBodyAccJerkMag-ropy-1,fBodyAccJerkMag-MaxInds-1,fBodyAccJerkMag-MeanFreq-1,fBodyAccJerkMag-Skewness-1,fBodyAccJerkMag-Kurtosis-1,fBodyGyroMag-Mean-1,fBodyGyroMag-STD-1,fBodyGyroMag-Mad-1,fBodyGyroMag-Max-1,fBodyGyroMag-Min-1,fBodyGyroMag-SMA-1,fBodyGyroMag-Energy-1,fBodyGyroMag-IQR-1,fBodyGyroMag-ropy-1,fBodyGyroMag-MaxInds-1,fBodyGyroMag-MeanFreq-1,fBodyGyroMag-Skewness-1,fBodyGyroMag-Kurtosis-1,fBodyGyroJerkMag-Mean-1,fBodyGyroJerkMag-STD-1,fBodyGyroJerkMag-Mad-1,fBodyGyroJerkMag-Max-1,fBodyGyroJerkMag-Min-1,fBodyGyroJerkMag-SMA-1,fBodyGyroJerkMag-Energy-1,fBodyGyroJerkMag-IQR-1,fBodyGyroJerkMag-ropy-1,fBodyGyroJerkMag-MaxInds-1,fBodyGyroJerkMag-MeanFreq-1,fBodyGyroJerkMag-Skewness-1,fBodyGyroJerkMag-Kurtosis-1,tBodyAcc-AngleWRTGravity-1,tBodyAccJerk-AngleWRTGravity-1,tBodyGyro-AngleWRTGravity-1,tBodyGyroJerk-AngleWRTGravity-1,tXAxisAcc-AngleWRTGravity-1,tYAxisAcc-AngleWRTGravity-1,tZAxisAcc-AngleWRTGravity-1
dtype,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,...,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64,float64


Unnamed: 0,tBodyAcc-Mean-1,tBodyAcc-Mean-2,tBodyAcc-Mean-3,tBodyAcc-STD-1,tBodyAcc-STD-2,tBodyAcc-STD-3,tBodyAcc-Mad-1,tBodyAcc-Mad-2,tBodyAcc-Mad-3,tBodyAcc-Max-1,tBodyAcc-Max-2,tBodyAcc-Max-3,tBodyAcc-Min-1,tBodyAcc-Min-2,tBodyAcc-Min-3,tBodyAcc-SMA-1,tBodyAcc-Energy-1,tBodyAcc-Energy-2,tBodyAcc-Energy-3,tBodyAcc-IQR-1,tBodyAcc-IQR-2,tBodyAcc-IQR-3,tBodyAcc-ropy-1,tBodyAcc-ropy-2,tBodyAcc-ropy-3,tBodyAcc-ARCoeff-1,tBodyAcc-ARCoeff-2,tBodyAcc-ARCoeff-3,tBodyAcc-ARCoeff-4,tBodyAcc-ARCoeff-5,tBodyAcc-ARCoeff-6,tBodyAcc-ARCoeff-7,tBodyAcc-ARCoeff-8,tBodyAcc-ARCoeff-9,tBodyAcc-ARCoeff-10,tBodyAcc-ARCoeff-11,tBodyAcc-ARCoeff-12,tBodyAcc-Correlation-1,tBodyAcc-Correlation-2,tBodyAcc-Correlation-3,tGravityAcc-Mean-1,tGravityAcc-Mean-2,tGravityAcc-Mean-3,tGravityAcc-STD-1,tGravityAcc-STD-2,tGravityAcc-STD-3,tGravityAcc-Mad-1,tGravityAcc-Mad-2,tGravityAcc-Mad-3,tGravityAcc-Max-1,...,fBodyAccMag-MaxInds-1,fBodyAccMag-MeanFreq-1,fBodyAccMag-Skewness-1,fBodyAccMag-Kurtosis-1,fBodyAccJerkMag-Mean-1,fBodyAccJerkMag-STD-1,fBodyAccJerkMag-Mad-1,fBodyAccJerkMag-Max-1,fBodyAccJerkMag-Min-1,fBodyAccJerkMag-SMA-1,fBodyAccJerkMag-Energy-1,fBodyAccJerkMag-IQR-1,fBodyAccJerkMag-ropy-1,fBodyAccJerkMag-MaxInds-1,fBodyAccJerkMag-MeanFreq-1,fBodyAccJerkMag-Skewness-1,fBodyAccJerkMag-Kurtosis-1,fBodyGyroMag-Mean-1,fBodyGyroMag-STD-1,fBodyGyroMag-Mad-1,fBodyGyroMag-Max-1,fBodyGyroMag-Min-1,fBodyGyroMag-SMA-1,fBodyGyroMag-Energy-1,fBodyGyroMag-IQR-1,fBodyGyroMag-ropy-1,fBodyGyroMag-MaxInds-1,fBodyGyroMag-MeanFreq-1,fBodyGyroMag-Skewness-1,fBodyGyroMag-Kurtosis-1,fBodyGyroJerkMag-Mean-1,fBodyGyroJerkMag-STD-1,fBodyGyroJerkMag-Mad-1,fBodyGyroJerkMag-Max-1,fBodyGyroJerkMag-Min-1,fBodyGyroJerkMag-SMA-1,fBodyGyroJerkMag-Energy-1,fBodyGyroJerkMag-IQR-1,fBodyGyroJerkMag-ropy-1,fBodyGyroJerkMag-MaxInds-1,fBodyGyroJerkMag-MeanFreq-1,fBodyGyroJerkMag-Skewness-1,fBodyGyroJerkMag-Kurtosis-1,tBodyAcc-AngleWRTGravity-1,tBodyAccJerk-AngleWRTGravity-1,tBodyGyro-AngleWRTGravity-1,tBodyGyroJerk-AngleWRTGravity-1,tXAxisAcc-AngleWRTGravity-1,tYAxisAcc-AngleWRTGravity-1,tZAxisAcc-AngleWRTGravity-1
0,0.030914,-0.008927,0.040382,-0.938504,-0.944626,-0.759334,-0.952398,-0.950281,-0.802483,-0.757099,-0.733398,-0.40796,0.728511,0.658266,0.629169,-0.913306,-0.997966,-0.998683,-0.975818,-0.97544,-0.966793,-0.914396,-0.363822,-0.420897,0.181772,0.517928,-0.403636,0.449325,-0.147545,0.22315,-0.190143,0.155899,0.054035,0.053156,-3.7e-05,-0.077888,0.028585,0.077659,-0.490616,-0.711964,0.933151,-0.27736,0.115469,-0.940012,-0.94046,-0.714148,-0.945699,-0.942284,-0.7447,0.906083,...,-1.0,-0.448379,0.005537,-0.383555,-0.894952,-0.896808,-0.889015,-0.928866,-0.898096,-0.894952,-0.993471,-0.921836,-0.484619,-1.0,-0.031754,-0.255114,-0.698671,-0.77061,-0.797105,-0.769223,-0.834266,-0.940359,-0.77061,-0.970958,-0.798403,0.179435,-1.0,-0.054576,-0.49682,-0.764755,-0.890169,-0.90748,-0.895518,-0.917953,-0.909825,-0.890169,-0.994105,-0.898097,-0.234815,-1.0,0.12283,-0.345684,-0.709087,0.006462,0.16292,-0.825886,0.271151,-0.720559,0.276779,-0.051074
1,0.042548,0.001079,-0.026236,-0.975516,-0.977502,-0.960146,-0.986694,-0.978983,-0.96682,-0.757099,-0.733398,-0.701699,0.770927,0.706301,0.635732,-0.978295,-0.999618,-0.999708,-0.999158,-0.993775,-0.982664,-0.974733,-0.466563,-0.392219,-0.435565,0.504355,-0.117122,0.062621,0.188184,0.209414,-0.245994,0.390254,-0.2478,0.210276,-0.146806,0.106145,-0.022423,-0.104187,-0.429196,0.398133,0.924068,-0.283835,0.152755,-0.991197,-0.984752,-0.976904,-0.991464,-0.984357,-0.977489,0.856176,...,-0.894737,0.224164,-0.214108,-0.599074,-0.945325,-0.934609,-0.930151,-0.950377,-0.967702,-0.945325,-0.99761,-0.957543,-0.723642,-1.0,-0.486025,-0.216243,-0.664383,-0.924461,-0.916766,-0.920964,-0.924413,-0.991454,-0.924461,-0.995727,-0.933145,-0.21886,-1.0,-0.039379,-0.11658,-0.46726,-0.951981,-0.938387,-0.93823,-0.949994,-0.986899,-0.951981,-0.998272,-0.951332,-0.431053,-1.0,-0.314688,-0.142804,-0.600867,-0.083495,0.0175,-0.434375,0.920593,-0.698684,0.281322,-0.076825
2,0.038297,-0.01166,-0.025643,-0.993922,-0.979215,-0.97303,-0.994298,-0.980535,-0.977508,-0.799005,-0.745911,-0.695737,0.837921,0.69052,0.659163,-0.983764,-0.999959,-0.999645,-0.999527,-0.993224,-0.983084,-0.981887,-0.707815,-0.716036,-0.560652,0.241698,-0.081234,0.055641,0.103205,0.009404,-0.12318,0.439879,-0.402218,0.305289,-0.284243,0.637201,-0.572356,0.306166,-0.323897,0.278536,0.926579,-0.282139,0.146271,-0.996731,-0.988875,-0.987926,-0.996877,-0.989432,-0.98723,0.856269,...,-1.0,0.360245,-0.790164,-0.946104,-0.970955,-0.970773,-0.969403,-0.975865,-0.976354,-0.970955,-0.999269,-0.978591,-0.898,-1.0,0.143718,-0.206895,-0.638213,-0.975209,-0.97399,-0.967707,-0.984206,-0.997741,-0.975209,-0.999504,-0.968278,-0.561266,-0.897436,-0.170494,-0.692859,-0.927681,-0.985692,-0.983452,-0.983649,-0.98693,-0.989605,-0.985692,-0.999831,-0.986227,-0.809976,-0.936508,0.11473,-0.209525,-0.6455,-0.034956,0.202302,0.064103,0.145068,-0.703355,0.280062,-0.072302


In [9]:
activity_labels = pd.read_table(root + 'activity_labels.txt', header=None).values.flatten()
activity_labels = np.array([label.rstrip().split() for label in activity_labels])
label2activity_dict = {}
activity2label_dict = {}
for label, activity in activity_labels:
    label2activity_dict[int(label)] = activity
    activity2label_dict[activity] = int(label)

In [23]:
classe_names_inc = ['WALKING', 'WALKING_UPSTAIRS', 'WALKING_DOWNSTAIRS', 'SITTING', 'STANDING', 'LAYING']
classe_ids_inc = [activity2label_dict[c] for c in classe_names_inc]

In [33]:
y_train[y_train[0].isin(classe_ids_inc)].index

Int64Index([   0,    1,    2,    3,    4,    5,    6,    7,    8,    9,
            ...
            7757, 7758, 7759, 7760, 7761, 7762, 7763, 7764, 7765, 7766],
           dtype='int64', length=7415)

In [37]:
X_train.iloc[y_train[y_train[0].isin(classe_ids_inc)].index].reset_index()

Unnamed: 0,index,tBodyAcc-Mean-1,tBodyAcc-Mean-2,tBodyAcc-Mean-3,tBodyAcc-STD-1,tBodyAcc-STD-2,tBodyAcc-STD-3,tBodyAcc-Mad-1,tBodyAcc-Mad-2,tBodyAcc-Mad-3,tBodyAcc-Max-1,tBodyAcc-Max-2,tBodyAcc-Max-3,tBodyAcc-Min-1,tBodyAcc-Min-2,tBodyAcc-Min-3,tBodyAcc-SMA-1,tBodyAcc-Energy-1,tBodyAcc-Energy-2,tBodyAcc-Energy-3,tBodyAcc-IQR-1,tBodyAcc-IQR-2,tBodyAcc-IQR-3,tBodyAcc-ropy-1,tBodyAcc-ropy-2,tBodyAcc-ropy-3,tBodyAcc-ARCoeff-1,tBodyAcc-ARCoeff-2,tBodyAcc-ARCoeff-3,tBodyAcc-ARCoeff-4,tBodyAcc-ARCoeff-5,tBodyAcc-ARCoeff-6,tBodyAcc-ARCoeff-7,tBodyAcc-ARCoeff-8,tBodyAcc-ARCoeff-9,tBodyAcc-ARCoeff-10,tBodyAcc-ARCoeff-11,tBodyAcc-ARCoeff-12,tBodyAcc-Correlation-1,tBodyAcc-Correlation-2,tBodyAcc-Correlation-3,tGravityAcc-Mean-1,tGravityAcc-Mean-2,tGravityAcc-Mean-3,tGravityAcc-STD-1,tGravityAcc-STD-2,tGravityAcc-STD-3,tGravityAcc-Mad-1,tGravityAcc-Mad-2,tGravityAcc-Mad-3,...,fBodyAccMag-MaxInds-1,fBodyAccMag-MeanFreq-1,fBodyAccMag-Skewness-1,fBodyAccMag-Kurtosis-1,fBodyAccJerkMag-Mean-1,fBodyAccJerkMag-STD-1,fBodyAccJerkMag-Mad-1,fBodyAccJerkMag-Max-1,fBodyAccJerkMag-Min-1,fBodyAccJerkMag-SMA-1,fBodyAccJerkMag-Energy-1,fBodyAccJerkMag-IQR-1,fBodyAccJerkMag-ropy-1,fBodyAccJerkMag-MaxInds-1,fBodyAccJerkMag-MeanFreq-1,fBodyAccJerkMag-Skewness-1,fBodyAccJerkMag-Kurtosis-1,fBodyGyroMag-Mean-1,fBodyGyroMag-STD-1,fBodyGyroMag-Mad-1,fBodyGyroMag-Max-1,fBodyGyroMag-Min-1,fBodyGyroMag-SMA-1,fBodyGyroMag-Energy-1,fBodyGyroMag-IQR-1,fBodyGyroMag-ropy-1,fBodyGyroMag-MaxInds-1,fBodyGyroMag-MeanFreq-1,fBodyGyroMag-Skewness-1,fBodyGyroMag-Kurtosis-1,fBodyGyroJerkMag-Mean-1,fBodyGyroJerkMag-STD-1,fBodyGyroJerkMag-Mad-1,fBodyGyroJerkMag-Max-1,fBodyGyroJerkMag-Min-1,fBodyGyroJerkMag-SMA-1,fBodyGyroJerkMag-Energy-1,fBodyGyroJerkMag-IQR-1,fBodyGyroJerkMag-ropy-1,fBodyGyroJerkMag-MaxInds-1,fBodyGyroJerkMag-MeanFreq-1,fBodyGyroJerkMag-Skewness-1,fBodyGyroJerkMag-Kurtosis-1,tBodyAcc-AngleWRTGravity-1,tBodyAccJerk-AngleWRTGravity-1,tBodyGyro-AngleWRTGravity-1,tBodyGyroJerk-AngleWRTGravity-1,tXAxisAcc-AngleWRTGravity-1,tYAxisAcc-AngleWRTGravity-1,tZAxisAcc-AngleWRTGravity-1
0,0,0.043580,-0.005970,-0.035054,-0.995381,-0.988366,-0.937382,-0.995007,-0.988816,-0.953325,-0.794796,-0.744893,-0.648447,0.841796,0.708440,0.651716,-0.975752,-0.999950,-0.999888,-0.998014,-0.993999,-0.991980,-0.970970,-0.547095,-0.700974,-0.622697,0.921884,-0.719483,0.342168,-0.161318,0.266049,-0.274351,0.267205,-0.020958,0.382610,-0.501748,0.512463,-0.206337,0.376778,0.435172,0.660199,0.960051,-0.135939,0.115556,-0.988134,-0.982693,-0.919723,-0.988362,-0.985523,-0.931834,...,-0.842105,-0.061629,-0.446120,-0.797046,-0.993610,-0.994226,-0.992839,-0.993778,-0.988172,-0.993610,-0.999918,-0.991736,-1.000000,-0.936508,0.349260,-0.517127,-0.801006,-0.980135,-0.961301,-0.974129,-0.956013,-0.989894,-0.980135,-0.999240,-0.992673,-0.701291,-1.000000,-0.132480,0.565697,0.363478,-0.991994,-0.990877,-0.990169,-0.992521,-0.991044,-0.991994,-0.999937,-0.990537,-0.871306,-1.000000,-0.012236,-0.314848,-0.713308,-0.112754,0.030400,-0.464761,-0.018446,-0.841559,0.179913,-0.051718
1,1,0.039480,-0.002131,-0.029067,-0.998348,-0.982945,-0.971273,-0.998702,-0.983315,-0.974000,-0.802537,-0.736338,-0.712415,0.838758,0.708440,0.659340,-0.987427,-0.999993,-0.999826,-0.999411,-0.998918,-0.985482,-0.973481,-0.781973,-0.534604,-0.593165,0.607435,-0.266783,0.275882,0.200417,0.131266,-0.149017,0.292436,-0.192986,0.217496,-0.089175,0.059909,-0.236609,-0.012696,-0.072711,0.578649,0.963215,-0.136648,0.109558,-0.997918,-0.990006,-0.955160,-0.998358,-0.990346,-0.956796,...,-1.000000,-0.018270,-0.128777,-0.448744,-0.990220,-0.992431,-0.990594,-0.994902,-0.989545,-0.990220,-0.999867,-0.991506,-1.000000,-0.841270,0.533688,-0.625993,-0.898311,-0.988296,-0.983313,-0.982951,-0.987406,-0.992134,-0.988296,-0.999811,-0.993996,-0.720683,-0.948718,-0.268979,-0.364219,-0.723724,-0.995857,-0.996580,-0.995671,-0.996939,-0.994436,-0.995857,-0.999981,-0.994623,-1.000000,-1.000000,0.202804,-0.603199,-0.860677,0.053477,-0.007435,-0.732626,0.703511,-0.845092,0.180261,-0.047436
2,2,0.039978,-0.005153,-0.022651,-0.995482,-0.977314,-0.984760,-0.996415,-0.975835,-0.985973,-0.798477,-0.736338,-0.712415,0.834002,0.705008,0.674551,-0.988528,-0.999972,-0.999719,-0.999803,-0.996898,-0.976781,-0.986754,-0.688176,-0.520514,-0.593165,0.272262,-0.056424,0.322283,-0.273292,0.037180,-0.133612,0.332487,-0.240491,0.348733,-0.195409,0.229436,-0.316816,-0.123889,-0.181137,0.608219,0.963532,-0.137105,0.102062,-0.999657,-0.993236,-0.995364,-0.999717,-0.993122,-0.995437,...,-0.894737,0.277458,-0.630062,-0.880125,-0.989165,-0.991337,-0.988135,-0.993592,-0.999886,-0.989165,-0.999845,-0.987029,-1.000000,-0.904762,0.661975,-0.725887,-0.926663,-0.989255,-0.986019,-0.984533,-0.991701,-0.995857,-0.989255,-0.999854,-0.993256,-0.736521,-0.794872,-0.212429,-0.564868,-0.874594,-0.995034,-0.995308,-0.994868,-0.996133,-0.995863,-0.995034,-0.999973,-0.993834,-1.000000,-0.555556,0.440079,-0.404427,-0.761847,-0.118559,0.177899,0.100699,0.808529,-0.849230,0.180610,-0.042271
3,3,0.039785,-0.011809,-0.028916,-0.996194,-0.988569,-0.993256,-0.996994,-0.988526,-0.993135,-0.798477,-0.752778,-0.722186,0.834002,0.705008,0.673208,-0.990389,-0.999978,-0.999783,-0.999815,-0.996949,-0.989437,-0.992440,-0.715103,-0.860988,-0.916429,0.062816,0.082940,0.200566,-0.378262,0.090063,-0.209264,0.316530,-0.090862,0.396383,-0.353643,0.503754,-0.490389,-0.304759,-0.362708,0.506602,0.964269,-0.139065,0.100028,-0.997302,-0.982395,-0.985890,-0.997251,-0.982317,-0.986065,...,-1.000000,0.096998,-0.478367,-0.756585,-0.992654,-0.992170,-0.989917,-0.994868,-0.995559,-0.992654,-0.999894,-0.988427,-1.000000,1.000000,0.680038,-0.702305,-0.907781,-0.989413,-0.987827,-0.987057,-0.987801,-0.996334,-0.989413,-0.999876,-0.989153,-0.720891,-1.000000,-0.043398,-0.257142,-0.516341,-0.995224,-0.995417,-0.995951,-0.995346,-0.995728,-0.995224,-0.999974,-0.995305,-0.955696,-0.936508,0.430891,-0.138373,-0.491604,-0.036788,-0.012892,0.640011,-0.485366,-0.848947,0.181907,-0.040826
4,4,0.038758,-0.002289,-0.023863,-0.998241,-0.986774,-0.993115,-0.998216,-0.986479,-0.993825,-0.801982,-0.746505,-0.717858,0.838581,0.705854,0.673208,-0.995057,-0.999992,-0.999882,-0.999908,-0.997772,-0.987726,-0.995109,-0.836774,-0.589200,-0.773771,0.312105,-0.095254,0.194399,-0.007998,0.266740,-0.318965,0.409731,-0.224589,0.520354,-0.319167,0.234376,-0.102650,-0.154974,-0.189796,0.598515,0.964878,-0.143824,0.094663,-0.998736,-0.988731,-0.986066,-0.998767,-0.989455,-0.986376,...,-1.000000,0.411015,-0.119313,-0.481119,-0.995407,-0.994860,-0.994169,-0.995898,-0.982174,-0.995407,-0.999941,-0.994542,-1.000000,-1.000000,0.560592,-0.529957,-0.857124,-0.991433,-0.989051,-0.987932,-0.992145,-0.998404,-0.991433,-0.999902,-0.989339,-0.763372,-0.897436,-0.270529,-0.539596,-0.833661,-0.995096,-0.995645,-0.995508,-0.995683,-0.997414,-0.995096,-0.999974,-0.995566,-1.000000,-0.936508,0.137735,-0.366214,-0.702490,0.123320,0.122542,0.693578,-0.615971,-0.848164,0.185124,-0.037080
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
7410,7762,0.048048,-0.042445,-0.065884,-0.195448,-0.278326,-0.219954,-0.282233,-0.305861,-0.357803,0.267874,-0.209017,-0.071229,0.358185,0.210893,0.153409,-0.288219,-0.703984,-0.823789,-0.806079,-0.500917,-0.444521,-0.480595,-0.085674,0.063228,-0.129545,-0.553916,0.387004,-0.041522,-0.159446,-0.069030,0.028946,-0.053502,0.338292,-0.220301,0.181078,-0.107963,0.132397,-0.210953,-0.251623,-0.285560,0.919814,-0.216841,-0.039336,-0.955305,-0.865364,-0.913023,-0.960526,-0.861557,-0.922330,...,-0.842105,-0.185470,-0.416105,-0.658815,-0.271440,-0.287857,-0.221972,-0.352139,-0.937298,-0.271440,-0.732994,-0.303834,0.354983,-0.904762,-0.062939,-0.077457,-0.425200,-0.332753,-0.129722,-0.146246,-0.309831,-0.995294,-0.332753,-0.605727,-0.292613,0.577573,-0.897436,-0.368534,-0.197418,-0.556747,-0.681100,-0.724107,-0.647607,-0.799516,-0.925237,-0.681100,-0.951092,-0.599138,0.310836,-0.904762,-0.008381,-0.596760,-0.879026,-0.190437,0.829718,0.206972,-0.425619,-0.792292,0.238580,0.056020
7411,7763,0.037639,0.006430,-0.044345,-0.235372,-0.302680,-0.232843,-0.322483,-0.354464,-0.345592,0.181271,-0.209017,-0.032557,0.365442,0.227092,0.153409,-0.318111,-0.732559,-0.837484,-0.814302,-0.519880,-0.520277,-0.484334,-0.099061,0.206285,-0.100579,-0.355994,0.147814,0.208128,-0.262731,0.052048,-0.117448,0.075208,0.289009,-0.168158,0.044478,0.242653,-0.223244,-0.197696,-0.225904,-0.276714,0.915010,-0.236826,-0.039707,-0.962673,-0.933049,-0.914388,-0.968759,-0.943068,-0.921418,...,-0.842105,0.029700,-0.260459,-0.556568,-0.352958,-0.323685,-0.258791,-0.411116,-0.805083,-0.352958,-0.775856,-0.374212,0.361739,-0.904762,-0.189792,-0.152674,-0.507979,-0.357992,-0.187109,-0.226351,-0.199654,-0.919361,-0.357992,-0.649987,-0.427590,0.620646,-0.846154,-0.292100,-0.005408,-0.283893,-0.682759,-0.771343,-0.727237,-0.779415,-0.761876,-0.682759,-0.957032,-0.670128,0.207930,-0.904762,0.209452,-0.404418,-0.684496,0.064907,0.875679,-0.879033,0.400219,-0.772288,0.252653,0.056252
7412,7764,0.037451,-0.002724,0.021009,-0.218281,-0.378082,-0.076950,-0.304446,-0.400661,-0.193071,0.113141,-0.334533,0.042977,0.349585,0.227092,0.151363,-0.282999,-0.720539,-0.870521,-0.731586,-0.488447,-0.500856,-0.329875,-0.102890,0.189941,0.092430,-0.370954,0.191859,0.082682,-0.117559,0.016680,-0.085444,0.146797,0.141790,-0.215770,0.115667,0.044672,0.004797,-0.225947,-0.184732,-0.200530,0.916476,-0.231739,-0.026648,-0.982661,-0.981651,-0.845274,-0.983958,-0.982724,-0.847288,...,-0.842105,-0.204612,-0.036186,-0.381034,-0.424827,-0.326615,-0.347943,-0.316819,-0.786819,-0.424827,-0.801702,-0.490072,0.189903,-0.904762,0.010553,0.330996,0.084875,-0.351948,-0.032286,-0.209511,0.076073,-0.973172,-0.351948,-0.545002,-0.241801,0.584816,-0.846154,-0.315084,0.468934,0.302568,-0.685855,-0.726528,-0.725174,-0.709332,-0.692579,-0.685855,-0.952309,-0.696440,0.158936,-0.904762,0.237003,0.000207,-0.317314,0.052806,-0.266724,0.864404,0.701169,-0.779566,0.249121,0.047071
7413,7765,0.044011,-0.004536,-0.051242,-0.219202,-0.383350,-0.081035,-0.310419,-0.380233,-0.201007,0.166671,-0.369637,0.042977,0.325946,0.261879,0.151363,-0.274477,-0.721170,-0.872676,-0.734725,-0.488072,-0.464520,-0.377506,-0.112676,0.162452,-0.031156,-0.468350,0.274676,0.035400,-0.140051,-0.244395,0.124330,0.131594,-0.033104,-0.231405,0.165104,-0.133763,0.224279,-0.256875,-0.231141,-0.191979,0.918989,-0.228031,-0.004823,-0.979175,-0.973888,-0.903971,-0.980324,-0.976087,-0.912846,...,-0.842105,-0.202955,-0.099957,-0.462660,-0.455099,-0.378403,-0.337459,-0.424125,-0.694834,-0.455099,-0.826288,-0.560079,0.240644,-0.904762,-0.106041,0.037511,-0.304283,-0.415004,0.039203,-0.187961,0.028693,-0.960898,-0.415004,-0.510548,-0.513218,0.445207,-0.846154,-0.402999,0.285400,-0.050802,-0.712134,-0.689573,-0.702416,-0.694869,-0.886150,-0.712134,-0.951972,-0.760114,0.210070,-0.904762,0.069366,0.037919,-0.356579,-0.101360,0.700740,0.936674,-0.589479,-0.785603,0.246409,0.031700


In [35]:
y_train.iloc[y_train[y_train[0].isin(classe_ids_inc)].index]

Unnamed: 0,0
0,5
1,5
2,5
3,5
4,5
...,...
7762,2
7763,2
7764,2
7765,2


In [18]:
print(list(activity2label_dict.keys()))

['WALKING', 'WALKING_UPSTAIRS', 'WALKING_DOWNSTAIRS', 'SITTING', 'STANDING', 'LAYING', 'STAND_TO_SIT', 'SIT_TO_STAND', 'SIT_TO_LIE', 'LIE_TO_SIT', 'STAND_TO_LIE', 'LIE_TO_STAND']


In [10]:
print('Size of train label', y_train.shape)
c = Counter(y_train.values.flatten())
for label in range(1, len(c)+1):
    print(f'label {label} ({label2activity_dict[label]}) has {c[label]} samples ({c[label] / len(y_train) * 100:.04}% of train data)')

Size of train label (7767, 1)
label 1 (WALKING) has 1226 samples (15.78% of train data)
label 2 (WALKING_UPSTAIRS) has 1073 samples (13.81% of train data)
label 3 (WALKING_DOWNSTAIRS) has 987 samples (12.71% of train data)
label 4 (SITTING) has 1293 samples (16.65% of train data)
label 5 (STANDING) has 1423 samples (18.32% of train data)
label 6 (LAYING) has 1413 samples (18.19% of train data)
label 7 (STAND_TO_SIT) has 47 samples (0.6051% of train data)
label 8 (SIT_TO_STAND) has 23 samples (0.2961% of train data)
label 9 (SIT_TO_LIE) has 75 samples (0.9656% of train data)
label 10 (LIE_TO_SIT) has 60 samples (0.7725% of train data)
label 11 (STAND_TO_LIE) has 90 samples (1.159% of train data)
label 12 (LIE_TO_STAND) has 57 samples (0.7339% of train data)


In [11]:
print('Size of test label', y_test.shape)
c = Counter(y_test.values.flatten())
for label in range(1, len(c)+1):
    print(f'label {label} ({label2activity_dict[label]}) has {c[label]} samples ({c[label] / len(y_test) * 100:.04}% of test data)')

Size of test label (3162, 1)
label 1 (WALKING) has 496 samples (15.69% of test data)
label 2 (WALKING_UPSTAIRS) has 471 samples (14.9% of test data)
label 3 (WALKING_DOWNSTAIRS) has 420 samples (13.28% of test data)
label 4 (SITTING) has 508 samples (16.07% of test data)
label 5 (STANDING) has 556 samples (17.58% of test data)
label 6 (LAYING) has 545 samples (17.24% of test data)
label 7 (STAND_TO_SIT) has 23 samples (0.7274% of test data)
label 8 (SIT_TO_STAND) has 10 samples (0.3163% of test data)
label 9 (SIT_TO_LIE) has 32 samples (1.012% of test data)
label 10 (LIE_TO_SIT) has 25 samples (0.7906% of test data)
label 11 (STAND_TO_LIE) has 49 samples (1.55% of test data)
label 12 (LIE_TO_STAND) has 27 samples (0.8539% of test data)


In [12]:
subject_id_train = pd.read_table(root + 'Train/subject_id_train.txt', header=None).values.flatten()
subject_id_test = pd.read_table(root + 'Test/subject_id_test.txt', header=None).values.flatten()

print('subjects in train are: ', set(subject_id_train))
print('subjects in test are: ', set(subject_id_test))

subjects in train are:  {1, 3, 5, 6, 7, 8, 11, 14, 15, 16, 17, 19, 21, 22, 23, 25, 26, 27, 28, 29, 30}
subjects in test are:  {2, 4, 9, 10, 12, 13, 18, 20, 24}
