In [4]:
%matplotlib inline
import pandas as pd
import numpy as np
import matplotlib.pylab as plt
import seaborn as sns
from tsfresh.examples.robot_execution_failures import download_robot_execution_failures, load_robot_execution_failures
from tsfresh import extract_features, extract_relevant_features, select_features
from tsfresh.utilities.dataframe_functions import impute
from tsfresh.feature_extraction import ComprehensiveFCParameters
from sklearn.tree import DecisionTreeClassifier
from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report

In [2]:
# We set the logger to Error level
# This is not recommend for normal use as you can oversee important Warning messages
import logging
logging.basicConfig(level=logging.ERROR)

In [6]:
field_data = pd.read_csv('../data/interim/field_data.csv', index_col=0)
field_data.head()

Unnamed: 0,ts,AARD,AARG,AAVD,AAVG,AM,Fc,Speed,direction,span,id,classes
0,0.0,-6.569074,-10.717356,-9.113529,-7.193623,-8.398395,59.851273,160.173004,descente,Span1,run12_Span1,splicer
1,1.0,-6.883555,-9.547513,-6.912798,-4.47368,-6.954387,69.203842,160.173004,descente,Span1,run12_Span1,splicer
2,2.0,-6.022359,-6.864442,-8.345452,-4.4351,-6.416838,82.019447,160.173004,descente,Span1,run12_Span1,splicer
3,3.0,-6.869041,-6.433753,-8.650504,-5.939749,-6.973262,96.665985,160.173004,descente,Span1,run12_Span1,splicer
4,4.0,-4.662831,-5.525816,-9.712738,-9.759242,-7.415157,111.383583,160.173004,descente,Span1,run12_Span1,splicer


# Extract Features

In [12]:
df = field_data.drop(columns=['Speed', 'direction', 'span', 'classes'])

In [13]:
extraction_settings = ComprehensiveFCParameters()

In [14]:
X = extract_features(df, 
                     column_id='id', column_sort='ts',
                     default_fc_parameters=extraction_settings,
                     impute_function= impute)

Feature Extraction: 100%|██████████| 20/20 [01:53<00:00,  5.69s/it]


In [15]:
X.head()

variable,AARD__abs_energy,AARD__absolute_sum_of_changes,"AARD__agg_autocorrelation__f_agg_""mean""__maxlag_40","AARD__agg_autocorrelation__f_agg_""median""__maxlag_40","AARD__agg_autocorrelation__f_agg_""var""__maxlag_40","AARD__agg_linear_trend__f_agg_""max""__chunk_len_10__attr_""intercept""","AARD__agg_linear_trend__f_agg_""max""__chunk_len_10__attr_""rvalue""","AARD__agg_linear_trend__f_agg_""max""__chunk_len_10__attr_""slope""","AARD__agg_linear_trend__f_agg_""max""__chunk_len_10__attr_""stderr""","AARD__agg_linear_trend__f_agg_""max""__chunk_len_50__attr_""intercept""",...,Fc__symmetry_looking__r_0.9,Fc__symmetry_looking__r_0.9500000000000001,Fc__time_reversal_asymmetry_statistic__lag_1,Fc__time_reversal_asymmetry_statistic__lag_2,Fc__time_reversal_asymmetry_statistic__lag_3,Fc__value_count__value_-1,Fc__value_count__value_0,Fc__value_count__value_1,Fc__variance,Fc__variance_larger_than_standard_deviation
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
run10_Span1,22869.505976,426.083997,-0.015499,-0.050271,0.089691,-3.501116,-0.242578,-0.059449,0.042701,-1.142191,...,1.0,1.0,500.35568,683.87769,914.524966,0.0,0.0,0.0,1015.993225,1.0
run10_Span10,20751.738963,389.018701,0.00297,-0.070024,0.037087,-5.70034,0.115396,0.017883,0.027647,-4.552589,...,1.0,1.0,1212.113893,2919.910774,4203.131412,0.0,0.0,0.0,948.927174,1.0
run10_Span11,23038.622067,488.985176,0.014179,0.011728,0.037133,-4.983168,0.168974,0.032318,0.033858,-3.242825,...,1.0,1.0,-3097.734683,-5178.645859,-5524.571441,0.0,0.0,0.0,1131.809279,1.0
run10_Span12,20680.832175,407.510224,0.006087,-0.001767,0.040271,-4.288704,-0.295094,-0.044697,0.025993,-2.528502,...,1.0,1.0,2105.924676,6306.048466,11493.374167,0.0,0.0,0.0,810.06973,1.0
run10_Span2,21384.694195,605.091819,-0.001021,-0.004073,0.034065,-3.218167,-0.293647,-0.053328,0.031695,-1.773919,...,1.0,1.0,4094.196209,7466.705061,12297.64704,0.0,0.0,0.0,1116.405135,1.0
