In [1]:
import warnings
warnings.filterwarnings(action="ignore")
import os
import ast
import pandas as pd
import numpy as np
from matplotlib import pyplot
import matplotlib.patches as mpatches
import seaborn as sn
from tqdm.std import tqdm
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler

pd.set_option('display.max_rows', None)
pd.set_option('display.max_columns', None)
pd.set_option('display.width', None)
pd.set_option('display.max_colwidth', None)

In [2]:
class Config:
    data_dir = '../data/'
    working_dir = '../src/'
    models_dir = '../models/'
    submissions_dir = '../submissions'

In [3]:
from google.colab import files
  
  
uploaded = files.upload()
import pandas as pd
import io

  
train = pd.read_csv(io.BytesIO(uploaded['Train.csv']))

Saving Train.csv to Train (2).csv


In [4]:
uploaded = files.upload()
metadata = pd.read_csv(io.BytesIO(uploaded['metadata.csv']))

Saving metadata.csv to metadata (2).csv


In [5]:
uploaded = files.upload()
test = pd.read_csv(io.BytesIO(uploaded['Test.csv']))

Saving Test.csv to Test (2).csv


In [6]:
uploaded = files.upload()
ss = pd.read_csv(io.BytesIO(uploaded['SampleSubmission.csv']))

Saving SampleSubmission.csv to SampleSubmission (2).csv


train = pd.read_csv(filepath_or_buffer=os.path.join(Config.data_dir, "Train.csv"))
metadata = pd.read_csv(filepath_or_buffer=os.path.join(Config.data_dir, "metadata.csv"))
test = pd.read_csv(filepath_or_buffer=os.path.join(Config.data_dir, "Test.csv"))
ss = pd.read_csv(filepath_or_buffer=os.path.join(Config.data_dir, "SampleSubmission.csv"))



In [7]:
print(metadata.isna().sum())

ID                         0
RegistrationDate           0
Deposit                    0
UpsellDate             36370
AccessoryRate              0
PaymentMethod              0
rateTypeEntity             0
RatePerUnit                0
DaysOnDeposit              0
MainApplicantGender        0
Age                     6939
Region                  1934
Town                       0
Occupation                 0
SupplierName               0
Term                       0
TotalContractValue         0
ExpectedTermDate           0
FirstPaymentDate           0
LastPaymentDate            0
dtype: int64


In [8]:
metadata[metadata.isna().Region].head(5)

Unnamed: 0,ID,RegistrationDate,Deposit,UpsellDate,AccessoryRate,PaymentMethod,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,SupplierName,Term,TotalContractValue,ExpectedTermDate,FirstPaymentDate,LastPaymentDate
3,ID_HXBJFHB,11/25/2015 0:00,2000,,0,FINANCED,DAILY,35,7,Female,43.0,,UNKNOWN,Teacher,d_light,364,14740,11/23/2016 0:00,11/25/2015 13:25,5/22/2017 16:46
17,ID_AYIBQUP,12/12/2015 0:00,2000,,0,FINANCED,DAILY,35,7,Male,44.0,,UNKNOWN,Other,d_light,364,14740,12/10/2016 0:00,12/12/2015 7:00,9/2/2020 20:30
51,ID_35MNQL1,12/6/2015 0:00,2000,,0,FINANCED,DAILY,35,7,Male,42.0,,UNKNOWN,Farmer,d_light,364,14740,12/4/2016 0:00,12/7/2015 6:21,11/18/2017 11:07
84,ID_RWA0Q3U,7/12/2017 14:44,2000,,0,FINANCED,DAILY,40,7,Female,52.0,,UNKNOWN,Government Employee,d_light,364,16560,7/11/2018 14:44,7/12/2017 14:45,9/2/2020 20:31
85,ID_QWI7WWN,11/24/2015 0:00,2000,,0,FINANCED,DAILY,35,7,Male,40.0,,UNKNOWN,Other,d_light,364,14740,11/22/2016 0:00,11/24/2015 14:02,11/25/2016 14:58


In [9]:
metadata.Region.value_counts()

Nyanza                6998
North Rift            5344
Nairobi Region        5056
South Rift            4759
Coast Region          4671
Western               4508
Mount Kenya Region    4073
Name: Region, dtype: int64

In [10]:
pd.merge(left=metadata[metadata.isna().Region], right=test, on="ID").head(2)
#test data also contains empty values in region therefore we need to treat as a category.

Unnamed: 0,ID,RegistrationDate,Deposit,UpsellDate,AccessoryRate,PaymentMethod,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,SupplierName,Term,TotalContractValue,ExpectedTermDate,FirstPaymentDate,LastPaymentDate,TransactionDates,PaymentsHistory
0,ID_UOT1MF3,7/13/2017 8:56,2000,,0,FINANCED,DAILY,40,7,Male,54.0,,UNKNOWN,Business,d_light,364,16560,7/12/2018 8:56,7/13/2017 8:56,9/2/2020 20:31,"['07-2017', '08-2017', '09-2017', '10-2017', '11-2017', '12-2017', '01-2018', '02-2018', '03-2018', '04-2018', '05-2018', '06-2018', '07-2018', '08-2018', '10-2018', '11-2018', '12-2018', '01-2019', '02-2019', '03-2019', '04-2019', '07-2019']","[2720.0, 1080.0, 1200.0, 1000.0, 960.0, 1160.0, 1120.0, 600.0, 1040.0, 840.0, 680.0, 640.0, 680.0, 520.0, 80.0, 80.0, 40.0, 40.0, 240.0, 40.0, 80.0, 40.0]"
1,ID_290EB8N,7/5/2017 9:06,2000,,0,FINANCED,DAILY,40,7,Male,31.0,,UNKNOWN,Labourer,d_light,364,16560,7/4/2018 9:06,7/5/2017 8:54,9/2/2020 20:35,"['07-2017', '08-2017', '12-2017', '01-2018', '02-2018', '03-2018', '04-2018', '05-2018', '06-2018', '07-2018', '08-2018', '09-2018', '10-2018']","[2710.0, 120.0, 200.0, 300.0, 50.0, 250.0, 550.0, 100.0, 500.0, 350.0, 350.0, 950.0, 200.0]"


In [11]:
metadata.Region.fillna(value="Other", inplace=True)

In [12]:
metadata.UpsellDate.fillna(value=0, inplace=True)

In [13]:
pd.merge(left=metadata[metadata.isna().Age], right=test, on="ID").head(2)
##now just using mean here to remove 0 in metadata.


Unnamed: 0,ID,RegistrationDate,Deposit,UpsellDate,AccessoryRate,PaymentMethod,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,SupplierName,Term,TotalContractValue,ExpectedTermDate,FirstPaymentDate,LastPaymentDate,TransactionDates,PaymentsHistory
0,ID_VJ80SX2,12/14/2015 0:00,2000,0,0,FINANCED,DAILY,35,7,Female,,Mount Kenya Region,Embu,Business,d_light,364,14740,12/12/2016 0:00,12/14/2015 14:20,12/12/2016 11:59,"['12-2015', '01-2016', '02-2016', '03-2016', '04-2016', '05-2016', '06-2016']","[3000.0, 850.0, 750.0, 1500.0, 650.0, 1250.0, 1000.0]"
1,ID_ZLW8XIB,12/5/2015 0:00,2000,0,0,FINANCED,DAILY,35,7,Male,,Mount Kenya Region,Embu,Farmer,d_light,364,14740,12/3/2016 0:00,12/5/2015 15:28,4/1/2017 19:19,"['12-2015', '01-2016', '02-2016', '03-2016', '04-2016', '05-2016', '06-2016', '07-2016', '08-2016', '09-2016', '10-2016']","[3200.0, 735.0, 1320.0, 1000.0, 1170.0, 866.0, 730.0, 100.0, 100.0, 450.0, 700.0]"


In [14]:
metadata.Age.fillna(value=round(metadata.Age.mean()), inplace=True)

In [15]:
merged = pd.merge(left=metadata, right=pd.concat(objs=[train, test]).fillna(value=0), on="ID")
merged.head(5)

Unnamed: 0,ID,RegistrationDate,Deposit,UpsellDate,AccessoryRate,PaymentMethod,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,SupplierName,Term,TotalContractValue,ExpectedTermDate,FirstPaymentDate,LastPaymentDate,TransactionDates,PaymentsHistory,m1,m2,m3,m4,m5,m6
0,ID_K00S4N4,12/10/2015 0:00,2000,0,0,FINANCED,DAILY,35,7,Male,41.0,Mount Kenya Region,Embu,Other,d_light,364,14740,12/8/2016 0:00,12/10/2015 9:52,10/23/2016 4:52,"['12-2015', '01-2016', '02-2016', '03-2016', '04-2016']","[3050.0, 1050.0, 910.0, 1050.0, 1050.0]",1225.0,1050.0,1190.0,525.0,1750.0,1890.0
1,ID_6L67PAA,12/9/2015 0:00,2000,0,0,FINANCED,DAILY,35,7,Male,33.0,Coast Region,Kilifi,Other,d_light,364,14740,12/7/2016 0:00,12/9/2015 13:14,5/24/2020 15:32,"['12-2015', '01-2016', '02-2016', '03-2016', '05-2016', '07-2016']","[4000.0, 1050.0, 1050.0, 1050.0, 1050.0, 400.0]",0.0,0.0,0.0,0.0,0.0,0.0
2,ID_102CV85,12/18/2015 0:00,2000,3/29/2018 10:14,35,FINANCED,DAILY,35,7,Female,48.0,Nairobi Region,Makueni,Business,d_light,392,29480,1/13/2017 0:00,12/18/2015 6:22,2/1/2017 15:23,"['12-2015', '01-2016', '02-2016', '03-2016', '04-2016', '05-2016', '06-2016', '07-2016', '08-2016']","[4245.0, 980.0, 735.0, 735.0, 1470.0, 735.0, 980.0, 915.0, 735.0]",980.0,980.0,1225.0,980.0,935.0,355.0
3,ID_HXBJFHB,11/25/2015 0:00,2000,0,0,FINANCED,DAILY,35,7,Female,43.0,Other,UNKNOWN,Teacher,d_light,364,14740,11/23/2016 0:00,11/25/2015 13:25,5/22/2017 16:46,"['11-2015', '12-2015', '01-2016', '02-2016', '03-2016', '04-2016', '05-2016', '06-2016', '07-2016', '08-2016', '10-2016']","[2245.0, 980.0, 980.0, 1225.0, 980.0, 980.0, 980.0, 1225.0, 735.0, 490.0, 250.0]",250.0,1000.0,250.0,500.0,560.0,1150.0
4,ID_3K9VZ5J,12/2/2015 0:00,2000,0,0,FINANCED,DAILY,35,7,Female,56.0,Mount Kenya Region,Kirinyaga,Other,d_light,364,14740,11/30/2016 0:00,12/5/2015 10:34,5/12/2017 16:50,"['12-2015', '01-2016', '02-2016', '03-2016', '04-2016', '05-2016', '06-2016', '07-2016', '08-2016', '09-2016', '10-2016', '11-2016']","[2750.0, 1000.0, 750.0, 1000.0, 955.0, 880.0, 280.0, 665.0, 770.0, 420.0, 525.0, 735.0]",630.0,805.0,700.0,855.0,245.0,775.0


In [16]:
merged.drop(["FirstPaymentDate"],axis=1,inplace=True)

In [17]:
def diff(a,b):
    start=b.split('/')
    end=a.split('/')
    return int(end[1])-int(start[1])+12*(int(end[0])-int(start[0]))

In [18]:
#merged['month']=merged['RegistrationDate']
#merged['year']=merged['RegistrationDate']
merged['time']=merged['RegistrationDate']
merged['PaidAmount']=merged['TotalContractValue']
merged['PeriodDiff']=merged['TotalContractValue']
for i in tqdm(range(0,merged.shape[0]),desc='Row'):
    year=int(merged.RegistrationDate.iloc[i].split('/')[0])
    month=int(merged.RegistrationDate.iloc[i].split('/')[1])
    time=np.ceil(merged.loc[i,'Term']/30)
    merged.loc[i,'time']=time
    if merged.UpsellDate.iloc[i]!=0:
        merged.loc[i,'UpsellDate']=diff(merged.UpsellDate.iloc[i],merged.RegistrationDate.iloc[i])/time
    merged.loc[i,'LastPaymentDate']=diff(merged.LastPaymentDate.iloc[i],merged.RegistrationDate.iloc[i])/time
    merged.loc[i,'ExpectedTermDate']=diff(merged.ExpectedTermDate.iloc[i],merged.RegistrationDate.iloc[i])/time
    merged.loc[i,'m1']=merged.loc[i,'m1']/merged.loc[i,'TotalContractValue']
    merged.loc[i,'m2']=merged.loc[i,'m2']/merged.loc[i,'TotalContractValue']
    merged.loc[i,'m3']=merged.loc[i,'m3']/merged.loc[i,'TotalContractValue']
    merged.loc[i,'m4']=merged.loc[i,'m4']/merged.loc[i,'TotalContractValue']
    merged.loc[i,'m5']=merged.loc[i,'m5']/merged.loc[i,'TotalContractValue']
    merged.loc[i,'m6']=merged.loc[i,'m6']/merged.loc[i,'TotalContractValue']
    dates=[]
    for j in merged.loc[i,'TransactionDates'].split("'"):
        if '-' in j:
            date=j.split('-')
            dates.append((int(date[0])-month+12*(int(date[1])-year))/time)
    merged.at[i,'TransactionDates']=dates
    history=[]
    for j in merged.loc[i,'PaymentsHistory'].split("[")[1].split("]")[0].split(","):
        if '.' in j:
            history.append(float(j)/merged.loc[i,'TotalContractValue'])
    merged.at[i,'PaymentsHistory']=history
    merged.loc[i,'PaidAmount']=sum(history)
    merged.loc[i,'PeriodDiff']=merged.loc[i,'LastPaymentDate']-dates[-1]
merged.drop(["RegistrationDate","Term"],axis=1,inplace=True)

Row: 100%|██████████| 37343/37343 [05:29<00:00, 113.17it/s]


In [19]:
merged.tail(2)

Unnamed: 0,ID,Deposit,UpsellDate,AccessoryRate,PaymentMethod,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,SupplierName,TotalContractValue,ExpectedTermDate,LastPaymentDate,TransactionDates,PaymentsHistory,m1,m2,m3,m4,m5,m6,time,PaidAmount,PeriodDiff
37341,ID_GHHAQ9D,2400,0,0,FINANCED,DAILY,50,3,Male,27.0,Other,UNKNOWN,Labourer,d_light,14400,11.625,3.5,"[3024.75, 3024.875, 3025.0, 3025.125, 3025.25, 3025.375, 3025.5, 3025.625, 3025.75]","[0.18194444444444444, 0.09027777777777778, 0.08333333333333333, 0.07291666666666667, 0.0763888888888889, 0.04513888888888889, 0.010416666666666666, 0.0038194444444444443, 0.021875]",0.034722,0.059028,0.045139,0.048611,0.041667,0.048611,8,0.586111,-3022.25
37342,ID_PAI1FJK,2400,0,0,FINANCED,DAILY,50,3,Male,36.0,Coast Region,Mombasa,Farmer,d_light,14400,11.625,5.25,"[3024.75, 3024.875, 3025.125, 3025.25, 3025.375, 3025.5, 3025.625, 3025.75, 3025.875]","[0.1701388888888889, 0.003472222222222222, 0.003472222222222222, 0.09375, 0.03125, 0.07291666666666667, 0.04861111111111111, 0.0798611111111111, 0.05277777777777778]",0.100694,0.055556,0.017361,0.003472,0.010417,0.045139,8,0.55625,-3020.625


In [20]:
from sklearn.preprocessing import LabelEncoder
lb_make = LabelEncoder()
category_list=['PaymentMethod','rateTypeEntity','MainApplicantGender','Region','Town','Occupation','SupplierName']
for s in category_list:
    merged[s] = lb_make.fit_transform(merged[s])
    print(lb_make.transform(lb_make.classes_))
    print(lb_make.classes_)
merged.head(2)

[0]
['FINANCED']
[0 1 2]
['DAILY' 'MONTHLY' 'WEEKLY']
[0 1]
['Female' 'Male']
[0 1 2 3 4 5 6 7]
['Coast Region' 'Mount Kenya Region' 'Nairobi Region' 'North Rift'
 'Nyanza' 'Other' 'South Rift' 'Western']
[ 0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23
 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47]
['Baringo' 'Bomet' 'Bungoma' 'Busia' 'Elgeyo/Marakwet' 'Embu' 'Garissa'
 'Homa Bay' 'Isiolo' 'Kajiado' 'Kakamega' 'Kericho' 'Kiambu' 'Kilifi'
 'Kirinyaga' 'Kisii' 'Kisumu' 'Kitui' 'Kwale' 'Laikipia' 'Lamu' 'Machakos'
 'Makueni' 'Mandera' 'Marsabit' 'Meru' 'Migori' 'Mombasa' 'Muranga'
 'Nairobi City' 'Nakuru' 'Nandi' 'Narok' 'Nyamira' 'Nyandarua' 'Nyeri'
 'Samburu' 'Siaya' 'Taita/Taveta' 'Tana River' 'Tharaka-Nithi'
 'Trans Nzoia' 'Turkana' 'UNKNOWN' 'Uasin Gishu' 'Vihiga' 'Wajir'
 'West Pokot']
[0 1 2 3 4 5 6]
['Business' 'Driver/Motorbike Rider' 'Farmer' 'Government Employee'
 'Labourer' 'Other' 'Teacher']
[0]
['d_light']


Unnamed: 0,ID,Deposit,UpsellDate,AccessoryRate,PaymentMethod,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,SupplierName,TotalContractValue,ExpectedTermDate,LastPaymentDate,TransactionDates,PaymentsHistory,m1,m2,m3,m4,m5,m6,time,PaidAmount,PeriodDiff
0,ID_K00S4N4,2000,0,0,0,0,35,7,1,41.0,1,5,5,0,14740,-0.153846,-0.846154,"[1849.076923076923, 1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155]","[0.20691994572591588, 0.07123473541383989, 0.06173677069199457, 0.07123473541383989, 0.07123473541383989]",0.083107,0.071235,0.080733,0.035617,0.118725,0.128223,13,0.482361,-1850.230769
1,ID_6L67PAA,2000,0,0,0,0,35,7,1,33.0,0,13,5,0,14740,-0.153846,-5.30769,"[1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155, 1849.5384615384614, 1849.6923076923076]","[0.27137042062415195, 0.07123473541383989, 0.07123473541383989, 0.07123473541383989, 0.07123473541383989, 0.027137042062415198]",0.0,0.0,0.0,0.0,0.0,0.0,13,0.583446,-1855.0


In [21]:
## As these two variable has only one class.
merged.drop(['PaymentMethod','SupplierName'],axis=1,inplace=True)

In [22]:
merged.head(5)

Unnamed: 0,ID,Deposit,UpsellDate,AccessoryRate,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,TotalContractValue,ExpectedTermDate,LastPaymentDate,TransactionDates,PaymentsHistory,m1,m2,m3,m4,m5,m6,time,PaidAmount,PeriodDiff
0,ID_K00S4N4,2000,0.0,0,0,35,7,1,41.0,1,5,5,14740,-0.153846,-0.846154,"[1849.076923076923, 1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155]","[0.20691994572591588, 0.07123473541383989, 0.06173677069199457, 0.07123473541383989, 0.07123473541383989]",0.083107,0.071235,0.080733,0.035617,0.118725,0.128223,13,0.482361,-1850.230769
1,ID_6L67PAA,2000,0.0,0,0,35,7,1,33.0,0,13,5,14740,-0.153846,-5.30769,"[1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155, 1849.5384615384614, 1849.6923076923076]","[0.27137042062415195, 0.07123473541383989, 0.07123473541383989, 0.07123473541383989, 0.07123473541383989, 0.027137042062415198]",0.0,0.0,0.0,0.0,0.0,0.0,13,0.583446,-1855.0
2,ID_102CV85,2000,-6.92857,35,0,35,7,0,48.0,2,22,0,29480,-9.78571,-9.78571,"[1716.4285714285713, 1716.5, 1716.5714285714287, 1716.642857142857, 1716.7142857142858, 1716.7857142857142, 1716.857142857143, 1716.9285714285713, 1717.0]","[0.14399592944369063, 0.03324287652645862, 0.024932157394843963, 0.024932157394843963, 0.049864314789687926, 0.024932157394843963, 0.03324287652645862, 0.031037991858887382, 0.024932157394843963]",0.033243,0.033243,0.041554,0.033243,0.031716,0.012042,14,0.391113,-1726.785714
3,ID_HXBJFHB,2000,0.0,0,0,35,7,0,43.0,5,43,6,14740,-0.153846,-5.76923,"[1848.7692307692307, 1848.8461538461538, 1848.923076923077, 1849.0, 1849.076923076923, 1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155, 1849.4615384615386, 1849.6153846153845]","[0.1523066485753053, 0.06648575305291723, 0.06648575305291723, 0.08310719131614654, 0.06648575305291723, 0.06648575305291723, 0.06648575305291723, 0.08310719131614654, 0.049864314789687926, 0.03324287652645862, 0.016960651289009497]",0.016961,0.067843,0.016961,0.033921,0.037992,0.078019,13,0.751018,-1855.384615
4,ID_3K9VZ5J,2000,0.0,0,0,35,7,0,56.0,1,14,5,14740,1.23077,-5.69231,"[1849.6923076923076, 1849.7692307692307, 1849.8461538461538, 1849.923076923077, 1850.0, 1850.076923076923, 1850.1538461538462, 1850.2307692307693, 1850.3076923076924, 1850.3846153846155, 1850.4615384615386, 1850.5384615384614]","[0.1865671641791045, 0.06784260515603799, 0.05088195386702849, 0.06784260515603799, 0.06478968792401628, 0.05970149253731343, 0.018995929443690638, 0.04511533242876527, 0.05223880597014925, 0.028493894165535955, 0.03561736770691994, 0.049864314789687926]",0.042741,0.054613,0.04749,0.058005,0.016621,0.052578,13,0.727951,-1856.230769


In [23]:
merged.to_csv("Final.csv",index=False)

##Advance:: Can use clustering/estimation to get age.
##Advance:: Care for Days on deposit(Some finance has to be read)
##Advance:: Care for deposit in paid amount.

In [24]:

from tsfresh import extract_features
df=pd.DataFrame(columns=["time","money","id"])
for k in tqdm(range(0,merged.shape[0])):
    df_temp=pd.DataFrame({"time":merged.loc[k,"TransactionDates"],"money":merged.loc[k,"PaymentsHistory"]})
    df_temp['id']=merged.loc[k,"ID"]
    df=pd.concat([df, df_temp], ignore_index=True)
print(df.shape)

100%|██████████| 37343/37343 [02:35<00:00, 240.25it/s]

(607851, 3)





In [25]:
df_final=df.copy()

In [26]:
df_final=extract_features(df_final,column_id='id',column_sort="time").dropna(axis=1)

Feature Extraction: 100%|██████████| 5/5 [36:16<00:00, 435.34s/it]


In [27]:
print(df_final.shape)


(37343, 268)


In [28]:
df_final.head(5)

Unnamed: 0,money__variance_larger_than_standard_deviation,money__has_duplicate_max,money__has_duplicate_min,money__has_duplicate,money__sum_values,money__abs_energy,money__mean_abs_change,money__mean_change,money__mean_second_derivative_central,money__median,money__mean,money__length,money__standard_deviation,money__variation_coefficient,money__variance,money__skewness,money__kurtosis,money__root_mean_square,money__absolute_sum_of_changes,money__longest_strike_below_mean,money__longest_strike_above_mean,money__count_above_mean,money__count_below_mean,money__last_location_of_maximum,money__first_location_of_maximum,money__last_location_of_minimum,money__first_location_of_minimum,money__percentage_of_reoccurring_values_to_all_values,money__percentage_of_reoccurring_datapoints_to_all_datapoints,money__sum_of_reoccurring_values,money__sum_of_reoccurring_data_points,money__ratio_value_number_to_time_series_length,money__maximum,money__minimum,money__time_reversal_asymmetry_statistic__lag_1,money__time_reversal_asymmetry_statistic__lag_2,money__time_reversal_asymmetry_statistic__lag_3,money__c3__lag_1,money__c3__lag_2,money__c3__lag_3,money__cid_ce__normalize_True,money__cid_ce__normalize_False,money__symmetry_looking__r_0.0,money__symmetry_looking__r_0.05,money__symmetry_looking__r_0.1,money__symmetry_looking__r_0.15000000000000002,money__symmetry_looking__r_0.2,money__symmetry_looking__r_0.25,money__symmetry_looking__r_0.30000000000000004,money__symmetry_looking__r_0.35000000000000003,money__symmetry_looking__r_0.4,money__symmetry_looking__r_0.45,money__symmetry_looking__r_0.5,money__symmetry_looking__r_0.55,money__symmetry_looking__r_0.6000000000000001,money__symmetry_looking__r_0.65,money__symmetry_looking__r_0.7000000000000001,money__symmetry_looking__r_0.75,money__symmetry_looking__r_0.8,money__symmetry_looking__r_0.8500000000000001,money__symmetry_looking__r_0.9,money__symmetry_looking__r_0.9500000000000001,money__large_standard_deviation__r_0.05,money__large_standard_deviation__r_0.1,money__large_standard_deviation__r_0.15000000000000002,money__large_standard_deviation__r_0.2,money__large_standard_deviation__r_0.25,money__large_standard_deviation__r_0.30000000000000004,money__large_standard_deviation__r_0.35000000000000003,money__large_standard_deviation__r_0.4,money__large_standard_deviation__r_0.45,money__large_standard_deviation__r_0.5,money__large_standard_deviation__r_0.55,money__large_standard_deviation__r_0.6000000000000001,money__large_standard_deviation__r_0.65,money__large_standard_deviation__r_0.7000000000000001,money__large_standard_deviation__r_0.75,money__large_standard_deviation__r_0.8,money__large_standard_deviation__r_0.8500000000000001,money__large_standard_deviation__r_0.9,money__large_standard_deviation__r_0.9500000000000001,money__quantile__q_0.1,money__quantile__q_0.2,money__quantile__q_0.3,money__quantile__q_0.4,money__quantile__q_0.6,money__quantile__q_0.7,money__quantile__q_0.8,money__quantile__q_0.9,money__autocorrelation__lag_0,money__autocorrelation__lag_1,money__autocorrelation__lag_2,money__autocorrelation__lag_3,money__autocorrelation__lag_4,"money__agg_autocorrelation__f_agg_""mean""__maxlag_40","money__agg_autocorrelation__f_agg_""median""__maxlag_40","money__agg_autocorrelation__f_agg_""var""__maxlag_40",money__partial_autocorrelation__lag_0,money__partial_autocorrelation__lag_1,money__number_cwt_peaks__n_1,money__number_cwt_peaks__n_5,money__number_peaks__n_1,money__number_peaks__n_3,money__number_peaks__n_5,money__number_peaks__n_10,money__number_peaks__n_50,money__binned_entropy__max_bins_10,money__index_mass_quantile__q_0.1,money__index_mass_quantile__q_0.2,money__index_mass_quantile__q_0.3,money__index_mass_quantile__q_0.4,money__index_mass_quantile__q_0.6,money__index_mass_quantile__q_0.7,money__index_mass_quantile__q_0.8,money__index_mass_quantile__q_0.9,"money__cwt_coefficients__coeff_0__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_20__widths_(2, 5, 10, 20)",money__spkt_welch_density__coeff_2,money__ar_coefficient__coeff_10__k_10,"money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.8","money__fft_coefficient__attr_""real""__coeff_0","money__fft_coefficient__attr_""real""__coeff_1","money__fft_coefficient__attr_""real""__coeff_2","money__fft_coefficient__attr_""imag""__coeff_0","money__fft_coefficient__attr_""imag""__coeff_1","money__fft_coefficient__attr_""imag""__coeff_2","money__fft_coefficient__attr_""abs""__coeff_0","money__fft_coefficient__attr_""abs""__coeff_1","money__fft_coefficient__attr_""abs""__coeff_2","money__fft_coefficient__attr_""angle""__coeff_0","money__fft_coefficient__attr_""angle""__coeff_1","money__fft_coefficient__attr_""angle""__coeff_2","money__fft_aggregated__aggtype_""centroid""","money__fft_aggregated__aggtype_""variance""",money__value_count__value_0,money__value_count__value_1,money__value_count__value_-1,money__range_count__max_1__min_-1,money__range_count__max_0__min_1000000000000.0,money__range_count__max_1000000000000.0__min_0,money__approximate_entropy__m_2__r_0.1,money__approximate_entropy__m_2__r_0.3,money__approximate_entropy__m_2__r_0.5,money__approximate_entropy__m_2__r_0.7,money__approximate_entropy__m_2__r_0.9,"money__linear_trend__attr_""pvalue""","money__linear_trend__attr_""rvalue""","money__linear_trend__attr_""intercept""","money__linear_trend__attr_""slope""","money__linear_trend__attr_""stderr""","money__augmented_dickey_fuller__attr_""teststat""__autolag_""AIC""","money__augmented_dickey_fuller__attr_""pvalue""__autolag_""AIC""","money__augmented_dickey_fuller__attr_""usedlag""__autolag_""AIC""",money__number_crossing_m__m_0,money__number_crossing_m__m_-1,money__number_crossing_m__m_1,money__energy_ratio_by_chunks__num_segments_10__segment_focus_0,money__energy_ratio_by_chunks__num_segments_10__segment_focus_1,money__energy_ratio_by_chunks__num_segments_10__segment_focus_2,money__energy_ratio_by_chunks__num_segments_10__segment_focus_3,money__energy_ratio_by_chunks__num_segments_10__segment_focus_4,money__energy_ratio_by_chunks__num_segments_10__segment_focus_5,money__energy_ratio_by_chunks__num_segments_10__segment_focus_6,money__energy_ratio_by_chunks__num_segments_10__segment_focus_7,money__energy_ratio_by_chunks__num_segments_10__segment_focus_8,money__energy_ratio_by_chunks__num_segments_10__segment_focus_9,money__ratio_beyond_r_sigma__r_0.5,money__ratio_beyond_r_sigma__r_1,money__ratio_beyond_r_sigma__r_1.5,money__ratio_beyond_r_sigma__r_2,money__ratio_beyond_r_sigma__r_2.5,money__ratio_beyond_r_sigma__r_3,money__ratio_beyond_r_sigma__r_5,money__ratio_beyond_r_sigma__r_6,money__ratio_beyond_r_sigma__r_7,money__ratio_beyond_r_sigma__r_10,money__count_above__t_0,money__count_below__t_0,money__lempel_ziv_complexity__bins_2,money__lempel_ziv_complexity__bins_3,money__lempel_ziv_complexity__bins_5,money__lempel_ziv_complexity__bins_10,money__lempel_ziv_complexity__bins_100,money__fourier_entropy__bins_2,money__fourier_entropy__bins_3,money__fourier_entropy__bins_5,money__fourier_entropy__bins_10,money__fourier_entropy__bins_100,money__permutation_entropy__dimension_3__tau_1,money__permutation_entropy__dimension_4__tau_1,money__permutation_entropy__dimension_5__tau_1
ID_000RHRU,0.0,0.0,0.0,1.0,0.696256,0.048213,0.016304,-0.007631,0.003537,0.02657,0.030272,23.0,0.034349,1.13467,0.00118,3.753485,16.341787,0.045785,0.358696,5.0,3.0,9.0,14.0,0.043478,0.0,0.826087,0.782609,0.3125,0.521739,0.115942,0.251208,0.695652,0.179952,0.002415,-5.6e-05,-5.7e-05,-2.5e-05,2.5e-05,1.8e-05,1.9e-05,4.602107,0.158077,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.007246,0.009179,0.012077,0.023671,0.029469,0.033816,0.036232,0.041546,1.0,0.126157,0.062879,-0.060761,-0.11994,-0.250838,-0.027451,0.393677,1.0,0.126157,4.0,3.0,5.0,2.0,1.0,0.0,0.0,1.122093,0.043478,0.043478,0.086957,0.26087,0.478261,0.608696,0.695652,0.782609,0.092434,0.076629,0.085747,0.079185,0.112238,0.080009,0.091412,0.084054,0.059618,0.074683,0.095626,0.08867,-0.010128,0.059697,0.097715,0.095247,-0.04119,0.042206,0.099434,0.099778,0.00053,0.000459,0.00161,1e-06,0.00161,1e-06,0.001932,3e-06,0.001932,3e-06,0.000738,7e-05,0.005166,4.4e-05,0.0,0.000124,0.00785,6.2e-05,-0.007631,0.001078,0.016304,0.00087,0.0,0.0,0.0,0.0,-0.000805,1e-06,0.000805,1e-06,-0.000906,0.000134,0.008152,6.9e-05,-0.009138,0.001435,0.018317,0.001183,0.0,0.0,0.0,0.0,-0.003744,2.5e-05,0.00471,1.7e-05,-0.014674,0.001946,0.021679,0.001692,-3.469447e-18,6e-06,0.002415,1.203706e-35,-0.035024,0.003943,0.038043,0.003723,-0.070048,0.005427,0.073671,0.004907,0.696256,0.074338,0.185278,0.0,-5.8e-05,-0.105271,0.696256,0.074338,0.213096,0.0,-0.044473,-29.604289,4.305501,14.025674,0.0,0.0,0.0,23.0,0.0,23.0,0.06343,0.656787,0.417397,0.272425,0.120298,0.042054,-0.427167,0.054604,-0.002212,0.001022,-11.155049,2.8798269999999996e-20,0.0,0.0,0.0,0.0,0.7226,0.033279,0.025904,0.030253,0.038361,0.058328,0.048405,0.037181,0.001573,0.004114,0.391304,0.043478,0.043478,0.043478,0.043478,0.043478,0.0,0.0,0.0,0.0,1.0,0.0,0.26087,0.304348,0.304348,0.434783,0.782609,0.450561,0.721464,1.118743,1.357978,2.253858,1.632783,2.579844,2.871476
ID_001AMM9,0.0,0.0,0.0,1.0,0.629831,0.050183,0.024532,-0.007171,0.006341,0.066425,0.069981,9.0,0.026049,0.372224,0.000679,1.367185,3.813512,0.074672,0.196256,4.0,1.0,3.0,6.0,0.111111,0.0,0.333333,0.222222,0.125,0.222222,0.066425,0.13285,0.888889,0.13285,0.030193,-7.8e-05,-2.3e-05,-0.000209,0.000239,0.000258,0.000363,3.776845,0.098382,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.048551,0.055676,0.06099,0.066425,0.068841,0.073068,0.076691,0.089372,1.0,-0.133391,-0.540478,0.254512,-0.011685,-0.058555,-0.114044,0.089836,1.0,-0.133391,1.0,2.0,2.0,0.0,0.0,0.0,0.0,1.522955,0.111111,0.111111,0.333333,0.444444,0.666667,0.777778,0.888889,1.0,0.066969,0.10302,0.091445,0.068639,0.067957,0.123323,0.106936,0.079726,0.040384,0.138632,0.123735,0.092788,0.020477,0.147633,0.138551,0.105048,0.014257,0.15124,0.153479,0.118602,0.000221,0.0,-0.022947,0.0,0.022947,0.0,-0.016002,4.8e-05,0.016002,4.8e-05,-0.016002,4.8e-05,0.016002,4.8e-05,-0.002778,0.000161,0.011232,4.3e-05,-0.007171,0.001158,0.024532,0.000608,-0.009058,0.0,0.009058,0.0,-0.009058,0.0,0.009058,0.0,0.002264,7.5e-05,0.008303,1.1e-05,-0.000604,9.3e-05,0.009058,1.1e-05,0.0,0.0,0.0,0.0,0.003019,3.6e-05,0.006039,9e-06,-0.002013,7.5e-05,0.008052,1.4e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.629831,0.057859,0.085251,0.0,0.039101,0.048062,0.629831,0.069832,0.097866,0.0,34.050703,29.413265,0.781291,1.532661,0.0,0.0,0.0,9.0,0.0,9.0,0.133531,0.133531,0.149843,0.106608,0.080199,0.572252,-0.218475,0.078798,-0.002204,0.003721,-0.026049,0.9563241,2.0,0.0,0.0,0.0,0.351696,0.056271,0.018166,0.122803,0.087924,0.06558,0.096099,0.087924,0.113538,0.0,0.333333,0.222222,0.222222,0.111111,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.444444,0.555556,0.666667,0.777778,0.888889,0.500402,1.05492,0.950271,0.950271,1.609438,1.078992,1.329661,1.332179
ID_001QJLW,0.0,0.0,0.0,1.0,0.420139,0.068105,0.036806,-0.025386,0.012522,0.013889,0.042014,10.0,0.07103,1.690635,0.005045,2.874354,8.538625,0.082525,0.33125,8.0,2.0,2.0,8.0,0.1,0.0,0.5,0.4,0.111111,0.2,0.010417,0.020833,0.9,0.249306,0.003819,-0.000489,-8.2e-05,-0.000273,1.6e-05,9e-06,1.3e-05,2.803509,0.199134,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.006632,0.007222,0.009479,0.010417,0.01875,0.023958,0.0375,0.081181,1.0,0.196366,-0.070772,-0.070405,-0.15515,-0.270194,-0.15515,0.111495,1.0,0.196366,2.0,2.0,2.0,1.0,0.0,0.0,0.0,0.940448,0.1,0.1,0.1,0.1,0.2,0.2,0.4,0.7,0.144986,0.121005,0.091106,0.06554,0.165185,0.128064,0.098409,0.071356,0.081492,0.122849,0.099754,0.073117,-0.022249,0.105817,0.09856,0.074406,-0.064472,0.080273,0.094321,0.074656,0.000217,0.0,0.0,0.0,0.0,0.0,-0.001562,2e-06,0.001562,2e-06,-0.001562,7.3e-05,0.006771,3e-05,0.001984,0.000235,0.012698,7.8e-05,-0.025386,0.003762,0.036806,0.003051,-0.001562,2e-06,0.001562,2e-06,-0.001562,2e-06,0.001562,2e-06,-0.002604,0.00015,0.009375,6.9e-05,-0.039444,0.005549,0.044861,0.005092,0.0,0.0,0.0,0.0,-0.010417,0.000109,0.010417,0.000109,-0.069213,0.006986,0.069213,0.006986,0.0,0.0,0.0,0.0,-0.186806,0.0,0.186806,0.0,-0.186806,0.0,0.186806,0.0,0.420139,0.269772,0.276716,0.0,-0.026888,-0.041616,0.420139,0.271108,0.279828,0.0,-5.691763,-8.552699,1.960605,2.769557,0.0,0.0,0.0,10.0,0.0,10.0,0.306183,0.179246,0.037824,0.027761,0.027938,0.070915,-0.592777,0.10798,-0.014659,0.007041,-4.118909,0.0009011214,3.0,0.0,0.0,0.0,0.912616,0.057357,0.000708,0.004426,0.000214,0.014339,0.001593,0.001593,0.000781,0.006373,0.2,0.1,0.1,0.1,0.1,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.4,0.5,0.5,0.6,0.9,0.450561,0.867563,0.867563,0.867563,1.56071,1.559581,1.549826,1.56071
ID_003DANQ,0.0,0.0,0.0,1.0,0.682367,0.053404,0.025664,-0.009561,0.002196,0.050725,0.05249,13.0,0.036781,0.700724,0.001353,1.365214,2.899115,0.064094,0.307971,5.0,5.0,6.0,7.0,0.076923,0.0,0.538462,0.461538,0.083333,0.153846,0.054348,0.108696,0.923077,0.150966,0.002415,-0.000199,-0.000187,-0.000284,0.00015,9.8e-05,4.4e-05,2.881145,0.105971,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.015459,0.022222,0.032367,0.045894,0.054348,0.059179,0.06715,0.08599,1.0,0.430635,0.138502,0.207732,0.066432,-0.25506,-0.318998,0.184423,1.0,0.430635,4.0,2.0,3.0,0.0,0.0,0.0,0.0,1.818483,0.076923,0.076923,0.153846,0.230769,0.384615,0.692308,0.846154,0.923077,0.092091,0.128394,0.115315,0.087047,0.114313,0.145564,0.12181,0.090324,0.085033,0.145674,0.130664,0.099171,0.040241,0.13719,0.133131,0.102428,-0.00284,0.114971,0.137767,0.111008,0.00244,0.088637,0.012077,0.0,0.012077,0.0,-0.006039,0.000328,0.018116,3.6e-05,0.00138,0.000632,0.022429,0.000131,0.002717,0.000565,0.021135,0.000126,-0.009561,0.000844,0.025664,0.000277,0.0,0.0,0.0,0.0,-0.009058,9e-06,0.009058,9e-06,-0.002013,0.000105,0.010064,8e-06,-0.020359,0.000582,0.024155,0.000413,-0.006039,0.0,0.006039,0.0,0.003019,8.2e-05,0.009058,9e-06,-0.017874,0.000709,0.023188,0.000491,0.01207729,0.0,0.012077,0.0,-0.020833,0.000843,0.027476,0.000522,-0.060386,0.0,0.060386,0.0,0.682367,0.231018,0.028538,0.0,-0.068478,-0.05082,0.682367,0.240953,0.058284,0.0,-16.510765,-60.683934,1.574334,3.802899,0.0,0.0,0.0,13.0,0.0,13.0,0.087011,0.028513,0.510242,0.797331,0.691429,0.027631,-0.607551,0.088324,-0.005972,0.002354,-3.79903,0.002917257,0.0,0.0,0.0,0.0,0.580395,0.137929,0.098872,0.000109,0.003933,0.04818,0.006992,0.055308,0.0437,0.024581,0.461538,0.307692,0.076923,0.076923,0.076923,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.384615,0.461538,0.615385,0.769231,0.923077,0.59827,0.9557,1.277034,1.747868,1.94591,1.720193,2.163956,2.197225
ID_0047BAA,0.0,0.0,0.0,0.0,0.548958,0.063388,0.038472,-0.0275,0.01263,0.076389,0.091493,6.0,0.046838,0.511925,0.002194,2.129676,4.78841,0.102785,0.192361,5.0,1.0,1.0,5.0,0.166667,0.0,1.0,0.833333,0.0,0.0,0.0,0.0,1.0,0.193056,0.055556,-0.000455,-0.00105,0.0,0.000516,0.000726,0.0,2.943249,0.137855,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.057813,0.060069,0.064757,0.069444,0.083333,0.085417,0.0875,0.140278,1.0,-0.195338,-0.18252,0.013542,0.164955,-0.372625,-0.18252,0.434547,1.0,-0.195338,2.0,3.0,1.0,0.0,0.0,0.0,0.0,1.329661,0.166667,0.166667,0.166667,0.333333,0.666667,0.666667,0.833333,1.0,0.108782,0.111862,0.085983,0.062112,0.141962,0.141543,0.108343,0.078185,0.114333,0.165213,0.130467,0.094821,0.075761,0.171995,0.142825,0.105073,0.11103,0.122874,0.094788,0.068517,0.000233,0.0,0.0,0.0,0.0,0.0,0.009375,0.0,0.009375,0.0,0.011632,5e-06,0.011632,5e-06,-0.001128,0.000328,0.014844,0.000109,-0.0275,0.003045,0.038472,0.002321,0.009375,0.0,0.009375,0.0,0.011632,5e-06,0.011632,5e-06,0.009144,1.6e-05,0.009144,1.6e-05,-0.026389,0.003799,0.040104,0.002888,0.013889,0.0,0.013889,0.0,0.009028,2.4e-05,0.009028,2.4e-05,0.009028,2.4e-05,0.009028,2.4e-05,0.004166667,0.0,0.004167,0.0,0.004167,0.0,0.004167,0.0,0.0,0.0,0.0,0.0,0.548958,0.089063,0.140104,0.0,0.011727,-0.019546,0.548958,0.089831,0.141461,0.0,7.501345,-7.941985,0.886809,1.377284,0.0,0.0,0.0,6.0,0.0,6.0,0.223144,0.072736,0.08945,0.061933,0.061933,0.192843,-0.616032,0.13373,-0.016895,0.010802,-1.574565,0.4963565,1.0,0.0,0.0,0.0,0.587969,0.056924,0.076079,0.109554,0.120783,0.048691,0.0,0.0,0.0,0.0,0.5,0.166667,0.166667,0.166667,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.5,0.666667,0.666667,0.833333,1.0,0.562335,0.562335,1.039721,1.386294,1.386294,1.039721,1.098612,0.693147


In [29]:
df.sort_values(by='id',inplace=True)

In [30]:
df.head(5)

Unnamed: 0,time,money,id
68925,1856.153846,0.028986,ID_000RHRU
68927,1856.307692,0.042271,ID_000RHRU
68926,1856.230769,0.038647,ID_000RHRU
68930,1856.846154,0.007246,ID_000RHRU
68924,1856.076923,0.045894,ID_000RHRU


In [31]:
ids=df['id']

In [32]:
ids.drop_duplicates(inplace=True)

In [33]:
ids.shape

(37343,)

In [34]:
df_final['ID']=ids.values

In [35]:
df_final.head(5)

Unnamed: 0,money__variance_larger_than_standard_deviation,money__has_duplicate_max,money__has_duplicate_min,money__has_duplicate,money__sum_values,money__abs_energy,money__mean_abs_change,money__mean_change,money__mean_second_derivative_central,money__median,money__mean,money__length,money__standard_deviation,money__variation_coefficient,money__variance,money__skewness,money__kurtosis,money__root_mean_square,money__absolute_sum_of_changes,money__longest_strike_below_mean,money__longest_strike_above_mean,money__count_above_mean,money__count_below_mean,money__last_location_of_maximum,money__first_location_of_maximum,money__last_location_of_minimum,money__first_location_of_minimum,money__percentage_of_reoccurring_values_to_all_values,money__percentage_of_reoccurring_datapoints_to_all_datapoints,money__sum_of_reoccurring_values,money__sum_of_reoccurring_data_points,money__ratio_value_number_to_time_series_length,money__maximum,money__minimum,money__time_reversal_asymmetry_statistic__lag_1,money__time_reversal_asymmetry_statistic__lag_2,money__time_reversal_asymmetry_statistic__lag_3,money__c3__lag_1,money__c3__lag_2,money__c3__lag_3,money__cid_ce__normalize_True,money__cid_ce__normalize_False,money__symmetry_looking__r_0.0,money__symmetry_looking__r_0.05,money__symmetry_looking__r_0.1,money__symmetry_looking__r_0.15000000000000002,money__symmetry_looking__r_0.2,money__symmetry_looking__r_0.25,money__symmetry_looking__r_0.30000000000000004,money__symmetry_looking__r_0.35000000000000003,money__symmetry_looking__r_0.4,money__symmetry_looking__r_0.45,money__symmetry_looking__r_0.5,money__symmetry_looking__r_0.55,money__symmetry_looking__r_0.6000000000000001,money__symmetry_looking__r_0.65,money__symmetry_looking__r_0.7000000000000001,money__symmetry_looking__r_0.75,money__symmetry_looking__r_0.8,money__symmetry_looking__r_0.8500000000000001,money__symmetry_looking__r_0.9,money__symmetry_looking__r_0.9500000000000001,money__large_standard_deviation__r_0.05,money__large_standard_deviation__r_0.1,money__large_standard_deviation__r_0.15000000000000002,money__large_standard_deviation__r_0.2,money__large_standard_deviation__r_0.25,money__large_standard_deviation__r_0.30000000000000004,money__large_standard_deviation__r_0.35000000000000003,money__large_standard_deviation__r_0.4,money__large_standard_deviation__r_0.45,money__large_standard_deviation__r_0.5,money__large_standard_deviation__r_0.55,money__large_standard_deviation__r_0.6000000000000001,money__large_standard_deviation__r_0.65,money__large_standard_deviation__r_0.7000000000000001,money__large_standard_deviation__r_0.75,money__large_standard_deviation__r_0.8,money__large_standard_deviation__r_0.8500000000000001,money__large_standard_deviation__r_0.9,money__large_standard_deviation__r_0.9500000000000001,money__quantile__q_0.1,money__quantile__q_0.2,money__quantile__q_0.3,money__quantile__q_0.4,money__quantile__q_0.6,money__quantile__q_0.7,money__quantile__q_0.8,money__quantile__q_0.9,money__autocorrelation__lag_0,money__autocorrelation__lag_1,money__autocorrelation__lag_2,money__autocorrelation__lag_3,money__autocorrelation__lag_4,"money__agg_autocorrelation__f_agg_""mean""__maxlag_40","money__agg_autocorrelation__f_agg_""median""__maxlag_40","money__agg_autocorrelation__f_agg_""var""__maxlag_40",money__partial_autocorrelation__lag_0,money__partial_autocorrelation__lag_1,money__number_cwt_peaks__n_1,money__number_cwt_peaks__n_5,money__number_peaks__n_1,money__number_peaks__n_3,money__number_peaks__n_5,money__number_peaks__n_10,money__number_peaks__n_50,money__binned_entropy__max_bins_10,money__index_mass_quantile__q_0.1,money__index_mass_quantile__q_0.2,money__index_mass_quantile__q_0.3,money__index_mass_quantile__q_0.4,money__index_mass_quantile__q_0.6,money__index_mass_quantile__q_0.7,money__index_mass_quantile__q_0.8,money__index_mass_quantile__q_0.9,"money__cwt_coefficients__coeff_0__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_20__widths_(2, 5, 10, 20)",money__spkt_welch_density__coeff_2,money__ar_coefficient__coeff_10__k_10,"money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.8","money__fft_coefficient__attr_""real""__coeff_0","money__fft_coefficient__attr_""real""__coeff_1","money__fft_coefficient__attr_""real""__coeff_2","money__fft_coefficient__attr_""imag""__coeff_0","money__fft_coefficient__attr_""imag""__coeff_1","money__fft_coefficient__attr_""imag""__coeff_2","money__fft_coefficient__attr_""abs""__coeff_0","money__fft_coefficient__attr_""abs""__coeff_1","money__fft_coefficient__attr_""abs""__coeff_2","money__fft_coefficient__attr_""angle""__coeff_0","money__fft_coefficient__attr_""angle""__coeff_1","money__fft_coefficient__attr_""angle""__coeff_2","money__fft_aggregated__aggtype_""centroid""","money__fft_aggregated__aggtype_""variance""",money__value_count__value_0,money__value_count__value_1,money__value_count__value_-1,money__range_count__max_1__min_-1,money__range_count__max_0__min_1000000000000.0,money__range_count__max_1000000000000.0__min_0,money__approximate_entropy__m_2__r_0.1,money__approximate_entropy__m_2__r_0.3,money__approximate_entropy__m_2__r_0.5,money__approximate_entropy__m_2__r_0.7,money__approximate_entropy__m_2__r_0.9,"money__linear_trend__attr_""pvalue""","money__linear_trend__attr_""rvalue""","money__linear_trend__attr_""intercept""","money__linear_trend__attr_""slope""","money__linear_trend__attr_""stderr""","money__augmented_dickey_fuller__attr_""teststat""__autolag_""AIC""","money__augmented_dickey_fuller__attr_""pvalue""__autolag_""AIC""","money__augmented_dickey_fuller__attr_""usedlag""__autolag_""AIC""",money__number_crossing_m__m_0,money__number_crossing_m__m_-1,money__number_crossing_m__m_1,money__energy_ratio_by_chunks__num_segments_10__segment_focus_0,money__energy_ratio_by_chunks__num_segments_10__segment_focus_1,money__energy_ratio_by_chunks__num_segments_10__segment_focus_2,money__energy_ratio_by_chunks__num_segments_10__segment_focus_3,money__energy_ratio_by_chunks__num_segments_10__segment_focus_4,money__energy_ratio_by_chunks__num_segments_10__segment_focus_5,money__energy_ratio_by_chunks__num_segments_10__segment_focus_6,money__energy_ratio_by_chunks__num_segments_10__segment_focus_7,money__energy_ratio_by_chunks__num_segments_10__segment_focus_8,money__energy_ratio_by_chunks__num_segments_10__segment_focus_9,money__ratio_beyond_r_sigma__r_0.5,money__ratio_beyond_r_sigma__r_1,money__ratio_beyond_r_sigma__r_1.5,money__ratio_beyond_r_sigma__r_2,money__ratio_beyond_r_sigma__r_2.5,money__ratio_beyond_r_sigma__r_3,money__ratio_beyond_r_sigma__r_5,money__ratio_beyond_r_sigma__r_6,money__ratio_beyond_r_sigma__r_7,money__ratio_beyond_r_sigma__r_10,money__count_above__t_0,money__count_below__t_0,money__lempel_ziv_complexity__bins_2,money__lempel_ziv_complexity__bins_3,money__lempel_ziv_complexity__bins_5,money__lempel_ziv_complexity__bins_10,money__lempel_ziv_complexity__bins_100,money__fourier_entropy__bins_2,money__fourier_entropy__bins_3,money__fourier_entropy__bins_5,money__fourier_entropy__bins_10,money__fourier_entropy__bins_100,money__permutation_entropy__dimension_3__tau_1,money__permutation_entropy__dimension_4__tau_1,money__permutation_entropy__dimension_5__tau_1,ID
ID_000RHRU,0.0,0.0,0.0,1.0,0.696256,0.048213,0.016304,-0.007631,0.003537,0.02657,0.030272,23.0,0.034349,1.13467,0.00118,3.753485,16.341787,0.045785,0.358696,5.0,3.0,9.0,14.0,0.043478,0.0,0.826087,0.782609,0.3125,0.521739,0.115942,0.251208,0.695652,0.179952,0.002415,-5.6e-05,-5.7e-05,-2.5e-05,2.5e-05,1.8e-05,1.9e-05,4.602107,0.158077,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.007246,0.009179,0.012077,0.023671,0.029469,0.033816,0.036232,0.041546,1.0,0.126157,0.062879,-0.060761,-0.11994,-0.250838,-0.027451,0.393677,1.0,0.126157,4.0,3.0,5.0,2.0,1.0,0.0,0.0,1.122093,0.043478,0.043478,0.086957,0.26087,0.478261,0.608696,0.695652,0.782609,0.092434,0.076629,0.085747,0.079185,0.112238,0.080009,0.091412,0.084054,0.059618,0.074683,0.095626,0.08867,-0.010128,0.059697,0.097715,0.095247,-0.04119,0.042206,0.099434,0.099778,0.00053,0.000459,0.00161,1e-06,0.00161,1e-06,0.001932,3e-06,0.001932,3e-06,0.000738,7e-05,0.005166,4.4e-05,0.0,0.000124,0.00785,6.2e-05,-0.007631,0.001078,0.016304,0.00087,0.0,0.0,0.0,0.0,-0.000805,1e-06,0.000805,1e-06,-0.000906,0.000134,0.008152,6.9e-05,-0.009138,0.001435,0.018317,0.001183,0.0,0.0,0.0,0.0,-0.003744,2.5e-05,0.00471,1.7e-05,-0.014674,0.001946,0.021679,0.001692,-3.469447e-18,6e-06,0.002415,1.203706e-35,-0.035024,0.003943,0.038043,0.003723,-0.070048,0.005427,0.073671,0.004907,0.696256,0.074338,0.185278,0.0,-5.8e-05,-0.105271,0.696256,0.074338,0.213096,0.0,-0.044473,-29.604289,4.305501,14.025674,0.0,0.0,0.0,23.0,0.0,23.0,0.06343,0.656787,0.417397,0.272425,0.120298,0.042054,-0.427167,0.054604,-0.002212,0.001022,-11.155049,2.8798269999999996e-20,0.0,0.0,0.0,0.0,0.7226,0.033279,0.025904,0.030253,0.038361,0.058328,0.048405,0.037181,0.001573,0.004114,0.391304,0.043478,0.043478,0.043478,0.043478,0.043478,0.0,0.0,0.0,0.0,1.0,0.0,0.26087,0.304348,0.304348,0.434783,0.782609,0.450561,0.721464,1.118743,1.357978,2.253858,1.632783,2.579844,2.871476,ID_000RHRU
ID_001AMM9,0.0,0.0,0.0,1.0,0.629831,0.050183,0.024532,-0.007171,0.006341,0.066425,0.069981,9.0,0.026049,0.372224,0.000679,1.367185,3.813512,0.074672,0.196256,4.0,1.0,3.0,6.0,0.111111,0.0,0.333333,0.222222,0.125,0.222222,0.066425,0.13285,0.888889,0.13285,0.030193,-7.8e-05,-2.3e-05,-0.000209,0.000239,0.000258,0.000363,3.776845,0.098382,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.048551,0.055676,0.06099,0.066425,0.068841,0.073068,0.076691,0.089372,1.0,-0.133391,-0.540478,0.254512,-0.011685,-0.058555,-0.114044,0.089836,1.0,-0.133391,1.0,2.0,2.0,0.0,0.0,0.0,0.0,1.522955,0.111111,0.111111,0.333333,0.444444,0.666667,0.777778,0.888889,1.0,0.066969,0.10302,0.091445,0.068639,0.067957,0.123323,0.106936,0.079726,0.040384,0.138632,0.123735,0.092788,0.020477,0.147633,0.138551,0.105048,0.014257,0.15124,0.153479,0.118602,0.000221,0.0,-0.022947,0.0,0.022947,0.0,-0.016002,4.8e-05,0.016002,4.8e-05,-0.016002,4.8e-05,0.016002,4.8e-05,-0.002778,0.000161,0.011232,4.3e-05,-0.007171,0.001158,0.024532,0.000608,-0.009058,0.0,0.009058,0.0,-0.009058,0.0,0.009058,0.0,0.002264,7.5e-05,0.008303,1.1e-05,-0.000604,9.3e-05,0.009058,1.1e-05,0.0,0.0,0.0,0.0,0.003019,3.6e-05,0.006039,9e-06,-0.002013,7.5e-05,0.008052,1.4e-05,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.629831,0.057859,0.085251,0.0,0.039101,0.048062,0.629831,0.069832,0.097866,0.0,34.050703,29.413265,0.781291,1.532661,0.0,0.0,0.0,9.0,0.0,9.0,0.133531,0.133531,0.149843,0.106608,0.080199,0.572252,-0.218475,0.078798,-0.002204,0.003721,-0.026049,0.9563241,2.0,0.0,0.0,0.0,0.351696,0.056271,0.018166,0.122803,0.087924,0.06558,0.096099,0.087924,0.113538,0.0,0.333333,0.222222,0.222222,0.111111,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.444444,0.555556,0.666667,0.777778,0.888889,0.500402,1.05492,0.950271,0.950271,1.609438,1.078992,1.329661,1.332179,ID_001AMM9
ID_001QJLW,0.0,0.0,0.0,1.0,0.420139,0.068105,0.036806,-0.025386,0.012522,0.013889,0.042014,10.0,0.07103,1.690635,0.005045,2.874354,8.538625,0.082525,0.33125,8.0,2.0,2.0,8.0,0.1,0.0,0.5,0.4,0.111111,0.2,0.010417,0.020833,0.9,0.249306,0.003819,-0.000489,-8.2e-05,-0.000273,1.6e-05,9e-06,1.3e-05,2.803509,0.199134,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.006632,0.007222,0.009479,0.010417,0.01875,0.023958,0.0375,0.081181,1.0,0.196366,-0.070772,-0.070405,-0.15515,-0.270194,-0.15515,0.111495,1.0,0.196366,2.0,2.0,2.0,1.0,0.0,0.0,0.0,0.940448,0.1,0.1,0.1,0.1,0.2,0.2,0.4,0.7,0.144986,0.121005,0.091106,0.06554,0.165185,0.128064,0.098409,0.071356,0.081492,0.122849,0.099754,0.073117,-0.022249,0.105817,0.09856,0.074406,-0.064472,0.080273,0.094321,0.074656,0.000217,0.0,0.0,0.0,0.0,0.0,-0.001562,2e-06,0.001562,2e-06,-0.001562,7.3e-05,0.006771,3e-05,0.001984,0.000235,0.012698,7.8e-05,-0.025386,0.003762,0.036806,0.003051,-0.001562,2e-06,0.001562,2e-06,-0.001562,2e-06,0.001562,2e-06,-0.002604,0.00015,0.009375,6.9e-05,-0.039444,0.005549,0.044861,0.005092,0.0,0.0,0.0,0.0,-0.010417,0.000109,0.010417,0.000109,-0.069213,0.006986,0.069213,0.006986,0.0,0.0,0.0,0.0,-0.186806,0.0,0.186806,0.0,-0.186806,0.0,0.186806,0.0,0.420139,0.269772,0.276716,0.0,-0.026888,-0.041616,0.420139,0.271108,0.279828,0.0,-5.691763,-8.552699,1.960605,2.769557,0.0,0.0,0.0,10.0,0.0,10.0,0.306183,0.179246,0.037824,0.027761,0.027938,0.070915,-0.592777,0.10798,-0.014659,0.007041,-4.118909,0.0009011214,3.0,0.0,0.0,0.0,0.912616,0.057357,0.000708,0.004426,0.000214,0.014339,0.001593,0.001593,0.000781,0.006373,0.2,0.1,0.1,0.1,0.1,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.4,0.5,0.5,0.6,0.9,0.450561,0.867563,0.867563,0.867563,1.56071,1.559581,1.549826,1.56071,ID_001QJLW
ID_003DANQ,0.0,0.0,0.0,1.0,0.682367,0.053404,0.025664,-0.009561,0.002196,0.050725,0.05249,13.0,0.036781,0.700724,0.001353,1.365214,2.899115,0.064094,0.307971,5.0,5.0,6.0,7.0,0.076923,0.0,0.538462,0.461538,0.083333,0.153846,0.054348,0.108696,0.923077,0.150966,0.002415,-0.000199,-0.000187,-0.000284,0.00015,9.8e-05,4.4e-05,2.881145,0.105971,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.015459,0.022222,0.032367,0.045894,0.054348,0.059179,0.06715,0.08599,1.0,0.430635,0.138502,0.207732,0.066432,-0.25506,-0.318998,0.184423,1.0,0.430635,4.0,2.0,3.0,0.0,0.0,0.0,0.0,1.818483,0.076923,0.076923,0.153846,0.230769,0.384615,0.692308,0.846154,0.923077,0.092091,0.128394,0.115315,0.087047,0.114313,0.145564,0.12181,0.090324,0.085033,0.145674,0.130664,0.099171,0.040241,0.13719,0.133131,0.102428,-0.00284,0.114971,0.137767,0.111008,0.00244,0.088637,0.012077,0.0,0.012077,0.0,-0.006039,0.000328,0.018116,3.6e-05,0.00138,0.000632,0.022429,0.000131,0.002717,0.000565,0.021135,0.000126,-0.009561,0.000844,0.025664,0.000277,0.0,0.0,0.0,0.0,-0.009058,9e-06,0.009058,9e-06,-0.002013,0.000105,0.010064,8e-06,-0.020359,0.000582,0.024155,0.000413,-0.006039,0.0,0.006039,0.0,0.003019,8.2e-05,0.009058,9e-06,-0.017874,0.000709,0.023188,0.000491,0.01207729,0.0,0.012077,0.0,-0.020833,0.000843,0.027476,0.000522,-0.060386,0.0,0.060386,0.0,0.682367,0.231018,0.028538,0.0,-0.068478,-0.05082,0.682367,0.240953,0.058284,0.0,-16.510765,-60.683934,1.574334,3.802899,0.0,0.0,0.0,13.0,0.0,13.0,0.087011,0.028513,0.510242,0.797331,0.691429,0.027631,-0.607551,0.088324,-0.005972,0.002354,-3.79903,0.002917257,0.0,0.0,0.0,0.0,0.580395,0.137929,0.098872,0.000109,0.003933,0.04818,0.006992,0.055308,0.0437,0.024581,0.461538,0.307692,0.076923,0.076923,0.076923,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.384615,0.461538,0.615385,0.769231,0.923077,0.59827,0.9557,1.277034,1.747868,1.94591,1.720193,2.163956,2.197225,ID_003DANQ
ID_0047BAA,0.0,0.0,0.0,0.0,0.548958,0.063388,0.038472,-0.0275,0.01263,0.076389,0.091493,6.0,0.046838,0.511925,0.002194,2.129676,4.78841,0.102785,0.192361,5.0,1.0,1.0,5.0,0.166667,0.0,1.0,0.833333,0.0,0.0,0.0,0.0,1.0,0.193056,0.055556,-0.000455,-0.00105,0.0,0.000516,0.000726,0.0,2.943249,0.137855,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.057813,0.060069,0.064757,0.069444,0.083333,0.085417,0.0875,0.140278,1.0,-0.195338,-0.18252,0.013542,0.164955,-0.372625,-0.18252,0.434547,1.0,-0.195338,2.0,3.0,1.0,0.0,0.0,0.0,0.0,1.329661,0.166667,0.166667,0.166667,0.333333,0.666667,0.666667,0.833333,1.0,0.108782,0.111862,0.085983,0.062112,0.141962,0.141543,0.108343,0.078185,0.114333,0.165213,0.130467,0.094821,0.075761,0.171995,0.142825,0.105073,0.11103,0.122874,0.094788,0.068517,0.000233,0.0,0.0,0.0,0.0,0.0,0.009375,0.0,0.009375,0.0,0.011632,5e-06,0.011632,5e-06,-0.001128,0.000328,0.014844,0.000109,-0.0275,0.003045,0.038472,0.002321,0.009375,0.0,0.009375,0.0,0.011632,5e-06,0.011632,5e-06,0.009144,1.6e-05,0.009144,1.6e-05,-0.026389,0.003799,0.040104,0.002888,0.013889,0.0,0.013889,0.0,0.009028,2.4e-05,0.009028,2.4e-05,0.009028,2.4e-05,0.009028,2.4e-05,0.004166667,0.0,0.004167,0.0,0.004167,0.0,0.004167,0.0,0.0,0.0,0.0,0.0,0.548958,0.089063,0.140104,0.0,0.011727,-0.019546,0.548958,0.089831,0.141461,0.0,7.501345,-7.941985,0.886809,1.377284,0.0,0.0,0.0,6.0,0.0,6.0,0.223144,0.072736,0.08945,0.061933,0.061933,0.192843,-0.616032,0.13373,-0.016895,0.010802,-1.574565,0.4963565,1.0,0.0,0.0,0.0,0.587969,0.056924,0.076079,0.109554,0.120783,0.048691,0.0,0.0,0.0,0.0,0.5,0.166667,0.166667,0.166667,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.5,0.666667,0.666667,0.833333,1.0,0.562335,0.562335,1.039721,1.386294,1.386294,1.039721,1.098612,0.693147,ID_0047BAA


In [36]:
merged1= pd.merge(left=merged, right=df_final.fillna(value=0),on='ID')

In [37]:
merged1.shape

(37343, 294)

In [38]:
merged1.head()

Unnamed: 0,ID,Deposit,UpsellDate,AccessoryRate,rateTypeEntity,RatePerUnit,DaysOnDeposit,MainApplicantGender,Age,Region,Town,Occupation,TotalContractValue,ExpectedTermDate,LastPaymentDate,TransactionDates,PaymentsHistory,m1,m2,m3,m4,m5,m6,time,PaidAmount,PeriodDiff,money__variance_larger_than_standard_deviation,money__has_duplicate_max,money__has_duplicate_min,money__has_duplicate,money__sum_values,money__abs_energy,money__mean_abs_change,money__mean_change,money__mean_second_derivative_central,money__median,money__mean,money__length,money__standard_deviation,money__variation_coefficient,money__variance,money__skewness,money__kurtosis,money__root_mean_square,money__absolute_sum_of_changes,money__longest_strike_below_mean,money__longest_strike_above_mean,money__count_above_mean,money__count_below_mean,money__last_location_of_maximum,money__first_location_of_maximum,money__last_location_of_minimum,money__first_location_of_minimum,money__percentage_of_reoccurring_values_to_all_values,money__percentage_of_reoccurring_datapoints_to_all_datapoints,money__sum_of_reoccurring_values,money__sum_of_reoccurring_data_points,money__ratio_value_number_to_time_series_length,money__maximum,money__minimum,money__time_reversal_asymmetry_statistic__lag_1,money__time_reversal_asymmetry_statistic__lag_2,money__time_reversal_asymmetry_statistic__lag_3,money__c3__lag_1,money__c3__lag_2,money__c3__lag_3,money__cid_ce__normalize_True,money__cid_ce__normalize_False,money__symmetry_looking__r_0.0,money__symmetry_looking__r_0.05,money__symmetry_looking__r_0.1,money__symmetry_looking__r_0.15000000000000002,money__symmetry_looking__r_0.2,money__symmetry_looking__r_0.25,money__symmetry_looking__r_0.30000000000000004,money__symmetry_looking__r_0.35000000000000003,money__symmetry_looking__r_0.4,money__symmetry_looking__r_0.45,money__symmetry_looking__r_0.5,money__symmetry_looking__r_0.55,money__symmetry_looking__r_0.6000000000000001,money__symmetry_looking__r_0.65,money__symmetry_looking__r_0.7000000000000001,money__symmetry_looking__r_0.75,money__symmetry_looking__r_0.8,money__symmetry_looking__r_0.8500000000000001,money__symmetry_looking__r_0.9,money__symmetry_looking__r_0.9500000000000001,money__large_standard_deviation__r_0.05,money__large_standard_deviation__r_0.1,money__large_standard_deviation__r_0.15000000000000002,money__large_standard_deviation__r_0.2,money__large_standard_deviation__r_0.25,money__large_standard_deviation__r_0.30000000000000004,money__large_standard_deviation__r_0.35000000000000003,money__large_standard_deviation__r_0.4,money__large_standard_deviation__r_0.45,money__large_standard_deviation__r_0.5,money__large_standard_deviation__r_0.55,money__large_standard_deviation__r_0.6000000000000001,money__large_standard_deviation__r_0.65,money__large_standard_deviation__r_0.7000000000000001,money__large_standard_deviation__r_0.75,money__large_standard_deviation__r_0.8,money__large_standard_deviation__r_0.8500000000000001,money__large_standard_deviation__r_0.9,money__large_standard_deviation__r_0.9500000000000001,money__quantile__q_0.1,money__quantile__q_0.2,money__quantile__q_0.3,money__quantile__q_0.4,money__quantile__q_0.6,money__quantile__q_0.7,money__quantile__q_0.8,money__quantile__q_0.9,money__autocorrelation__lag_0,money__autocorrelation__lag_1,money__autocorrelation__lag_2,money__autocorrelation__lag_3,money__autocorrelation__lag_4,"money__agg_autocorrelation__f_agg_""mean""__maxlag_40","money__agg_autocorrelation__f_agg_""median""__maxlag_40","money__agg_autocorrelation__f_agg_""var""__maxlag_40",money__partial_autocorrelation__lag_0,money__partial_autocorrelation__lag_1,money__number_cwt_peaks__n_1,money__number_cwt_peaks__n_5,money__number_peaks__n_1,money__number_peaks__n_3,money__number_peaks__n_5,money__number_peaks__n_10,money__number_peaks__n_50,money__binned_entropy__max_bins_10,money__index_mass_quantile__q_0.1,money__index_mass_quantile__q_0.2,money__index_mass_quantile__q_0.3,money__index_mass_quantile__q_0.4,money__index_mass_quantile__q_0.6,money__index_mass_quantile__q_0.7,money__index_mass_quantile__q_0.8,money__index_mass_quantile__q_0.9,"money__cwt_coefficients__coeff_0__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_0__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_1__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_2__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_3__w_20__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_2__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_5__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_10__widths_(2, 5, 10, 20)","money__cwt_coefficients__coeff_4__w_20__widths_(2, 5, 10, 20)",money__spkt_welch_density__coeff_2,money__ar_coefficient__coeff_10__k_10,"money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.2__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.4__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.0","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.4__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.2","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.6__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.4","money__change_quantiles__f_agg_""mean""__isabs_False__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_False__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_True__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_True__qh_0.8__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.6","money__change_quantiles__f_agg_""mean""__isabs_False__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""var""__isabs_False__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""mean""__isabs_True__qh_1.0__ql_0.8","money__change_quantiles__f_agg_""var""__isabs_True__qh_1.0__ql_0.8","money__fft_coefficient__attr_""real""__coeff_0","money__fft_coefficient__attr_""real""__coeff_1","money__fft_coefficient__attr_""real""__coeff_2","money__fft_coefficient__attr_""imag""__coeff_0","money__fft_coefficient__attr_""imag""__coeff_1","money__fft_coefficient__attr_""imag""__coeff_2","money__fft_coefficient__attr_""abs""__coeff_0","money__fft_coefficient__attr_""abs""__coeff_1","money__fft_coefficient__attr_""abs""__coeff_2","money__fft_coefficient__attr_""angle""__coeff_0","money__fft_coefficient__attr_""angle""__coeff_1","money__fft_coefficient__attr_""angle""__coeff_2","money__fft_aggregated__aggtype_""centroid""","money__fft_aggregated__aggtype_""variance""",money__value_count__value_0,money__value_count__value_1,money__value_count__value_-1,money__range_count__max_1__min_-1,money__range_count__max_0__min_1000000000000.0,money__range_count__max_1000000000000.0__min_0,money__approximate_entropy__m_2__r_0.1,money__approximate_entropy__m_2__r_0.3,money__approximate_entropy__m_2__r_0.5,money__approximate_entropy__m_2__r_0.7,money__approximate_entropy__m_2__r_0.9,"money__linear_trend__attr_""pvalue""","money__linear_trend__attr_""rvalue""","money__linear_trend__attr_""intercept""","money__linear_trend__attr_""slope""","money__linear_trend__attr_""stderr""","money__augmented_dickey_fuller__attr_""teststat""__autolag_""AIC""","money__augmented_dickey_fuller__attr_""pvalue""__autolag_""AIC""","money__augmented_dickey_fuller__attr_""usedlag""__autolag_""AIC""",money__number_crossing_m__m_0,money__number_crossing_m__m_-1,money__number_crossing_m__m_1,money__energy_ratio_by_chunks__num_segments_10__segment_focus_0,money__energy_ratio_by_chunks__num_segments_10__segment_focus_1,money__energy_ratio_by_chunks__num_segments_10__segment_focus_2,money__energy_ratio_by_chunks__num_segments_10__segment_focus_3,money__energy_ratio_by_chunks__num_segments_10__segment_focus_4,money__energy_ratio_by_chunks__num_segments_10__segment_focus_5,money__energy_ratio_by_chunks__num_segments_10__segment_focus_6,money__energy_ratio_by_chunks__num_segments_10__segment_focus_7,money__energy_ratio_by_chunks__num_segments_10__segment_focus_8,money__energy_ratio_by_chunks__num_segments_10__segment_focus_9,money__ratio_beyond_r_sigma__r_0.5,money__ratio_beyond_r_sigma__r_1,money__ratio_beyond_r_sigma__r_1.5,money__ratio_beyond_r_sigma__r_2,money__ratio_beyond_r_sigma__r_2.5,money__ratio_beyond_r_sigma__r_3,money__ratio_beyond_r_sigma__r_5,money__ratio_beyond_r_sigma__r_6,money__ratio_beyond_r_sigma__r_7,money__ratio_beyond_r_sigma__r_10,money__count_above__t_0,money__count_below__t_0,money__lempel_ziv_complexity__bins_2,money__lempel_ziv_complexity__bins_3,money__lempel_ziv_complexity__bins_5,money__lempel_ziv_complexity__bins_10,money__lempel_ziv_complexity__bins_100,money__fourier_entropy__bins_2,money__fourier_entropy__bins_3,money__fourier_entropy__bins_5,money__fourier_entropy__bins_10,money__fourier_entropy__bins_100,money__permutation_entropy__dimension_3__tau_1,money__permutation_entropy__dimension_4__tau_1,money__permutation_entropy__dimension_5__tau_1
0,ID_K00S4N4,2000,0.0,0,0,35,7,1,41.0,1,5,5,14740,-0.153846,-0.846154,"[1849.076923076923, 1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155]","[0.20691994572591588, 0.07123473541383989, 0.06173677069199457, 0.07123473541383989, 0.07123473541383989]",0.083107,0.071235,0.080733,0.035617,0.118725,0.128223,13,0.482361,-1850.230769,0.0,0.0,0.0,1.0,0.482361,0.06185,0.03867,-0.033921,0.022614,0.071235,0.096472,5.0,0.055346,0.573702,0.003063,2.210847,4.91504,0.111221,0.154681,4.0,1.0,1.0,4.0,0.2,0.0,0.6,0.4,0.333333,0.6,0.071235,0.213704,0.6,0.20692,0.061737,-0.000896,-0.00233,0.0,0.000512,0.00091,0.0,2.463553,0.136348,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.065536,0.069335,0.071235,0.071235,0.071235,0.071235,0.098372,0.152646,1.0,-0.032419,-0.252773,-0.351019,-0.909967,-0.386545,-0.301896,0.104633,1.0,-0.032419,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.500402,0.2,0.2,0.2,0.2,0.6,0.6,0.8,1.0,0.155818,0.124829,0.091932,0.065688,0.152741,0.147113,0.110507,0.079332,0.095694,0.159607,0.127213,0.09264,0.097664,0.097589,0.073848,0.053116,0.072603,0.072199,0.054717,0.039373,7.9e-05,0.0,0.0,0.0,0.0,0.0,0.0,6e-05,0.006332,2e-05,0.0,6e-05,0.006332,2e-05,0.0,6e-05,0.006332,2e-05,-0.033921,0.003497,0.03867,0.003152,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.067843,0.004603,0.067843,0.004603,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.067843,0.004603,0.067843,0.004603,0.0,0.0,0.0,0.0,-0.067843,0.004603,0.067843,0.004603,0.0,0.0,0.0,0.0,0.482361,0.143369,0.13275,0.0,0.005583,-0.009033,0.482361,0.143478,0.133057,0.0,2.229957,-3.89274,0.539721,0.599082,0.0,0.0,0.0,5.0,0.0,5.0,0.287682,0.074179,0.074179,0.074179,0.074179,0.194141,-0.693409,0.150746,-0.027137,0.016281,-21.28581,0.0,0.0,0.0,0.0,0.0,0.692248,0.082043,0.061623,0.082043,0.082043,0.0,0.0,0.0,0.0,0.0,0.4,0.2,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.6,0.8,0.8,0.8,0.8,0.636514,1.098612,1.098612,1.098612,1.098612,1.098612,0.693147,-0.0
1,ID_6L67PAA,2000,0.0,0,0,35,7,1,33.0,0,13,5,14740,-0.153846,-5.30769,"[1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155, 1849.5384615384614, 1849.6923076923076]","[0.27137042062415195, 0.07123473541383989, 0.07123473541383989, 0.07123473541383989, 0.07123473541383989, 0.027137042062415198]",0.0,0.0,0.0,0.0,0.0,0.0,13,0.583446,-1855.0,0.0,0.0,0.0,1.0,0.583446,0.094676,0.048847,-0.048847,0.019505,0.071235,0.097241,6.0,0.07952,0.817765,0.006323,2.207943,5.242482,0.125616,0.244233,5.0,1.0,1.0,5.0,0.166667,0.0,1.0,0.833333,0.333333,0.666667,0.071235,0.284939,0.5,0.27137,0.027137,-0.001298,-0.002597,0.0,0.000559,0.000757,0.0,2.577156,0.204936,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.049186,0.071235,0.071235,0.071235,0.071235,0.071235,0.071235,0.171303,1.0,-0.021391,-0.053478,-0.106955,-0.21391,-0.465237,-0.106955,0.540984,1.0,-0.021391,2.0,3.0,0.0,0.0,0.0,0.0,0.0,0.867563,0.166667,0.166667,0.166667,0.166667,0.5,0.5,0.666667,0.833333,0.154403,0.146012,0.110788,0.079773,0.194101,0.17323,0.130253,0.093575,0.137533,0.188332,0.147507,0.106984,0.061102,0.179145,0.151092,0.111547,0.088067,0.105918,0.082761,0.060016,0.000108,0.0,-0.011024,0.0003646137,0.011024,0.0003646137,-0.011024,0.000365,0.011024,0.000365,-0.011024,0.000365,0.011024,0.000365,-0.011024,0.000365,0.011024,0.000365,-0.048847,0.006014,0.048847,0.006014,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.050034,0.00751,0.050034,0.00751,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.050034,0.00751,0.050034,0.00751,0.0,0.0,0.0,0.0,-0.050034,0.00751,0.050034,0.00751,-0.050034,0.00751,0.050034,0.00751,0.583446,0.178087,0.222185,0.0,-0.03819,-0.03819,0.583446,0.182136,0.225443,0.0,-12.103449,-9.752865,1.105616,1.434553,0.0,0.0,0.0,6.0,0.0,6.0,0.08945,0.08945,0.08945,0.061933,0.061933,0.086379,-0.749328,0.184467,-0.03489,0.015417,-7.671433,1.589786e-11,0.0,0.0,0.0,0.0,0.777832,0.053597,0.053597,0.053597,0.053597,0.007778,0.0,0.0,0.0,0.0,0.333333,0.166667,0.166667,0.166667,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.5,0.666667,0.666667,0.666667,0.666667,0.562335,0.562335,1.039721,1.039721,1.386294,1.039721,1.098612,0.693147
2,ID_102CV85,2000,-6.92857,35,0,35,7,0,48.0,2,22,0,29480,-9.78571,-9.78571,"[1716.4285714285713, 1716.5, 1716.5714285714287, 1716.642857142857, 1716.7142857142858, 1716.7857142857142, 1716.857142857143, 1716.9285714285713, 1717.0]","[0.14399592944369063, 0.03324287652645862, 0.024932157394843963, 0.024932157394843963, 0.049864314789687926, 0.024932157394843963, 0.03324287652645862, 0.031037991858887382, 0.024932157394843963]",0.033243,0.033243,0.041554,0.033243,0.031716,0.012042,14,0.391113,-1726.785714,0.0,0.0,1.0,1.0,0.391113,0.028881,0.023194,-0.014883,0.007475,0.031038,0.043457,9.0,0.036339,0.836206,0.001321,2.770409,7.892134,0.056648,0.18555,4.0,1.0,2.0,7.0,0.111111,0.0,1.0,0.222222,0.4,0.666667,0.058175,0.166214,0.555556,0.143996,0.024932,-9.6e-05,-9.9e-05,-0.000165,4.2e-05,6e-05,6.2e-05,3.21977,0.117003,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.024932,0.024932,0.024932,0.026153,0.032802,0.033243,0.039891,0.068691,1.0,-0.017588,-0.118454,-0.142864,0.171747,-0.285448,-0.14172,0.204077,1.0,-0.017588,2.0,1.0,2.0,1.0,0.0,0.0,0.0,0.683739,0.111111,0.111111,0.111111,0.222222,0.555556,0.555556,0.777778,0.888889,0.083184,0.085711,0.071464,0.052886,0.070341,0.094918,0.078393,0.057747,0.024422,0.097752,0.085607,0.063851,-0.006188,0.094366,0.090952,0.06929,-0.007239,0.085496,0.093427,0.073297,0.000163,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.003053,9e-06,0.003053,9e-06,-0.001662,3.3e-05,0.004986,1.1e-05,-0.014883,0.00149,0.023194,0.001173,0.0,0.0,0.0,0.0,-0.003053,9e-06,0.003053,9e-06,-0.001662,3.3e-05,0.004986,1.1e-05,-0.014883,0.00149,0.023194,0.001173,0.0,0.0,0.0,0.0,-0.002205,0.0,0.002205,0.0,-0.056479,0.002946,0.056479,0.002946,0.0,0.0,0.0,0.0,-0.110753,0.0,0.110753,0.0,0.0,0.0,0.0,0.0,0.391113,0.098906,0.129713,0.0,-0.000659,0.002733,0.391113,0.098909,0.129742,0.0,-0.381725,1.206863,1.376804,2.25567,0.0,0.0,0.0,9.0,0.0,9.0,0.039755,0.401533,0.314616,0.033346,0.033346,0.123215,-0.552138,0.07454,-0.007771,0.004435,-3.027372,0.03241609,2.0,0.0,0.0,0.0,0.717934,0.038263,0.021523,0.021523,0.086092,0.021523,0.038263,0.033356,0.021523,0.0,0.555556,0.111111,0.111111,0.111111,0.111111,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.444444,0.555556,0.555556,0.666667,0.666667,0.500402,1.05492,1.332179,1.332179,1.609438,1.351784,1.791759,1.609438
3,ID_HXBJFHB,2000,0.0,0,0,35,7,0,43.0,5,43,6,14740,-0.153846,-5.76923,"[1848.7692307692307, 1848.8461538461538, 1848.923076923077, 1849.0, 1849.076923076923, 1849.1538461538462, 1849.2307692307693, 1849.3076923076924, 1849.3846153846155, 1849.4615384615386, 1849.6153846153845]","[0.1523066485753053, 0.06648575305291723, 0.06648575305291723, 0.08310719131614654, 0.06648575305291723, 0.06648575305291723, 0.06648575305291723, 0.08310719131614654, 0.049864314789687926, 0.03324287652645862, 0.016960651289009497]",0.016961,0.067843,0.016961,0.033921,0.037992,0.078019,13,0.751018,-1855.384615,0.0,0.0,0.0,1.0,0.751018,0.062992,0.020183,-0.013535,0.003863,0.066486,0.068274,11.0,0.032637,0.478023,0.001065,1.266365,3.647771,0.075674,0.201832,3.0,1.0,3.0,8.0,0.090909,0.0,1.0,0.909091,0.333333,0.636364,0.149593,0.498643,0.545455,0.152307,0.016961,-0.000178,-0.000266,-0.000451,0.00032,0.000322,0.000341,3.039506,0.099199,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.033243,0.049864,0.066486,0.066486,0.066486,0.066486,0.083107,0.083107,1.0,0.182993,0.024463,0.062695,0.035337,-0.553409,-0.010635,1.537945,1.0,0.182993,3.0,3.0,2.0,1.0,0.0,0.0,0.0,1.540306,0.090909,0.090909,0.272727,0.363636,0.545455,0.636364,0.727273,0.818182,0.073752,0.127314,0.122935,0.094515,0.08708,0.151169,0.14087,0.107358,0.056639,0.166722,0.16021,0.122838,0.022743,0.174556,0.17197,0.132181,0.009224,0.1719,0.177695,0.137996,0.000182,0.0,-0.016452,2.876637e-08,0.016452,2.876637e-08,-0.006581,6.5e-05,0.006581,6.5e-05,-0.006581,6.5e-05,0.006581,6.5e-05,-0.005503,0.000245,0.01289,0.000109,-0.013535,0.000801,0.020183,0.000577,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-0.002374,0.000271,0.011872,0.000135,-0.012805,0.000998,0.021116,0.000717,0.0,0.0,0.0,0.0,0.00277,0.00013,0.008311,6.9e-05,-0.009886,0.001073,0.019384,0.000795,0.00277,0.00013,0.008311,6.9e-05,-0.009886,0.001073,0.019384,0.000795,0.0,0.0,0.0,0.0,0.751018,0.019463,0.084651,0.0,-0.077357,-0.07726,0.751018,0.079768,0.114608,0.0,-75.877226,-42.386049,1.334589,3.157348,0.0,0.0,0.0,11.0,0.0,11.0,0.20882,0.20882,0.20882,0.22199,0.22199,0.00697,-0.757148,0.107346,-0.007814,0.002247,-3.372766,0.01192308,0.0,0.0,0.0,0.0,0.438432,0.070173,0.109646,0.070173,0.070173,0.070173,0.109646,0.039473,0.017543,0.004567,0.363636,0.272727,0.181818,0.090909,0.090909,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.454545,0.454545,0.636364,0.636364,0.636364,0.450561,1.011404,1.329661,1.329661,1.791759,1.522955,1.906155,1.94591
4,ID_3K9VZ5J,2000,0.0,0,0,35,7,0,56.0,1,14,5,14740,1.23077,-5.69231,"[1849.6923076923076, 1849.7692307692307, 1849.8461538461538, 1849.923076923077, 1850.0, 1850.076923076923, 1850.1538461538462, 1850.2307692307693, 1850.3076923076924, 1850.3846153846155, 1850.4615384615386, 1850.5384615384614]","[0.1865671641791045, 0.06784260515603799, 0.05088195386702849, 0.06784260515603799, 0.06478968792401628, 0.05970149253731343, 0.018995929443690638, 0.04511533242876527, 0.05223880597014925, 0.028493894165535955, 0.03561736770691994, 0.049864314789687926]",0.042741,0.054613,0.04749,0.058005,0.016621,0.052578,13,0.727951,-1856.230769,0.0,0.0,0.0,1.0,0.727951,0.064056,0.025441,-0.012428,0.006649,0.05156,0.060663,12.0,0.040719,0.671233,0.001658,2.650186,8.290045,0.073061,0.279851,7.0,2.0,4.0,8.0,0.083333,0.0,0.583333,0.5,0.090909,0.166667,0.067843,0.135685,0.916667,0.186567,0.018996,-0.000234,-0.000252,-0.000459,0.00017,0.000172,0.000149,3.286974,0.133841,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.029206,0.037517,0.04654,0.050271,0.056716,0.063263,0.067232,0.067843,1.0,0.16203,0.001526,0.161405,0.152004,-0.282755,-0.169501,0.17316,1.0,0.16203,3.0,3.0,2.0,0.0,0.0,0.0,0.0,1.286057,0.083333,0.083333,0.166667,0.25,0.416667,0.583333,0.75,0.916667,0.072794,0.118274,0.119627,0.093331,0.110065,0.143914,0.129505,0.097922,0.08322,0.156015,0.140721,0.106453,0.035197,0.156177,0.150786,0.115793,0.006246,0.147458,0.154658,0.120605,0.000536,-0.094693,0.007123,0.0,0.007123,0.0,0.01583,6.1e-05,0.01583,6.1e-05,0.006174,0.000272,0.015672,6.5e-05,-0.002132,0.000457,0.017736,0.000147,-0.012428,0.001474,0.025441,0.000981,0.0,0.0,0.0,0.0,0.007123,0.0,0.007123,0.0,0.001018,3.7e-05,0.006106,1e-06,-0.019957,0.002061,0.027985,0.001676,0.0,0.0,0.0,0.0,-0.005088,0.0,0.005088,0.0,-0.025373,0.002297,0.032157,0.001907,-0.005088,0.0,0.005088,0.0,-0.042289,0.002922,0.042289,0.002922,-0.118725,0.0,0.118725,0.0,0.727951,0.16347,0.118725,0.0,-0.07972,-0.005288,0.727951,0.181873,0.118842,0.0,-25.997251,-2.55018,1.698823,4.03199,0.0,0.0,0.0,12.0,0.0,12.0,0.09531,0.231412,0.365024,0.367687,0.209865,0.027835,-0.630862,0.10159,-0.007441,0.002894,-2.374949,0.1489321,4.0,0.0,0.0,0.0,0.615246,0.112271,0.065532,0.055643,0.005633,0.031775,0.042602,0.012675,0.019805,0.038817,0.333333,0.166667,0.083333,0.083333,0.083333,0.083333,0.0,0.0,0.0,0.0,1.0,0.0,0.416667,0.416667,0.583333,0.666667,0.833333,0.59827,1.078992,1.549826,1.94591,1.94591,1.695743,2.043192,2.079442


In [39]:
df_test=merged1[merged1['m1']==0]
merged1.drop(merged1[merged1['m1']==0].index,inplace=True)

In [40]:
df_test.shape

(9336, 294)

In [41]:
merged1.shape

(28007, 294)

In [42]:
m1=merged1['m1']
m2=merged1['m2']
m3=merged1['m3']
m4=merged1['m4']
m5=merged1['m5']
m6=merged1['m6']

In [43]:
merged1.drop(columns=['m1','m2','m3','m4','m5','m6'],inplace=True)

In [44]:
df_test.drop(columns=['m1','m2','m3','m4','m5','m6'],inplace=True)

In [45]:
df_test.shape

(9336, 288)

In [46]:
merged1.shape

(28007, 288)

In [47]:
X_train=merged1.copy()

In [48]:
X_train.drop(columns=['ID', 'UpsellDate', 'ExpectedTermDate', 'LastPaymentDate', 'TransactionDates', 'PaymentsHistory','time'],inplace=True)

In [49]:
m1=m1*merged1['TotalContractValue']
m2=m2*merged1['TotalContractValue']
m3=m3*merged1['TotalContractValue']
m4=m4*merged1['TotalContractValue']
m5=m5*merged1['TotalContractValue']
m6=m6*merged1['TotalContractValue']

In [50]:

xtrain_m1, xval_m1, ytrain_m1, yval_m1 = train_test_split(
    X_train, 
    m1, 
    test_size=.3, 
    random_state=21, 
    shuffle=True
)
xtrain_m2, xval_m2, ytrain_m2, yval_m2 = train_test_split(
    X_train, 
    m2, 
    test_size=.3, 
    random_state=21, 
    shuffle=True
)
xtrain_m3, xval_m3, ytrain_m3, yval_m3 = train_test_split(
    X_train, 
    m3, 
    test_size=.3, 
    random_state=21, 
    shuffle=True
)
xtrain_m4, xval_m4, ytrain_m4, yval_m4 = train_test_split(
    X_train, 
    m4, 
    test_size=.3, 
    random_state=21, 
    shuffle=True
)
xtrain_m5, xval_m5, ytrain_m5, yval_m5 = train_test_split(
    X_train, 
    m5, 
    test_size=.3, 
    random_state=21, 
    shuffle=True
)
xtrain_m6, xval_m6, ytrain_m6, yval_m6 = train_test_split(
    X_train, 
    m6, 
    test_size=.3, 
    random_state=21, 
    shuffle=True
)

In [51]:
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_squared_error
lgbm1=LGBMRegressor()
lgbm1.fit(xtrain_m1,ytrain_m1)
pred1=lgbm1.predict(xval_m1)
mse1=mean_squared_error(pred1,yval_m1)**0.5
print(mse1)

395.3638392903541


In [52]:
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_squared_error
lgbm2=LGBMRegressor()
lgbm2.fit(xtrain_m2,ytrain_m2)
pred2=lgbm2.predict(xval_m2)
mse2=mean_squared_error(pred2,yval_m2)**0.5
print(mse2)

440.2042989535992


In [53]:
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_squared_error
lgbm3=LGBMRegressor()
lgbm3.fit(xtrain_m3,ytrain_m3)
pred3=lgbm3.predict(xval_m3)
mse3=mean_squared_error(pred3,yval_m3)**0.5
print(mse3)

527.648214135509


In [54]:
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_squared_error
lgbm4=LGBMRegressor()
lgbm4.fit(xtrain_m4,ytrain_m4)
pred4=lgbm4.predict(xval_m4)
mse4=mean_squared_error(pred4,yval_m4)**0.5
print(mse4)

454.11525158646407


In [55]:
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_squared_error
lgbm5=LGBMRegressor()
lgbm5.fit(xtrain_m5,ytrain_m5)
pred5=lgbm5.predict(xval_m5)
mse5=mean_squared_error(pred5,yval_m5)**0.5
print(mse5)

920.6644900205646


In [56]:
from lightgbm import LGBMRegressor
from sklearn.metrics import mean_squared_error
lgbm6=LGBMRegressor()
lgbm6.fit(xtrain_m6,ytrain_m6)
pred6=lgbm6.predict(xval_m6)
mse6=mean_squared_error(pred6,yval_m6)**0.5
print(mse6)

1289.566025197475


In [57]:
subm=df_test[['ID']].copy()

In [58]:
subm.shape

(9336, 1)

In [59]:
subm['ID'].head()

1     ID_6L67PAA
5     ID_VJ80SX2
8     ID_7OU9HLK
9     ID_WVWTPGK
12    ID_04DSDQS
Name: ID, dtype: object

In [60]:
df_test.drop(columns=['ID', 'UpsellDate', 'ExpectedTermDate', 'LastPaymentDate', 'TransactionDates', 'PaymentsHistory','time'],inplace=True)

In [71]:
fin1=lgbm1.predict(df_test)
subm1=subm.copy()
subm1['Target']=fin1
subm1['ID']=subm1['ID']+' x m1'

In [74]:
fin2=lgbm2.predict(df_test)
subm2=subm.copy()
subm2['Target']=fin2
subm2['ID']=subm2['ID']+' x m2'

In [76]:
fin3=lgbm3.predict(df_test)
subm3=subm.copy()
subm3['Target']=fin3
subm3['ID']=subm3['ID']+' x m3'

In [77]:
fin4=lgbm4.predict(df_test)
subm4=subm.copy()
subm4['Target']=fin4
subm4['ID']=subm4['ID']+' x m4'

In [78]:
fin5=lgbm5.predict(df_test)
subm5=subm.copy()
subm5['Target']=fin5
subm5['ID']=subm5['ID']+' x m5'

In [79]:
fin6=lgbm6.predict(df_test)
subm6=subm.copy()
subm6['Target']=fin6
subm6['ID']=subm6['ID']+' x m6'

In [80]:
frames=[subm1,subm2,subm3,subm4,subm5,subm6]
submission=pd.concat(frames)

In [81]:
submission.sort_values(by='ID',inplace=True)

In [82]:
submission.head()

Unnamed: 0,ID,Target
4203,ID_000RHRU x m1,260.015533
4203,ID_000RHRU x m2,375.724108
4203,ID_000RHRU x m3,415.364648
4203,ID_000RHRU x m4,419.662794
4203,ID_000RHRU x m5,567.656847


In [83]:
submission.to_csv('my_submission.csv', index=False)
print("Your submission was successfully saved!")

Your submission was successfully saved!
