# Scripts for loading results

In [2]:
import sys
import os
import glob
import re
import datetime
import math
import random
from pathlib import Path
import importlib
import shutil

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import scipy as sp
import statsmodels.api as sm
import sklearn as sk
from sktime.utils.data_io import load_from_tsfile_to_dataframe
from IPython.display import display, HTML

from experiments.python.aggregating import get_agg_matrix
from experiments.python.loading import load_experiments

%matplotlib inline
pd.set_option("display.max_rows", 100)
pd.set_option("display.max_columns", 100)
pd.set_option('display.width', 2000)
pd.set_option('display.float_format', lambda x: '%.4f' % x)
pd.set_option("display.max_seq_items", 100)

In [3]:
%load_ext autoreload

PROJECT_DIR  = "E:/git/dotnet54/TS-CHIEF-DEV/"
SCRIPTS_DIR = f"{PROJECT_DIR}/experiments/python/"
def load_modules():
    %reload_ext autoreload
    %autoreload 2

    print("loading utility modules...")
    %run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/utils"
    %run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/loading"
    %run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/aggregating"
    # %run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/plotting"

load_modules()

loading utility modules...
utils.py 29-4-2021.1
PROJECT_DIR: E:/git/dotnet54/TS-CHIEF-DEV/
utils.py 29-4-2021.1
PROJECT_DIR: E:/git/dotnet54/TS-CHIEF-DEV/
loading.py 16-5-2021.1
aggregating.py 29-4-2021.1


## Testing

In [37]:
load_modules()


INPUT = f"E:/git/experiments/thesis/out/ch3/"
OUTPUT = f"{INPUT}/.out"
exp = load_experiments(input_dir = INPUT, output_dir = OUTPUT,
                       # include=['k100e1','k100e2','k100e5','k100e10'], exclude=None,
                       include=['k100e1', 'k100e2'], exclude=None,
                       use_cache=True, save_intermediate=False, save=True)

print(exp.keys())
display(exp['k100e1'].head())

loading utility modules...
utils.py 29-4-2021.1
PROJECT_DIR: E:/git/dotnet54/TS-CHIEF-DEV/
loading.py 18-6-2021.1
aggregating.py 18-6-2021.1
load_experiments:: 1. loading k100e1 from cache
load_experiments:: 3. loading k100e2 from cache
dict_keys(['k100e1', 'k100e2'])


Unnamed: 0_level_0,batch_index,exp_name,timestamp,dataset,train_size,test_size,dimensions,length,classes,accuracy,error_rate,correct,errors,total_time_s,total_time_hr,train_time_hr,test_time_hr,total_time_formatted,train_time_formatted,test_time_formatted,train_time_ns,test_time_ns,init_time_ns,rand_seed,threads,cpus,hostname,version,build_date,version_tag,experiment_name,experiment_id,normalize,shuffle,fold_no,repeat_no,train_classes,test_classes,max_memory,total_memory,free_memory,free_memory_after_init,free_memory_after_train,free_memory_after_test,alloc_memory,alloc_memory_after_init,alloc_memory_after_train,alloc_memory_after_test,max_mem_usage,num_trees,...,wddtw_win,lcss_win,twe_win,erp_win,msm_win,ee_time,boss_time,rif_time,cif_time,randf_time,rotf_time,st_time,tsf_time,it_time,rt_time,euc_time,dtwf_time,dtw_time,ddtwf_time,ddtw_time,wdtw_time,wddtw_time,lcss_time,twe_time,erp_time,msm_time,rif_acf_count,rif_pacf_count,rif_arma_count,rif_ps_count,rif_dft_count,rif_acf_win,rif_pacf_win,rif_arma_win,rif_ps_win,rif_dft_win,rif_acf_time,rif_pacf_time,rif_arma_time,rif_ps_time,rif_dft_time,tree_accuracy_mean,tree_accuracy_std,tree_total_time_s_mean,tree_total_time_s_std,args,boss_transform_time,st_transform_time,it_transform_time,rt_transform_time
index,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1
0,0,k100e1,13-06-2021 19:47:24,Adiac,390,391,1,176,37,0.7033,0.2967,275,116,20.1922,0.0056,0.0027,0.0029,0-0:0:20.192,0-0:0:9.593,0-0:0:10.598,9593722423,10598509152,67476,8478120861627832,0,16,m3h005,2.1.1,2021.6.01,chief-refactored-2-thesis,,df6c69df,False,False,0,0,37,37,48000,616,391,391,245,212,225,225,371,404,504.0,100,...,844.0,898.0,927.0,947.0,921.0,122838710603.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,120087959.0,5105351871.0,4764289670.0,7632134594.0,12694762161.0,22644608237.0,20426511564.0,3832804995.0,80774358334.0,11769630043.0,78130618141.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4946,0.1087,2.5842,2.4773,-data=../data/ -archive=Univariate2018_ts -ove...,0.0,0.0,0.0,0.0
1,1,k100e1,13-06-2021 19:42:20,ArrowHead,36,175,1,251,3,0.8514,0.1486,149,26,2.1668,0.0006,0.0001,0.0005,0-0:0:2.166,0-0:0:0.345,0-0:0:1.821,345312838,1821500663,54997,8478120861627832,0,16,m3h005,2.1.1,2021.6.01,chief-refactored-2-thesis,,df6c69df,False,False,0,0,3,3,48000,216,134,134,145,65,82,82,71,151,151.0,100,...,109.0,113.0,111.0,112.0,87.0,4615304805.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7651697.0,776602734.0,625222862.0,1117474886.0,1166233923.0,3655404860.0,5870155762.0,664484971.0,8341606915.0,1590647295.0,5780816322.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.7025,0.0705,0.2998,0.1426,-data=../data/ -archive=Univariate2018_ts -ove...,0.0,0.0,0.0,0.0
2,2,k100e1,13-06-2021 19:42:58,Beef,30,30,1,470,5,0.7,0.3,21,9,2.4181,0.0007,0.0003,0.0004,0-0:0:2.418,0-0:0:1.079,0-0:0:1.338,1079091181,1338968378,83940,8478120861627832,0,16,m3h005,2.1.1,2021.6.01,chief-refactored-2-thesis,,df6c69df,False,False,0,0,5,5,48000,464,315,315,208,238,149,149,256,226,290.0,100,...,122.0,97.0,94.0,124.0,100.0,14337122509.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3042048.0,497005909.0,447446664.0,1197307928.0,1391885264.0,2875543330.0,3211967942.0,484158653.0,7070909153.0,1881115540.0,11033657352.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.5847,0.0918,0.3253,0.2076,-data=../data/ -archive=Univariate2018_ts -ove...,0.0,0.0,0.0,0.0
3,3,k100e1,13-06-2021 19:42:24,BeetleFly,20,20,1,512,2,0.65,0.35,13,7,1.3727,0.0004,0.0002,0.0002,0-0:0:1.372,0-0:0:0.596,0-0:0:0.776,596536920,776138358,117772,8478120861627832,0,16,m3h005,2.1.1,2021.6.01,chief-refactored-2-thesis,,df6c69df,False,False,0,0,2,2,48000,456,213,213,147,271,123,123,189,185,195.0,100,...,123.0,98.0,86.0,95.0,93.0,8454996953.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2227365.0,396059319.0,264020223.0,601003399.0,607146447.0,2214497735.0,4040519282.0,489359118.0,4085041121.0,790970369.0,4963281982.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.6295,0.1299,0.1926,0.0775,-data=../data/ -archive=Univariate2018_ts -ove...,0.0,0.0,0.0,0.0
4,4,k100e1,13-06-2021 19:42:22,BirdChicken,20,20,1,512,2,0.85,0.15,17,3,1.4695,0.0004,0.0002,0.0002,0-0:0:1.469,0-0:0:0.698,0-0:0:0.771,698475429,771009258,74144,8478120861627832,0,16,m3h005,2.1.1,2021.6.01,chief-refactored-2-thesis,,df6c69df,False,False,0,0,2,2,48000,336,146,146,173,202,70,70,163,134,216.0,100,...,76.0,84.0,91.0,84.0,101.0,9560607713.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2192888.0,344598952.0,459372227.0,661494400.0,566249672.0,1736267857.0,2843990724.0,556396867.0,5058859088.0,903223116.0,6308658431.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.6985,0.1113,0.2019,0.0927,-data=../data/ -archive=Univariate2018_ts -ove...,0.0,0.0,0.0,0.0


In [39]:
%run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/aggregating"

exp['k100e1'].head()

get_agg_matrix(exp, ['k100e1', 'k100e2'], 'accuracy')

aggregating.py 18-6-2021.1


Unnamed: 0,dataset,k100e1,k100e2
0,Adiac,0.7136,0.7379
1,ArrowHead,0.84,0.8657
2,Beef,0.6833,0.7167
3,BeetleFly,0.675,0.775
4,BirdChicken,0.825,0.8
5,CBF,0.9828,0.9844
6,Car,0.8167,0.8417
7,ChlorineConcentration,0.628,0.6294
8,CinCECGTorso,0.8949,0.9127
9,Coffee,1.0,1.0


In [26]:
%load_ext autoreload
%autoreload 2

%run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/utils"

# from experiments.python.loading import *

INPUT = f"E:/git/experiments/thesis/out/0105/"
OUTPUT = f"E:/git/dotnet54/TS-CHIEF-DEV/experiments/thesis/data/tmp/"

# tmp =  load_forest_csv("k500e5", input_dir=INPUT, output_dir=OUTPUT, num_folds=1, num_repeats=1,
#                 save_intermediate=True, save=True, verbosity=0)
# tmp.head()

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload
utils.py 29-4-2021.1
PROJECT_DIR: E:/git/dotnet54/TS-CHIEF-DEV/


## Experiments

In [None]:

load_forest_csv("k500e5", input_dir=INPUT, output_dir=OUTPUT, num_folds=1, num_repeats=1,
                save_intermediate=True, save=True, verbosity=0)
load_forest_csv("k500b100", input_dir=INPUT, output_dir=OUTPUT, num_folds=1, num_repeats=1,
                save_intermediate=True, save=True, verbosity=0)
load_forest_csv("k500r100", input_dir=INPUT, output_dir=OUTPUT, num_folds=1, num_repeats=1,
                save_intermediate=True, save=True, verbosity=0)

load_forest_csv("k500b100_bv1", input_dir=INPUT, output_dir=OUTPUT, num_folds=1, num_repeats=1,
                save_intermediate=True, save=True, verbosity=0)
load_forest_csv("k500r100_rv1", input_dir=INPUT, output_dir=OUTPUT, num_folds=1, num_repeats=1,
                save_intermediate=True, save=True, verbosity=0)

## WORK AREA

In [45]:
%run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/plotting"

plotting.py 29-4-2021.1


In [46]:
# tmp = read_csv("k500b100.all_forest", input_dir=OUTPUT)

tmp = read_and_merge_csv("k500b100.all_forest", "k500b100_bv1.all_forest", input_dir=OUTPUT)[0]
tmp.head()

from plotting import scatter 

scatter(tmp['accuracy_x'], tmp['accuracy_y'])


TypeError: 'NoneType' object is not subscriptable

In [None]:
load_modules()

# %run "E:/git/dotnet54/TS-CHIEF-DEV/experiments/python/utils"

INPUT = f"E:/git/experiments/mpf/11-2-2020/0704/topk/"
OUTPUT = f"E:/git/experiments/mpf/11-2-2020/0704/topk/"
exp_topk = load_experiments(input_dir = INPUT, output_dir = OUTPUT)

print(exp_topk.keys())

In [None]:
INPUT = f"{PROJECT_DIR}/out/test/topk/"
OUTPUT = f"{PROJECT_DIR}/out/test/topk/"

df_exp = load_experiments(input_dir=INPUT, output_dir=OUTPUT)