In [1]:
import os
import re
import warnings

import numpy as np
import pandas as pd

warnings.filterwarnings('ignore')
os.getcwd()

'/Users/seb/repos/ml/automlbenchmark/reports'

In [2]:
def parse_value(val):
    m = re.fullmatch(r"(?P<value>-?\d+\.?\d*)( \((?P<imp>\d?)\))?", val)
    return m.groupdict() if m else dict(value=np.nan, imp=None)

def get_scores(duration):
    scores = pd.read_csv(f"tables/{duration}h/score_summary.csv", index_col=['type', 'task'])
#     return scores
    return scores.applymap(lambda v: parse_value(str(v))['value']).astype(np.float)

def calc_improvements(lhs, rhs):
    improvement = (rhs - lhs).dropna(how='all')
    relative_improvement = ((rhs - lhs) * 100 / lhs.abs()).dropna(how='all')
    return improvement, relative_improvement

scores_1h = get_scores(1)
scores_4h = get_scores(4)
scores_8h = get_scores(8)

improvement_1to4, relative_improvement_1to4 = calc_improvements(scores_1h, scores_4h)
improvement_4to8, relative_improvement_4to8 = calc_improvements(scores_4h, scores_8h)            


In [3]:
improvement_1to4

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,adult,0.00025,0.001521,0.0,0.003847,-2e-05,0.001725,0.000143
binary,amazon_employee_access,-0.006552,0.011058,0.0,0.001357,0.000228,-0.002022,0.000511
binary,apsfailure,0.000343,0.019574,0.0,-0.000367,0.000555,0.00146,0.000763
binary,australian,-0.000165,0.008012,0.0,-0.004181,-0.000936,0.004282,-0.002374
binary,bank-marketing,-0.00044,0.082493,0.0,-1.5e-05,-0.000223,0.000578,7.9e-05
binary,blood-transfusion,0.006063,0.001063,0.0,0.007648,-0.002072,-0.017317,-0.001614
binary,christine,0.001684,0.006535,0.0,-0.001976,-0.000145,0.006124,-0.000446
binary,credit-g,-0.000143,-0.00881,0.0,0.001001,-0.00031,-0.014667,-0.002238
binary,guiellermo,0.003458,-0.001681,0.0,0.002686,3.8e-05,0.03434,0.000262
binary,higgs,0.016138,0.079908,0.0,0.002341,-9.6e-05,0.003409,0.000379


In [4]:
relative_improvement_1to4

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,adult,0.026895,0.167538,0.0,0.415541,-0.002199,0.186,0.015728
binary,amazon_employee_access,-0.765466,1.366819,0.0,0.154336,0.026384,-0.232534,0.059223
binary,apsfailure,0.034605,2.029111,0.0,-0.036983,0.055992,0.147436,0.077011
binary,australian,-0.01764,0.862018,0.0,-0.444928,-0.099936,0.459475,-0.254202
binary,bank-marketing,-0.046942,9.978517,0.0,-0.001601,-0.023957,0.061905,0.008488
binary,blood-transfusion,0.800527,0.143492,0.0,1.011238,-0.301916,-2.390622,-0.234402
binary,christine,0.202953,0.81485,0.0,-0.239226,-0.017995,0.752887,-0.055089
binary,credit-g,-0.018272,-1.170689,0.0,0.1269,-0.03901,-1.865691,-0.281324
binary,guiellermo,0.383669,-0.191418,0.0,0.295189,0.00421,4.191772,0.029022
binary,higgs,2.034228,11.803529,0.0,0.287767,-0.011956,0.425301,0.047201


In [5]:
improvement_4to8

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,airlines,-0.001536,0.026216,0.0,0.00031,0.0,0.000422,6.3e-05
binary,albert,-0.006743,,0.0,-0.002775,0.0,0.013498,0.000278
multiclass,covertype,0.016915,-2.29016,0.0,0.095561,0.0,0.050578,-0.061889
multiclass,dionis,-0.7608,0.99608,0.0,,0.0,,0.07045


In [6]:
relative_improvement_4to8

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,airlines,-0.211529,3.949472,0.0,0.04239,0.0,0.058388,0.009528
binary,albert,-0.900901,,0.0,-0.362527,0.0,1.86367,0.037667
multiclass,covertype,13.972295,-142.712215,0.0,37.013467,0.0,32.058059,-62.228769
multiclass,dionis,-22.648654,25.680504,0.0,,0.0,,6.481558


In [7]:
scores_1h

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,adult,0.929528,0.907855,0.5,0.92578,0.909396,0.92742,0.909231
binary,amazon_employee_access,0.855949,0.809032,0.5,0.879249,0.864145,0.86955,0.862834
binary,apsfailure,0.991173,0.964659,0.5,0.992338,0.991212,0.990257,0.990772
binary,australian,0.935352,0.929447,0.5,0.939702,0.936597,0.931933,0.933904
binary,bank-marketing,0.937332,0.826706,0.5,0.93707,0.930829,0.933684,0.930685
binary,blood-transfusion,0.757376,0.740807,0.5,0.756301,0.686283,0.724372,0.688562
binary,christine,0.829747,0.801988,0.5,0.825998,0.80578,0.813402,0.809603
binary,credit-g,0.782619,0.752548,0.5,0.788809,0.794667,0.786143,0.795524
binary,guiellermo,0.901298,0.878182,0.5,0.909924,0.902647,0.819224,0.902757
binary,higgs,0.793323,0.676984,0.5,0.813504,0.802973,0.80155,0.802942


In [8]:
scores_4h

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,adult,0.929778,0.909376,0.5,0.929627,0.909376,0.929145,0.909374
binary,airlines,0.726142,0.663785,0.5,0.731307,0.660767,0.722753,0.661191
binary,albert,0.748473,,0.5,0.76546,0.738157,0.72427,0.738038
binary,amazon_employee_access,0.849397,0.82009,0.5,0.880606,0.864373,0.867528,0.863345
binary,apsfailure,0.991516,0.984233,0.5,0.991971,0.991767,0.991717,0.991535
binary,australian,0.935187,0.937459,0.5,0.935521,0.935661,0.936215,0.93153
binary,bank-marketing,0.936892,0.909199,0.5,0.937055,0.930606,0.934262,0.930764
binary,blood-transfusion,0.763439,0.74187,0.5,0.763949,0.684211,0.707055,0.686948
binary,christine,0.831431,0.808523,0.5,0.824022,0.805635,0.819526,0.809157
binary,credit-g,0.782476,0.743738,0.5,0.78981,0.794357,0.771476,0.793286


In [9]:
scores_8h

Unnamed: 0_level_0,Unnamed: 1_level_0,autosklearn,autoweka,constantpredictor,h2oautoml,randomforest,tpot,tunedrandomforest
type,task,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
binary,airlines,0.724606,0.690001,0.5,0.731617,0.660767,0.723175,0.661254
binary,albert,0.74173,,0.5,0.762685,0.738157,0.737768,0.738316
multiclass,covertype,-0.104146,-3.8949,-1.20516,-0.162618,-0.161368,-0.107192,-0.161343
multiclass,dionis,-4.11994,-2.88266,-5.85739,-1.66178,-1.07764,-1.36118,-1.01648
