# Experiment

### Vorbereitung

In [1]:
import pandas as pd
import numpy as np
import time

import experiment
from imputer import *

In [2]:
t0 = time.time()
results = []
base, scaler = experiment.reset_base(return_scaler=True)

In [3]:
functions =  {'Backfill':impute_backfill, 'Overall Mean':impute_overall_means, 
              'Yearly Mean':impute_yearly_means, 'Yearly Mean per Region':impute_yearly_means_per_region, 
              'Interpolate 3':interpolate3, 'Interpolate all':interpolate_all, 
              'ICE 1':iterative_imputer1, 'ICE 2':iterative_imputer2, 
              'ICE 3':iterative_imputer3, 'MICE 1':mice_imputer, 'MICE 2':mice_imputer2, 
              'KNN 1':knn_imputer1, 'KNN 2':knn_imputer2
             }

In [4]:
def run_all(frac):
    
    #getting n different training sets
    cords_list =[]
    n = 7
    for i in np.arange(1,n+1):
        cords_list.append(experiment.get_cords(frac, i))
    
    #setting up two dictionaries to save detailed and averaged results
    detailed_results = {}   
    results = {}
         
    #itterating over dictionary of all imputers
    for name, func in functions.items():
        func_runs = []
        print(name)
        
        #running each imputer n times on different training sets
        for count, cords in enumerate(cords_list):            
            print(f'run: {count+1}/{n}')
            
            #running current imputer and timeing runtime
            t0 = time.time()
            df= func(experiment.reset_train(cords)) 
            t1 = time.time()
            t = t1-t0
            
            #evaluating run
            func_runs.append(experiment.evaluate(df, t, cords))
        
        #print evaluation result of all runs of current imputer
        print(func_runs)
        print ('')
        
        #save detailed and averaged results
        detailed_results[name] = func_runs
        results[name] = np.mean(np.array(func_runs), axis=0)
        
    return results, detailed_results


### Durchlauf mit 3% fehlenden Werten

In [5]:
r1, r1_detail = run_all(0.03)

Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Backfill
run: 1/7
r2: 0.9937039221729441, rmse: 0.007707057811487927, t: 0.526526927947998

run: 2/7
r2: 0.9657391810107668, rmse: 0.10555221815029571, t: 0.5235934257507324

run: 3/7
r2: 0.9766604006765891, rmse: 0.056011491920483096, t: 0.5210199356079102

run: 4/7
r2: 0.9501189660444422, rmse: 0.11902912409462993, t: 0.5325300693511963

run: 5/7
r2: 0.9831429735684615, rmse: 0.19290286081367014, t: 0.5321474075317383

run: 6/7
r2: 0.9573375292925177, rmse: 0.3128308878879232, t: 0.5290226936340332

run: 7/7
r2: 0.9933442360232246, rmse: 0.24392357863946923, t: 0.5255281925201416

[[0.9937039221729441, 0.007707057811487927, 13



r2: 0.9886141004811781, rmse: 0.010133741302042107, t: 9.179530382156372

run: 2/7




r2: 0.9969938797064417, rmse: 0.03264245109172732, t: 9.073166847229004

run: 3/7




r2: 0.9823856956727524, rmse: 0.04749377870979146, t: 9.072300434112549

run: 4/7




r2: 0.9443952112833709, rmse: 0.12301500835650132, t: 10.130785465240479

run: 5/7




r2: 0.9930012149058882, rmse: 0.1214447328042551, t: 9.454391956329346

run: 6/7




r2: 0.9904658215291421, rmse: 0.14477207716361423, t: 11.017295837402344

run: 7/7




r2: 0.997505666086807, rmse: 0.14564247211583412, t: 10.64597201347351

[[0.9886141004811781, 0.010133741302042107, 0, 9.179530382156372], [0.9969938797064417, 0.03264245109172732, 0, 9.073166847229004], [0.9823856956727524, 0.04749377870979146, 0, 9.072300434112549], [0.9443952112833709, 0.12301500835650132, 0, 10.130785465240479], [0.9930012149058882, 0.1214447328042551, 0, 9.454391956329346], [0.9904658215291421, 0.14477207716361423, 0, 11.017295837402344], [0.997505666086807, 0.14564247211583412, 0, 10.64597201347351]]

ICE 2
run: 1/7
r2: 0.5788132288656755, rmse: 0.06163444660307302, t: 25.72673773765564

run: 2/7
r2: 0.9669299390486221, rmse: 0.10826724408166427, t: 25.982272624969482

run: 3/7
r2: 0.9348462881281402, rmse: 0.09134263970608068, t: 25.75723433494568

run: 4/7
r2: 0.3956973498698034, rmse: 0.40553584987931257, t: 29.61709451675415

run: 5/7
r2: 0.9768823216404493, rmse: 0.22071886952704878, t: 24.831433057785034

run: 6/7
r2: 0.9907854500471703, rmse: 0.14232468502



r2: -5.782937969962195, rmse: 0.24734040215576422, t: 80.21087527275085

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0799033982078504e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3494085481130412.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2488735646459102.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1014003086131140.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 268048955391033.06, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 151926253175668.94, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 238513876110891.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 497983705317007.7, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 289017147183020.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 355915452226243.3, scaled tolerance: 35084726045503.402 




r2: 0.8897214921707376, rmse: 0.19770835602778117, t: 81.35544657707214

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.995283345381666e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3000719520796107.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2498691031340111.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 787375027349655.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 261874436794394.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 217340275140959.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 231966339084000.03, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3714339557724758.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2211213339885234.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 929528025057859.2, scaled tolerance: 35084726045503.402 




r2: 0.12720869040568894, rmse: 0.3343175560153587, t: 81.31389260292053

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.959707392362632e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4092070970867496.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1842634154554800.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 318120130042958.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 287910333739588.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 444642220331643.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 475390572175422.44, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 348760315019321.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 281276129282691.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 135337710363837.02, scaled tolerance: 35084726045503.402 




r2: 0.8058902562416488, rmse: 0.22984003078536086, t: 80.74026226997375

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.8701323059467836e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3529939060362759.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2449931491622516.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1481456827893229.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 661514257431716.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 377803906916290.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 146950100490097.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 134067335167841.78, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 98584070567759.1, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 78513110568461.44, scaled tolerance: 35084726045503.402 




r2: 0.05577804733072378, rmse: 1.410601694706969, t: 81.04362797737122

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.015818359427178e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3117744409768266.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2479185006035241.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 951416804686240.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 351753783539276.75, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 178252798348134.34, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 179445817035008.34, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 139763187913068.81, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 111221144977164.53, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 167509416466243.22, scaled tolerance: 35084726045503.402 




r2: 0.9808206153968652, rmse: 0.2053338267526176, t: 80.0068371295929

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9313439837575116e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2866807417925424.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2542088147042818.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1162880534806257.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 538236274919893.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3552899129990092.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2100823101805869.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 876634066136050.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 412874573773454.06, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 271586922977810.34, scaled tolerance: 35084726045503.402 




r2: 0.8884253662652009, rmse: 0.9740774313427364, t: 80.61836957931519

[[-5.782937969962195, 0.24734040215576422, 0, 80.21087527275085], [0.8897214921707376, 0.19770835602778117, 0, 81.35544657707214], [0.12720869040568894, 0.3343175560153587, 0, 81.31389260292053], [0.8058902562416488, 0.22984003078536086, 0, 80.74026226997375], [0.05577804733072378, 1.410601694706969, 0, 81.04362797737122], [0.9808206153968652, 0.2053338267526176, 0, 80.0068371295929], [0.8884253662652009, 0.9740774313427364, 0, 80.61836957931519]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.06
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.28
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.38
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.63
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.73
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.80
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.90
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.21
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.40
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.50
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.59
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.64
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.74
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.81
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.12
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.30
[IterativeImputer] Ending imputation round 4

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.85
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.31
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.53
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.58
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.66
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.73
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending i

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.75
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.92
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.29
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.25
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.46
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.80
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.01
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.13
[IterativeImputer] Ending imputation round 6/10, elapsed time 7.24
[IterativeImputer] Ending imputation round 7/10, elapsed time 8.38
[IterativeImputer] Ending imputation round 8/10, elapsed time 9.49
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.58
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.70
Imputation round 9/12
[IterativeImputer] C

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.50
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.57
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.78
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.88
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.06
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.20
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.29
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.37
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.55
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.65
[IterativeImputer] Ending imputation round 9/

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.30
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.40
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.58
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.76
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.84
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.42
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.51
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.51
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.58
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.75
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.81
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.46
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.08
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.68
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.27
[IterativeImputer] Ending imputation round 8/10, elapsed time 68.93
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.85
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.55
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.47
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.75
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.31
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.04
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.85
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.58
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.22
[IterativeImputer] Ending imputation round 3/10, elapsed time 26.07
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.84
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.71
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.48
[IterativeImputer] Ending imputation round 7/10, elapsed time 61.43
[IterativeImputer] Ending imputation round 8/10, elapsed time 70.22
[IterativeImputer] Ending imputation round 9/10, elapsed time 79.05
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.81
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.60
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.76
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 69.46
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.11
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.70
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.65
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.33
[IterativeImputer] Ending imputation round 3/10, elapsed time 26.06
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.86
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.57
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.39
[IterativeImputer] Ending imputation round 7/10, elapsed time 61.11
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.83
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.61
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.31
Imputation round 5/5
[IterativeImp

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.54
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.13
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.93
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.63
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.31
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.10
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.87
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.48
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.08
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.74
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.45
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.21
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.95
[IterativeImputer] Ending imputatio

In [6]:
r1 = pd.DataFrame(r1).T
r1

Unnamed: 0,0,1,2,3
Backfill,0.974292,0.14828,135535.571429,0.527196
Overall Mean,-5.962344,1.241624,0.0,0.765108
Yearly Mean,-0.355261,1.067552,52298.0,0.603498
Yearly Mean per Region,-1.183785,1.088632,58248.428571,0.722327
Interpolate 3,0.997193,0.043241,134354.571429,2.499423
Interpolate all,0.997194,0.043126,112679.285714,1.776762
ICE 1,0.984766,0.089306,0.0,9.796206
ICE 2,0.809815,0.321516,0.0,25.856708
ICE 3,-0.290728,0.514174,0.0,80.755616
MICE 1,0.988975,0.065806,0.0,132.21311


In [7]:
r1_detail = pd.DataFrame(pd.DataFrame(r1_detail).T.stack().to_dict()).T
r1_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r1_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,0.993704,0.007707,135530.0,0.526527
Backfill,1,0.965739,0.105552,135514.0,0.523593
Backfill,2,0.976660,0.056011,135555.0,0.521020
Backfill,3,0.950119,0.119029,135512.0,0.532530
Backfill,4,0.983143,0.192903,135536.0,0.532147
...,...,...,...,...,...
KNN 2,2,-0.233679,0.397471,0.0,17.035321
KNN 2,3,-20.034245,2.392575,0.0,17.116524
KNN 2,4,0.125150,1.357795,0.0,17.111814
KNN 2,5,-15.411109,6.006371,0.0,17.061632


### Durchlauf mit 5% fehlenden Werten

In [8]:
r2 , r2_detail =  run_all(0.05)

Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Backfill
run: 1/7
r2: 0.9955395119500975, rmse: 0.1861136671230279, t: 0.7944169044494629

run: 2/7
r2: 0.9527099134718778, rmse: 0.1345692633962322, t: 0.7894420623779297

run: 3/7
r2: 0.9763782188141665, rmse: 0.09655187044651366, t: 0.7956225872039795

run: 4/7
r2: 0.9821806209292083, rmse: 0.07169457597353222, t: 0.7859370708465576

run: 5/7
r2: 0.9919133372286484, rmse: 0.30785394825052304, t: 0.792574405670166

run: 6/7
r2: 0.9731047056590749, rmse: 0.11202481252411967, t: 0.7877082824707031

run: 7/7
r2: 0.9555658812117589, rmse: 0.1250581475259366, t: 0.7917881011962891

[[0.9955395119500975, 0.1861136671230279, 135735, 



r2: 0.9942158016960598, rmse: 0.20756410705991854, t: 9.504182815551758

run: 2/7




r2: 0.7827329807258437, rmse: 0.2820413273792655, t: 9.342730283737183

run: 3/7




r2: 0.988236531487906, rmse: 0.06661977159134161, t: 9.413074254989624

run: 4/7




r2: 0.9877198111831341, rmse: 0.1761993484346218, t: 9.372396469116211

run: 5/7




r2: 0.9908166506864295, rmse: 0.320979945536532, t: 9.33663558959961

run: 6/7




r2: 0.979276661097969, rmse: 0.09625406608467339, t: 9.279404878616333

run: 7/7




r2: 0.9885215254972911, rmse: 0.062270014150689196, t: 9.349469423294067

[[0.9942158016960598, 0.20756410705991854, 0, 9.504182815551758], [0.7827329807258437, 0.2820413273792655, 0, 9.342730283737183], [0.988236531487906, 0.06661977159134161, 0, 9.413074254989624], [0.9877198111831341, 0.1761993484346218, 0, 9.372396469116211], [0.9908166506864295, 0.320979945536532, 0, 9.33663558959961], [0.979276661097969, 0.09625406608467339, 0, 9.279404878616333], [0.9885215254972911, 0.062270014150689196, 0, 9.349469423294067]]

ICE 2
run: 1/7
r2: 0.897000119367959, rmse: 0.8758889134010717, t: 22.816221237182617

run: 2/7
r2: 0.9664793394870981, rmse: 0.1107827472103113, t: 22.684454202651978

run: 3/7
r2: 0.8501371093540149, rmse: 0.2377839268308384, t: 22.771201610565186

run: 4/7
r2: 0.965367564984733, rmse: 0.29589885856832354, t: 22.68521499633789

run: 5/7
r2: 0.9533613958864062, rmse: 0.7233527197482782, t: 22.816636562347412

run: 6/7
r2: 0.9615302098800056, rmse: 0.13114421213306895, t



r2: 0.6724652756518652, rmse: 1.5619220044933946, t: 80.57109236717224

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.042905975534203e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2952750620995729.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2637618919460105.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 839975951480219.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 416741465011542.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 206536252721299.34, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 257581722062894.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3676756867963236.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2184993869866275.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3531016219250393.0, scaled tolerance: 35084726045503.402 




r2: 0.8649439154415968, rmse: 0.22236832474634613, t: 81.04388475418091

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0843589729908572e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1979474405978225.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2801112307662757.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1574030763879201.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 970053503110370.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 444197716419550.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 120489078070655.97, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 250815913508324.62, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 334711927449455.7, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 169377876238841.16, scaled tolerance: 35084726045503.402 




r2: 0.4368929726829536, rmse: 0.4609256913736006, t: 80.53303623199463

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 4.07467735367784e+16, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 1722959034065735.5, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 2090673085752552.0, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 1048890708859029.4, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 477907701737168.3, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 247554233211173.34, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 186004828520420.94, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 115911094752149.7, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 4551435341310723.0, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 2950508177613738.0, scaled tolerance: 24412569472460.902 




r2: 0.7933548811158273, rmse: 0.7227936884335278, t: 81.29315876960754

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9978395215752304e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3003152652961603.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2710129489422781.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1503311021595322.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 637890235948702.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 193512071993254.84, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 95235849980947.98, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3799024907012754.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2165780169160924.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 758361314303099.8, scaled tolerance: 35084726045503.402 




r2: 0.7509497996987184, rmse: 1.6715554758531586, t: 82.13223910331726

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9776192030081652e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3044979293280502.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2763841100172785.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1362571378206143.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 661720887075584.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 564051005975988.1, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 282493180047003.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 258287355201001.56, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 317856899116435.44, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 207792200045378.66, scaled tolerance: 35084726045503.402 




r2: 0.7683567367590791, rmse: 0.32180964561497843, t: 82.66263222694397

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0226885580187016e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2379627034227580.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3225907214873371.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1411027095596911.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 620877603659269.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 207785870209439.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 99800251007646.69, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 266273218000688.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 300535847821599.75, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4243503242538099.0, scaled tolerance: 35084726045503.402 




r2: 0.925267046972088, rmse: 0.15888867713223276, t: 82.23351550102234

[[0.6724652756518652, 1.5619220044933946, 0, 80.57109236717224], [0.8649439154415968, 0.22236832474634613, 0, 81.04388475418091], [0.4368929726829536, 0.4609256913736006, 0, 80.53303623199463], [0.7933548811158273, 0.7227936884335278, 0, 81.29315876960754], [0.7509497996987184, 1.6715554758531586, 0, 82.13223910331726], [0.7683567367590791, 0.32180964561497843, 0, 82.66263222694397], [0.925267046972088, 0.15888867713223276, 0, 82.23351550102234]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.28
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.38
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.55
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.63
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.69
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.78
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.04
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.13
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.21
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.31
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.54
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.62
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.71
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.81
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.13
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.84
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.32
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.50
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.61
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.69
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.86
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending i

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.69
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.78
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.86
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.55
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.63
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.74
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.80
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.92
Imputation round 9/12
[IterativeImputer] Co

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.56
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.75
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.83
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.42
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.51
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.59
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.42
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.60
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.76
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.82
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.38
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.45
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.30
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.36
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.45
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.51
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.74
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.86
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.28
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.49
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.24
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.79
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.65
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.29
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.86
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.61
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.50
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.10
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.67
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.23
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.91
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.41
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.59
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.86
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.48
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.18
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.92
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.65
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.33
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.20
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.92
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.55
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.78
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 70.04
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.78
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.53
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.75
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.39
[IterativeImputer] Ending imputation round 3/10, elapsed time 26.11
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.79
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.51
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.18
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.89
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.45
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.22
Imputation round 5/5
[IterativeImp

[IterativeImputer] Ending imputation round 3/10, elapsed time 25.81
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.63
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.41
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.15
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.87
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.65
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.38
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.11
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.61
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 26.12
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.74
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.38
[IterativeImputer] Ending imputatio

In [9]:
r2 = pd.DataFrame(r2).T
r2

Unnamed: 0,0,1,2,3
Backfill,0.975342,0.147695,135735.285714,0.79107
Overall Mean,-0.37569,1.520351,0.0,1.031946
Yearly Mean,0.003883,1.443118,52298.0,0.867196
Yearly Mean per Region,-0.037073,1.459472,58352.714286,0.975353
Interpolate 3,0.986653,0.099497,134538.0,2.879262
Interpolate all,0.986653,0.099293,112822.0,2.0982
ICE 1,0.958789,0.173133,0.0,9.371128
ICE 2,0.936942,0.35486,0.0,22.787866
ICE 3,0.744604,0.731466,0.0,81.495651
MICE 1,0.961106,0.190552,0.0,131.261402


In [10]:
r2_detail = pd.DataFrame(pd.DataFrame(r2_detail).T.stack().to_dict()).T
r2_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r2_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,0.995540,0.186114,135735.0,0.794417
Backfill,1,0.952710,0.134569,135759.0,0.789442
Backfill,2,0.976378,0.096552,135763.0,0.795623
Backfill,3,0.982181,0.071695,135732.0,0.785937
Backfill,4,0.991913,0.307854,135733.0,0.792574
...,...,...,...,...,...
KNN 2,2,0.018198,0.608622,0.0,17.644920
KNN 2,3,0.039752,1.558094,0.0,17.660501
KNN 2,4,0.365186,2.668704,0.0,17.362485
KNN 2,5,-0.009893,0.671935,0.0,17.547829


### Durchlauf mit 10% fehlenden Werten

In [11]:
r3, r3_detail = run_all(0.1)

Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Backfill
run: 1/7
r2: 0.9274609546179627, rmse: 0.13999037811409296, t: 1.4602751731872559

run: 2/7
r2: 0.9455969962686308, rmse: 0.23338382688988088, t: 1.453249216079712

run: 3/7
r2: 0.988973607471802, rmse: 0.09433324875288353, t: 1.4485344886779785

run: 4/7
r2: 0.9871014885095162, rmse: 0.1274737073886282, t: 1.448564052581787

run: 5/7
r2: 0.978704659862762, rmse: 0.14079264643449055, t: 1.4496948719024658

run: 6/7
r2: 0.9594305188150599, rmse: 0.13362401808881974, t: 1.448211908340454

run: 7/7
r2: 0.9653888552652197, rmse: 0.21176762112988018, t: 1.457254409790039

[[0.9274609546179627, 0.139990378114092



r2: 0.9370202334659707, rmse: 0.12777336992410396, t: 10.01151418685913

run: 2/7




r2: 0.9521427024799756, rmse: 0.2140660895293748, t: 9.965301752090454

run: 3/7




r2: 0.9893949691492818, rmse: 0.09044214578504266, t: 9.933764219284058

run: 4/7




r2: 0.9872547817984083, rmse: 0.1239430322939622, t: 9.928513288497925

run: 5/7




r2: 0.9145067510943837, rmse: 0.27554462283829784, t: 10.028450012207031

run: 6/7




r2: 0.9744614263853603, rmse: 0.10397455368644115, t: 9.976807355880737

run: 7/7




r2: 0.9592018246489338, rmse: 0.2262877530362623, t: 10.002170085906982

[[0.9370202334659707, 0.12777336992410396, 0, 10.01151418685913], [0.9521427024799756, 0.2140660895293748, 0, 9.965301752090454], [0.9893949691492818, 0.09044214578504266, 0, 9.933764219284058], [0.9872547817984083, 0.1239430322939622, 0, 9.928513288497925], [0.9145067510943837, 0.27554462283829784, 0, 10.028450012207031], [0.9744614263853603, 0.10397455368644115, 0, 9.976807355880737], [0.9592018246489338, 0.2262877530362623, 0, 10.002170085906982]]

ICE 2
run: 1/7
r2: 0.9353924573529703, rmse: 0.12941405261701314, t: 23.349486589431763

run: 2/7
r2: 0.9754346077997191, rmse: 0.1533683133456013, t: 23.46217703819275

run: 3/7
r2: 0.9360508486955306, rmse: 0.22209167631387725, t: 23.23794913291931

run: 4/7
r2: 0.9788027743296512, rmse: 0.1598409276001701, t: 23.801782608032227

run: 5/7
r2: 0.9654162535346161, rmse: 0.17525162313588508, t: 23.26524066925049

run: 6/7
r2: 0.9480526821327732, rmse: 0.14828946922440



r2: 0.8656510287868295, rmse: 0.18661949011636286, t: 82.30011439323425

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0793701416671844e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1965670947388250.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2055781807062901.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1202414568308490.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 693042073549476.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 378724405818521.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 255856467206931.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 267666823038194.47, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 154395120361844.72, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 148140249946584.5, scaled tolerance: 35084726045503.402 




r2: 0.7873761250218165, rmse: 0.4512111309121132, t: 80.98962163925171

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.767695010894046e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2215172710472481.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1272751790088711.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1112711149673679.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 802807918332657.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 493386041322739.56, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 430603857658830.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 332478603549620.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 342605605246312.56, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 441335845081200.56, scaled tolerance: 35084726045503.402 




r2: 0.6804537315552623, rmse: 0.4964571441735188, t: 81.57783102989197

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9054460292016464e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2686861492950140.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2020346442314162.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 966537983426960.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 582942911181494.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 420352635594125.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 330099304310940.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 358375333903242.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3634484630414166.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1767168676599967.5, scaled tolerance: 35084726045503.402 




r2: 0.47922093799031384, rmse: 0.7922736954811134, t: 81.66539025306702

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.846033471882781e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2443889493057179.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1118613781447626.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1656357204430435.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1009176985672603.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 559421305245813.94, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 312335935597925.06, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 220725728023061.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 164621507370038.3, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 82701702766819.66, scaled tolerance: 35084726045503.402 




r2: 0.8722507778212176, rmse: 0.3368256541499248, t: 81.75665307044983

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.8294474367208748e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4139629907362432.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 390103240320452.3, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 480200889998486.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 261830544332400.75, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 189086282259717.12, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 377920233300190.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 194047129613484.97, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 169979398971228.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 227898838726431.8, scaled tolerance: 35084726045503.402 




r2: 0.7763818916299724, rmse: 0.30766793089303923, t: 81.13509631156921

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.854918039445052e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2409759074863166.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2223436743873453.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1238625108794931.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 920819527831711.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 691382610454438.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 307868855775374.7, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4257137278737354.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2379071200736785.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3091248674431410.5, scaled tolerance: 35084726045503.402 




r2: 0.8564627437700868, rmse: 0.4244465423647631, t: 82.04906010627747

[[0.8656510287868295, 0.18661949011636286, 0, 82.30011439323425], [0.7873761250218165, 0.4512111309121132, 0, 80.98962163925171], [0.6804537315552623, 0.4964571441735188, 0, 81.57783102989197], [0.47922093799031384, 0.7922736954811134, 0, 81.66539025306702], [0.8722507778212176, 0.3368256541499248, 0, 81.75665307044983], [0.7763818916299724, 0.30766793089303923, 0, 81.13509631156921], [0.8564627437700868, 0.4244465423647631, 0, 82.04906010627747]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.21
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.30
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.37
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.30
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.43
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.51
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.56
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.64
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.73
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.26
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.05
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.20
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.29
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.37
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.52
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.59
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.65
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.76
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.82
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.28
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.57
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.63
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.73
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.80
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending i

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.94
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.16
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.34
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.51
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.70
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.88
[IterativeImputer] Ending imputation round 6/10, elapsed time 7.08
[IterativeImputer] Ending imputation round 7/10, elapsed time 8.20
[IterativeImputer] Ending imputation round 8/10, elapsed time 9.39
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.52
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.67
Imputation round 9/12
[IterativeImputer] C

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.58
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.75
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.97
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.14
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.22
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.52
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.56
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.65
[IterativeImputer] Ending imputation round 9/

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.29
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.46
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.53
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.59
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.66
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.76
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.19
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.29
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.36
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.11
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.19
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.27
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.36
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.42
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.53
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.60
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.67
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.74
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.13
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.31
[IterativeImputer] Ending imputation round 5/

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.26
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.85
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.33
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.17
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.93
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.77
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.53
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.83
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.41
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.05
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.78
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.40
[IterativeImputer] Ending imputation round 2/10, elapsed time 16.99
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.60
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.25
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.87
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.52
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.27
[IterativeImputer] Ending imputation round 8/10, elapsed time 68.91
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.56
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.29
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.47
[IterativeImputer] Ending imputation round 2/10, elapsed time 16.94
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.48
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 69.38
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.21
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.06
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.53
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.00
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.53
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.11
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.85
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.27
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.01
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.65
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.39
Imputation round 5/5
[IterativeImp

[IterativeImputer] Ending imputation round 3/10, elapsed time 25.74
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.41
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.07
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.73
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.31
[IterativeImputer] Ending imputation round 8/10, elapsed time 68.90
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.57
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.34
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.56
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.72
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.50
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.23
[IterativeImputer] Ending imputatio

In [12]:
r3 = pd.DataFrame(r3).T
r3

Unnamed: 0,0,1,2,3
Backfill,0.964665,0.154481,136315.285714,1.452255
Overall Mean,-0.395046,1.014262,0.0,1.691577
Yearly Mean,0.006562,0.877928,52320.571429,1.528007
Yearly Mean per Region,-0.04767,0.899047,58597.428571,1.634522
Interpolate 3,0.993325,0.070422,135062.142857,3.706281
Interpolate all,0.993325,0.070246,113218.571429,2.833818
ICE 1,0.95914,0.166005,0.0,9.978074
ICE 2,0.958234,0.16959,0.0,23.394707
ICE 3,0.759685,0.427929,0.0,81.63911
MICE 1,0.969067,0.143948,0.0,131.948982


In [13]:
r3_detail = pd.DataFrame(pd.DataFrame(r3_detail).T.stack().to_dict()).T
r3_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r3_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,0.927461,0.139990,136318.0,1.460275
Backfill,1,0.945597,0.233384,136383.0,1.453249
Backfill,2,0.988974,0.094333,136254.0,1.448534
Backfill,3,0.987101,0.127474,136287.0,1.448564
Backfill,4,0.978705,0.140793,136382.0,1.449695
...,...,...,...,...,...
KNN 2,2,-0.010297,0.882753,0.0,18.724982
KNN 2,3,0.173781,0.997921,0.0,18.725665
KNN 2,4,0.177441,0.854692,0.0,18.820452
KNN 2,5,0.198567,0.582455,0.0,18.844070


### Imputationverfahren auf Originaldatensatz anwenden

In [14]:
for name, func in functions.items():
    print(name)
    
    #impute original (scaled) dataset
    t0 = time.time()
    df= func(experiment.reset_base()) 
    t1 = time.time()
    t = t1-t0
    
    #rescale to original proportions
    df = scaler.inverse_transform(df)

    print(f'{round(t, 2)}s vergangen')
    print('')
    df.to_csv(f'additional_data/imputed_sets/{name}.csv')

Backfill
0.14s vergangen

Overall Mean
0.39s vergangen

Yearly Mean
0.21s vergangen

Yearly Mean per Region
0.34s vergangen

Interpolate 3
2.05s vergangen

Interpolate all
1.36s vergangen

ICE 1




8.82s vergangen

ICE 2
21.91s vergangen

ICE 3
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0129401435894064e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3255302827643808.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2664174541478353.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 752792522498120.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4139741271714855.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2298800774032059.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1244198777526491.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1297247835266420.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3963777598111986.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2892682827217661.5, scaled tolerance: 35084726045503.402 
84.33s vergangen





MICE 1
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.35
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.41
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.51
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.58
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.73
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.83
Imputation round 2/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Endi

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.75
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.42
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.48
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.60
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.77
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.85
130.72s vergangen

MICE 2
Imputation round 1/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.72
[I

### Ergebnisse abspeichern

In [15]:
t1 = time.time()
t = t1-t0
print(f'complete runtime: {t/60}min')

comlete runtime: 0.2840871334075928min


In [16]:
sets = {'r1':r1, 'r1_detail':r1_detail,
       'r2':r2, 'r2_detail':r2_detail,
       'r3':r3, 'r3_detail':r3_detail,}
for name, df in sets.items():
    df.to_csv(f'additional_data/results/{name}.csv')