# Experiment

### Vorbereitung

In [1]:
import pandas as pd
import numpy as np
import time

import experiment
from imputer import *

In [2]:
t0 = time.time()
results = []
base = experiment.reset_base()

In [3]:
functions =  {'Backfill':impute_backfill, 'Overall Mean':impute_overall_means, 
              'Yearly Mean':impute_yearly_means, 'Yearly Mean per Region':impute_yearly_means_per_region, 
              'Interpolate 3':interpolate3, 'Interpolate all':interpolate_all, 
              'ICE 1':iterative_imputer1, 'ICE 2':iterative_imputer2, 
              'ICE 3':iterative_imputer3, 'MICE 1':mice_imputer, 'MICE 2':mice_imputer2, 
              'KNN 1':knn_imputer1, 'KNN 2':knn_imputer2
             }

In [4]:
def run_all(frac):
    
    #getting n different training sets
    cords_list =[]
    n = 7
    for i in np.arange(1,n+1):
        cords_list.append(experiment.get_cords(frac, i))
    
    #setting up two dictionaries to save detailed and averaged results
    detailed_results = {}   
    results = {}
         
    #itterating over dictionary of all imputers
    for name, func in functions.items():
        func_runs = []
        print(name)
        
        #running each imputer n times on different training sets
        for count, cords in enumerate(cords_list):            
            print(f'run: {count+1}/{n}')
            
            #running current imputer and timeing runtime
            t0 = time.time()
            df= func(experiment.reset_train(cords)) 
            t1 = time.time()
            t = t1-t0
            
            #evaluating run
            func_runs.append(experiment.evaluate(df, t, cords))
        
        #print evaluation result of all runs of current imputer
        print(func_runs)
        print ('')
        
        #save detailed and averaged results
        detailed_results[name] = func_runs
        results[name] = np.mean(np.array(func_runs), axis=0)
        
    return results, detailed_results


### Durchlauf mit 3% fehlenden Werten

In [5]:
r1, r1_detail = run_all(0.03)

Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Backfill
run: 1/7
r2: -144.98553218874548, rmse: 1.167481655589472, t: 0.5405552387237549

run: 2/7
r2: -0.4794096680065927, rmse: 0.7353749861467419, t: 0.5665717124938965

run: 3/7
r2: -0.8348683382262871, rmse: 0.49142181386145956, t: 0.543114423751831

run: 4/7
r2: -1.5797499946123539, rmse: 0.8520111068685011, t: 0.5720705986022949

run: 5/7
r2: -0.05550737513979409, rmse: 1.5157644139579278, t: 0.584585428237915

run: 6/7
r2: -1.6304125406906191, rmse: 2.4458919591067323, t: 0.583345890045166

run: 7/7
r2: 0.015980859403412206, rmse: 2.9284326026095235, t: 0.5673139095306396

[[-144.98553218874548, 1.167481655589472, 32550



r2: 0.9886141004811781, rmse: 0.010133741302042107, t: 9.176393508911133

run: 2/7




r2: 0.9969938797064417, rmse: 0.03264245109172732, t: 9.117773056030273

run: 3/7




r2: 0.9823856956727524, rmse: 0.04749377870979146, t: 9.058730840682983

run: 4/7




r2: 0.9443952112833709, rmse: 0.12301500835650132, t: 9.109863519668579

run: 5/7




r2: 0.9930012149058882, rmse: 0.1214447328042551, t: 9.141319751739502

run: 6/7




r2: 0.9904658215291421, rmse: 0.14477207716361423, t: 9.151404619216919

run: 7/7




r2: 0.997505666086807, rmse: 0.14564247211583412, t: 9.09156346321106

[[0.9886141004811781, 0.010133741302042107, 0, 9.176393508911133], [0.9969938797064417, 0.03264245109172732, 0, 9.117773056030273], [0.9823856956727524, 0.04749377870979146, 0, 9.058730840682983], [0.9443952112833709, 0.12301500835650132, 0, 9.109863519668579], [0.9930012149058882, 0.1214447328042551, 0, 9.141319751739502], [0.9904658215291421, 0.14477207716361423, 0, 9.151404619216919], [0.997505666086807, 0.14564247211583412, 0, 9.09156346321106]]

ICE 2
run: 1/7
r2: 0.5788132288656755, rmse: 0.06163444660307302, t: 22.373931884765625

run: 2/7
r2: 0.9669299390486221, rmse: 0.10826724408166427, t: 22.43480348587036

run: 3/7
r2: 0.9348462881281402, rmse: 0.09134263970608068, t: 22.371362447738647

run: 4/7
r2: 0.3956973498698034, rmse: 0.40553584987931257, t: 22.26173233985901

run: 5/7
r2: 0.9768823216404493, rmse: 0.22071886952704878, t: 22.406378507614136

run: 6/7
r2: 0.9907854500471703, rmse: 0.14232468502594



r2: -5.782937969962195, rmse: 0.24734040215576422, t: 81.29945302009583

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0799033982078504e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3494085481130412.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2488735646459102.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1014003086131140.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 268048955391033.06, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 151926253175668.94, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 238513876110891.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 497983705317007.7, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 289017147183020.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 355915452226243.3, scaled tolerance: 35084726045503.402 




r2: 0.8897214921707376, rmse: 0.19770835602778117, t: 81.37644529342651

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.995283345381666e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3000719520796107.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2498691031340111.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 787375027349655.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 261874436794394.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 217340275140959.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 231966339084000.03, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3714339557724758.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2211213339885234.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 929528025057859.2, scaled tolerance: 35084726045503.402 




r2: 0.12720869040568894, rmse: 0.3343175560153587, t: 80.37357592582703

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.959707392362632e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4092070970867496.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1842634154554800.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 318120130042958.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 287910333739588.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 444642220331643.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 475390572175422.44, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 348760315019321.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 281276129282691.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 135337710363837.02, scaled tolerance: 35084726045503.402 




r2: 0.8058902562416488, rmse: 0.22984003078536086, t: 80.53988742828369

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.8701323059467836e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3529939060362759.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2449931491622516.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1481456827893229.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 661514257431716.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 377803906916290.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 146950100490097.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 134067335167841.78, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 98584070567759.1, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 78513110568461.44, scaled tolerance: 35084726045503.402 




r2: 0.05577804733072378, rmse: 1.410601694706969, t: 80.7481861114502

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.015818359427178e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3117744409768266.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2479185006035241.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 951416804686240.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 351753783539276.75, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 178252798348134.34, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 179445817035008.34, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 139763187913068.81, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 111221144977164.53, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 167509416466243.22, scaled tolerance: 35084726045503.402 




r2: 0.9808206153968652, rmse: 0.2053338267526176, t: 80.64609265327454

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9313439837575116e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2866807417925424.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2542088147042818.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1162880534806257.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 538236274919893.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3552899129990092.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2100823101805869.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 876634066136050.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 412874573773454.06, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 271586922977810.34, scaled tolerance: 35084726045503.402 




r2: 0.8884253662652009, rmse: 0.9740774313427364, t: 80.42581295967102

[[-5.782937969962195, 0.24734040215576422, 0, 81.29945302009583], [0.8897214921707376, 0.19770835602778117, 0, 81.37644529342651], [0.12720869040568894, 0.3343175560153587, 0, 80.37357592582703], [0.8058902562416488, 0.22984003078536086, 0, 80.53988742828369], [0.05577804733072378, 1.410601694706969, 0, 80.7481861114502], [0.9808206153968652, 0.2053338267526176, 0, 80.64609265327454], [0.8884253662652009, 0.9740774313427364, 0, 80.42581295967102]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.26
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.32
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.37
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.35
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.51
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.61
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.69
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.76
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.80
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.30
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.37
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.45
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.63
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.87
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.21
[IterativeImputer] Ending imputation round 4

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.80
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.39
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.45
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.61
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.70
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.78
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.87
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending i

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.63
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.70
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.78
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.32
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.38
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.45
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.53
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.61
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.71
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.78
Imputation round 9/12
[IterativeImputer] Co

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.61
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.77
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.83
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.28
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.37
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.43
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.52
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.60
[IterativeImputer] Ending imputation round 9/

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.59
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.75
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.84
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.41
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.26
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.42
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.58
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.74
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.82
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.30
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.54
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.22
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.88
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.46
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.09
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.91
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.61
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.52
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.93
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.51
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.29
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.07
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.51
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.09
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.94
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.71
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.64
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.38
[IterativeImputer] Ending imputation round 7/10, elapsed time 61.39
[IterativeImputer] Ending imputation round 8/10, elapsed time 70.28
[IterativeImputer] Ending imputation round 9/10, elapsed time 79.12
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.90
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.65
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.32
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.97
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 69.40
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.09
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.75
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.62
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.92
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.72
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.48
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.30
[IterativeImputer] Ending imputation round 7/10, elapsed time 61.11
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.86
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.69
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.45
Imputation round 5/5
[IterativeImp

[IterativeImputer] Ending imputation round 3/10, elapsed time 26.20
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.90
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.45
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.31
[IterativeImputer] Ending imputation round 7/10, elapsed time 61.05
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.85
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.94
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.89
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.64
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.26
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.91
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.61
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.36
[IterativeImputer] Ending imputatio

In [6]:
r1 = pd.DataFrame(r1).T
r1

Unnamed: 0,0,1,2,3
Backfill,-21.364214,1.448054,32527.0,0.565365
Overall Mean,-5.962344,1.241624,0.0,0.820471
Yearly Mean,-0.355261,1.067552,52298.0,0.635217
Yearly Mean per Region,-1.183785,1.088632,58248.428571,0.736686
Interpolate 3,-10.35088,1.327611,32557.857143,0.612619
Interpolate all,-10.352888,1.305378,59.428571,0.593553
ICE 1,0.984766,0.089306,0.0,9.121007
ICE 2,0.809815,0.321516,0.0,22.380427
ICE 3,-0.290728,0.514174,0.0,80.772779
MICE 1,0.988975,0.065806,0.0,131.155067


In [7]:
r1_detail = pd.DataFrame(pd.DataFrame(r1_detail).T.stack().to_dict()).T
r1_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r1_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,-144.985532,1.167482,32550.0,0.540555
Backfill,1,-0.479410,0.735375,32521.0,0.566572
Backfill,2,-0.834868,0.491422,32510.0,0.543114
Backfill,3,-1.579750,0.852011,32521.0,0.572071
Backfill,4,-0.055507,1.515764,32519.0,0.584585
...,...,...,...,...,...
KNN 2,2,-0.233679,0.397471,0.0,17.000751
KNN 2,3,-20.034245,2.392575,0.0,17.015642
KNN 2,4,0.125150,1.357795,0.0,17.030557
KNN 2,5,-15.411109,6.006371,0.0,16.973309


### Durchlauf mit 5% fehlenden Werten

In [8]:
r2 , r2_detail =  run_all(0.05)

Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Backfill
run: 1/7
r2: -0.2630386067986965, rmse: 3.1264580984032304, t: 0.7864000797271729

run: 2/7
r2: -2.77533240911633, rmse: 1.1896157293266358, t: 0.794287919998169

run: 3/7
r2: -1.688280205196218, rmse: 1.0226797653748734, t: 0.7923393249511719

run: 4/7
r2: -0.6672076075877178, rmse: 2.085863590967128, t: 0.7887966632843018

run: 5/7
r2: -0.07720522781720884, rmse: 3.533882957257935, t: 0.7867903709411621

run: 6/7
r2: -5.6191599013569355, rmse: 1.7468428288779958, t: 0.7876796722412109

run: 7/7
r2: -3.5433278053623427, rmse: 1.259265501149907, t: 0.7907960414886475

[[-0.2630386067986965, 3.1264580984032304, 32924, 0.



r2: 0.9942158016960598, rmse: 0.20756410705991854, t: 9.396286249160767

run: 2/7




r2: 0.7827329807258437, rmse: 0.2820413273792655, t: 9.336734771728516

run: 3/7




r2: 0.988236531487906, rmse: 0.06661977159134161, t: 9.326533555984497

run: 4/7




r2: 0.9877198111831341, rmse: 0.1761993484346218, t: 9.349674224853516

run: 5/7




r2: 0.9908166506864295, rmse: 0.320979945536532, t: 9.359977960586548

run: 6/7




r2: 0.979276661097969, rmse: 0.09625406608467339, t: 9.41997766494751

run: 7/7




r2: 0.9885215254972911, rmse: 0.062270014150689196, t: 9.39787244796753

[[0.9942158016960598, 0.20756410705991854, 0, 9.396286249160767], [0.7827329807258437, 0.2820413273792655, 0, 9.336734771728516], [0.988236531487906, 0.06661977159134161, 0, 9.326533555984497], [0.9877198111831341, 0.1761993484346218, 0, 9.349674224853516], [0.9908166506864295, 0.320979945536532, 0, 9.359977960586548], [0.979276661097969, 0.09625406608467339, 0, 9.41997766494751], [0.9885215254972911, 0.062270014150689196, 0, 9.39787244796753]]

ICE 2
run: 1/7
r2: 0.897000119367959, rmse: 0.8758889134010717, t: 22.65574622154236

run: 2/7
r2: 0.9664793394870981, rmse: 0.1107827472103113, t: 22.78944683074951

run: 3/7
r2: 0.8501371093540149, rmse: 0.2377839268308384, t: 22.70345377922058

run: 4/7
r2: 0.965367564984733, rmse: 0.29589885856832354, t: 22.881284952163696

run: 5/7
r2: 0.9533613958864062, rmse: 0.7233527197482782, t: 22.841010570526123

run: 6/7
r2: 0.9615302098800056, rmse: 0.13114421213306895, t: 22



r2: 0.6724652756518652, rmse: 1.5619220044933946, t: 80.79265356063843

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.042905975534203e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2952750620995729.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2637618919460105.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 839975951480219.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 416741465011542.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 206536252721299.34, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 257581722062894.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3676756867963236.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2184993869866275.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3531016219250393.0, scaled tolerance: 35084726045503.402 




r2: 0.8649439154415968, rmse: 0.22236832474634613, t: 81.55274415016174

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0843589729908572e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1979474405978225.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2801112307662757.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1574030763879201.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 970053503110370.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 444197716419550.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 120489078070655.97, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 250815913508324.62, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 334711927449455.7, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 169377876238841.16, scaled tolerance: 35084726045503.402 




r2: 0.4368929726829536, rmse: 0.4609256913736006, t: 80.13306403160095

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 4.07467735367784e+16, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 1722959034065735.5, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 2090673085752552.0, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 1048890708859029.4, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 477907701737168.3, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 247554233211173.34, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 186004828520420.94, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 115911094752149.7, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 4551435341310723.0, scaled tolerance: 24412569472460.902 
[IterativeImputer] Change: 2950508177613738.0, scaled tolerance: 24412569472460.902 




r2: 0.7933548811158273, rmse: 0.7227936884335278, t: 81.66687202453613

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9978395215752304e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3003152652961603.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2710129489422781.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1503311021595322.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 637890235948702.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 193512071993254.84, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 95235849980947.98, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3799024907012754.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2165780169160924.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 758361314303099.8, scaled tolerance: 35084726045503.402 




r2: 0.7509497996987184, rmse: 1.6715554758531586, t: 82.1869146823883

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9776192030081652e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3044979293280502.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2763841100172785.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1362571378206143.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 661720887075584.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 564051005975988.1, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 282493180047003.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 258287355201001.56, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 317856899116435.44, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 207792200045378.66, scaled tolerance: 35084726045503.402 




r2: 0.7683567367590791, rmse: 0.32180964561497843, t: 82.54212212562561

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0226885580187016e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2379627034227580.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3225907214873371.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1411027095596911.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 620877603659269.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 207785870209439.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 99800251007646.69, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 266273218000688.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 300535847821599.75, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4243503242538099.0, scaled tolerance: 35084726045503.402 




r2: 0.925267046972088, rmse: 0.15888867713223276, t: 82.8696517944336

[[0.6724652756518652, 1.5619220044933946, 0, 80.79265356063843], [0.8649439154415968, 0.22236832474634613, 0, 81.55274415016174], [0.4368929726829536, 0.4609256913736006, 0, 80.13306403160095], [0.7933548811158273, 0.7227936884335278, 0, 81.66687202453613], [0.7509497996987184, 1.6715554758531586, 0, 82.1869146823883], [0.7683567367590791, 0.32180964561497843, 0, 82.54212212562561], [0.925267046972088, 0.15888867713223276, 0, 82.8696517944336]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.31
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.37
[IterativeImputer] Ending imputation round 6/1

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.40
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.59
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.76
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.84
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.26
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.14
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.41
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.59
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.69
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.77
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.83
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.87
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.26
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.61
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.70
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.88
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.12
[IterativeImputer] Ending i

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.67
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.75
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.82
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.24
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.52
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.60
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.70
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.77
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.88
Imputation round 9/12
[IterativeImputer] Co

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.60
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.76
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.86
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.06
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.15
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.41
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.55
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.65
[IterativeImputer] Ending imputation round 9/

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.30
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.38
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.54
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.65
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.72
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.82
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.37
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.35
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.43
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.47
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.57
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.64
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.74
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.81
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.20
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.35
[IterativeImputer] Ending imputation round 5/

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.42
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.07
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.64
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.48
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.10
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.68
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.51
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.51
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.81
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.98
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.53
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.53
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.19
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.81
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.45
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.19
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.91
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.75
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.49
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.41
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.09
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.52
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.32
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.95
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 70.20
[IterativeImputer] Ending imputation round 9/10, elapsed time 79.12
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.88
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.29
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.99
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.67
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.37
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.12
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.84
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.64
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.45
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.20
Imputation round 5/5
[IterativeImp

[IterativeImputer] Ending imputation round 3/10, elapsed time 25.79
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.56
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.38
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.06
[IterativeImputer] Ending imputation round 7/10, elapsed time 61.03
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.83
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.61
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.37
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.63
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.28
[IterativeImputer] Ending imputation round 3/10, elapsed time 26.11
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.69
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.33
[IterativeImputer] Ending imputatio

In [9]:
r2 = pd.DataFrame(r2).T
r2

Unnamed: 0,0,1,2,3
Backfill,-2.090507,1.994944,32841.0,0.789584
Overall Mean,-0.37569,1.520351,0.0,1.038475
Yearly Mean,0.003883,1.443118,52298.0,0.866701
Yearly Mean per Region,-0.037073,1.459472,58352.714286,0.978276
Interpolate 3,-0.821449,1.713417,32871.428571,0.858034
Interpolate all,-0.821336,1.685872,58.0,0.831332
ICE 1,0.958789,0.173133,0.0,9.36958
ICE 2,0.936942,0.35486,0.0,22.80914
ICE 3,0.744604,0.731466,0.0,81.677717
MICE 1,0.961106,0.190552,0.0,131.525383


In [10]:
r2_detail = pd.DataFrame(pd.DataFrame(r2_detail).T.stack().to_dict()).T
r2_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r2_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,-0.263039,3.126458,32924.0,0.786400
Backfill,1,-2.775332,1.189616,32825.0,0.794288
Backfill,2,-1.688280,1.022680,32824.0,0.792339
Backfill,3,-0.667208,2.085864,32841.0,0.788797
Backfill,4,-0.077205,3.533883,32828.0,0.786790
...,...,...,...,...,...
KNN 2,2,0.018198,0.608622,0.0,17.572790
KNN 2,3,0.039752,1.558094,0.0,17.616792
KNN 2,4,0.365186,2.668704,0.0,17.322385
KNN 2,5,-0.009893,0.671935,0.0,17.521255


### Durchlauf mit 10% fehlenden Werten

In [11]:
r3, r3_detail = run_all(0.1)

Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Backfill
run: 1/7
r2: -3.964219549140708, rmse: 1.1521878884113992, t: 1.4539918899536133

run: 2/7
r2: -1.8373707535864638, rmse: 1.6792466658151293, t: 1.4359464645385742

run: 3/7
r2: -1.9081389310564236, rmse: 1.5239926108614468, t: 1.4534881114959717

run: 4/7
r2: -0.8977876217879388, rmse: 1.5383638773729555, t: 1.4679749011993408

run: 5/7
r2: -1.1760918948068961, rmse: 1.4134849682042556, t: 1.4638822078704834

run: 6/7
r2: -6.042109199979188, rmse: 1.7577308194911425, t: 1.449491024017334

run: 7/7
r2: -0.965017536607846, rmse: 1.5948064365763108, t: 1.4459543228149414

[[-3.964219549140708, 1.152187888411



r2: 0.9370202334659707, rmse: 0.12777336992410396, t: 9.91875672340393

run: 2/7




r2: 0.9521427024799756, rmse: 0.2140660895293748, t: 10.007898092269897

run: 3/7




r2: 0.9893949691492818, rmse: 0.09044214578504266, t: 9.987415552139282

run: 4/7




r2: 0.9872547817984083, rmse: 0.1239430322939622, t: 9.972945928573608

run: 5/7




r2: 0.9145067510943837, rmse: 0.27554462283829784, t: 10.027352809906006

run: 6/7




r2: 0.9744614263853603, rmse: 0.10397455368644115, t: 9.958301782608032

run: 7/7




r2: 0.9592018246489338, rmse: 0.2262877530362623, t: 10.060387134552002

[[0.9370202334659707, 0.12777336992410396, 0, 9.91875672340393], [0.9521427024799756, 0.2140660895293748, 0, 10.007898092269897], [0.9893949691492818, 0.09044214578504266, 0, 9.987415552139282], [0.9872547817984083, 0.1239430322939622, 0, 9.972945928573608], [0.9145067510943837, 0.27554462283829784, 0, 10.027352809906006], [0.9744614263853603, 0.10397455368644115, 0, 9.958301782608032], [0.9592018246489338, 0.2262877530362623, 0, 10.060387134552002]]

ICE 2
run: 1/7
r2: 0.9353924573529703, rmse: 0.12941405261701314, t: 23.399222135543823

run: 2/7
r2: 0.9754346077997191, rmse: 0.1533683133456013, t: 23.687905073165894

run: 3/7
r2: 0.9360508486955306, rmse: 0.22209167631387725, t: 23.42537498474121

run: 4/7
r2: 0.9788027743296512, rmse: 0.1598409276001701, t: 23.590027570724487

run: 5/7
r2: 0.9654162535346161, rmse: 0.17525162313588508, t: 23.515063762664795

run: 6/7
r2: 0.9480526821327732, rmse: 0.148289469224



r2: 0.8656510287868295, rmse: 0.18661949011636286, t: 83.72660684585571

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0793701416671844e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1965670947388250.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2055781807062901.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1202414568308490.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 693042073549476.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 378724405818521.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 255856467206931.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 267666823038194.47, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 154395120361844.72, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 148140249946584.5, scaled tolerance: 35084726045503.402 




r2: 0.7873761250218165, rmse: 0.4512111309121132, t: 82.4126136302948

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.767695010894046e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2215172710472481.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1272751790088711.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1112711149673679.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 802807918332657.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 493386041322739.56, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 430603857658830.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 332478603549620.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 342605605246312.56, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 441335845081200.56, scaled tolerance: 35084726045503.402 




r2: 0.6804537315552623, rmse: 0.4964571441735188, t: 82.27380299568176

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.9054460292016464e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2686861492950140.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2020346442314162.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 966537983426960.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 582942911181494.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 420352635594125.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 330099304310940.4, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 358375333903242.25, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3634484630414166.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1767168676599967.5, scaled tolerance: 35084726045503.402 




r2: 0.47922093799031384, rmse: 0.7922736954811134, t: 82.23210501670837

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.846033471882781e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2443889493057179.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1118613781447626.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1656357204430435.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1009176985672603.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 559421305245813.94, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 312335935597925.06, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 220725728023061.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 164621507370038.3, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 82701702766819.66, scaled tolerance: 35084726045503.402 




r2: 0.8722507778212176, rmse: 0.3368256541499248, t: 82.46265244483948

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.8294474367208748e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4139629907362432.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 390103240320452.3, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 480200889998486.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 261830544332400.75, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 189086282259717.12, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 377920233300190.6, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 194047129613484.97, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 169979398971228.9, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 227898838726431.8, scaled tolerance: 35084726045503.402 




r2: 0.7763818916299724, rmse: 0.30766793089303923, t: 84.19991636276245

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 2.854918039445052e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2409759074863166.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2223436743873453.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1238625108794931.8, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 920819527831711.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 691382610454438.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 307868855775374.7, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4257137278737354.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2379071200736785.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3091248674431410.5, scaled tolerance: 35084726045503.402 




r2: 0.8564627437700868, rmse: 0.4244465423647631, t: 83.24162745475769

[[0.8656510287868295, 0.18661949011636286, 0, 83.72660684585571], [0.7873761250218165, 0.4512111309121132, 0, 82.4126136302948], [0.6804537315552623, 0.4964571441735188, 0, 82.27380299568176], [0.47922093799031384, 0.7922736954811134, 0, 82.23210501670837], [0.8722507778212176, 0.3368256541499248, 0, 82.46265244483948], [0.7763818916299724, 0.30766793089303923, 0, 84.19991636276245], [0.8564627437700868, 0.4244465423647631, 0, 83.24162745475769]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.37
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.47
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.57
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.67
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.75
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.84
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.95
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.35
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.42
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.59
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.73
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.81
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.25
[IterativeImputer] Ending imputation round 4

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.91
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.37
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.46
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.52
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.61
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.72
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.82
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.91
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending i

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.70
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.83
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.91
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.28
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.46
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.65
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.74
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.82
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.88
Imputation round 9/12
[IterativeImputer] Co

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.58
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.67
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.75
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.86
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.94
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.08
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.16
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.32
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.49
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.57
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.66
[IterativeImputer] Ending imputation round 9/

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.40
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.45
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.54
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.63
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.72
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.90
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.07
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.22
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.33
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.40
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.51
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.32
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.62
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.71
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.85
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.92
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.18
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.28
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.37
[IterativeImputer] Ending imputation round 5/

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.50
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.17
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.91
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.72
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.71
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.59
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.47
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.57
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.25
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.98
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.62
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.34
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.12
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.49
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.10
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.82
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.62
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.27
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.96
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.78
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.50
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.32
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.15
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.49
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.08
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.67
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 69.86
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.75
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.80
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.73
[IterativeImputer] Ending imputation round 2/10, elapsed time 17.27
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.93
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.61
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.30
[IterativeImputer] Ending imputation round 6/10, elapsed time 52.07
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.92
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.70
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.44
[IterativeImputer] Ending imputation round 10/10, elapsed time 87.14
Imputation round 5/5
[IterativeImp

[IterativeImputer] Ending imputation round 3/10, elapsed time 25.97
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.65
[IterativeImputer] Ending imputation round 5/10, elapsed time 43.35
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.96
[IterativeImputer] Ending imputation round 7/10, elapsed time 60.67
[IterativeImputer] Ending imputation round 8/10, elapsed time 69.38
[IterativeImputer] Ending imputation round 9/10, elapsed time 78.13
[IterativeImputer] Ending imputation round 10/10, elapsed time 86.96
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.61
[IterativeImputer] Ending imputation round 2/10, elapsed time 18.77
[IterativeImputer] Ending imputation round 3/10, elapsed time 28.09
[IterativeImputer] Ending imputation round 4/10, elapsed time 37.67
[IterativeImputer] Ending imputation round 5/10, elapsed time 47.39
[IterativeImputer] Ending imputatio

In [12]:
r3 = pd.DataFrame(r3).T
r3

Unnamed: 0,0,1,2,3
Backfill,-2.398676,1.52283,33689.285714,1.452961
Overall Mean,-0.395046,1.014262,0.0,1.687307
Yearly Mean,0.006562,0.877928,52320.571429,1.540814
Yearly Mean per Region,-0.04767,0.899047,58597.428571,1.630441
Interpolate 3,-0.891135,1.183015,33720.0,1.522317
Interpolate all,-0.892295,1.163724,58.428571,1.494697
ICE 1,0.95914,0.166005,0.0,9.990437
ICE 2,0.958234,0.16959,0.0,23.602618
ICE 3,0.759685,0.427929,0.0,82.935618
MICE 1,0.969067,0.143948,0.0,132.455087


In [13]:
r3_detail = pd.DataFrame(pd.DataFrame(r3_detail).T.stack().to_dict()).T
r3_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r3_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,-3.964220,1.152188,33619.0,1.453992
Backfill,1,-1.837371,1.679247,33786.0,1.435946
Backfill,2,-1.908139,1.523993,33654.0,1.453488
Backfill,3,-0.897788,1.538364,33643.0,1.467975
Backfill,4,-1.176092,1.413485,33679.0,1.463882
...,...,...,...,...,...
KNN 2,2,-0.010297,0.882753,0.0,18.800680
KNN 2,3,0.173781,0.997921,0.0,18.919110
KNN 2,4,0.177441,0.854692,0.0,18.957804
KNN 2,5,0.198567,0.582455,0.0,18.929258


### Imputationverfahren auf Originaldatensatz anwenden

In [14]:
for name, func in functions.items():
    print(name)

    t0 = time.time()
    df= func(experiment.reset_base()) 
    t1 = time.time()
    t = t1-t0

    print(f'{round(t, 2)}s vergangen')
    print('')
    df.to_csv(f'additional_data/imputed_sets/{name}.csv')

Backfill
0.14s vergangen

Overall Mean
0.37s vergangen

Yearly Mean
0.21s vergangen

Yearly Mean per Region
0.32s vergangen

Interpolate 3
0.2s vergangen

Interpolate all
0.17s vergangen

ICE 1




8.86s vergangen

ICE 2
22.12s vergangen

ICE 3
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 3.0129401435894064e+16, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3255302827643808.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2664174541478353.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 752792522498120.2, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 4139741271714855.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2298800774032059.0, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1244198777526491.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 1297247835266420.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 3963777598111986.5, scaled tolerance: 35084726045503.402 
[IterativeImputer] Change: 2892682827217661.5, scaled tolerance: 35084726045503.402 
84.79s vergangen





MICE 1
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.15
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.23
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.33
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.38
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.48
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.55
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.64
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.72
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.84
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.90
Imputation round 2/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.20
[IterativeImputer] Endi

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.85
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.27
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.34
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.40
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.48
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.56
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.68
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.74
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.83
130.91s vergangen

MICE 2
Imputation round 1/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.74
[I

### Ergebnisse abspeichern

In [15]:
t1 = time.time()
t = t1-t0
print(f'comlete runtime: {t/60}min')

comlete runtime: 0.28645807107289634min


In [16]:
sets = {'r1':r1, 'r1_detail':r1_detail,
       'r2':r2, 'r2_detail':r2_detail,
       'r3':r3, 'r3_detail':r3_detail,}
for name, df in sets.items():
    df.to_csv(f'additional_data/results/{name}.csv')