# Experiment

### Vorbereitung

In [1]:
import pandas as pd
import numpy as np
import time

import experiment
from imputer import *

In [2]:
t0 = time.time()
results = []
base, scaler = experiment.reset_base(return_scaler=True)

In [3]:
functions =  {'Backfill':impute_backfill, 'Overall Mean':impute_overall_means, 
              'Yearly Mean':impute_yearly_means, 'Yearly Mean per Region':impute_yearly_means_per_region, 
              'Interpolate 3':interpolate3, 'Interpolate all':interpolate_all, 
              'ICE 1':iterative_imputer1, 'ICE 2':iterative_imputer2, 
              'ICE 3':iterative_imputer3, 'MICE 1':mice_imputer, 'MICE 2':mice_imputer2, 
              'KNN 1':knn_imputer1, 'KNN 2':knn_imputer2
             }

In [4]:
def run_all(frac):
    
    #getting n different training sets
    cords_list =[]
    n = 7
    for i in np.arange(1,n+1):
        cords_list.append(experiment.get_cords(frac, i))
    
    #setting up two dictionaries to save detailed and averaged results
    detailed_results = {}   
    results = {}
         
    #itterating over dictionary of all imputers
    for name, func in functions.items():
        func_runs = []
        print(name)
        
        #running each imputer n times on different training sets
        for count, cords in enumerate(cords_list):            
            print(f'run: {count+1}/{n}')
            
            #running current imputer and timeing runtime
            t0 = time.time()
            df= func(experiment.reset_train(cords)) 
            t1 = time.time()
            t = t1-t0
            
            #evaluating run
            func_runs.append(experiment.evaluate(df, t, cords))
        
        #print evaluation result of all runs of current imputer
        print(func_runs)
        print ('')
        
        #save detailed and averaged results
        detailed_results[name] = func_runs
        results[name] = np.mean(np.array(func_runs), axis=0)
        
    return results, detailed_results


### Durchlauf mit 3% fehlenden Werten

In [5]:
r1, r1_detail = run_all(0.03)

Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Testdaten mit 3.0% fehlenden Werten (absolut: 5109)
Backfill
run: 1/7
r2: 0.932583879271738, rmse: 0.025304839916863744, t: 0.566561222076416

run: 2/7
r2: 0.98343571167781, rmse: 0.0721265294982051, t: 0.5600488185882568

run: 3/7
r2: 0.9894228814375354, rmse: 0.03734057954145193, t: 0.558051586151123

run: 4/7
r2: 0.9924393093755304, rmse: 0.045826793422044876, t: 0.5515456199645996

run: 5/7
r2: 0.9960627112832513, rmse: 0.08578166120884186, t: 0.5575532913208008

run: 6/7
r2: 0.9990794142822997, rmse: 0.03858664120213273, t: 0.5583295822143555

run: 7/7
r2: 0.9977643305855354, rmse: 0.09632470364064019, t: 0.5590472221374512

[[0.932583879271738, 0.025304839916863744, 135530,



r2: 0.9885938035326868, rmse: 0.010177118381818086, t: 10.444562673568726

run: 2/7




r2: 0.9969846894731622, rmse: 0.03219183202892108, t: 10.382390022277832

run: 3/7




r2: 0.982137909799109, rmse: 0.04736277087601019, t: 10.32923698425293

run: 4/7




r2: 0.9440848262594914, rmse: 0.1219888331236465, t: 10.26927375793457

run: 5/7




r2: 0.9919523897114556, rmse: 0.11982546506968654, t: 10.374939918518066

run: 6/7




r2: 0.9904858880552722, rmse: 0.12143557844281638, t: 10.372352838516235

run: 7/7




r2: 0.9962470222194769, rmse: 0.12172472982414029, t: 10.348971366882324

[[0.9885938035326868, 0.010177118381818086, 0, 10.444562673568726], [0.9969846894731622, 0.03219183202892108, 0, 10.382390022277832], [0.982137909799109, 0.04736277087601019, 0, 10.32923698425293], [0.9440848262594914, 0.1219888331236465, 0, 10.26927375793457], [0.9919523897114556, 0.11982546506968654, 0, 10.374939918518066], [0.9904858880552722, 0.12143557844281638, 0, 10.372352838516235], [0.9962470222194769, 0.12172472982414029, 0, 10.348971366882324]]

ICE 2
run: 1/7




r2: 0.8801397913371654, rmse: 0.032990729364265094, t: 79.21348571777344

run: 2/7




r2: 0.9703004346124738, rmse: 0.10103101545269999, t: 75.94025754928589

run: 3/7




r2: 0.9803439563494001, rmse: 0.049684281871232285, t: 75.62446761131287

run: 4/7




r2: 0.9609487457985622, rmse: 0.10194659642568091, t: 75.36795330047607

run: 5/7




r2: 0.9590658054971118, rmse: 0.2702456916945032, t: 75.71967792510986

run: 6/7




r2: 0.9951910162798481, rmse: 0.08633531357755905, t: 75.39020133018494

run: 7/7




r2: 0.873168968456131, rmse: 0.7076256796558823, t: 74.87840366363525

[[0.8801397913371654, 0.032990729364265094, 0, 79.21348571777344], [0.9703004346124738, 0.10103101545269999, 0, 75.94025754928589], [0.9803439563494001, 0.049684281871232285, 0, 75.62446761131287], [0.9609487457985622, 0.10194659642568091, 0, 75.36795330047607], [0.9590658054971118, 0.2702456916945032, 0, 75.71967792510986], [0.9951910162798481, 0.08633531357755905, 0, 75.39020133018494], [0.873168968456131, 0.7076256796558823, 0, 74.87840366363525]]

ICE 3
run: 1/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 104.23736178791236, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 60.847872252015186, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 52.31651619822493, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 42.63605091117454, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 30.681095913733184, scaled to



r2: -1.2105933752175941, rmse: 0.1416800934002644, t: 79.17767453193665

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 99.21597161518164, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 42.034139945838625, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.062224569956754, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 154.71906775264046, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 345.5181443228103, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 257.05861729784704, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 240.92813805467935, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 191.72414329939875, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 187.0783365983041, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 187.3861616408846, scaled tolerance: 0.11370298835951696 




r2: 0.8936549290616118, rmse: 0.1911781935726795, t: 78.65476274490356

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 99.59402232008283, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 13.66941925927509, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 36.10499179926715, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 16.14119125804418, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 23.466956358997567, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 27.382876315858102, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 29.148359946534416, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 26.850971417311673, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.081279644519007, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 29.31933614930661, scaled tolerance: 0.11370298835951696 




r2: 0.8459808419459823, rmse: 0.13907796758967478, t: 80.99149823188782

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 98.84242662642316, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 152.5215046381835, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 34.7809371715383, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.880096435598986, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 48.91586569427565, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 46.71666206992575, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 92.07978116007823, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 80.17799344781714, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 69.44097903340213, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 54.69914820277461, scaled tolerance: 0.11370298835951696 




r2: 0.8349686849543275, rmse: 0.20957448998322428, t: 78.41846990585327

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 102.01042838708766, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 42.79470429095581, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 51.71930440501302, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 115.79759635480664, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 61.8123126484441, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 75.13764517478455, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 34.03736489149699, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 66.56091203396421, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 219.92943643960817, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 42.74137409124545, scaled tolerance: 0.11370298835951696 




r2: 0.9750461965042472, rmse: 0.21100076509911342, t: 77.68548393249512

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 100.29992120043757, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 23.766048296741165, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 35.43633297980655, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 37.87213754287315, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.618932667729663, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 21.314694087582566, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 23.152781210505452, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 24.908543857299502, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 37.98855101995858, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 49.86922807218363, scaled tolerance: 0.11370298835951696 




r2: 0.9860539816337848, rmse: 0.14702355974840992, t: 81.9513931274414

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 105.06411838577453, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 32.48268997833305, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 34.30852258173641, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 76.8927323894636, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 77.40966321279409, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 79.5903203067961, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 53.58896268647449, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 55.530369894870745, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 98.91425993716732, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 96.27897871268496, scaled tolerance: 0.11370298835951696 




r2: 0.9408371540451838, rmse: 0.48329839312313255, t: 78.90451455116272

[[-1.2105933752175941, 0.1416800934002644, 0, 79.17767453193665], [0.8936549290616118, 0.1911781935726795, 0, 78.65476274490356], [0.8459808419459823, 0.13907796758967478, 0, 80.99149823188782], [0.8349686849543275, 0.20957448998322428, 0, 78.41846990585327], [0.9750461965042472, 0.21100076509911342, 0, 77.68548393249512], [0.9860539816337848, 0.14702355974840992, 0, 81.9513931274414], [0.9408371540451838, 0.48329839312313255, 0, 78.90451455116272]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.12
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.21
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.32
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.42
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.54
[IterativeImputer] Ending imputation ro

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.26
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.38
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.52
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.65
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.79
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.91
[IterativeImputer] Ending imputation round 8/10, elapsed time 9.06
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.17
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.29
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.12
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.24
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.35
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.49
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.16
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.35
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.50
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.68
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.83
[IterativeImputer] Ending imputation round 6/10, elapsed time 7.02
[IterativeImputer] Ending imputation round 7/10, elapsed time 8.16
[IterativeImputer] Ending imputation round 8/10, elapsed time 9.35
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.50
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.68
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.13
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.25
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.34
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 10/10, elapsed time 11.42
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.20
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.37
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.58
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.77
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.97
[IterativeImputer] Ending imputation round 6/10, elapsed time 7.14
[IterativeImputer] Ending imputation round 7/10, elapsed time 8.33
[IterativeImputer] Ending imputation round 8/10, elapsed time 9.50
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.70
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.88
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.16
[IterativeImputer] Ending 

[IterativeImputer] Ending imputation round 8/10, elapsed time 8.93
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.04
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.17
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.24
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.36
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.50
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.61
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.75
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.85
[IterativeImputer] Ending imputation round 8/10, elapsed time 9.00
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.13
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.27
Imputation round 9/12
[IterativeImputer] 

[IterativeImputer] Ending imputation round 6/10, elapsed time 6.70
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.81
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.89
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.01
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.10
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.13
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.22
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.35
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.44
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.55
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.65
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.78
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.90
[IterativeImputer] Ending imputation round 9

[IterativeImputer] Ending imputation round 4/10, elapsed time 4.46
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.57
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.69
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.78
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.90
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.98
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.11
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.12
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.26
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.35
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.48
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.59
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.73
[IterativeImputer] Ending imputation round 7/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.24
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.34
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.41
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.52
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.62
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.73
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.87
[IterativeImputer] Ending imputation round 9/10, elapsed time 10.02
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.13
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.14
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.23
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.35
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.46
[IterativeImputer] Ending imputation round 5

[IterativeImputer] Ending imputation round 4/10, elapsed time 34.00
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.52
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.00
[IterativeImputer] Ending imputation round 7/10, elapsed time 59.46
[IterativeImputer] Ending imputation round 8/10, elapsed time 67.91
[IterativeImputer] Ending imputation round 9/10, elapsed time 76.41
[IterativeImputer] Ending imputation round 10/10, elapsed time 84.85
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.21
[IterativeImputer] Ending imputation round 2/10, elapsed time 16.64
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.16
[IterativeImputer] Ending imputation round 4/10, elapsed time 33.64
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.11
[IterativeImputer] Ending imputation round 6/10, elapsed time 50.61
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 1/10, elapsed time 8.35
[IterativeImputer] Ending imputation round 2/10, elapsed time 16.91
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.48
[IterativeImputer] Ending imputation round 4/10, elapsed time 34.10
[IterativeImputer] Ending imputation round 5/10, elapsed time 42.70
[IterativeImputer] Ending imputation round 6/10, elapsed time 51.35
[IterativeImputer] Ending imputation round 7/10, elapsed time 59.98
[IterativeImputer] Ending imputation round 8/10, elapsed time 68.53
[IterativeImputer] Ending imputation round 9/10, elapsed time 77.14
[IterativeImputer] Ending imputation round 10/10, elapsed time 85.85
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.35
[IterativeImputer] Ending imputation round 2/10, elapsed time 16.89
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.38
[IterativeImputer] Ending imputation

[IterativeImputer] Ending imputation round 8/10, elapsed time 89.41
[IterativeImputer] Ending imputation round 9/10, elapsed time 100.64
[IterativeImputer] Ending imputation round 10/10, elapsed time 112.02
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 2/10, elapsed time 19.71
[IterativeImputer] Ending imputation round 3/10, elapsed time 29.90
[IterativeImputer] Ending imputation round 4/10, elapsed time 39.93
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.03
[IterativeImputer] Ending imputation round 6/10, elapsed time 60.16
[IterativeImputer] Ending imputation round 7/10, elapsed time 70.24
[IterativeImputer] Ending imputation round 8/10, elapsed time 80.31
[IterativeImputer] Ending imputation round 9/10, elapsed time 90.74
[IterativeImputer] Ending imputation round 10/10, elapsed time 102.71
Imputation round 5/5
[Iterative

[IterativeImputer] Ending imputation round 3/10, elapsed time 29.72
[IterativeImputer] Ending imputation round 4/10, elapsed time 39.76
[IterativeImputer] Ending imputation round 5/10, elapsed time 49.78
[IterativeImputer] Ending imputation round 6/10, elapsed time 59.85
[IterativeImputer] Ending imputation round 7/10, elapsed time 70.07
[IterativeImputer] Ending imputation round 8/10, elapsed time 80.21
[IterativeImputer] Ending imputation round 9/10, elapsed time 90.39
[IterativeImputer] Ending imputation round 10/10, elapsed time 101.70
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.97
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.04
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.18
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.32
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.69
[IterativeImputer] Ending imputati

In [6]:
r1 = pd.DataFrame(r1).T
r1

Unnamed: 0,0,1,2,3
Backfill,0.984398,0.057327,135535.571429,0.558734
Overall Mean,-0.32835,0.878404,0.0,0.827731
Yearly Mean,-0.357697,0.883607,52298.0,0.646067
Yearly Mean per Region,-1.195371,0.909555,58248.428571,0.792087
Interpolate 3,0.996616,0.028444,134354.571429,2.532999
Interpolate all,0.996619,0.028371,112679.285714,1.783518
ICE 1,0.984355,0.082101,0.0,10.360247
ICE 2,0.945594,0.192837,0.0,76.019207
ICE 3,0.609421,0.217548,0.0,79.397685
MICE 1,0.98871,0.061365,0.0,136.15285


In [7]:
r1_detail = pd.DataFrame(pd.DataFrame(r1_detail).T.stack().to_dict()).T
r1_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r1_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,0.932584,0.025305,135530.0,0.566561
Backfill,1,0.983436,0.072127,135514.0,0.560049
Backfill,2,0.989423,0.037341,135555.0,0.558052
Backfill,3,0.992439,0.045827,135512.0,0.551546
Backfill,4,0.996063,0.085782,135536.0,0.557553
...,...,...,...,...,...
KNN 2,2,0.117166,0.332974,0.0,18.313717
KNN 2,3,0.558552,0.342764,0.0,18.354773
KNN 2,4,0.157529,1.226008,0.0,18.373783
KNN 2,5,0.090273,1.187456,0.0,19.043271


### Durchlauf mit 5% fehlenden Werten

In [8]:
r2 , r2_detail =  run_all(0.05)

Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Testdaten mit 5.0% fehlenden Werten (absolut: 8515)
Backfill
run: 1/7
r2: 0.9973082101055876, rmse: 0.08703598848801375, t: 0.8733551502227783

run: 2/7
r2: 0.9858079818551079, rmse: 0.07306097819250446, t: 0.8754844665527344

run: 3/7
r2: 0.9757670531819184, rmse: 0.09497599123099765, t: 0.8697924613952637

run: 4/7
r2: 0.9864813648105862, rmse: 0.06158480457363178, t: 0.8953661918640137

run: 5/7
r2: 0.9957604692455183, rmse: 0.10362087941748466, t: 0.8808281421661377

run: 6/7
r2: 0.9909789664362828, rmse: 0.06180154142551044, t: 0.9035186767578125

run: 7/7
r2: 0.9866297434430658, rmse: 0.0680957160943159, t: 0.8910121917724609

[[0.9973082101055876, 0.08703598848801375, 1357



r2: 0.9876887158899978, rmse: 0.18229550284202936, t: 12.028942108154297

run: 2/7




r2: 0.7840364282344524, rmse: 0.2786823680043684, t: 11.855463981628418

run: 3/7




r2: 0.9883558942421291, rmse: 0.06437175877687713, t: 11.912816286087036

run: 4/7




r2: 0.9877952162945246, rmse: 0.1162959285766722, t: 11.928767681121826

run: 5/7




r2: 0.9908526390634123, rmse: 0.14892100877162637, t: 12.001462936401367

run: 6/7




r2: 0.9776164366571884, rmse: 0.09529402834134755, t: 11.793576955795288

run: 7/7




r2: 0.9885829413373741, rmse: 0.06164679174661918, t: 11.792851686477661

[[0.9876887158899978, 0.18229550284202936, 0, 12.028942108154297], [0.7840364282344524, 0.2786823680043684, 0, 11.855463981628418], [0.9883558942421291, 0.06437175877687713, 0, 11.912816286087036], [0.9877952162945246, 0.1162959285766722, 0, 11.928767681121826], [0.9908526390634123, 0.14892100877162637, 0, 12.001462936401367], [0.9776164366571884, 0.09529402834134755, 0, 11.793576955795288], [0.9885829413373741, 0.06164679174661918, 0, 11.792851686477661]]

ICE 2
run: 1/7




r2: 0.9134133219911886, rmse: 0.48344805457527845, t: 93.79971408843994

run: 2/7




r2: 0.9901392262918218, rmse: 0.05954903630360002, t: 94.10777568817139

run: 3/7




r2: 0.9445414083142578, rmse: 0.14048395425496465, t: 93.97961163520813

run: 4/7




r2: 0.966112054802091, rmse: 0.19378586022877453, t: 94.07925271987915

run: 5/7




r2: 0.9813090139861719, rmse: 0.21287475824601432, t: 93.63507056236267

run: 6/7




r2: 0.9526705310209753, rmse: 0.1385692574011069, t: 93.71891927719116

run: 7/7




r2: 0.9905927071712107, rmse: 0.05595845238568842, t: 93.47826910018921

[[0.9134133219911886, 0.48344805457527845, 0, 93.79971408843994], [0.9901392262918218, 0.05954903630360002, 0, 94.10777568817139], [0.9445414083142578, 0.14048395425496465, 0, 93.97961163520813], [0.966112054802091, 0.19378586022877453, 0, 94.07925271987915], [0.9813090139861719, 0.21287475824601432, 0, 93.63507056236267], [0.9526705310209753, 0.1385692574011069, 0, 93.71891927719116], [0.9905927071712107, 0.05595845238568842, 0, 93.47826910018921]]

ICE 3
run: 1/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 134.0789117873059, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 55.24029626044301, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 40.23731081080076, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 66.68856953197154, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 53.90903391122144, scaled tole



r2: 0.9510462473349963, rmse: 0.3635107617499555, t: 94.5076756477356

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 102.68818423860914, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 56.05921525223947, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 17.92995857600461, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 49.53385154442202, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 64.82527772708133, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 49.04548727117475, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 42.57054404053308, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 17.244417111425246, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 35.00396695094187, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 37.37514769797358, scaled tolerance: 0.11370298835951696 




r2: 0.8795631871785323, rmse: 0.20811283643369438, t: 93.50213146209717

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 100.9420480716928, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 39.32911744174603, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 33.311100999328055, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 11.530699947821748, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 81.78881965723532, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 83.62352785381074, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 74.73318317434824, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 75.90504819993113, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 78.72860451618784, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 88.92423738081648, scaled tolerance: 0.11370298835951696 




r2: 0.4379287452835423, rmse: 0.44723727449197703, t: 93.94242882728577

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 98.96897680519632, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 48.60203732706713, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 30.01218225745206, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 54.481340324136525, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 50.85017542605499, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 68.83767644679045, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 30.02206203568621, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 41.670993102237624, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 39.66229541001917, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 29.214783066199807, scaled tolerance: 0.11370298835951696 




r2: 0.5663124712159896, rmse: 0.6932468963586335, t: 94.33545207977295

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 125.54761934116495, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 43.389315436180816, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 55.04173588130167, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 33.54869712983137, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 91.24799333811104, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 35.68745705765289, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 100.03782881955571, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 69.70058456195132, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 145.65473277694113, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 287.8834355960849, scaled tolerance: 0.11370298835951696 




r2: 0.9519501671573913, rmse: 0.341313921075408, t: 92.77167129516602

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 103.71610835618661, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 95.69262766130305, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 61.34996735984817, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 97.78114889024351, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 80.8631964656669, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 65.0183168593102, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 38.91930960723178, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 46.74544777200868, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 54.009617866588265, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 44.60822607972789, scaled tolerance: 0.11370298835951696 




r2: 0.8514486895158309, rmse: 0.24549311542798946, t: 94.8245177268982

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 113.11561269853337, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 13.158556199168958, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 47.504766445852404, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 22.38870595915095, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 18.232074887920763, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 17.460948048075117, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 21.588313712863876, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.32330575754128, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 37.89327193925225, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 35.450979156258505, scaled tolerance: 0.11370298835951696 




r2: 0.893074358110113, rmse: 0.18865759619345054, t: 94.77078914642334

[[0.9510462473349963, 0.3635107617499555, 0, 94.5076756477356], [0.8795631871785323, 0.20811283643369438, 0, 93.50213146209717], [0.4379287452835423, 0.44723727449197703, 0, 93.94242882728577], [0.5663124712159896, 0.6932468963586335, 0, 94.33545207977295], [0.9519501671573913, 0.341313921075408, 0, 92.77167129516602], [0.8514486895158309, 0.24549311542798946, 0, 94.8245177268982], [0.893074358110113, 0.18865759619345054, 0, 94.77078914642334]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.42
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.78
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.32
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.74
[IterativeImputer] Ending imputation round 5/10, elapsed time 7.11
[IterativeImputer] Ending imputation round 6/

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.68
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.01
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.39
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.71
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.14
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.50
[IterativeImputer] Ending imputation round 8/10, elapsed time 10.87
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.27
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.67
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.36
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.69
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.05
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.42
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.42
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.82
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.17
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.55
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.93
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.29
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.68
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.08
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.46
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.83
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.39
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.76
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.11
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 10/10, elapsed time 13.76
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.38
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.72
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.09
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.83
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.19
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.54
[IterativeImputer] Ending imputation round 8/10, elapsed time 10.91
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.25
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.64
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.37
[IterativeImputer] Ending

[IterativeImputer] Ending imputation round 7/10, elapsed time 9.48
[IterativeImputer] Ending imputation round 8/10, elapsed time 10.84
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.18
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.62
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.34
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.72
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.07
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.81
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.17
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.56
[IterativeImputer] Ending imputation round 8/10, elapsed time 10.94
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.31
[IterativeImputer] Ending imputation roun

[IterativeImputer] Ending imputation round 4/10, elapsed time 5.50
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.94
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.28
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.65
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.01
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.44
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.79
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.36
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.71
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.06
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.44
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.77
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.13
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.38
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.81
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.19
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.58
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.96
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.32
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.72
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.07
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.45
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.80
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.37
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.72
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.11
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 10/10, elapsed time 13.94
Imputation round 4/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.34
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.69
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.09
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.48
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.84
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.19
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.56
[IterativeImputer] Ending imputation round 8/10, elapsed time 10.94
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.32
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.83
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.37
[IterativeImputer] Ending 

[IterativeImputer] Ending imputation round 1/10, elapsed time 9.96
[IterativeImputer] Ending imputation round 2/10, elapsed time 19.92
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.10
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.23
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.58
[IterativeImputer] Ending imputation round 6/10, elapsed time 60.78
[IterativeImputer] Ending imputation round 7/10, elapsed time 71.03
[IterativeImputer] Ending imputation round 8/10, elapsed time 81.22
[IterativeImputer] Ending imputation round 9/10, elapsed time 91.33
[IterativeImputer] Ending imputation round 10/10, elapsed time 101.45
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.84
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.03
[IterativeImputer] Ending imputation round 3/10, elapsed time 29.98
[IterativeImputer] Ending imputatio

[IterativeImputer] Ending imputation round 8/10, elapsed time 81.07
[IterativeImputer] Ending imputation round 9/10, elapsed time 91.23
[IterativeImputer] Ending imputation round 10/10, elapsed time 101.48
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.97
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.42
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.46
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.55
[IterativeImputer] Ending imputation round 6/10, elapsed time 60.79
[IterativeImputer] Ending imputation round 7/10, elapsed time 71.12
[IterativeImputer] Ending imputation round 8/10, elapsed time 81.42
[IterativeImputer] Ending imputation round 9/10, elapsed time 91.70
[IterativeImputer] Ending imputation round 10/10, elapsed time 101.96
Imputation round 4/5
[IterativeI

[IterativeImputer] Ending imputation round 3/10, elapsed time 30.21
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.19
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.40
[IterativeImputer] Ending imputation round 6/10, elapsed time 60.67
[IterativeImputer] Ending imputation round 7/10, elapsed time 70.81
[IterativeImputer] Ending imputation round 8/10, elapsed time 80.96
[IterativeImputer] Ending imputation round 9/10, elapsed time 91.16
[IterativeImputer] Ending imputation round 10/10, elapsed time 101.47
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.77
[IterativeImputer] Ending imputation round 2/10, elapsed time 19.98
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.09
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.25
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.67
[IterativeImputer] Ending imputati

[IterativeImputer] Ending imputation round 9/10, elapsed time 91.62
[IterativeImputer] Ending imputation round 10/10, elapsed time 101.87
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.81
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.02
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.43
[IterativeImputer] Ending imputation round 5/10, elapsed time 50.62
[IterativeImputer] Ending imputation round 6/10, elapsed time 61.03
[IterativeImputer] Ending imputation round 7/10, elapsed time 71.40
[IterativeImputer] Ending imputation round 8/10, elapsed time 81.81
[IterativeImputer] Ending imputation round 9/10, elapsed time 92.31
[IterativeImputer] Ending imputation round 10/10, elapsed time 102.78
Imputation round 5/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] 

In [9]:
r2 = pd.DataFrame(r2).T
r2

Unnamed: 0,0,1,2,3
Backfill,0.988391,0.078597,135735.285714,0.884194
Overall Mean,0.017483,0.942313,0.0,1.158503
Yearly Mean,0.002611,0.949257,52298.0,0.997352
Yearly Mean per Region,-0.053966,0.97477,58352.714286,1.113363
Interpolate 3,0.9955,0.053491,134538.0,3.118704
Interpolate all,0.9955,0.053374,112822.0,2.279457
ICE 1,0.957847,0.135358,0.0,11.901983
ICE 2,0.962683,0.183524,0.0,93.828373
ICE 3,0.790189,0.355367,0.0,94.093524
MICE 1,0.960959,0.140063,0.0,166.841412


In [10]:
r2_detail = pd.DataFrame(pd.DataFrame(r2_detail).T.stack().to_dict()).T
r2_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r2_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,0.997308,0.087036,135735.0,0.873355
Backfill,1,0.985808,0.073061,135759.0,0.875484
Backfill,2,0.975767,0.094976,135763.0,0.869792
Backfill,3,0.986481,0.061585,135732.0,0.895366
Backfill,4,0.995760,0.103621,135733.0,0.880828
...,...,...,...,...,...
KNN 2,2,0.027728,0.588215,0.0,18.844944
KNN 2,3,0.092321,1.002918,0.0,19.003815
KNN 2,4,0.307846,1.295417,0.0,18.890669
KNN 2,5,0.103455,0.603097,0.0,19.075048


### Durchlauf mit 10% fehlenden Werten

In [11]:
r3, r3_detail = run_all(0.1)

Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Testdaten mit 10.0% fehlenden Werten (absolut: 17030)
Backfill
run: 1/7
r2: 0.9663622883375262, rmse: 0.09435929351380964, t: 1.6076178550720215

run: 2/7
r2: 0.965831207998835, rmse: 0.16608208537305055, t: 1.6123969554901123

run: 3/7
r2: 0.9935577602592738, rmse: 0.06511406610024399, t: 1.6313450336456299

run: 4/7
r2: 0.9875539571238111, rmse: 0.10890085372239798, t: 1.595137596130371

run: 5/7
r2: 0.9899041916706846, rmse: 0.09012378029510211, t: 1.6163153648376465

run: 6/7
r2: 0.9842042755499092, rmse: 0.08112853612646811, t: 1.6076030731201172

run: 7/7
r2: 0.9800827771746988, rmse: 0.1472582895356431, t: 1.6198585033416748

[[0.9663622883375262, 0.09435929351



r2: 0.9357367864645735, rmse: 0.12776886482885486, t: 13.235673189163208

run: 2/7




r2: 0.9418304252479318, rmse: 0.21200718413612057, t: 13.166343688964844

run: 3/7




r2: 0.9891326376065146, rmse: 0.08267894900896625, t: 13.17636775970459

run: 4/7




r2: 0.9838955013211477, rmse: 0.12119792020333492, t: 12.897680521011353

run: 5/7




r2: 0.903254558541485, rmse: 0.2725040574712619, t: 13.142938375473022

run: 6/7




r2: 0.972978168094846, rmse: 0.10409991674233914, t: 12.73015832901001

run: 7/7




r2: 0.9575388399481048, rmse: 0.2118402119224618, t: 13.06698751449585

[[0.9357367864645735, 0.12776886482885486, 0, 13.235673189163208], [0.9418304252479318, 0.21200718413612057, 0, 13.166343688964844], [0.9891326376065146, 0.08267894900896625, 0, 13.17636775970459], [0.9838955013211477, 0.12119792020333492, 0, 12.897680521011353], [0.903254558541485, 0.2725040574712619, 0, 13.142938375473022], [0.972978168094846, 0.10409991674233914, 0, 12.73015832901001], [0.9575388399481048, 0.2118402119224618, 0, 13.06698751449585]]

ICE 2
run: 1/7




r2: 0.9719353654700009, rmse: 0.0844351953090043, t: 96.79999279975891

run: 2/7




r2: 0.9895519743837302, rmse: 0.0898503447309157, t: 95.56663703918457

run: 3/7




r2: 0.9268145106214385, rmse: 0.21455832155568302, t: 97.21492910385132

run: 4/7




r2: 0.9894193796617424, rmse: 0.09823746062273213, t: 95.464923620224

run: 5/7




r2: 0.9769052618823861, rmse: 0.13314174318796193, t: 95.50529026985168

run: 6/7




r2: 0.9693786707502026, rmse: 0.11081664757337056, t: 93.99799990653992

run: 7/7




r2: 0.9743810937014752, rmse: 0.1645480603565979, t: 94.67615032196045

[[0.9719353654700009, 0.0844351953090043, 0, 96.79999279975891], [0.9895519743837302, 0.0898503447309157, 0, 95.56663703918457], [0.9268145106214385, 0.21455832155568302, 0, 97.21492910385132], [0.9894193796617424, 0.09823746062273213, 0, 95.464923620224], [0.9769052618823861, 0.13314174318796193, 0, 95.50529026985168], [0.9693786707502026, 0.11081664757337056, 0, 93.99799990653992], [0.9743810937014752, 0.1645480603565979, 0, 94.67615032196045]]

ICE 3
run: 1/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 109.22399646964098, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 91.46784081655693, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 69.8562366250249, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 101.71444966370606, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 115.08336356745625, scaled tolera



r2: 0.8317600668382732, rmse: 0.20673231140118428, t: 94.83883833885193

run: 2/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 102.39954741294694, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 20.352317319160072, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 9.378776891868991, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 17.16695477889979, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 72.44230440366934, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 82.79799894265723, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 65.07266376302802, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 56.70634665209171, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 64.13432661677074, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 41.43549581057201, scaled tolerance: 0.11370298835951696 




r2: 0.9279255907554914, rmse: 0.2359897711135257, t: 94.3963611125946

run: 3/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 98.8378069733917, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 63.20495065618921, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 38.48773350762675, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 51.28703781400902, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 74.33181509055048, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 128.04150810241745, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 99.46324303876852, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 61.77744879898086, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 579.5195599917383, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 279.6843645320948, scaled tolerance: 0.11370298835951696 




r2: 0.9012723961034466, rmse: 0.24920237152512917, t: 94.98651909828186

run: 4/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 101.59862970829286, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 15.663192425136073, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 52.59335430752736, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 115.01461481171575, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 221.62534573611666, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 289.5621618419794, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 336.9138692397395, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 561.5506886861668, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 247.03425383394904, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 551.3246047150237, scaled tolerance: 0.11370298835951696 




r2: 0.8822168989227234, rmse: 0.3277653610486168, t: 96.2418806552887

run: 5/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 108.52297283174707, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 32.06969219935116, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 15.822913081301701, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 35.51287462155281, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 78.48592581034185, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 33.36204888450823, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 14.213536448245621, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 8.56585257172939, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 8.668069909785652, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 11.993393583817477, scaled tolerance: 0.11370298835951696 




r2: 0.9028637094294659, rmse: 0.2730539573510883, t: 93.29700708389282

run: 6/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 113.2552465236194, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 14.526387316079786, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 16.806643105539855, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 25.601576346812276, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 40.30675637335955, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 26.705077335468257, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 29.379706857052057, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.020186484985178, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 26.634344693256246, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.59899241010215, scaled tolerance: 0.11370298835951696 




r2: 0.8448359986107478, rmse: 0.2494528519453891, t: 94.20208883285522

run: 7/7
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 128.53839749749673, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 28.873454347871395, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 54.498676788034494, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 213.2897525374016, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 383.57496947167056, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 581.6482736919526, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 674.4326864154756, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 678.6299931489322, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 522.209441177793, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 307.2898208800594, scaled tolerance: 0.11370298835951696 




r2: 0.8807813549229437, rmse: 0.35496420914237725, t: 94.13712692260742

[[0.8317600668382732, 0.20673231140118428, 0, 94.83883833885193], [0.9279255907554914, 0.2359897711135257, 0, 94.3963611125946], [0.9012723961034466, 0.24920237152512917, 0, 94.98651909828186], [0.8822168989227234, 0.3277653610486168, 0, 96.2418806552887], [0.9028637094294659, 0.2730539573510883, 0, 93.29700708389282], [0.8448359986107478, 0.2494528519453891, 0, 94.20208883285522], [0.8807813549229437, 0.35496420914237725, 0, 94.13712692260742]]

MICE 1
run: 1/7
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.36
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.83
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.20
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.58
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.97
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 2/10, elapsed time 2.71
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.15
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.54
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.92
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.35
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.68
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.08
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.44
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.83
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.37
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.71
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.11
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.46
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.34
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.70
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.06
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.51
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.93
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.39
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.79
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.17
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.58
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.93
Imputation round 11/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.41
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.82
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.25
[IterativeImputer] Ending imputation round

[IterativeImputer] Ending imputation round 10/10, elapsed time 14.30
Imputation round 9/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.38
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.77
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.16
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.52
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.96
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.33
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.71
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.12
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.49
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.91
Imputation round 10/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.42
[IterativeImputer] Ending

[IterativeImputer] Ending imputation round 7/10, elapsed time 9.82
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.20
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.63
[IterativeImputer] Ending imputation round 10/10, elapsed time 14.04
Imputation round 8/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.41
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.83
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.23
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.60
[IterativeImputer] Ending imputation round 5/10, elapsed time 7.05
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.43
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.81
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.21
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.58
[IterativeImputer] Ending imputation roun

[IterativeImputer] Ending imputation round 4/10, elapsed time 5.55
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.94
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.32
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.80
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.20
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.62
[IterativeImputer] Ending imputation round 10/10, elapsed time 14.01
Imputation round 7/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.36
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.78
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.17
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.58
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.94
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.34
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 1/10, elapsed time 1.46
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.84
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.25
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.62
[IterativeImputer] Ending imputation round 5/10, elapsed time 7.04
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.39
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.80
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.20
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.58
[IterativeImputer] Ending imputation round 10/10, elapsed time 14.09
Imputation round 6/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.35
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.74
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.13
[IterativeImputer] Ending imputation round 

[IterativeImputer] Ending imputation round 10/10, elapsed time 14.19
Imputation round 4/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.41
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.78
[IterativeImputer] Ending imputation round 3/10, elapsed time 4.16
[IterativeImputer] Ending imputation round 4/10, elapsed time 5.58
[IterativeImputer] Ending imputation round 5/10, elapsed time 6.93
[IterativeImputer] Ending imputation round 6/10, elapsed time 8.33
[IterativeImputer] Ending imputation round 7/10, elapsed time 9.69
[IterativeImputer] Ending imputation round 8/10, elapsed time 11.11
[IterativeImputer] Ending imputation round 9/10, elapsed time 12.51
[IterativeImputer] Ending imputation round 10/10, elapsed time 13.92
Imputation round 5/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.42
[IterativeImputer] Ending 

[IterativeImputer] Ending imputation round 1/10, elapsed time 10.02
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.37
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.78
[IterativeImputer] Ending imputation round 4/10, elapsed time 41.24
[IterativeImputer] Ending imputation round 5/10, elapsed time 51.80
[IterativeImputer] Ending imputation round 6/10, elapsed time 62.30
[IterativeImputer] Ending imputation round 7/10, elapsed time 72.86
[IterativeImputer] Ending imputation round 8/10, elapsed time 83.41
[IterativeImputer] Ending imputation round 9/10, elapsed time 93.90
[IterativeImputer] Ending imputation round 10/10, elapsed time 104.63
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.99
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.39
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.96
[IterativeImputer] Ending imputati

[IterativeImputer] Ending imputation round 7/10, elapsed time 71.77
[IterativeImputer] Ending imputation round 8/10, elapsed time 82.17
[IterativeImputer] Ending imputation round 9/10, elapsed time 92.58
[IterativeImputer] Ending imputation round 10/10, elapsed time 102.98
Imputation round 3/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.90
[IterativeImputer] Ending imputation round 2/10, elapsed time 19.96
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.17
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.56
[IterativeImputer] Ending imputation round 5/10, elapsed time 51.03
[IterativeImputer] Ending imputation round 6/10, elapsed time 61.24
[IterativeImputer] Ending imputation round 7/10, elapsed time 71.65
[IterativeImputer] Ending imputation round 8/10, elapsed time 82.10
[IterativeImputer] Ending imputation round 9/10, elapsed time 92.44
[IterativeImputer] Ending imputati

[IterativeImputer] Ending imputation round 2/10, elapsed time 20.24
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.65
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.91
[IterativeImputer] Ending imputation round 5/10, elapsed time 51.19
[IterativeImputer] Ending imputation round 6/10, elapsed time 61.53
[IterativeImputer] Ending imputation round 7/10, elapsed time 71.81
[IterativeImputer] Ending imputation round 8/10, elapsed time 82.18
[IterativeImputer] Ending imputation round 9/10, elapsed time 92.60
[IterativeImputer] Ending imputation round 10/10, elapsed time 103.19
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 9.93
[IterativeImputer] Ending imputation round 2/10, elapsed time 20.13
[IterativeImputer] Ending imputation round 3/10, elapsed time 30.35
[IterativeImputer] Ending imputation round 4/10, elapsed time 40.66
[IterativeImputer] Ending imputati

[IterativeImputer] Ending imputation round 8/10, elapsed time 75.42
[IterativeImputer] Ending imputation round 9/10, elapsed time 84.06
[IterativeImputer] Ending imputation round 10/10, elapsed time 92.60
Imputation round 4/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.29
[IterativeImputer] Ending imputation round 2/10, elapsed time 16.66
[IterativeImputer] Ending imputation round 3/10, elapsed time 25.04
[IterativeImputer] Ending imputation round 4/10, elapsed time 33.43
[IterativeImputer] Ending imputation round 5/10, elapsed time 41.80
[IterativeImputer] Ending imputation round 6/10, elapsed time 50.35
[IterativeImputer] Ending imputation round 7/10, elapsed time 58.82
[IterativeImputer] Ending imputation round 8/10, elapsed time 67.31
[IterativeImputer] Ending imputation round 9/10, elapsed time 75.82
[IterativeImputer] Ending imputation round 10/10, elapsed time 84.36
Imputation round 5/5
[IterativeImp

In [12]:
r3 = pd.DataFrame(r3).T
r3

Unnamed: 0,0,1,2,3
Backfill,0.981071,0.107567,136315.285714,1.612896
Overall Mean,0.017973,0.801274,0.0,1.979229
Yearly Mean,0.003655,0.806951,52320.571429,1.693189
Yearly Mean per Region,-0.067243,0.833809,58597.428571,1.808593
Interpolate 3,0.992623,0.06878,135062.142857,3.98737
Interpolate all,0.992623,0.068608,113218.571429,3.03362
ICE 1,0.95491,0.161728,0.0,13.05945
ICE 2,0.971198,0.127941,0.0,95.603703
ICE 3,0.881665,0.271023,0.0,94.585689
MICE 1,0.965489,0.140832,0.0,170.078419


In [13]:
r3_detail = pd.DataFrame(pd.DataFrame(r3_detail).T.stack().to_dict()).T
r3_detail.columns = ['r2', 'rmse', 'still_missing', 't']
r3_detail

Unnamed: 0,Unnamed: 1,r2,rmse,still_missing,t
Backfill,0,0.966362,0.094359,136318.0,1.607618
Backfill,1,0.965831,0.166082,136383.0,1.612397
Backfill,2,0.993558,0.065114,136254.0,1.631345
Backfill,3,0.987554,0.108901,136287.0,1.595138
Backfill,4,0.989904,0.090124,136382.0,1.616315
...,...,...,...,...,...
KNN 2,2,0.070942,0.764459,0.0,18.499605
KNN 2,3,0.248429,0.827955,0.0,18.547533
KNN 2,4,0.201913,0.782678,0.0,18.572516
KNN 2,5,0.250318,0.548317,0.0,18.481295


### Imputationverfahren auf Originaldatensatz anwenden

In [14]:
for name, func in functions.items():
    print(name)
    
    #impute original (scaled) dataset
    t0 = time.time()
    df= func(experiment.reset_base()) 
    t1 = time.time()
    t = t1-t0
    
    #rescale to original proportions
    col = df.columns
    idx = df.index
    df = scaler.inverse_transform(df)
    df = pd.DataFrame(df, columns=col, index=idx)

    print(f'{round(t, 2)}s vergangen')
    print('')
    df.to_csv(f'additional_data/imputed_sets/{name}.csv')

Backfill
0.16s vergangen

Overall Mean
0.4s vergangen

Yearly Mean
0.24s vergangen

Yearly Mean per Region
0.35s vergangen

Interpolate 3
2.02s vergangen

Interpolate all
1.4s vergangen

ICE 1




9.02s vergangen

ICE 2




74.13s vergangen

ICE 3
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Change: 98.86652185477122, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 300.9499313595279, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 335.0402796084985, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 85.62030138511601, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 1316.7388692189515, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 860.0137215932846, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 591.9256689911845, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 1691.2582393542325, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 1690.4436131565592, scaled tolerance: 0.11370298835951696 
[IterativeImputer] Change: 641.041467924275, scaled tolerance: 0.11370298835951696 
78.81s vergangen





MICE 1
Imputation round 1/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.11
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.23
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.31
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.42
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.51
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.62
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.74
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.86
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.95
[IterativeImputer] Ending imputation round 10/10, elapsed time 11.05
Imputation round 2/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.09
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.22
[IterativeImputer] Endi

[IterativeImputer] Ending imputation round 10/10, elapsed time 10.92
Imputation round 12/12
[IterativeImputer] Completing matrix with shape (26070, 31)
[IterativeImputer] Ending imputation round 1/10, elapsed time 1.10
[IterativeImputer] Ending imputation round 2/10, elapsed time 2.17
[IterativeImputer] Ending imputation round 3/10, elapsed time 3.29
[IterativeImputer] Ending imputation round 4/10, elapsed time 4.36
[IterativeImputer] Ending imputation round 5/10, elapsed time 5.45
[IterativeImputer] Ending imputation round 6/10, elapsed time 6.57
[IterativeImputer] Ending imputation round 7/10, elapsed time 7.66
[IterativeImputer] Ending imputation round 8/10, elapsed time 8.76
[IterativeImputer] Ending imputation round 9/10, elapsed time 9.87
[IterativeImputer] Ending imputation round 10/10, elapsed time 10.95
132.91s vergangen

MICE 2
Imputation round 1/5
[IterativeImputer] Completing matrix with shape (4898, 165)
[IterativeImputer] Ending imputation round 1/10, elapsed time 8.25
[I

### Ergebnisse abspeichern

In [15]:
t1 = time.time()
t = t1-t0
print(f'complete runtime: {t/60}min')

complete runtime: 0.29942274490992227min


In [16]:
sets = {'r1':r1, 'r1_detail':r1_detail,
       'r2':r2, 'r2_detail':r2_detail,
       'r3':r3, 'r3_detail':r3_detail,}
for name, df in sets.items():
    df.to_csv(f'additional_data/results/{name}.csv')