In [119]:
import matplotlib.pyplot as plt
%matplotlib inline
import numpy as np
import os
import pandas as pd
import re
import requests
import seaborn as sns
import time
import descartes
import geopandas as gpd

from arcgis.geocoding import geocode
from arcgis.gis import GIS
from dotenv import load_dotenv
from functools import reduce
from shapely.geometry import Point, Polygon
from sklearn.decomposition import PCA
from sklearn.ensemble import RandomForestClassifier, RandomForestRegressor
from sklearn.model_selection import GridSearchCV
from sklearn.metrics import confusion_matrix
from sklearn.model_selection import train_test_split, TimeSeriesSplit
from sklearn.preprocessing import StandardScaler, LabelEncoder, RobustScaler
from sklearn.svm import SVC, SVR
from sklearn.tree import DecisionTreeRegressor
from textwrap import wrap
from xgboost import XGBClassifier, XGBRegressor, plot_importance
from yellowbrick.classifier import ROCAUC, ConfusionMatrix

plt.style.use("ggplot")
sns.set_context("talk")

In [2]:
load_dotenv("")
censuskey = os.getenv("censuskey")

In [207]:
var_description = pd.DataFrame(pd.DataFrame(
    requests.get("https://api.census.gov/data/2016/acs/acs5/profile/variables.json")
                                            .json()["variables"])
                               .T.iloc[:, 3]
                               .str.title()
                               .str.split("!!", expand=True)
                              ).sort_index()

In [208]:
var_description.columns=["unit", 
                         "subject",
                         "denominator",
                         "criteria_1",
                         "criteria_2",
                         "criteria_3",
                         "criteria_4"
                        ]

In [213]:
var_description

Unnamed: 0,unit,subject,denominator,criteria_1,criteria_2,criteria_3,criteria_4
AIANHH,American Indian Area/Alaska Native Area/Hawaii...,,,,,,
AIHHTLI,American Indian Area (Off-Reservation Trust La...,,,,,,
AITSCE,American Indian Tribal Subdivision (Census),,,,,,
ANRC,Alaska Native Regional Corporation,,,,,,
CBSA,Metropolitan Statistical Area/Micropolitan Sta...,,,,,,
CD115,Congressional District (115Th),,,,,,
CNECTA,Combined New England City And Town Area,,,,,,
CONCIT,Consolidated City,,,,,,
COUNTY,County (Fips),,,,,,
COUSUB,County Subdivision (Fips),,,,,,


In [210]:
var_description.to_csv("../data/var_description.csv")

In [211]:
variables_selected = var_description.loc[((~var_description.index.str.contains(r'DP')|
                                           (var_description.index.str.contains(r'DP')&
                                            var_description.index.str.contains(r'[0-9]PE')))&
                                          ~var_description.index.str.contains(r'PR_'))
                                        ].sort_index()

In [109]:
len(variables_selected)

554

In [193]:
varlist_dict = {}
var_dict = {}
for year in range(2010, 2018):
    varlist_dict[year] = []
    k = 0
    for var in variables_selected.index:
        success = False
        l = 0
        while not success:
            l += 1
            resp = requests.get(
                "https://api.census.gov/data/{}/acs/acs5/profile?get={}&for=county:*&in=state:*&key={}"
                .format(year, var, censuskey))
            time.sleep(1)
            if resp.status_code ==200:
                varlist_dict[year].append(pd.DataFrame(resp.json()[1:], columns=resp.json()[0]))
                success = True
            elif l > 10:
                success = True
        k += 1
        
        if k%int(len(variables_selected)/10)==0:
            print("---progress: {:0.2f}% completed for {}---".format(
                k*10/int(len(variables_selected)/10), 
                year
            ))
    var_dict[year] = reduce(lambda left, right: pd.merge(left, 
                                                         right, 
                                                         how='outer'
                                                        ), varlist_dict[year])
    print(year, var_dict[year].shape)

---progress: 10.00% completed for 2010---
---progress: 20.00% completed for 2010---
---progress: 30.00% completed for 2010---
---progress: 40.00% completed for 2010---
---progress: 50.00% completed for 2010---
---progress: 60.00% completed for 2010---
---progress: 70.00% completed for 2010---
---progress: 80.00% completed for 2010---
---progress: 90.00% completed for 2010---
---progress: 100.00% completed for 2010---
2010 (3221, 544)
---progress: 10.00% completed for 2011---
---progress: 20.00% completed for 2011---
---progress: 30.00% completed for 2011---
---progress: 40.00% completed for 2011---
---progress: 50.00% completed for 2011---
---progress: 60.00% completed for 2011---
---progress: 70.00% completed for 2011---
---progress: 80.00% completed for 2011---
---progress: 90.00% completed for 2011---
---progress: 100.00% completed for 2011---
2011 (3221, 545)
---progress: 10.00% completed for 2012---
---progress: 20.00% completed for 2012---
---progress: 30.00% completed for 2012--

In [459]:
missing_varlist_dict = {}
missing_var_dict = {}
for year in range(2010, 2018):
    missing_col = []
    for col in var_dict[2016].columns:
        if col not in var_dict[2010].columns:
            missing_col.append(col)
    missing_varlist_dict[year] = []
    k = 0
    for var in missing_col:
        success = False
        l = 0
        while not success:
            l += 1
            resp = requests.get(
                "https://api.census.gov/data/{}/acs/acs5/profile?get={}&for=county:*&in=state:*&key={}"
                .format(year, var, censuskey))
#             time.sleep(1)
            if resp.status_code ==200:
                missing_varlist_dict[year].append(pd.DataFrame(resp.json()[1:], columns=resp.json()[0]))
                success = True
            elif l > 10:
                success = True
                print("no data for: ", year, var)
        k += 1

no data for:  2010 CD115
no data for:  2010 DP02_0150PE
no data for:  2010 DP02_0151PE
no data for:  2010 DP02_0152PE
no data for:  2010 DP04_0142PE
no data for:  2010 DP04_0143PE
no data for:  2010 DP05_0082PE
no data for:  2010 DP05_0083PE
no data for:  2010 DP05_0084PE
no data for:  2010 ZCTA5
no data for:  2011 CD115
no data for:  2011 DP02_0150PE
no data for:  2011 DP02_0151PE
no data for:  2011 DP02_0152PE
no data for:  2011 DP04_0142PE
no data for:  2011 DP04_0143PE
no data for:  2011 DP05_0082PE
no data for:  2011 DP05_0083PE
no data for:  2011 DP05_0084PE
no data for:  2012 CD115
no data for:  2012 DP02_0150PE
no data for:  2012 DP02_0151PE
no data for:  2012 DP02_0152PE
no data for:  2012 DP04_0142PE
no data for:  2012 DP04_0143PE
no data for:  2012 DP05_0082PE
no data for:  2012 DP05_0083PE
no data for:  2012 DP05_0084PE
no data for:  2013 CD115
no data for:  2013 DP04_0142PE
no data for:  2013 DP04_0143PE
no data for:  2013 DP05_0082PE
no data for:  2013 DP05_0083PE
no data

In [467]:
for year in range(2010, 2018):
    var_dict[year] = var_dict[year].apply(pd.to_numeric, errors='coerce')
    var_dict[year] = var_dict[year].loc[var_dict[year].state!=72]
    var_dict[year]["FIPS"] = var_dict[year].state * 1000 + var_dict[year].county
    var_dict[year].to_csv("../data/census_{}.csv".format(year))

In [265]:
pd.options.display.float_format = '{:,.2f}'.format

In [466]:
var_dict[2016].head()

Unnamed: 0,AIANHH,state,county,AIHHTLI,AITSCE,ANRC,CBSA,CD115,CNECTA,CONCIT,COUNTY,COUSUB,CSA,DIVISION,DP02_0001PE,DP02_0002PE,DP02_0003PE,DP02_0004PE,DP02_0005PE,DP02_0006PE,DP02_0007PE,DP02_0008PE,DP02_0009PE,DP02_0010PE,DP02_0011PE,DP02_0012PE,DP02_0013PE,DP02_0014PE,DP02_0015PE,DP02_0016PE,DP02_0017PE,DP02_0018PE,DP02_0019PE,DP02_0020PE,DP02_0021PE,DP02_0022PE,DP02_0023PE,DP02_0024PE,DP02_0025PE,DP02_0026PE,DP02_0027PE,DP02_0028PE,DP02_0029PE,DP02_0030PE,DP02_0031PE,DP02_0032PE,DP02_0033PE,DP02_0034PE,DP02_0035PE,DP02_0036PE,DP02_0037PE,DP02_0038PE,DP02_0039PE,DP02_0040PE,DP02_0041PE,DP02_0042PE,DP02_0043PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0049PE,DP02_0050PE,DP02_0051PE,DP02_0052PE,DP02_0053PE,DP02_0054PE,DP02_0055PE,DP02_0056PE,DP02_0057PE,DP02_0058PE,DP02_0059PE,DP02_0060PE,DP02_0061PE,DP02_0062PE,DP02_0063PE,DP02_0064PE,DP02_0065PE,DP02_0066PE,DP02_0067PE,DP02_0068PE,DP02_0069PE,DP02_0070PE,DP02_0071PE,DP02_0072PE,DP02_0073PE,DP02_0074PE,DP02_0075PE,DP02_0076PE,DP02_0077PE,DP02_0078PE,DP02_0079PE,DP02_0080PE,DP02_0081PE,DP02_0082PE,DP02_0083PE,DP02_0084PE,DP02_0085PE,DP02_0086PE,DP02_0087PE,DP02_0088PE,DP02_0089PE,DP02_0090PE,DP02_0091PE,DP02_0092PE,DP02_0093PE,DP02_0094PE,DP02_0095PE,DP02_0096PE,DP02_0097PE,DP02_0098PE,DP02_0099PE,DP02_0100PE,DP02_0101PE,DP02_0102PE,DP02_0103PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP02_0110PE,DP02_0111PE,DP02_0112PE,DP02_0113PE,DP02_0114PE,DP02_0115PE,DP02_0116PE,DP02_0117PE,DP02_0118PE,DP02_0119PE,DP02_0120PE,DP02_0121PE,DP02_0122PE,DP02_0123PE,DP02_0124PE,DP02_0125PE,DP02_0126PE,DP02_0127PE,DP02_0128PE,DP02_0129PE,DP02_0130PE,DP02_0131PE,DP02_0132PE,DP02_0133PE,DP02_0134PE,DP02_0135PE,DP02_0136PE,DP02_0137PE,DP02_0138PE,DP02_0139PE,DP02_0140PE,DP02_0141PE,DP02_0142PE,DP02_0143PE,DP02_0144PE,DP02_0145PE,DP02_0146PE,DP02_0147PE,DP02_0148PE,DP02_0149PE,DP02_0150PE,DP02_0151PE,DP02_0152PE,DP03_0001PE,DP03_0002PE,DP03_0003PE,DP03_0004PE,DP03_0005PE,DP03_0006PE,DP03_0007PE,DP03_0008PE,DP03_0009PE,DP03_0010PE,DP03_0011PE,DP03_0012PE,DP03_0013PE,DP03_0014PE,DP03_0015PE,DP03_0016PE,DP03_0017PE,DP03_0018PE,DP03_0019PE,DP03_0020PE,DP03_0021PE,DP03_0022PE,DP03_0023PE,DP03_0024PE,DP03_0025PE,DP03_0026PE,DP03_0027PE,DP03_0028PE,DP03_0029PE,DP03_0030PE,DP03_0031PE,DP03_0032PE,DP03_0033PE,DP03_0034PE,DP03_0035PE,DP03_0036PE,DP03_0037PE,DP03_0038PE,DP03_0039PE,DP03_0040PE,DP03_0041PE,DP03_0042PE,DP03_0043PE,DP03_0044PE,DP03_0045PE,DP03_0046PE,DP03_0047PE,DP03_0048PE,DP03_0049PE,DP03_0050PE,DP03_0051PE,DP03_0052PE,DP03_0053PE,DP03_0054PE,DP03_0055PE,DP03_0056PE,DP03_0057PE,DP03_0058PE,DP03_0059PE,DP03_0060PE,DP03_0061PE,DP03_0062PE,DP03_0063PE,DP03_0064PE,DP03_0065PE,DP03_0066PE,DP03_0067PE,DP03_0068PE,DP03_0069PE,DP03_0070PE,DP03_0071PE,DP03_0072PE,DP03_0073PE,DP03_0074PE,DP03_0075PE,DP03_0076PE,DP03_0077PE,DP03_0078PE,DP03_0079PE,DP03_0080PE,DP03_0081PE,DP03_0082PE,DP03_0083PE,DP03_0084PE,DP03_0085PE,DP03_0086PE,DP03_0087PE,DP03_0088PE,DP03_0089PE,DP03_0090PE,DP03_0091PE,DP03_0092PE,DP03_0093PE,DP03_0094PE,DP03_0095PE,DP03_0096PE,DP03_0097PE,DP03_0098PE,DP03_0099PE,DP03_0100PE,DP03_0101PE,DP03_0102PE,DP03_0103PE,DP03_0104PE,DP03_0105PE,DP03_0106PE,DP03_0107PE,DP03_0108PE,DP03_0109PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0114PE,DP03_0115PE,DP03_0116PE,DP03_0117PE,DP03_0118PE,DP03_0119PE,DP03_0120PE,DP03_0121PE,DP03_0122PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0128PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP03_0133PE,DP03_0134PE,DP03_0135PE,DP03_0136PE,DP03_0137PE,DP04_0001PE,DP04_0002PE,DP04_0003PE,DP04_0004PE,DP04_0005PE,DP04_0006PE,DP04_0007PE,DP04_0008PE,DP04_0009PE,DP04_0010PE,DP04_0011PE,DP04_0012PE,DP04_0013PE,DP04_0014PE,DP04_0015PE,DP04_0016PE,DP04_0017PE,DP04_0018PE,DP04_0019PE,DP04_0020PE,DP04_0021PE,DP04_0022PE,DP04_0023PE,DP04_0024PE,DP04_0025PE,DP04_0026PE,DP04_0027PE,DP04_0028PE,DP04_0029PE,DP04_0030PE,DP04_0031PE,DP04_0032PE,DP04_0033PE,DP04_0034PE,DP04_0035PE,DP04_0036PE,DP04_0037PE,DP04_0038PE,DP04_0039PE,DP04_0040PE,DP04_0041PE,DP04_0042PE,DP04_0043PE,DP04_0044PE,DP04_0045PE,DP04_0046PE,DP04_0047PE,DP04_0048PE,DP04_0049PE,DP04_0050PE,DP04_0051PE,DP04_0052PE,DP04_0053PE,DP04_0054PE,DP04_0055PE,DP04_0056PE,DP04_0057PE,DP04_0058PE,DP04_0059PE,DP04_0060PE,DP04_0061PE,DP04_0062PE,DP04_0063PE,DP04_0064PE,DP04_0065PE,DP04_0066PE,DP04_0067PE,DP04_0068PE,DP04_0069PE,DP04_0070PE,DP04_0071PE,DP04_0072PE,DP04_0073PE,DP04_0074PE,DP04_0075PE,DP04_0076PE,DP04_0077PE,DP04_0078PE,DP04_0079PE,DP04_0080PE,DP04_0081PE,DP04_0082PE,DP04_0083PE,DP04_0084PE,DP04_0085PE,DP04_0086PE,DP04_0087PE,DP04_0088PE,DP04_0089PE,DP04_0090PE,DP04_0091PE,DP04_0092PE,DP04_0093PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0101PE,DP04_0102PE,DP04_0103PE,DP04_0104PE,DP04_0105PE,DP04_0106PE,DP04_0107PE,DP04_0108PE,DP04_0109PE,DP04_0110PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE,DP04_0116PE,DP04_0117PE,DP04_0118PE,DP04_0119PE,DP04_0120PE,DP04_0121PE,DP04_0122PE,DP04_0123PE,DP04_0124PE,DP04_0125PE,DP04_0126PE,DP04_0127PE,DP04_0128PE,DP04_0129PE,DP04_0130PE,DP04_0131PE,DP04_0132PE,DP04_0133PE,DP04_0134PE,DP04_0135PE,DP04_0136PE,DP04_0137PE,DP04_0138PE,DP04_0139PE,DP04_0140PE,DP04_0141PE,DP04_0142PE,DP04_0143PE,DP05_0001PE,DP05_0002PE,DP05_0003PE,DP05_0004PE,DP05_0005PE,DP05_0006PE,DP05_0007PE,DP05_0008PE,DP05_0009PE,DP05_0010PE,DP05_0011PE,DP05_0012PE,DP05_0013PE,DP05_0014PE,DP05_0015PE,DP05_0016PE,DP05_0017PE,DP05_0018PE,DP05_0019PE,DP05_0020PE,DP05_0021PE,DP05_0022PE,DP05_0023PE,DP05_0024PE,DP05_0025PE,DP05_0026PE,DP05_0027PE,DP05_0028PE,DP05_0029PE,DP05_0030PE,DP05_0031PE,DP05_0032PE,DP05_0033PE,DP05_0034PE,DP05_0035PE,DP05_0036PE,DP05_0037PE,DP05_0038PE,DP05_0039PE,DP05_0040PE,DP05_0041PE,DP05_0042PE,DP05_0043PE,DP05_0044PE,DP05_0045PE,DP05_0046PE,DP05_0047PE,DP05_0048PE,DP05_0049PE,DP05_0050PE,DP05_0051PE,DP05_0052PE,DP05_0053PE,DP05_0054PE,DP05_0055PE,DP05_0056PE,DP05_0057PE,DP05_0058PE,DP05_0059PE,DP05_0060PE,DP05_0061PE,DP05_0062PE,DP05_0063PE,DP05_0064PE,DP05_0065PE,DP05_0066PE,DP05_0067PE,DP05_0068PE,DP05_0069PE,DP05_0070PE,DP05_0071PE,DP05_0072PE,DP05_0073PE,DP05_0074PE,DP05_0075PE,DP05_0076PE,DP05_0077PE,DP05_0078PE,DP05_0079PE,DP05_0080PE,DP05_0081PE,DP05_0082PE,DP05_0083PE,DP05_0084PE,GEOCOMP,GEOVARIANT,GEO_ID,LSAD_NAME,METDIV,NAME,NECTA,NECTADIV,PLACE,PUMA5,REGION,SDELM,SDSEC,SDUNI,SLDL,SLDU,STATE,SUBMCD,SUMLEVEL,TRACT,TTRACT,UA,US,ZCTA5
0,,5,27,,,,31620,,,,27,,999,7,9518.0,67.4,28.8,47.0,17.1,3.8,2.1,16.5,9.6,32.6,27.1,13.1,32.7,29.9,,,22479.0,42.3,19.8,27.6,4.7,5.5,1.7,9316.0,36.7,50.7,1.0,3.9,7.7,10581.0,29.3,44.0,3.3,11.3,12.0,443.0,43.1,,,,,,481.0,80.0,22.0,8.1,15.4,34.5,385.0,69.1,66.8,6937.0,6.5,5.2,28.4,18.3,41.5,15040.0,5.0,9.8,39.2,18.9,5.1,14.9,7.0,85.2,21.9,18989.0,7.8,23748.0,18.5,5092.0,4.7,14900.0,14.5,3756.0,53.2,23772.0,83.3,16.7,9.3,7.4,4.8,2.6,0.1,24168.0,97.4,97.2,69.6,27.5,0.2,2.6,639.0,21.3,78.7,681.0,42.0,4.8,95.2,639.0,29.0,71.0,639.0,7.5,34.0,3.6,0.0,54.9,0.0,22705.0,95.6,4.4,1.5,2.9,1.0,0.7,0.0,0.7,0.5,0.1,0.0,24168.0,13.6,0.0,0.2,0.0,0.9,7.4,1.5,0.1,5.1,0.1,0.1,9.3,1.0,0.0,0.2,0.2,0.0,0.3,1.3,1.0,0.0,0.5,0.1,0.1,0.0,0.4,0.0,,,,19617,57.1,57.1,51.8,5.3,0.0,42.9,11209,9.3,10466,51.4,51.4,47.6,1623,72.8,2989,62.5,9930,86.7,6.1,0.1,4.2,0.7,2.2,,10165,29.4,16.0,25.1,10.3,19.2,10165,6.2,3.8,20.2,2.5,12.6,3.4,0.4,3.2,3.9,28.2,7.9,4.0,3.5,10165,75.4,20.1,4.3,0.1,9518,12.9,10.4,14.2,10.7,12.7,16.6,10.1,9.9,1.4,1.0,,,69.7,,39.9,,17.2,,7.4,,1.7,,18.2,6411,9.0,5.2,11.0,9.2,14.0,21.3,12.3,14.2,2.1,1.5,,,,3107,,,,,,23748,88.4,60.3,39.8,11.6,5092,2.1,14900,10514,9567,84.8,79.7,7.4,15.2,947,58.3,27.7,31.4,41.7,4386,82.3,47.2,41.4,17.7,19.4,31.5,27.3,10.6,15.2,12.0,40.0,53.1,40.8,24.9,36.5,35.9,35.8,35.9,21.7,23.4,15.7,21.2,41.1,11578,82.2,17.8,,,11578,67.1,0.8,1.4,2.8,2.2,3.2,2.7,19.9,0.0,11578,0.0,1.2,12.8,15.3,14.8,17.7,12.5,14.1,5.2,6.4,11578,3.2,1.3,6.3,16.8,25.4,21.2,13.9,6.1,5.9,,11578,3.4,5.7,29.9,46.9,12.3,1.8,9518,66.1,33.9,,,9518,4.3,30.6,31.9,13.1,7.6,12.5,9518,6.4,37.3,33.5,22.9,9518,41.4,5.3,50.1,0.3,0.0,2.8,0.0,0.0,0.1,9518,0.2,0.4,2.4,9518,98.0,0.8,1.2,6296,29.5,30.9,10.8,11.1,13.3,3.0,1.4,0.0,,6296,48.2,51.8,3035,7.7,57.5,21.2,6.6,3.9,0.3,2.8,,3261,31.5,38.3,24.8,3.3,1.4,0.6,,3034,55.1,16.0,4.9,5.6,18.5,,3243,47.3,16.4,10.0,10.1,4.3,3.3,8.5,,2486,31.1,64.7,2.4,1.2,0.0,0.6,0.0,,,2365,19.6,14.1,5.4,15.7,6.1,39.1,,24168,47.6,52.4,6.1,6.0,5.6,9.9,10.2,11.4,10.6,11.7,5.4,6.5,8.7,5.7,2.1,,78.6,70.2,20.6,16.6,18989,46.7,53.3,4002,42.1,57.9,24168,99.0,1.0,99.0,60.0,34.8,0.3,0.0,0.0,0.0,0.0,1.1,0.1,0.1,0.0,0.0,0.0,0.1,0.8,0.0,0.0,0.0,0.0,0.0,2.8,1.0,0.7,0.1,0.0,0.0,24168,60.8,35.8,0.4,1.1,0.0,3.0,24168,2.6,2.2,0.0,0.0,0.4,97.4,59.2,34.7,0.3,1.1,0.0,1.4,0.7,0.0,0.7,,18517,46.8,53.2,0,0,,,99999,,,,,,3,,,,,,5,,50,,,,,
1,,5,29,,,,99999,,,,29,,999,7,8360.0,66.9,26.4,49.1,15.6,4.8,3.4,13.0,7.4,33.1,29.7,13.1,29.3,32.4,,,20796.0,40.2,19.8,28.3,7.6,4.1,1.7,8303.0,25.8,57.1,1.8,3.7,11.5,8729.0,20.2,51.9,2.4,12.6,12.9,260.0,40.0,,,,,,620.0,34.8,8.1,7.1,1.0,18.7,216.0,58.3,77.8,4499.0,5.5,6.8,46.9,24.1,16.7,14516.0,5.0,10.0,42.3,19.3,6.4,11.3,5.6,85.0,16.9,16184.0,9.3,20904.0,20.9,4800.0,7.1,12305.0,19.1,3799.0,44.2,20891.0,88.9,11.0,6.6,4.4,3.2,1.2,0.1,21060.0,98.0,97.5,75.2,22.3,0.5,2.0,431.0,26.5,73.5,532.0,101.0,9.9,90.1,431.0,5.6,94.4,431.0,11.6,2.6,0.9,0.0,83.3,1.6,19792.0,96.2,3.8,1.9,3.2,1.8,0.4,0.0,0.1,0.1,0.0,0.0,21060.0,24.2,0.0,0.0,0.0,0.9,5.8,4.0,0.3,12.3,0.2,0.5,9.4,2.8,0.0,0.2,0.9,0.3,0.1,1.1,1.8,0.0,0.9,0.1,0.9,0.1,0.3,0.0,,,,16627,54.2,54.1,50.2,3.9,0.1,45.8,8992,7.2,8554,49.7,49.6,45.7,1451,55.1,3044,69.0,8222,83.3,10.7,0.8,1.3,1.2,2.7,,8342,28.8,14.7,23.1,17.7,15.7,8342,8.4,8.4,11.9,2.7,11.4,6.7,1.5,6.5,5.7,23.3,6.1,3.4,3.9,8342,77.3,16.1,6.4,0.1,8360,10.9,9.3,14.9,11.8,12.8,17.5,10.0,8.4,1.9,2.4,,,66.9,,41.6,,19.8,,9.9,,2.3,,17.1,5594,5.0,5.7,13.7,10.9,14.0,22.2,11.2,11.4,2.6,3.5,,,,2766,,,,,,20904,89.1,58.0,44.0,10.9,4800,3.9,12305,8565,7961,86.7,79.7,9.2,13.3,604,47.2,20.9,27.8,52.8,3740,81.0,38.6,51.4,19.0,15.7,28.7,35.9,8.8,18.4,16.8,38.9,51.6,85.5,21.5,33.6,32.9,31.6,33.4,18.0,19.7,12.5,17.9,38.5,9733,85.9,14.1,,,9733,75.0,0.3,4.3,1.2,1.4,0.0,1.5,15.8,0.4,9733,0.3,2.4,15.7,13.6,18.3,19.4,10.6,8.5,4.0,7.1,9733,2.4,0.9,4.7,12.2,35.2,21.1,11.6,5.6,6.2,,9733,2.6,5.1,23.1,60.0,7.8,1.3,8360,72.6,27.4,,,8360,3.3,28.4,31.9,14.3,9.2,12.8,8360,6.6,31.4,40.3,21.7,8360,25.8,6.7,59.1,0.2,0.0,6.1,0.0,1.8,0.4,8360,0.1,0.4,2.2,8360,97.2,2.4,0.4,6069,17.8,32.1,19.7,14.0,11.0,3.3,1.9,0.2,,6069,51.7,48.3,3140,6.1,56.4,28.5,6.9,1.0,0.6,0.5,,2929,30.3,43.7,19.4,5.1,1.3,0.2,,3140,46.2,10.2,7.5,11.8,24.3,,2908,54.4,16.4,12.0,5.8,2.4,1.4,7.6,,1804,34.7,60.3,5.0,0.0,0.0,0.0,0.0,,,1762,16.3,10.6,3.7,11.7,7.5,50.1,,21060,48.9,51.1,6.0,6.9,6.2,6.0,5.9,11.7,11.5,13.8,7.1,6.4,10.3,5.4,2.7,,76.9,73.4,22.0,18.3,16198,48.6,51.4,3864,45.2,54.8,21060,97.9,2.1,97.9,85.3,11.8,0.5,0.3,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.0,0.1,0.0,0.0,0.0,0.0,0.0,0.2,2.1,0.6,1.0,0.1,0.0,21060,87.3,12.7,1.8,0.2,0.1,0.2,21060,3.8,3.2,0.0,0.0,0.6,96.2,81.8,11.8,0.5,0.1,0.0,0.0,2.1,0.0,2.1,,15889,48.7,51.3,0,0,,,99999,,,,,,3,,,,,,5,,50,,,,,
2,,5,31,,,,27860,,,,31,,308,7,39042.0,66.4,30.2,45.3,17.4,6.3,4.1,14.7,8.7,33.6,26.6,9.0,34.7,23.5,,,99218.0,39.3,17.8,29.0,7.3,6.6,2.8,39084.0,33.0,49.9,1.6,2.3,13.2,42369.0,27.6,45.0,2.7,10.0,14.6,1219.0,37.0,,,,,,2440.0,57.9,19.3,16.2,7.5,15.0,1413.0,61.6,64.8,29537.0,7.4,6.3,37.4,16.2,32.7,65447.0,4.0,8.1,34.2,22.3,6.0,16.1,9.3,88.0,25.4,77277.0,7.6,101881.0,17.7,25555.0,9.2,63685.0,15.4,12641.0,46.3,101598.0,76.7,22.9,14.7,8.2,5.9,2.3,0.4,102884.0,96.2,95.8,68.6,27.2,0.4,3.8,3906.0,28.6,71.4,4337.0,431.0,0.0,100.0,3906.0,27.2,72.8,3906.0,6.0,28.5,5.4,2.1,53.3,4.7,95696.0,94.6,5.4,2.3,3.5,1.6,0.7,0.2,0.8,0.4,0.3,0.0,102884.0,16.8,0.1,0.0,0.1,0.7,6.6,1.7,0.3,9.5,0.1,0.0,10.5,2.0,0.0,0.3,0.7,0.1,0.3,1.1,1.6,0.1,0.7,0.3,0.0,0.1,0.4,0.1,,,,80053,62.7,62.7,58.7,4.0,0.1,37.3,50177,6.3,41780,56.6,56.6,52.8,8135,74.8,15552,69.6,46201,82.6,10.4,0.3,2.1,1.1,3.5,,46995,33.4,16.2,23.6,10.1,16.7,46995,2.1,7.2,14.3,2.3,13.2,4.4,1.7,5.0,5.9,28.0,9.1,4.3,2.4,46995,79.3,13.8,6.8,0.1,39042,8.3,6.7,13.5,11.5,16.0,18.1,10.8,9.2,3.1,2.8,,,78.5,,29.8,,17.7,,7.8,,1.9,,15.6,25935,4.8,3.3,10.8,10.9,16.5,19.7,13.7,12.4,4.0,3.9,,,,13107,,,,,,101881,86.4,58.0,39.5,13.6,25555,4.9,63685,47343,44437,80.4,73.1,9.6,19.6,2906,57.4,24.9,34.7,42.6,16342,83.7,41.7,49.0,16.3,13.2,21.2,29.2,5.5,8.5,11.8,35.3,45.0,59.1,18.9,27.6,27.4,33.8,25.0,16.0,17.8,7.5,15.7,32.2,43278,90.2,9.8,,,43278,69.5,1.3,3.4,6.7,4.4,4.9,3.6,6.2,0.0,43278,1.3,7.3,19.2,20.5,13.6,17.7,8.8,5.4,2.3,3.9,43278,1.1,2.2,9.6,16.1,22.2,19.3,12.8,8.3,8.3,,43278,1.2,8.2,27.0,49.2,12.0,2.3,39042,58.9,41.1,,,39042,5.8,41.9,29.3,12.5,4.7,5.8,39042,7.4,33.5,41.1,17.9,39042,39.3,5.4,53.7,0.0,0.0,1.2,0.0,0.2,0.2,39042,0.1,1.1,2.7,39042,97.6,1.9,0.5,23001,11.3,23.9,24.1,17.7,13.1,6.4,2.2,1.3,,23001,63.0,37.0,14485,3.4,46.1,27.5,13.4,5.3,2.2,2.2,,8516,28.8,39.6,22.5,7.0,1.3,0.8,,14434,59.2,14.8,8.5,4.9,12.6,,8441,53.3,19.1,9.6,5.7,3.2,1.7,7.4,,14902,18.0,67.4,12.0,2.2,0.4,0.1,0.1,,,14578,12.9,14.3,13.9,11.1,8.5,39.3,,102884,48.7,51.3,7.0,7.8,6.1,7.3,8.2,15.0,12.8,12.0,5.5,5.4,7.5,3.7,1.7,,75.2,70.3,16.2,12.8,77320,47.8,52.2,13216,42.2,57.8,102884,98.1,1.9,98.1,80.8,13.8,0.6,0.1,0.0,0.0,0.0,1.2,0.2,0.4,0.2,0.1,0.1,0.1,0.2,0.1,0.0,0.0,0.0,0.1,1.6,1.9,1.0,0.4,0.1,0.2,102884,82.5,15.1,1.3,1.3,0.1,1.7,102884,4.7,3.8,0.1,0.0,0.8,95.3,78.0,13.8,0.3,1.2,0.1,0.1,1.9,0.1,1.8,,74820,47.7,52.3,0,0,,,99999,,,,,,3,,,,,,5,,50,,,,,
3,,5,33,,,,22900,,,,33,,999,7,23548.0,75.5,30.0,58.1,20.9,4.8,2.4,12.7,6.6,24.5,21.5,9.2,36.3,27.8,,,61319.0,38.4,22.3,29.4,6.6,3.3,1.6,24037.0,24.5,60.8,1.8,1.9,11.1,25134.0,17.5,56.7,1.5,11.3,13.0,740.0,41.4,,,,,,2407.0,65.4,9.0,7.0,15.2,34.3,1575.0,58.0,70.9,15492.0,7.0,5.5,46.4,24.0,17.2,41418.0,5.4,9.3,40.0,23.7,8.1,9.4,4.1,85.3,13.5,46375.0,10.4,61391.0,18.8,15541.0,6.0,36689.0,17.9,9161.0,43.8,61200.0,86.0,13.9,8.1,5.8,3.4,2.3,0.1,61927.0,95.8,95.2,64.5,30.7,0.6,4.2,2604.0,39.5,60.5,2975.0,371.0,0.0,100.0,2604.0,12.3,87.7,2604.0,6.0,25.4,1.2,0.0,63.9,3.5,58143.0,92.8,7.2,3.6,5.5,2.8,0.4,0.2,1.2,0.7,0.0,0.0,61927.0,13.5,0.1,0.2,0.1,1.8,16.5,2.1,0.2,12.0,0.0,0.1,12.6,1.0,0.1,0.5,0.4,0.1,0.2,1.0,1.8,0.0,0.1,0.4,0.1,0.0,0.3,0.2,,,,48102,57.1,57.1,53.0,4.0,0.0,42.9,27453,7.1,24614,51.7,51.7,48.7,4256,61.0,10140,63.3,25208,86.5,9.2,0.2,1.8,0.4,2.0,,25513,28.5,17.0,24.4,11.5,18.7,25513,2.3,7.4,16.7,2.9,12.2,6.0,1.1,5.1,6.3,23.9,6.9,4.7,4.3,25513,81.1,14.5,4.3,0.1,23548,8.7,6.1,13.9,12.8,17.6,19.4,10.3,8.1,1.5,1.6,,,72.2,,37.7,,17.2,,7.1,,2.6,,14.9,17788,6.7,3.4,10.9,11.5,18.9,22.0,12.6,10.0,2.0,2.0,,,,5760,,,,,,61391,87.2,57.0,41.5,12.8,15541,7.0,36689,25664,23839,83.9,77.0,10.6,16.1,1825,46.8,33.4,16.1,53.2,11025,82.9,38.3,54.3,17.1,14.7,23.6,20.6,8.7,14.5,10.0,38.3,49.0,46.7,18.8,27.3,27.1,24.6,27.9,15.9,17.0,11.7,16.6,33.8,26430,89.1,10.9,,,26430,76.5,1.4,2.9,2.3,2.1,1.8,1.0,11.9,0.0,26430,0.6,4.0,17.4,23.5,17.7,15.5,7.9,5.9,3.6,3.9,26430,1.7,1.3,4.2,12.9,30.9,22.6,13.8,6.5,6.1,,26430,1.8,5.3,23.8,55.4,11.9,1.7,23548,76.4,23.6,,,23548,3.9,27.7,35.0,18.2,8.1,7.2,23548,3.9,33.1,41.1,22.0,23548,35.4,3.9,53.1,0.2,0.1,5.9,0.0,0.7,0.7,23548,0.2,0.7,2.9,23548,96.2,2.8,1.0,17991,13.7,31.0,24.2,16.6,10.4,3.4,0.7,0.0,,17991,56.4,43.6,10151,4.8,51.8,31.3,7.8,2.5,0.5,1.3,,7840,32.7,36.9,24.8,3.8,1.4,0.3,,10067,48.0,15.2,10.6,5.8,20.4,,7640,46.4,21.9,14.6,5.7,3.2,1.9,6.3,,5018,23.9,70.6,4.5,0.2,0.8,0.0,0.0,,,4887,13.2,14.6,15.6,12.2,8.2,36.2,,61927,49.2,50.8,6.1,6.9,7.6,6.7,5.9,12.1,12.9,13.8,6.9,5.9,9.2,4.5,1.6,,74.9,71.7,18.9,15.3,46377,48.6,51.4,9491,44.6,55.4,61927,96.9,3.1,96.9,90.2,1.3,2.0,1.0,0.0,0.0,0.3,1.8,0.0,0.0,0.5,0.0,0.1,0.3,0.9,0.0,0.0,0.0,0.0,0.0,1.5,3.1,0.5,2.4,0.1,0.0,61927,93.3,1.9,4.5,1.9,0.1,1.6,61927,7.0,4.5,0.3,0.0,2.2,93.0,85.5,1.3,1.4,1.7,0.0,0.0,3.0,0.0,3.0,,45049,48.9,51.1,0,0,,,99999,,,,,,3,,,,,,5,,50,,,,,
4,,5,35,,,,32820,,,,35,,368,7,18496.0,66.4,31.6,38.7,15.1,4.2,2.1,23.6,14.4,33.6,27.8,9.8,37.0,24.4,,,48797.0,37.9,14.7,33.9,8.9,4.6,2.4,17603.0,37.2,44.1,3.5,3.1,12.1,20340.0,33.0,37.7,5.4,10.1,13.8,1050.0,60.5,,,,,,1439.0,56.3,9.9,9.7,6.0,30.8,810.0,64.1,73.1,13631.0,7.2,6.7,45.7,21.0,19.5,31056.0,6.1,12.2,35.6,22.3,6.5,11.9,5.5,81.8,17.4,35621.0,8.1,48967.0,17.5,13890.0,6.7,29272.0,16.6,5805.0,48.3,48572.0,84.3,15.4,11.0,4.4,1.7,2.8,0.3,49511.0,98.5,98.0,54.8,43.2,0.5,1.5,763.0,29.6,70.4,1005.0,242.0,0.0,100.0,763.0,11.4,88.6,763.0,13.5,33.8,3.8,2.9,44.6,1.4,45676.0,97.2,2.8,1.2,1.8,0.8,0.3,0.2,0.5,0.2,0.2,0.0,49511.0,7.0,0.3,0.1,0.0,1.6,4.6,0.8,0.1,4.2,0.0,0.2,5.8,1.2,0.0,0.0,0.4,0.0,0.0,0.9,0.9,0.0,0.5,0.3,0.1,0.0,0.1,0.0,,,,37083,60.5,60.5,55.0,5.5,0.0,39.5,22429,9.1,19975,56.2,56.2,50.3,4418,68.3,8593,73.0,19914,81.8,11.0,0.3,1.9,2.4,2.6,,20381,30.9,17.2,24.2,9.8,17.9,20381,3.4,3.4,11.4,4.0,11.8,9.9,1.6,4.0,6.3,26.2,8.6,4.6,4.6,20381,76.2,17.8,5.6,0.4,18496,10.1,6.9,16.4,13.0,11.9,18.5,9.7,9.0,2.6,1.7,,,75.2,,30.0,,15.1,,8.3,,1.9,,23.5,12288,7.0,4.9,14.0,12.9,11.7,19.9,12.3,11.4,3.7,2.3,,,,6208,,,,,,48967,88.5,53.3,43.5,11.5,13890,5.0,29272,21124,19195,86.2,77.0,11.7,13.8,1929,65.6,29.0,39.0,34.4,8148,80.5,31.1,54.2,19.5,19.0,27.7,24.1,5.1,7.0,8.4,41.3,49.4,48.8,24.6,37.0,36.9,45.0,33.8,19.7,20.6,15.2,22.8,33.2,21607,85.6,14.4,,,21607,69.0,1.1,3.1,5.5,8.0,2.9,1.3,9.0,0.2,21607,0.3,1.7,17.7,15.8,15.8,18.8,13.1,8.6,4.8,3.4,21607,1.3,1.6,6.2,19.2,27.3,18.9,12.7,7.2,5.5,,21607,1.4,6.2,27.1,50.6,12.8,1.8,18496,57.1,42.9,,,18496,6.2,33.6,33.6,13.6,5.3,7.7,18496,10.8,39.7,31.6,17.8,18496,47.5,5.7,45.5,0.3,0.0,0.6,0.0,0.4,0.2,18496,0.5,0.7,3.5,18496,95.9,3.0,1.0,10565,17.7,31.0,21.7,14.3,11.2,3.5,0.5,0.1,,10565,64.3,35.7,6789,2.4,45.7,33.9,12.2,3.5,1.9,0.4,,3776,26.4,37.3,26.9,6.7,1.9,0.8,,6725,50.8,16.7,8.2,5.1,19.2,,3741,45.5,21.5,12.3,6.0,4.5,2.3,7.9,,7282,21.0,65.8,11.7,1.3,0.2,0.0,0.0,,,6984,14.8,11.2,10.6,8.9,10.1,44.5,,49511,47.2,52.8,7.7,8.0,7.6,7.2,6.7,13.1,12.1,13.3,5.8,6.1,7.3,3.8,1.1,,71.9,67.9,15.5,12.2,35621,46.0,54.0,6054,42.1,57.9,49511,97.3,2.7,97.3,45.1,50.7,0.2,0.1,0.0,0.0,0.0,0.7,0.1,0.1,0.2,0.0,0.1,0.1,0.1,0.2,0.1,0.0,0.0,0.0,0.5,2.7,0.8,0.3,0.1,1.0,49511,46.8,52.8,1.7,0.8,0.2,0.7,49511,2.3,2.0,0.1,0.0,0.2,97.7,43.7,50.6,0.2,0.7,0.2,0.1,2.4,0.0,2.4,,35098,45.6,54.4,0,0,,,99999,,,,,,3,,,,,,5,,50,,,,,


In [266]:
var_dict[2016].loc[:,(var_dict[2016].max()>100)|(var_dict[2016].min()<0)].describe()

Unnamed: 0,county,CBSA,COUNTY,CSA,DP02_0001PE,DP02_0015PE,DP02_0016PE,DP02_0017PE,DP02_0024PE,DP02_0030PE,DP02_0036PE,DP02_0037PE,DP02_0038PE,DP02_0039PE,DP02_0040PE,DP02_0041PE,DP02_0042PE,DP02_0043PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0049PE,DP02_0050PE,DP02_0051PE,DP02_0052PE,DP02_0058PE,DP02_0068PE,DP02_0070PE,DP02_0072PE,DP02_0074PE,DP02_0076PE,DP02_0078PE,DP02_0086PE,DP02_0093PE,DP02_0094PE,DP02_0095PE,DP02_0096PE,DP02_0097PE,DP02_0098PE,DP02_0099PE,DP02_0100PE,DP02_0101PE,DP02_0102PE,DP02_0103PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP02_0110PE,DP02_0122PE,DP02_0150PE,DP02_0151PE,DP02_0152PE,DP03_0001PE,DP03_0008PE,DP03_0010PE,DP03_0014PE,DP03_0015PE,DP03_0016PE,DP03_0017PE,DP03_0018PE,DP03_0025PE,DP03_0026PE,DP03_0032PE,DP03_0046PE,DP03_0051PE,DP03_0062PE,DP03_0063PE,DP03_0065PE,DP03_0067PE,DP03_0069PE,DP03_0071PE,DP03_0073PE,DP03_0075PE,DP03_0086PE,DP03_0087PE,DP03_0088PE,DP03_0089PE,DP03_0090PE,DP03_0091PE,DP03_0092PE,DP03_0093PE,DP03_0094PE,DP03_0095PE,DP03_0100PE,DP03_0102PE,DP03_0103PE,DP03_0104PE,DP03_0109PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0114PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0001PE,DP04_0004PE,DP04_0005PE,DP04_0006PE,DP04_0016PE,DP04_0027PE,DP04_0037PE,DP04_0038PE,DP04_0045PE,DP04_0048PE,DP04_0049PE,DP04_0050PE,DP04_0057PE,DP04_0062PE,DP04_0072PE,DP04_0073PE,DP04_0075PE,DP04_0076PE,DP04_0080PE,DP04_0089PE,DP04_0090PE,DP04_0093PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0101PE,DP04_0102PE,DP04_0109PE,DP04_0110PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE,DP04_0116PE,DP04_0117PE,DP04_0125PE,DP04_0126PE,DP04_0134PE,DP04_0135PE,DP04_0136PE,DP04_0143PE,DP05_0001PE,DP05_0017PE,DP05_0022PE,DP05_0025PE,DP05_0028PE,DP05_0058PE,DP05_0065PE,DP05_0081PE,DP05_0082PE,METDIV
count,3220.0,3220.0,3220.0,3220.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0
mean,102.92,58578.5,102.92,745.8,37465.38,-888888888.0,-888888888.0,98816.98,39970.37,41989.63,-7071403.76,-9194390.41,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,2305.26,-3819174.82,-3819213.12,-3819212.64,-3819215.61,-3819203.72,842.15,-10821073.59,-10821061.09,26145.25,67997.82,77636.91,99801.44,23384.91,62134.32,14282.22,100195.17,101387.07,13429.14,-2758285.0,-2758271.47,14932.7,1503.57,-15913422.86,-15913341.37,13429.14,-2758313.92,-2758242.54,13428.96,-2758310.23,-2758303.93,-2758324.15,-2758326.93,-2758280.48,-2758322.85,95064.04,101387.07,-888888888.0,-888888888.0,-888888888.0,79561.29,50027.67,40808.38,7218.14,-414013.9,14747.47,-206968.87,45615.71,-888888888.0,46290.82,46290.82,46290.82,36942.05,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888923394.56,-890476189.59,-892788128.85,24371.63,-888888888.0,-888888888.0,-888888888.0,12570.43,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,98471.72,23056.56,61290.24,46920.81,43458.42,3462.39,-2070334.9,-2070359.0,-2070366.53,-2070352.16,14369.43,-207018.71,-1449252.35,-414068.6,-2277423.34,-207004.74,-414033.73,-17391252.31,-207015.63,-207016.03,-414051.52,-207017.38,42120.08,-888888888.0,-888888888.0,42120.08,42120.08,42120.08,-888888888.0,42120.08,36942.05,-888888888.0,-888888888.0,36942.05,36942.05,36942.05,36942.05,-21532090.46,-1104206.89,36942.05,23518.57,-888888888.0,23518.57,15018.93,-207035.16,-207001.46,-207007.95,-207024.86,-207033.2,-207036.54,-207036.23,-888888888.0,8499.65,-888888888.0,14939.64,-206992.9,-207024.29,-207029.23,-207032.51,-207017.78,-888888888.0,8376.22,-888888888.0,12680.87,-888888888.0,-888888888.0,12373.86,-888888888.0,100027.19,-888888888.0,76927.86,14532.57,100027.19,100027.19,100027.19,-888888888.0,70594.92,97678.22
std,106.69,35672.4,106.69,332.15,113832.97,0.0,0.0,319441.43,127433.69,134776.08,78985874.62,87288045.27,0.0,0.0,0.0,0.0,0.0,9158.39,50322647.21,50322644.3,50322644.33,50322644.11,50322645.01,2520.65,84257062.09,84257063.7,87045.17,217137.16,248705.83,322248.8,76312.93,206211.57,40978.85,321226.61,325201.74,90754.86,42800236.41,42800237.28,95769.58,6354.71,101779240.8,101779253.55,90754.86,42800234.54,42800239.14,90753.91,42800234.78,42800235.19,42800233.88,42800233.7,42800236.7,42800233.97,304066.02,325201.74,0.0,0.0,0.0,254974.56,165896.96,131173.38,24280.7,16612246.86,47973.55,11748457.51,149682.93,0.0,152507.44,152507.44,152507.44,112535.96,0.0,0.0,0.0,0.0,1958076.04,13187165.08,20449322.04,73679.7,0.0,0.0,0.0,39675.88,0.0,0.0,0.0,0.0,0.0,318523.91,75427.65,203820.46,157089.32,144557.64,12846.36,37099911.25,37099909.91,37099909.49,37099910.29,47139.31,11748456.63,31054512.37,16612245.5,38904650.98,11748456.88,16612246.37,106279137.47,11748456.69,11748456.68,16612245.93,11748456.66,123620.61,0.0,0.0,123620.61,123620.61,123620.61,0.0,123620.61,112535.96,0.0,0.0,112535.96,112535.96,112535.96,112535.96,136681408.31,31314614.53,112535.96,61868.49,0.0,61868.49,43033.03,11748456.34,11748456.94,11748456.82,11748456.52,11748456.38,11748456.32,11748456.32,0.0,19384.05,0.0,42780.44,11748457.09,11748456.53,11748456.45,11748456.39,11748456.65,0.0,19087.79,0.0,51640.81,0.0,0.0,50355.28,0.0,321446.48,0.0,246435.01,41470.99,321446.48,321446.48,321446.48,0.0,207704.9,12369.66
min,1.0,10100.0,1.0,104.0,37.0,-888888888.0,-888888888.0,76.0,37.0,33.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,0.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,0.0,-666666666.0,-666666666.0,4.0,67.0,70.0,76.0,1.0,51.0,16.0,76.0,76.0,0.0,-666666666.0,-666666666.0,0.0,0.0,-666666666.0,-666666666.0,0.0,-666666666.0,-666666666.0,0.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,76.0,76.0,-888888888.0,-888888888.0,-888888888.0,70.0,39.0,33.0,0.0,-666666666.0,0.0,-666666666.0,39.0,-888888888.0,39.0,39.0,39.0,37.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-999999999.0,-999999999.0,-999999999.0,13.0,-888888888.0,-888888888.0,-888888888.0,20.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,76.0,1.0,51.0,39.0,39.0,0.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,3.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,64.0,-888888888.0,-888888888.0,64.0,64.0,64.0,-888888888.0,64.0,37.0,-888888888.0,-888888888.0,37.0,37.0,37.0,37.0,-888888888.0,-888888888.0,37.0,2.0,-888888888.0,2.0,0.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-888888888.0,2.0,-888888888.0,0.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-888888888.0,2.0,-888888888.0,9.0,-888888888.0,-888888888.0,9.0,-888888888.0,76.0,-888888888.0,70.0,19.0,76.0,76.0,76.0,-888888888.0,61.0,11244.0
25%,35.0,27010.0,35.0,408.0,4220.25,-888888888.0,-888888888.0,10597.25,4525.0,4447.5,118.0,24.6,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,209.25,37.9,4.7,5.3,3.1,11.9,105.0,54.6,64.8,2431.75,7559.75,8474.5,10642.25,2462.0,6180.5,1923.25,10884.75,10996.5,176.0,30.1,45.4,229.0,41.0,0.0,87.5,176.0,5.7,81.0,176.0,6.4,9.33,0.0,0.0,24.5,0.2,10378.75,10996.5,-888888888.0,-888888888.0,-888888888.0,9009.0,4922.5,4450.25,729.0,58.5,1591.75,65.5,4437.5,-888888888.0,4519.5,4519.5,4519.5,4303.25,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,2863.75,-888888888.0,-888888888.0,-888888888.0,1402.75,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,10830.25,2498.75,6257.75,4533.75,4145.0,293.0,47.7,24.0,17.2,29.8,1682.0,13.5,13.3,5.2,2.0,26.98,35.5,36.7,15.6,15.1,17.5,13.9,5532.75,-888888888.0,-888888888.0,5532.75,5532.75,5532.75,-888888888.0,5532.75,4303.25,-888888888.0,-888888888.0,4303.25,4303.25,4303.25,4303.25,0.2,2.0,4303.25,3172.5,-888888888.0,3172.5,1442.75,1.7,27.0,27.1,9.3,2.7,0.7,0.6,-888888888.0,1641.25,-888888888.0,1425.75,40.6,13.3,8.5,5.5,16.8,-888888888.0,1624.25,-888888888.0,894.75,-888888888.0,-888888888.0,857.75,-888888888.0,11202.5,-888888888.0,8697.5,2046.25,11202.5,11202.5,11202.5,-888888888.0,8453.25,99999.0
50%,79.0,42960.0,79.0,999.0,9830.5,-888888888.0,-888888888.0,24710.5,10394.5,10531.0,294.5,35.6,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,559.5,47.65,8.5,9.0,6.3,18.2,284.0,60.15,73.7,5980.5,17663.5,19995.0,24939.0,5835.0,14846.0,4241.5,25390.0,25737.5,631.5,42.1,57.9,797.0,135.0,4.0,95.2,631.5,11.5,88.4,631.5,14.2,21.0,1.4,0.0,46.4,2.3,24275.5,25737.5,-888888888.0,-888888888.0,-888888888.0,20955.5,11454.5,10530.0,1762.5,65.7,3735.0,71.2,10404.0,-888888888.0,10602.5,10602.5,10602.5,9849.5,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,6649.0,-888888888.0,-888888888.0,-888888888.0,3115.5,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,25234.5,5897.0,15025.0,10670.0,9826.0,804.5,59.55,33.7,25.1,40.3,4145.0,19.1,20.9,8.4,6.1,34.2,44.7,51.9,22.2,21.8,25.5,20.3,12393.0,-888888888.0,-888888888.0,12393.0,12393.0,12393.0,-888888888.0,12393.0,9849.5,-888888888.0,-888888888.0,9849.5,9849.5,9849.5,9849.5,0.4,2.5,9849.5,7125.0,-888888888.0,7125.0,3587.0,3.2,40.1,32.4,13.3,4.7,1.8,1.6,-888888888.0,3392.0,-888888888.0,3563.5,46.9,15.35,10.2,6.7,20.5,-888888888.0,3328.0,-888888888.0,2247.5,-888888888.0,-888888888.0,2178.0,-888888888.0,25990.5,-888888888.0,20238.5,4443.0,25990.5,25990.5,25990.5,-888888888.0,19690.5,99999.0
75%,133.0,99999.0,133.0,999.0,25655.0,-888888888.0,-888888888.0,65137.0,27090.75,28087.5,805.5,47.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,1457.25,59.0,13.3,13.6,10.2,25.4,694.0,65.57,82.7,16574.5,45553.0,51783.75,65741.75,15133.0,39845.25,10790.25,66915.25,67583.25,2821.0,54.4,69.6,3326.25,510.75,11.8,100.0,2821.0,18.8,94.2,2821.0,25.0,35.0,4.7,0.6,70.2,5.8,63590.25,67583.25,-888888888.0,-888888888.0,-888888888.0,53512.5,31035.25,27183.0,4510.25,71.8,9620.25,76.4,28393.5,-888888888.0,28847.5,28847.5,28847.5,25218.75,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,16912.0,-888888888.0,-888888888.0,-888888888.0,8136.25,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,65014.75,14928.25,39354.5,28969.25,26815.25,2233.5,70.0,43.12,34.8,52.2,10570.75,25.5,29.9,12.6,12.3,41.5,53.7,68.4,29.3,28.9,34.0,27.33,30456.75,-888888888.0,-888888888.0,30456.75,30456.75,30456.75,-888888888.0,30456.75,25218.75,-888888888.0,-888888888.0,25218.75,25218.75,25218.75,25218.75,0.7,3.3,25218.75,17793.0,-888888888.0,17793.0,10217.5,5.5,49.4,36.8,19.02,8.0,3.4,3.2,-888888888.0,7428.25,-888888888.0,10151.25,52.4,17.0,11.8,8.1,25.2,-888888888.0,7295.0,-888888888.0,6719.0,-888888888.0,-888888888.0,6543.0,-888888888.0,66702.25,-888888888.0,51696.75,11022.0,66702.25,66702.25,66702.25,-888888888.0,50299.0,99999.0
max,840.0,99999.0,840.0,999.0,3281845.0,-888888888.0,-888888888.0,9881693.0,3987136.0,4177105.0,121611.0,100.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,327780.0,100.0,100.0,100.0,100.0,100.0,74072.0,100.0,100.0,2732745.0,6712079.0,7757193.0,9988629.0,2292627.0,6496638.0,1199364.0,9938945.0,10057155.0,3474305.0,100.0,100.0,3585100.0,110795.0,100.0,100.0,3474305.0,100.0,100.0,3474253.0,100.0,100.0,100.0,100.0,100.0,83.3,9421033.0,10057155.0,-888888888.0,-888888888.0,-888888888.0,8036077.0,5169884.0,4113477.0,729679.0,100.0,1463051.0,100.0,4591360.0,-888888888.0,4709319.0,4709319.0,4709319.0,3281845.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,2196172.0,-888888888.0,-888888888.0,-888888888.0,1085673.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,-888888888.0,9988629.0,2292627.0,6496638.0,4920315.0,4485999.0,434316.0,100.0,100.0,100.0,100.0,1576323.0,75.9,100.0,65.7,100.0,87.0,100.0,100.0,78.9,78.9,100.0,78.1,3490118.0,-888888888.0,-888888888.0,3490118.0,3490118.0,3490118.0,-888888888.0,3490118.0,3281845.0,-888888888.0,-888888888.0,3281845.0,3281845.0,3281845.0,3281845.0,36.0,25.9,3281845.0,1499576.0,-888888888.0,1499576.0,1105414.0,40.5,100.0,65.2,50.1,33.7,21.7,57.7,-888888888.0,394162.0,-888888888.0,1098819.0,100.0,43.3,31.8,30.0,100.0,-888888888.0,388004.0,-888888888.0,1737285.0,-888888888.0,-888888888.0,1697033.0,-888888888.0,10057155.0,-888888888.0,7760370.0,1227202.0,10057155.0,10057155.0,10057155.0,-888888888.0,6123488.0,99999.0


In [267]:
var_dict[2016].loc[:,var_dict[2016].min()==-666666666.0].describe()

Unnamed: 0,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0050PE,DP02_0051PE,DP02_0094PE,DP02_0095PE,DP02_0098PE,DP02_0099PE,DP02_0101PE,DP02_0102PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP03_0015PE,DP03_0017PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE
count,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0,3220.0
mean,-3819174.82,-3819213.12,-3819212.64,-3819215.61,-3819203.72,-10821073.59,-10821061.09,-2758285.0,-2758271.47,-15913422.86,-15913341.37,-2758313.92,-2758242.54,-2758310.23,-2758303.93,-2758324.15,-2758326.93,-2758280.48,-2758322.85,-414013.9,-206968.87,-2070334.9,-2070359.0,-2070366.53,-2070352.16,-207018.71,-1449252.35,-414068.6,-2277423.34,-207004.74,-414033.73,-17391252.31,-207015.63,-207016.03,-414051.52,-207017.38,-207035.16,-207001.46,-207007.95,-207024.86,-207033.2,-207036.54,-207036.23,-206992.9,-207024.29,-207029.23,-207032.51,-207017.78
std,50322647.21,50322644.3,50322644.33,50322644.11,50322645.01,84257062.09,84257063.7,42800236.41,42800237.28,101779240.8,101779253.55,42800234.54,42800239.14,42800234.78,42800235.19,42800233.88,42800233.7,42800236.7,42800233.97,16612246.86,11748457.51,37099911.25,37099909.91,37099909.49,37099910.29,11748456.63,31054512.37,16612245.5,38904650.98,11748456.88,16612246.37,106279137.47,11748456.69,11748456.68,16612245.93,11748456.66,11748456.34,11748456.94,11748456.82,11748456.52,11748456.38,11748456.32,11748456.32,11748457.09,11748456.53,11748456.45,11748456.39,11748456.65
min,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0,-666666666.0
25%,37.9,4.7,5.3,3.1,11.9,54.6,64.8,30.1,45.4,0.0,87.5,5.7,81.0,6.4,9.33,0.0,0.0,24.5,0.2,58.5,65.5,47.7,24.0,17.2,29.8,13.5,13.3,5.2,2.0,26.98,35.5,36.7,15.6,15.1,17.5,13.9,1.7,27.0,27.1,9.3,2.7,0.7,0.6,40.6,13.3,8.5,5.5,16.8
50%,47.65,8.5,9.0,6.3,18.2,60.15,73.7,42.1,57.9,4.0,95.2,11.5,88.4,14.2,21.0,1.4,0.0,46.4,2.3,65.7,71.2,59.55,33.7,25.1,40.3,19.1,20.9,8.4,6.1,34.2,44.7,51.9,22.2,21.8,25.5,20.3,3.2,40.1,32.4,13.3,4.7,1.8,1.6,46.9,15.35,10.2,6.7,20.5
75%,59.0,13.3,13.6,10.2,25.4,65.57,82.7,54.4,69.6,11.8,100.0,18.8,94.2,25.0,35.0,4.7,0.6,70.2,5.8,71.8,76.4,70.0,43.12,34.8,52.2,25.5,29.9,12.6,12.3,41.5,53.7,68.4,29.3,28.9,34.0,27.33,5.5,49.4,36.8,19.02,8.0,3.4,3.2,52.4,17.0,11.8,8.1,25.2
max,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,83.3,100.0,100.0,100.0,100.0,100.0,100.0,75.9,100.0,65.7,100.0,87.0,100.0,100.0,78.9,78.9,100.0,78.1,40.5,100.0,65.2,50.1,33.7,21.7,57.7,100.0,43.3,31.8,30.0,100.0


In [319]:
var_dict[2016] = var_dict[2016].applymap(lambda x: np.nan if x==-666666666 or x==-888888888 or x==-999999999 else x)

In [316]:
var_dict[2016].isnull().sum()

AIANHH         3142
state             0
county            0
AIHHTLI        3142
AITSCE         3142
ANRC           3142
CBSA              0
CD115          3142
CNECTA         3142
CONCIT         3142
COUNTY            0
COUSUB         3142
CSA               0
DIVISION          0
DP02_0001PE       0
DP02_0002PE       0
DP02_0003PE       0
DP02_0004PE       0
DP02_0005PE       0
DP02_0006PE       0
DP02_0007PE       0
DP02_0008PE       0
DP02_0009PE       0
DP02_0010PE       0
DP02_0011PE       0
DP02_0012PE       0
DP02_0013PE       0
DP02_0014PE       0
DP02_0015PE    3142
DP02_0016PE    3142
               ... 
DP05_0079PE       0
DP05_0080PE       0
DP05_0081PE    3142
DP05_0082PE       0
DP05_0083PE       0
DP05_0084PE       0
GEOCOMP           0
GEOVARIANT        0
GEO_ID         3142
LSAD_NAME      3142
METDIV            0
NAME           3142
NECTA          3142
NECTADIV       3142
PLACE          3142
PUMA5          3142
REGION            0
SDELM          3142
SDSEC          3142


In [317]:
var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index

Index(['DP02_0036PE', 'DP02_0037PE', 'DP02_0044PE', 'DP02_0045PE',
       'DP02_0046PE', 'DP02_0047PE', 'DP02_0048PE', 'DP02_0050PE',
       'DP02_0051PE', 'DP02_0094PE', 'DP02_0095PE', 'DP02_0098PE',
       'DP02_0099PE', 'DP02_0101PE', 'DP02_0102PE', 'DP02_0104PE',
       'DP02_0105PE', 'DP02_0106PE', 'DP02_0107PE', 'DP02_0108PE',
       'DP02_0109PE', 'DP03_0015PE', 'DP03_0017PE', 'DP03_0069PE',
       'DP03_0071PE', 'DP03_0073PE', 'DP03_0110PE', 'DP03_0111PE',
       'DP03_0112PE', 'DP03_0113PE', 'DP03_0120PE', 'DP03_0121PE',
       'DP03_0123PE', 'DP03_0124PE', 'DP03_0125PE', 'DP03_0126PE',
       'DP03_0127PE', 'DP03_0129PE', 'DP03_0130PE', 'DP03_0131PE',
       'DP03_0132PE', 'DP04_0075PE', 'DP04_0094PE', 'DP04_0095PE',
       'DP04_0096PE', 'DP04_0097PE', 'DP04_0098PE', 'DP04_0099PE',
       'DP04_0100PE', 'DP04_0111PE', 'DP04_0112PE', 'DP04_0113PE',
       'DP04_0114PE', 'DP04_0115PE'],
      dtype='object')

In [416]:
df = var_dict[2016].drop(columns=var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index)

In [417]:
df = df.loc[:, df.columns.str.contains(r"DP0")].dropna(axis=1)

In [419]:
df_target = var_dict[2016].loc[:, var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index]

In [420]:
df_target.head()

Unnamed: 0,DP02_0036PE,DP02_0037PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0050PE,DP02_0051PE,DP02_0094PE,DP02_0095PE,DP02_0098PE,DP02_0099PE,DP02_0101PE,DP02_0102PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP03_0015PE,DP03_0017PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0075PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE
0,443.0,43.1,80.0,22.0,8.1,15.4,34.5,69.1,66.8,21.3,78.7,4.8,95.2,29.0,71.0,7.5,34.0,3.6,0.0,54.9,0.0,72.8,62.5,58.3,27.7,31.4,41.7,31.5,27.3,15.2,12.0,40.0,53.1,40.8,36.5,35.9,35.8,35.9,2.4,7.7,57.5,21.2,6.6,3.9,0.3,2.8,55.1,16.0,4.9,5.6,18.5
1,260.0,40.0,34.8,8.1,7.1,1.0,18.7,58.3,77.8,26.5,73.5,9.9,90.1,5.6,94.4,11.6,2.6,0.9,0.0,83.3,1.6,55.1,69.0,47.2,20.9,27.8,52.8,28.7,35.9,18.4,16.8,38.9,51.6,85.5,33.6,32.9,31.6,33.4,2.2,6.1,56.4,28.5,6.9,1.0,0.6,0.5,46.2,10.2,7.5,11.8,24.3
2,1219.0,37.0,57.9,19.3,16.2,7.5,15.0,61.6,64.8,28.6,71.4,0.0,100.0,27.2,72.8,6.0,28.5,5.4,2.1,53.3,4.7,74.8,69.6,57.4,24.9,34.7,42.6,21.2,29.2,8.5,11.8,35.3,45.0,59.1,27.6,27.4,33.8,25.0,2.7,3.4,46.1,27.5,13.4,5.3,2.2,2.2,59.2,14.8,8.5,4.9,12.6
3,740.0,41.4,65.4,9.0,7.0,15.2,34.3,58.0,70.9,39.5,60.5,0.0,100.0,12.3,87.7,6.0,25.4,1.2,0.0,63.9,3.5,61.0,63.3,46.8,33.4,16.1,53.2,23.6,20.6,14.5,10.0,38.3,49.0,46.7,27.3,27.1,24.6,27.9,2.9,4.8,51.8,31.3,7.8,2.5,0.5,1.3,48.0,15.2,10.6,5.8,20.4
4,1050.0,60.5,56.3,9.9,9.7,6.0,30.8,64.1,73.1,29.6,70.4,0.0,100.0,11.4,88.6,13.5,33.8,3.8,2.9,44.6,1.4,68.3,73.0,65.6,29.0,39.0,34.4,27.7,24.1,7.0,8.4,41.3,49.4,48.8,37.0,36.9,45.0,33.8,3.5,2.4,45.7,33.9,12.2,3.5,1.9,0.4,50.8,16.7,8.2,5.1,19.2


In [348]:
# impute_var_df_list = []
# test_scores = []
# for i, col in enumerate(var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index):

#     rfr_impute = RandomForestRegressor()
#     df_temp = df.loc[df_target.iloc[:, i].notnull()]
#     df_target_temp = df_target.iloc[:, i].dropna()

#     X_train, X_test, y_train, y_test = train_test_split(df_temp, df_target_temp)
#     rfr_impute.fit(X_train, y_train)
#     print(col)
#     print("train score: ", rfr_impute.score(X_train, y_train))
#     print("test score: ", rfr_impute.score(X_test, y_test))
#     test_scores.append(rfr_impute.score(X_test, y_test))

#     impute_var_df_list.append(pd.DataFrame(rfr_impute.predict(df), columns=[col]))
# print("average test score: ", np.mean(test_scores))



DP02_0036PE
train score:  0.9892120235383359
test score:  0.929599832357992




DP02_0037PE
train score:  0.8679578078567677
test score:  0.2788970889532306




DP02_0044PE
train score:  0.9118090034826889
test score:  0.5597612063331762




DP02_0045PE
train score:  0.796217977612543
test score:  -0.2503652532954741




DP02_0046PE
train score:  0.7994679201937716
test score:  -0.12339095084411822




DP02_0047PE
train score:  0.8061458986116573
test score:  -0.02753136399162703




DP02_0048PE
train score:  0.8348175160567604
test score:  0.04860290724410199




DP02_0050PE
train score:  0.8151530319077382
test score:  -0.08700580955709492




DP02_0051PE
train score:  0.8050129051270143
test score:  0.04784885689864737




DP02_0094PE
train score:  0.8566101546442543
test score:  0.30571451776713676




DP02_0095PE
train score:  0.8582089365245411
test score:  0.24562523545023976




DP02_0098PE
train score:  0.8003764016301235
test score:  -0.13181836231862154




DP02_0099PE
train score:  0.7929773858729612
test score:  -0.10659139477120383




DP02_0101PE
train score:  0.8455672398424682
test score:  0.0364321953676523




DP02_0102PE
train score:  0.8348227449561266
test score:  0.055609053229040306




DP02_0104PE
train score:  0.8821040152078434
test score:  0.3512886364939264




DP02_0105PE
train score:  0.9382694188117184
test score:  0.5676667252487977




DP02_0106PE
train score:  0.8538275007944398
test score:  0.21407177555642187




DP02_0107PE
train score:  0.847324179283385
test score:  0.2539145544321797




DP02_0108PE
train score:  0.9544993748371885
test score:  0.6660685522952932




DP02_0109PE
train score:  0.8517939440011525
test score:  0.13426828332311347




DP03_0015PE
train score:  0.8786928532892893
test score:  0.3200007419174298




DP03_0017PE
train score:  0.90742562483828
test score:  0.5164163676594076




DP03_0110PE
train score:  0.8895231173001787
test score:  0.3970249802047906




DP03_0111PE
train score:  0.8924888641963278
test score:  0.2769304383732304




DP03_0112PE
train score:  0.8833032300359827
test score:  0.2697223843886889




DP03_0113PE
train score:  0.8935256143942982
test score:  0.3910682797198558




DP03_0120PE
train score:  0.984808101290215
test score:  0.9238788627614226




DP03_0121PE
train score:  0.8946328256909608
test score:  0.4221980527692446




DP03_0123PE
train score:  0.9600623104344882
test score:  0.7933272640692216




DP03_0124PE
train score:  0.8457268181237878
test score:  -0.03191638642482375




DP03_0125PE
train score:  0.9260330303844267
test score:  0.6389795924905926




DP03_0126PE
train score:  0.9122200471756983
test score:  0.48575306921564154




DP03_0127PE
train score:  0.8367247065996946
test score:  0.060815590400828845




DP03_0129PE
train score:  0.9890739719625966
test score:  0.9216166521118133




DP03_0130PE
train score:  0.9884976391156259
test score:  0.9429854950646369




DP03_0131PE
train score:  0.9457491282322562
test score:  0.6636347782150278




DP03_0132PE
train score:  0.9811745266264107
test score:  0.8841375758065986




DP04_0075PE
train score:  0.840286116914577
test score:  0.14283408016344




DP04_0094PE
train score:  0.9046615147409748
test score:  0.4595410455652911




DP04_0095PE
train score:  0.9762246672027061
test score:  0.8218585676039328




DP04_0096PE
train score:  0.9171006479877015
test score:  0.558973839767746




DP04_0097PE
train score:  0.9538677583293582
test score:  0.7364382079701266




DP04_0098PE
train score:  0.959573166610552
test score:  0.7429840842269166




DP04_0099PE
train score:  0.9661592670996314
test score:  0.8190403178357137




DP04_0100PE
train score:  0.9761896018277278
test score:  0.898741136786898




DP04_0111PE
train score:  0.9132640284279313
test score:  0.5762774980308427




DP04_0112PE
train score:  0.8347091091341831
test score:  0.07600223605642031




DP04_0113PE
train score:  0.8330661844818806
test score:  0.0721928003921346




DP04_0114PE
train score:  0.8332315900752556
test score:  -0.08565983799232035




DP04_0115PE
train score:  0.9041246970478312
test score:  0.5551166966749481
average test score:  0.3768545234901668


In [350]:
# impute_var_df_list = []
# test_scores = []
# for i, col in enumerate(var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index):

#     dtr_impute = DecisionTreeRegressor()
#     df_temp = df.loc[df_target.iloc[:, i].notnull()]
#     df_target_temp = df_target.iloc[:, i].dropna()

#     X_train, X_test, y_train, y_test = train_test_split(df_temp, df_target_temp)
#     dtr_impute.fit(X_train, y_train)
#     print(col)
#     print("train score: ", dtr_impute.score(X_train, y_train))
#     print("test score: ", dtr_impute.score(X_test, y_test))
#     test_scores.append(dtr_impute.score(X_test, y_test))

#     impute_var_df_list.append(pd.DataFrame(dtr_impute.predict(df), columns=[col]))
# print("average test score: ", np.mean(test_scores))

DP02_0036PE
train score:  1.0
test score:  0.620860263845814
DP02_0037PE
train score:  1.0
test score:  -0.3540257144132797
DP02_0044PE
train score:  1.0
test score:  0.17033203787838214
DP02_0045PE
train score:  1.0
test score:  -0.8235330991911103
DP02_0046PE
train score:  1.0
test score:  -0.8128000559236255
DP02_0047PE
train score:  1.0
test score:  -1.2490716814797262
DP02_0048PE
train score:  1.0
test score:  -0.6965747676040361
DP02_0050PE
train score:  1.0
test score:  -0.7380968673690884
DP02_0051PE
train score:  1.0
test score:  -0.805238008460309
DP02_0094PE
train score:  1.0
test score:  -0.3963149702045534
DP02_0095PE
train score:  1.0
test score:  -0.46272844499213694
DP02_0098PE
train score:  1.0
test score:  -1.2841930632322947
DP02_0099PE
train score:  1.0
test score:  -0.9897324322531109
DP02_0101PE
train score:  1.0
test score:  -0.6068613179220745
DP02_0102PE
train score:  1.0
test score:  -0.6923012171528158
DP02_0104PE
train score:  1.0
test score:  -0.15238377988

In [352]:
# impute_var_df_list = []
# test_scores = []
# for i, col in enumerate(var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index):

#     svr_impute = SVR()
#     df_temp = df.loc[df_target.iloc[:, i].notnull()]
#     df_target_temp = df_target.iloc[:, i].dropna()

#     X_train, X_test, y_train, y_test = train_test_split(df_temp, df_target_temp)
#     svr_impute.fit(X_train, y_train)
#     print(col)
#     print("train score: ", svr_impute.score(X_train, y_train))
#     print("test score: ", svr_impute.score(X_test, y_test))
#     test_scores.append(svr_impute.score(X_test, y_test))

#     impute_var_df_list.append(pd.DataFrame(svr_impute.predict(df), columns=[col]))
# print("average test score: ", np.mean(test_scores))



DP02_0036PE
train score:  -0.04717958697972736
test score:  -0.1146169887781674




DP02_0037PE
train score:  0.07697499178692202
test score:  -0.00249361585518737




DP02_0044PE
train score:  0.08381483833241754
test score:  -0.00988926523144995




DP02_0045PE
train score:  0.07963489945932178
test score:  -0.025475094248408547




DP02_0046PE
train score:  0.08223047308646737
test score:  -0.024203046925820093




DP02_0047PE
train score:  0.11304429592657272
test score:  -0.05110770904606499




DP02_0048PE
train score:  0.09176283777844041
test score:  -0.028771560252161654




DP02_0050PE
train score:  0.1252381933118164
test score:  -0.00021780567381202154




DP02_0051PE
train score:  0.08227043611999829
test score:  -0.00243882939731499




DP02_0094PE
train score:  0.0795650537222663
test score:  -2.545387616859074e-05




DP02_0095PE
train score:  0.07985765543990875
test score:  -0.0011286567642558865




DP02_0098PE
train score:  0.002524782747307719
test score:  -0.10138336124845848




DP02_0099PE
train score:  -0.007281557987974584
test score:  -0.11994676321421949




DP02_0101PE
train score:  0.059663419833955296
test score:  -0.043101037699677214




DP02_0102PE
train score:  0.0553888994134204
test score:  -0.06843208769262388




DP02_0104PE
train score:  0.0400752437061902
test score:  -0.043489544235080675




DP02_0105PE
train score:  0.05246659883422
test score:  -0.025966492223015836




DP02_0106PE
train score:  0.012041935886730968
test score:  -0.08443411889359953




DP02_0107PE
train score:  0.058045318571238846
test score:  -0.02353241001410633




DP02_0108PE
train score:  0.05826377077636191
test score:  -0.0057360714929381995




DP02_0109PE
train score:  0.010928702937641144
test score:  -0.10250229536347644




DP03_0015PE
train score:  0.13250833404931928
test score:  -0.00032642264140037014




DP03_0017PE
train score:  0.15760197239717533
test score:  -0.015145608204041983




DP03_0110PE
train score:  0.08687399382845651
test score:  -0.01601930210943614




DP03_0111PE
train score:  0.09493124280527565
test score:  -0.005761769960197061




DP03_0112PE
train score:  0.10774189558985203
test score:  -0.012763884998726605




DP03_0113PE
train score:  0.08808351000809478
test score:  -0.003972573008758973




DP03_0120PE
train score:  0.1512928193674309
test score:  -0.02305879087164575




DP03_0121PE
train score:  0.09376312092176275
test score:  -0.016378111721226496




DP03_0123PE
train score:  0.19523641728399066
test score:  -0.07722948361317461




DP03_0124PE
train score:  0.04424328675316225
test score:  -0.0911889467514182




DP03_0125PE
train score:  0.12393641218666851
test score:  -0.0033063400518866803




DP03_0126PE
train score:  0.09820531298933077
test score:  -0.00250656456562548




DP03_0127PE
train score:  0.0614441141369394
test score:  -0.0003940014255430224




DP03_0129PE
train score:  0.13291948424780398
test score:  -0.013132133488044317




DP03_0130PE
train score:  0.13245139134037265
test score:  -0.0028426611822995884




DP03_0131PE
train score:  0.10570011392349876
test score:  -0.021919231241817938




DP03_0132PE
train score:  0.13538794652398756
test score:  -0.004700071199541966




DP04_0075PE
train score:  0.3693910452104747
test score:  -0.013563249269118227




DP04_0094PE
train score:  0.27759043808510053
test score:  -0.060613285097230296




DP04_0095PE
train score:  0.07621640387408168
test score:  -0.05588947095835728




DP04_0096PE
train score:  0.16956990304195152
test score:  -0.03409464525626449




DP04_0097PE
train score:  0.18514206539822806
test score:  -0.024093175147057888




DP04_0098PE
train score:  0.17300950832301576
test score:  -0.0633525149794485




DP04_0099PE
train score:  0.21489502333312216
test score:  -0.09542618650696433




DP04_0100PE
train score:  0.05857190285111425
test score:  -0.06566235898379791




DP04_0111PE
train score:  0.16295863170249103
test score:  -0.0048592962454345745




DP04_0112PE
train score:  0.3297337532800506
test score:  -0.011380247081876682




DP04_0113PE
train score:  0.4109070524588957
test score:  -0.00226239072849177




DP04_0114PE
train score:  0.42050599380409526
test score:  -0.0014201102720277081




DP04_0115PE
train score:  0.1969249039558305
test score:  -0.03462344758590197
average test score:  -0.03248585261319146


In [421]:
impute_var_df_list = []
test_scores = []
for i, col in enumerate(var_dict[2016].loc[0, ((var_dict[2016].isnull().sum()>0)&(var_dict[2016].isnull().sum()!=3142))].index):

    xgr_impute = XGBRegressor()
    df_temp = df.loc[df_target.iloc[:, i].notnull()]
    df_target_temp = df_target.iloc[:, i].dropna()

    X_train, X_test, y_train, y_test = train_test_split(df_temp, df_target_temp)
    xgr_impute.fit(X_train, y_train)
    print(col)
    print("train score: ", xgr_impute.score(X_train, y_train))
    print("test score: ", xgr_impute.score(X_test, y_test))
    test_scores.append(xgr_impute.score(X_test, y_test))

    impute_var_df_list.append(pd.DataFrame(xgr_impute.predict(df), columns=[col]))
print("average test score: ", np.mean(test_scores))

  if getattr(data, 'base', None) is not None and \


DP02_0036PE
train score:  0.9985899172637263
test score:  0.8950040261999618


  if getattr(data, 'base', None) is not None and \


DP02_0037PE
train score:  0.6873424490076532
test score:  0.3167814220934839


  if getattr(data, 'base', None) is not None and \


DP02_0044PE
train score:  0.8840984022239405
test score:  0.7236340052054314


  if getattr(data, 'base', None) is not None and \


DP02_0045PE
train score:  0.5756757545757967
test score:  0.02907107263999753


  if getattr(data, 'base', None) is not None and \


DP02_0046PE
train score:  0.5896905589669583
test score:  0.034352214057969066


  if getattr(data, 'base', None) is not None and \


DP02_0047PE
train score:  0.6005091434357656
test score:  0.0004330315692671061


  if getattr(data, 'base', None) is not None and \


DP02_0048PE
train score:  0.6569173394765049
test score:  0.10089712495494484


  if getattr(data, 'base', None) is not None and \


DP02_0050PE
train score:  0.5619256927535552
test score:  -0.04378946234527148


  if getattr(data, 'base', None) is not None and \


DP02_0051PE
train score:  0.5687737165476571
test score:  0.07730171917350193


  if getattr(data, 'base', None) is not None and \


DP02_0094PE
train score:  0.6683082479830129
test score:  0.2961450185814005


  if getattr(data, 'base', None) is not None and \


DP02_0095PE
train score:  0.6771456984270634
test score:  0.26962072591778563


  if getattr(data, 'base', None) is not None and \


DP02_0098PE
train score:  0.5748360666710173
test score:  -0.013608539222137672


  if getattr(data, 'base', None) is not None and \


DP02_0099PE
train score:  0.565859751157207
test score:  0.03546489863728264


  if getattr(data, 'base', None) is not None and \


DP02_0101PE
train score:  0.6713752336034631
test score:  0.1560202670410462


  if getattr(data, 'base', None) is not None and \


DP02_0102PE
train score:  0.6648432516227015
test score:  0.13364129151972837


  if getattr(data, 'base', None) is not None and \


DP02_0104PE
train score:  0.7824568641248382
test score:  0.3747461367023218


  if getattr(data, 'base', None) is not None and \


DP02_0105PE
train score:  0.8553830794495124
test score:  0.6366427252826503


  if getattr(data, 'base', None) is not None and \


DP02_0106PE
train score:  0.810026738110205
test score:  0.19961743067124327


  if getattr(data, 'base', None) is not None and \


DP02_0107PE
train score:  0.8697075886360566
test score:  -0.07676147101122055


  if getattr(data, 'base', None) is not None and \


DP02_0108PE
train score:  0.8998611081863945
test score:  0.76465489691253


  if getattr(data, 'base', None) is not None and \


DP02_0109PE
train score:  0.7577635816854817
test score:  0.18012646409156896


  if getattr(data, 'base', None) is not None and \


DP03_0015PE
train score:  0.7240280367174267
test score:  0.41766991514516827


  if getattr(data, 'base', None) is not None and \


DP03_0017PE
train score:  0.8017402742057091
test score:  0.5541562150090729


  if getattr(data, 'base', None) is not None and \


DP03_0110PE
train score:  0.7740284753810414
test score:  0.4765377855982387


  if getattr(data, 'base', None) is not None and \


DP03_0111PE
train score:  0.7732624967564499
test score:  0.41256643056793346


  if getattr(data, 'base', None) is not None and \


DP03_0112PE
train score:  0.7169160220606956
test score:  0.318165108802815


  if getattr(data, 'base', None) is not None and \


DP03_0113PE
train score:  0.7672283542081136
test score:  0.39420666899076584


  if getattr(data, 'base', None) is not None and \


DP03_0120PE
train score:  0.9740445507037174
test score:  0.9428772779233929


  if getattr(data, 'base', None) is not None and \


DP03_0121PE
train score:  0.7583992216951343
test score:  0.4831517871720825


  if getattr(data, 'base', None) is not None and \


DP03_0123PE
train score:  0.9252619601823829
test score:  0.791165658034232


  if getattr(data, 'base', None) is not None and \


DP03_0124PE
train score:  0.696518839030041
test score:  0.17704737233883816


  if getattr(data, 'base', None) is not None and \


DP03_0125PE
train score:  0.8774733040589991
test score:  0.6938505905075709


  if getattr(data, 'base', None) is not None and \


DP03_0126PE
train score:  0.8286387902683093
test score:  0.5733674776810511


  if getattr(data, 'base', None) is not None and \


DP03_0127PE
train score:  0.5915281210136558
test score:  0.1236246959184697


  if getattr(data, 'base', None) is not None and \


DP03_0129PE
train score:  0.9750273442750823
test score:  0.9448144532882993


  if getattr(data, 'base', None) is not None and \


DP03_0130PE
train score:  0.9765800239622454
test score:  0.9507196010633373


  if getattr(data, 'base', None) is not None and \


DP03_0131PE
train score:  0.878806492724189
test score:  0.6995700004767083


  if getattr(data, 'base', None) is not None and \


DP03_0132PE
train score:  0.9558926754866058
test score:  0.9100941897701622


  if getattr(data, 'base', None) is not None and \


DP04_0075PE
train score:  0.7010446180180456
test score:  0.15061567259044228


  if getattr(data, 'base', None) is not None and \


DP04_0094PE
train score:  0.8434648373649504
test score:  0.5345763567582111


  if getattr(data, 'base', None) is not None and \


DP04_0095PE
train score:  0.9505454498300455
test score:  0.8601419869521528


  if getattr(data, 'base', None) is not None and \


DP04_0096PE
train score:  0.8076348668464746
test score:  0.5984821829750653


  if getattr(data, 'base', None) is not None and \


DP04_0097PE
train score:  0.8997333657158292
test score:  0.7760959631694465


  if getattr(data, 'base', None) is not None and \


DP04_0098PE
train score:  0.9240361359042278
test score:  0.8242580020101621


  if getattr(data, 'base', None) is not None and \


DP04_0099PE
train score:  0.9277408243644975
test score:  0.8483540544338862


  if getattr(data, 'base', None) is not None and \


DP04_0100PE
train score:  0.975920881736547
test score:  0.8977509738843802


  if getattr(data, 'base', None) is not None and \


DP04_0111PE
train score:  0.8442229836424977
test score:  0.6739414551093841


  if getattr(data, 'base', None) is not None and \


DP04_0112PE
train score:  0.6367840945037604
test score:  0.1510275895689237


  if getattr(data, 'base', None) is not None and \


DP04_0113PE
train score:  0.6272027601737549
test score:  0.08473385775812514


  if getattr(data, 'base', None) is not None and \


DP04_0114PE
train score:  0.6369474632810372
test score:  0.1123555202039973


  if getattr(data, 'base', None) is not None and \


DP04_0115PE
train score:  0.8406738353677731
test score:  0.5407470785931667
average test score:  0.43150315531311706


In [422]:
df_impute = reduce(lambda left, right: pd.merge(left, right, left_index=True, right_index=True), impute_var_df_list)

In [423]:
df_impute.describe()

Unnamed: 0,DP02_0036PE,DP02_0037PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0050PE,DP02_0051PE,DP02_0094PE,DP02_0095PE,DP02_0098PE,DP02_0099PE,DP02_0101PE,DP02_0102PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP03_0015PE,DP03_0017PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0075PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE
count,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0
mean,1248.67,36.55,48.66,10.37,10.78,7.93,19.84,60.44,72.71,43.43,56.72,7.98,91.72,14.23,85.81,17.97,24.17,3.95,1.03,47.72,5.27,65.0,70.75,57.91,35.08,25.78,42.12,19.74,22.15,9.34,8.64,33.95,44.25,52.98,22.81,22.37,26.2,21.1,2.88,3.9,37.43,31.67,14.7,6.22,2.85,3.17,46.96,15.11,10.05,6.76,21.12
std,3725.28,12.16,13.6,5.06,4.85,4.16,7.28,5.62,8.96,11.73,11.81,5.67,5.88,7.51,7.36,11.7,15.12,5.55,3.61,24.6,5.93,7.17,6.65,12.09,11.49,8.95,12.22,8.54,9.45,5.31,6.36,9.34,11.07,12.77,9.92,9.95,10.95,9.65,1.16,2.63,14.61,6.0,6.12,4.63,3.09,5.47,7.1,1.94,1.54,1.34,5.16
min,-43.01,-0.57,-4.86,-1.51,-2.27,-0.95,0.09,9.62,5.88,12.43,-1.21,-2.72,10.34,-0.85,6.63,-5.68,-4.56,-2.25,-0.45,-2.55,-2.25,21.83,21.48,5.86,0.75,-5.93,0.7,0.46,-0.6,-2.18,-1.44,-2.51,-1.21,0.42,0.87,0.54,-0.65,0.35,0.39,-0.36,2.69,1.61,0.88,0.26,-0.05,-0.3,8.18,0.26,0.43,0.48,1.45
25%,128.3,29.2,40.63,8.71,9.14,6.53,15.51,57.97,70.37,34.71,48.3,4.91,89.59,10.0,83.74,9.41,11.82,1.41,0.39,26.8,2.19,60.74,66.95,49.39,27.06,19.56,32.38,13.41,15.66,5.44,4.76,28.06,37.41,45.75,15.43,14.95,18.3,13.96,2.37,2.01,27.49,28.68,9.88,3.05,1.11,0.97,42.55,14.28,9.27,6.15,17.31
50%,296.02,36.0,48.76,9.87,10.33,7.76,19.24,59.89,73.7,43.55,56.47,7.31,92.42,12.58,87.34,16.38,22.75,2.63,0.59,45.92,3.75,65.68,71.09,57.87,33.96,24.48,42.31,19.02,21.35,8.38,7.35,34.07,44.78,54.09,22.12,21.68,25.53,20.19,2.74,3.47,40.47,32.59,13.23,4.55,1.74,1.51,47.28,15.32,10.06,6.65,20.34
75%,802.34,41.85,56.66,10.95,11.52,8.81,23.31,62.34,76.95,51.61,65.59,10.37,94.9,16.15,90.04,24.76,34.5,4.64,0.82,67.1,5.92,69.66,74.88,67.59,41.59,31.72,50.88,24.64,27.55,12.14,10.66,39.73,51.27,60.62,28.49,28.04,32.69,26.42,3.12,5.21,49.26,35.83,18.76,7.65,3.22,2.86,51.48,16.24,10.92,7.29,24.21
max,69142.97,97.55,98.8,93.25,86.64,94.28,91.02,97.97,102.82,101.19,95.75,91.99,102.42,89.44,100.72,95.71,91.5,88.54,95.72,106.21,67.23,95.35,95.78,97.78,93.62,80.93,96.32,70.3,90.79,37.8,92.18,71.64,92.87,95.74,66.0,67.26,91.2,64.1,22.09,36.51,96.58,52.69,35.28,31.26,19.94,55.55,96.13,37.86,22.26,26.53,47.13


In [401]:
for i in range(df_target.shape[0]):
    for j in range(df_target.shape[1]):
        if df_target.iloc[i, j]:
            pass
        else:
            print (i, j, df_impute.iloc[i, j])

0 18 0.3701587915420532
0 20 1.4133073091506958
1 18 0.7443952560424805
2 11 9.553938865661621
3 11 7.765506267547607
3 18 0.635379433631897
4 11 7.926748752593994
5 11 4.166656970977783
5 17 4.342953681945801
5 18 0.5773282647132874
5 20 3.0973005294799805
6 11 4.771521091461182
6 15 3.195215940475464
6 17 3.061688184738159
6 18 1.1876146793365479
6 20 1.8477822542190552
6 30 10.951211929321289
6 43 1.5731524229049683
6 45 0.9919759035110474
7 15 0.9721551537513733
7 18 0.0
7 20 0.10659855604171753
7 43 0.6378676295280457
7 44 0.5935386419296265
7 45 0.5166997313499451
8 18 0.40636152029037476
8 20 1.9676765203475952
10 5 7.1631999015808105
10 11 10.722609519958496
10 17 0.6520010828971863
10 20 4.570133686065674
10 33 50.05937194824219
10 44 0.5414832830429077
11 16 13.390957832336426
11 17 1.757449984550476
11 18 0.9278309345245361
11 45 0.6257994174957275
12 18 0.5485392212867737
13 18 0.8752049207687378
13 20 3.698108196258545
13 45 0.6334158182144165
14 17 0.8806463479995728
15 1

153 45 1.972055435180664
154 17 2.0010881423950195
155 4 4.327592849731445
155 5 4.39334774017334
155 11 7.06756591796875
155 17 2.071934461593628
155 18 1.0594490766525269
155 29 2.716822624206543
155 30 3.224801540374756
156 1 17.65973472595215
156 3 0.8007535934448242
156 4 24.221887588500977
156 11 5.118497848510742
156 17 1.293412208557129
156 20 2.9382426738739014
156 30 1.4634850025177002
157 11 2.372089147567749
157 45 0.9069743156433105
161 11 7.50291633605957
163 11 1.7125344276428223
163 18 0.5000321865081787
163 44 1.7266324758529663
164 5 6.355036735534668
173 11 5.115328311920166
173 17 3.1897213459014893
173 18 0.535378098487854
173 20 2.4560208320617676
174 11 3.2885007858276367
174 16 2.441336154937744
174 17 0.7882468700408936
174 18 0.3388378322124481
174 44 0.6064651608467102
174 45 0.7857908606529236
175 11 5.432147979736328
175 17 0.8787326812744141
177 11 6.12630033493042
178 11 3.1526641845703125
178 16 0.0
178 17 1.1438289880752563
178 18 0.2914641797542572
178

323 18 0.2671124339103699
330 18 0.46270498633384705
332 30 8.097962379455566
335 11 2.84592342376709
335 17 0.6756461262702942
335 18 1.059617280960083
335 33 21.439882278442383
336 1 26.33089256286621
336 3 0.5563058853149414
336 4 0.0
336 5 1.3268733024597168
336 8 6.719797134399414
336 18 0.8043961524963379
336 20 10.7062349319458
336 30 2.1336019039154053
342 11 6.720210075378418
342 33 39.11818313598633
356 3 4.7154717445373535
356 4 7.766202449798584
356 5 1.8715993165969849
356 13 3.2569491863250732
356 17 3.2140395641326904
356 18 0.7484955191612244
356 20 4.756424903869629
356 28 6.330774307250977
356 30 9.166027069091797
356 33 12.269742012023926
363 4 26.46792221069336
363 11 6.463300704956055
363 18 1.9141260385513306
370 18 0.355934202671051
372 11 5.80756139755249
372 18 0.9718196988105774
373 11 0.6007257103919983
373 13 6.050117492675781
373 16 1.9431555271148682
373 18 0.843431293964386
373 20 2.642008066177368
374 11 3.599982261657715
374 17 0.09539687633514404
374 2

481 17 0.06029650568962097
481 18 0.42328110337257385
482 11 6.769412517547607
482 17 1.2135796546936035
482 18 0.30897748470306396
482 20 2.0424575805664062
482 30 7.196173191070557
483 4 11.0316162109375
483 17 2.898869514465332
483 18 0.0
483 45 0.8635625839233398
491 18 0.4755377769470215
498 17 0.3158609867095947
506 3 9.105947494506836
506 17 2.565081834793091
506 18 0.43159282207489014
507 18 0.610703706741333
509 5 6.819922924041748
509 11 5.8227949142456055
509 18 0.37409693002700806
511 11 6.735607624053955
512 11 1.5825098752975464
512 17 0.5350787043571472
512 18 0.0
512 20 1.2078843116760254
513 11 3.5800185203552246
513 17 0.0
513 18 0.0
513 20 0.8274810910224915
513 44 0.6709588766098022
513 45 0.8578386306762695
514 4 10.67416763305664
514 5 7.938085556030273
514 11 7.20894718170166
514 18 0.3951874077320099
514 20 0.0
514 44 0.8885560035705566
515 3 5.71953821182251
515 4 7.6190948486328125
515 5 6.349696636199951
515 11 1.3740477561950684
515 13 4.51629638671875
515 1

646 45 0.6870599985122681
648 18 0.40534424781799316
650 4 9.262084007263184
650 11 8.062162399291992
650 17 2.416588306427002
650 18 0.6918632388114929
651 11 2.8825809955596924
651 17 2.6716458797454834
651 18 0.12139272689819336
651 20 4.555563449859619
651 30 3.1339566707611084
652 18 0.5243015289306641
653 3 6.149576187133789
653 5 6.531958103179932
653 11 3.3701207637786865
653 18 0.06611493229866028
653 20 0.0916614830493927
654 9 26.316478729248047
654 17 0.0
654 18 0.23460659384727478
654 19 18.37005043029785
654 20 2.1736135482788086
654 39 1.7753815650939941
655 3 7.4613423347473145
655 11 5.613948822021484
655 17 0.4747675359249115
655 18 0.4794993996620178
655 30 8.176323890686035
656 11 12.020530700683594
656 17 2.2464346885681152
656 18 0.4754548966884613
656 20 1.6687487363815308
657 11 7.1149187088012695
659 18 0.7256447076797485
660 17 5.03596830368042
660 20 2.6211981773376465
660 45 1.1161186695098877
661 17 3.5015501976013184
661 18 0.3351193070411682
662 18 0.6446

829 11 6.752666473388672
829 18 0.5347495079040527
829 20 2.635963201522827
829 44 0.527917742729187
830 28 5.574069499969482
830 30 3.1544687747955322
830 33 31.130809783935547
831 3 9.773118019104004
831 10 36.0622673034668
831 11 4.835348129272461
831 13 6.127026081085205
831 15 44.86534118652344
831 16 13.087821006774902
831 17 2.104111909866333
831 18 1.5152192115783691
831 20 5.205197811126709
832 3 8.068483352661133
832 9 47.106388092041016
832 11 5.545784950256348
832 13 6.494694709777832
832 16 25.161911010742188
832 17 0.0
832 18 0.9634456634521484
832 19 22.46753692626953
832 20 1.0179827213287354
832 44 0.15100419521331787
832 45 0.1918206512928009
833 3 12.636033058166504
833 4 8.67078971862793
833 11 4.107400417327881
833 18 0.6567941308021545
833 20 5.05955171585083
833 30 7.5841827392578125
834 11 3.231924295425415
834 13 10.57543659210205
834 17 1.4134477376937866
834 18 0.9446650743484497
835 11 6.9934468269348145
835 18 0.8511033058166504
835 20 3.194009304046631
836

952 17 3.261493444442749
952 18 0.9722796678543091
953 6 15.486404418945312
953 11 4.175880432128906
953 17 1.7565964460372925
953 18 0.4995187520980835
953 20 3.4638752937316895
953 44 1.0110589265823364
954 17 0.6804521083831787
954 18 1.4191105365753174
955 11 8.486990928649902
955 17 5.069599628448486
956 17 4.575828552246094
956 18 1.2611289024353027
958 3 3.732746124267578
958 5 5.985199928283691
958 6 13.8770751953125
958 11 3.125857353210449
958 16 3.1283645629882812
958 17 2.3905420303344727
958 18 0.35675665736198425
959 10 34.898494720458984
959 13 5.986456394195557
959 16 9.301712036132812
959 17 0.685468316078186
959 18 0.44380611181259155
959 20 5.27012825012207
959 44 0.6419172883033752
959 45 0.7113205194473267
960 17 4.277256488800049
960 18 0.6992295980453491
961 3 8.025980949401855
961 5 3.863145351409912
961 11 5.650869369506836
961 17 0.9102157354354858
961 18 0.5598224401473999
961 30 2.527134656906128
961 44 0.9089738130569458
961 45 0.6621897220611572
962 5 6.05

1070 16 4.12808895111084
1070 17 0.4663458466529846
1070 18 0.5338303446769714
1070 20 2.6194908618927
1071 4 8.74075984954834
1071 5 7.008869171142578
1071 10 47.71636199951172
1071 11 3.1575310230255127
1071 13 8.871590614318848
1071 15 20.077722549438477
1071 16 8.350198745727539
1071 18 1.953660488128662
1071 19 23.84827423095703
1071 20 7.291874885559082
1071 44 0.7496976256370544
1071 45 1.364419937133789
1073 18 0.6719700694084167
1074 3 8.116433143615723
1074 11 2.8148999214172363
1074 13 9.3863525390625
1074 17 0.9681535363197327
1074 18 0.3476962149143219
1074 45 0.737676739692688
1075 3 9.58816909790039
1075 11 3.239469289779663
1075 18 0.4295002222061157
1076 11 6.912017822265625
1076 18 0.6215741038322449
1076 20 4.828258037567139
1076 45 0.49751219153404236
1077 11 4.563599109649658
1077 18 0.5599079728126526
1077 20 2.798008441925049
1079 11 9.177631378173828
1079 17 2.4966959953308105
1079 20 3.9392995834350586
1080 18 0.6586172580718994
1080 20 2.0128445625305176
1080 

1229 5 7.3897705078125
1229 6 12.940409660339355
1229 11 4.361485481262207
1229 13 9.29861068725586
1229 16 8.037469863891602
1229 17 0.3728591501712799
1229 18 0.5417892336845398
1229 20 3.7889299392700195
1229 44 0.029840946197509766
1230 17 1.4714195728302002
1230 18 0.7361443042755127
1232 11 5.844307899475098
1232 17 1.058532476425171
1232 18 0.8670313954353333
1232 33 49.01737594604492
1233 11 4.5870680809021
1233 17 1.7031484842300415
1233 18 0.6115866899490356
1233 44 1.2163312435150146
1234 11 2.5768933296203613
1234 16 8.012001991271973
1234 17 1.2060964107513428
1234 18 2.163980007171631
1235 4 31.20712661743164
1235 5 2.742495536804199
1235 6 5.117956161499023
1235 11 3.2550721168518066
1235 17 0.8720576167106628
1235 18 0.7884753942489624
1235 29 4.117914199829102
1235 30 4.377678871154785
1235 45 1.937153935432434
1236 11 5.308799743652344
1236 17 2.4904415607452393
1236 33 45.709564208984375
1237 1 4.045525550842285
1237 9 18.948911666870117
1237 13 6.296751499176025
123

1442 11 8.125211715698242
1442 18 0.5454410314559937
1443 2 0.0
1443 3 5.364133834838867
1443 4 3.2217204570770264
1443 5 5.398900032043457
1443 6 4.9462385177612305
1443 11 5.517126560211182
1443 16 0.8259553909301758
1443 17 0.7247558832168579
1443 18 0.37676218152046204
1443 30 5.836909770965576
1445 18 1.0086649656295776
1446 18 0.9264285564422607
1447 30 2.246558427810669
1449 11 8.76168155670166
1451 18 1.4087727069854736
1452 11 5.526834487915039
1452 18 1.1595652103424072
1453 33 45.12921142578125
1454 5 7.200155735015869
1454 17 2.772656202316284
1457 17 1.4792529344558716
1457 18 0.5574246048927307
1458 3 6.74613618850708
1458 30 2.7118377685546875
1459 3 11.920886039733887
1459 18 0.7313759326934814
1461 11 8.731858253479004
1463 4 9.065630912780762
1463 5 6.275228977203369
1463 13 9.819713592529297
1463 17 1.739004135131836
1463 18 0.5431452989578247
1463 30 4.57199764251709
1465 11 5.454967975616455
1466 18 0.9333875775337219
1467 18 0.8891963362693787
1468 18 0.9863397479

1564 18 0.18173712491989136
1564 20 0.6708300113677979
1564 30 8.637874603271484
1564 45 1.0672292709350586
1566 11 7.020574569702148
1566 18 0.4286448359489441
1567 5 8.626940727233887
1567 17 1.7985097169876099
1567 18 0.4451202154159546
1567 19 32.26707077026367
1567 20 1.9284532070159912
1570 11 4.624041557312012
1570 17 1.018375277519226
1570 18 0.18246695399284363
1570 20 2.3003039360046387
1571 18 0.5245304107666016
1571 20 2.7595956325531006
1572 11 4.665367126464844
1572 13 11.125896453857422
1572 17 3.1537349224090576
1572 18 0.4767815172672272
1573 5 8.377381324768066
1573 11 7.226446151733398
1573 17 3.6490039825439453
1573 18 0.7868753671646118
1573 19 15.892701148986816
1573 20 2.0920448303222656
1573 30 7.221642971038818
1573 44 0.8539273142814636
1573 45 0.6994501352310181
1574 11 5.558056831359863
1574 13 11.276532173156738
1574 18 0.684522271156311
1574 20 3.5815610885620117
1575 11 4.470649242401123
1575 18 0.4496798813343048
1575 20 3.242802619934082
1575 30 10.6316

1678 11 2.049438238143921
1678 17 0.43400654196739197
1678 18 0.952829122543335
1678 20 1.7600164413452148
1678 30 4.752553462982178
1678 44 0.9407512545585632
1678 45 1.2607046365737915
1679 17 0.5515986084938049
1679 18 0.5285612940788269
1679 20 1.8118654489517212
1680 5 8.495357513427734
1682 4 6.262299060821533
1682 5 2.9700801372528076
1682 6 6.921586990356445
1682 11 7.382165908813477
1682 16 1.4575345516204834
1682 17 0.2919940948486328
1682 18 1.2027949094772339
1682 20 3.6246860027313232
1682 24 15.325562477111816
1682 30 0.949406623840332
1682 42 4.666662693023682
1682 44 0.8509098291397095
1682 45 1.11741304397583
1683 4 9.023948669433594
1683 5 4.633869647979736
1683 6 9.34271240234375
1683 11 2.6199564933776855
1683 13 10.262761116027832
1683 18 0.9958593249320984
1683 20 2.100339412689209
1683 30 4.5531840324401855
1684 3 17.538192749023438
1684 5 5.7758708000183105
1684 11 0.0
1684 13 8.027566909790039
1684 18 0.3614894151687622
1685 11 0.9010282158851624
1685 18 0.2280

1771 30 3.7240540981292725
1771 44 3.364004373550415
1772 17 1.23689603805542
1772 18 0.4864991307258606
1772 30 4.215598106384277
1773 3 4.022968292236328
1773 6 26.528352737426758
1773 11 6.055176734924316
1773 13 13.72961139678955
1773 17 7.8818793296813965
1773 18 0.15544283390045166
1773 25 31.941926956176758
1773 28 12.21219539642334
1773 30 4.212217807769775
1773 33 37.1712532043457
1774 11 5.083601951599121
1774 17 7.8739447593688965
1774 18 2.8678154945373535
1775 11 5.092334270477295
1775 17 2.8667616844177246
1775 18 0.7196027040481567
1775 30 2.688671112060547
1776 17 1.5807058811187744
1776 18 0.6093664765357971
1776 25 10.67949390411377
1776 30 1.943686842918396
1777 18 0.6099966168403625
1778 18 1.8124940395355225
1779 11 2.641343593597412
1779 16 9.424714088439941
1779 17 3.4565091133117676
1779 18 0.03269806504249573
1779 25 7.934157371520996
1779 33 53.877540588378906
1779 45 0.5316246747970581
1780 1 6.560548782348633
1780 2 0.8847936987876892
1780 3 17.9068374633789

1883 44 0.6787713766098022
1883 45 0.6192731261253357
1884 3 6.779037952423096
1884 30 3.528522491455078
1884 45 1.2298848628997803
1885 11 6.565615177154541
1886 18 0.4639039933681488
1886 30 16.211257934570312
1887 3 7.866786003112793
1887 5 4.229424476623535
1887 11 0.8950790166854858
1887 17 0.7652043104171753
1887 18 0.5223528742790222
1887 43 2.8304436206817627
1887 44 0.9110606908798218
1890 18 0.6881505250930786
1893 18 0.6462628841400146
1895 18 0.6585156917572021
1900 11 9.043478012084961
1900 18 0.7588651180267334
1906 18 0.7696936726570129
1907 18 0.934770405292511
1909 3 7.547570705413818
1909 18 0.6808651089668274
1917 18 0.5091336369514465
1925 18 0.894673764705658
1936 11 6.420931816101074
1936 18 0.8578793406486511
1937 18 0.9909144639968872
1938 11 7.533904075622559
1938 18 0.4747706651687622
1945 18 1.183119773864746
1949 11 7.5519280433654785
1949 18 0.6073326468467712
1949 30 6.22399377822876
1950 11 10.953845024108887
1950 18 0.5007885098457336
1952 11 6.342258453

2158 1 9.074957847595215
2158 4 10.169054985046387
2158 6 20.947471618652344
2158 11 0.29671064019203186
2158 13 4.653339862823486
2158 18 1.696505069732666
2158 20 0.1958998441696167
2158 25 22.378286361694336
2158 26 12.775941848754883
2158 30 1.8084465265274048
2158 39 1.7815359830856323
2159 18 0.2815087139606476
2159 20 1.8024715185165405
2159 30 6.01555061340332
2160 11 5.236889362335205
2160 30 4.583788871765137
2161 5 8.757369995117188
2161 17 0.0
2161 18 0.04520976543426514
2161 20 0.32757681608200073
2161 23 11.813569068908691
2161 24 9.058874130249023
2161 25 14.027745246887207
2161 28 33.12187957763672
2161 30 11.306842803955078
2161 42 9.166959762573242
2161 44 0.5029750466346741
2161 45 0.369772344827652
2162 4 9.493644714355469
2162 5 7.358465671539307
2162 11 6.3839287757873535
2162 17 0.23281288146972656
2162 18 0.6848127245903015
2163 17 1.8410067558288574
2164 4 9.910297393798828
2164 11 3.4216599464416504
2164 13 6.968553066253662
2164 16 3.802978515625
2164 17 0.28

2351 4 9.730552673339844
2351 11 5.756471157073975
2351 17 0.4033704698085785
2351 18 0.7201114296913147
2351 44 1.2028224468231201
2351 45 1.6939644813537598
2357 11 6.706776142120361
2357 17 0.0
2360 5 4.394518852233887
2360 11 2.8440325260162354
2360 16 1.4500138759613037
2360 30 6.234748840332031
2360 44 1.0826536417007446
2360 45 1.1390254497528076
2361 11 5.611150741577148
2361 18 2.2384870052337646
2362 17 2.577237606048584
2362 18 0.512377142906189
2364 11 2.8629846572875977
2364 13 8.372398376464844
2364 18 2.6689958572387695
2365 5 6.791818618774414
2367 1 6.35250186920166
2367 3 16.54058837890625
2367 17 1.1356793642044067
2367 18 1.821824312210083
2367 19 5.472111225128174
2367 20 5.222722053527832
2367 33 24.098613739013672
2373 17 2.55952787399292
2373 18 0.5459482669830322
2375 18 0.9549075961112976
2380 11 4.103343963623047
2380 18 0.5818605422973633
2380 20 7.082735061645508
2381 5 7.956451416015625
2381 18 0.7458670139312744
2381 30 4.636076927185059
2384 18 0.7696936

2566 15 0.525773286819458
2566 17 0.8594701290130615
2566 18 0.0
2566 20 0.7026227116584778
2566 24 19.380693435668945
2566 45 1.1222429275512695
2567 17 0.0
2567 18 0.09000781178474426
2569 18 0.03265342116355896
2569 20 1.5937241315841675
2569 45 0.8489832282066345
2570 5 2.790135383605957
2570 6 4.398261070251465
2570 11 5.832521438598633
2570 15 2.55993914604187
2570 18 0.3214549422264099
2570 20 0.3646085262298584
2570 23 49.88137435913086
2570 24 32.037086486816406
2570 25 4.74732780456543
2570 33 14.80752182006836
2570 45 1.2279255390167236
2570 49 2.8070731163024902
2573 1 11.22728157043457
2573 4 4.9150848388671875
2573 9 38.58513641357422
2573 13 5.7476372718811035
2573 15 4.312306880950928
2573 16 0.0
2573 17 0.0
2573 18 0.0
2573 20 0.0
2573 28 13.613372802734375
2573 30 6.211304664611816
2573 43 0.7092598676681519
2573 44 0.9027078747749329
2573 45 0.20453789830207825
2574 6 10.971915245056152
2574 11 5.972768783569336
2574 16 0.0
2574 17 0.0
2574 18 0.0
2574 20 1.240337133

2664 25 7.178686618804932
2664 29 3.0879061222076416
2664 30 8.69847297668457
2664 43 2.606882095336914
2664 44 0.9773463606834412
2664 45 0.9252302050590515
2665 11 5.525789737701416
2665 17 0.0
2665 18 0.194671630859375
2666 18 0.2273324728012085
2666 20 2.7150895595550537
2666 30 7.187361240386963
2667 5 9.586177825927734
2667 11 3.70660400390625
2667 17 0.11847317218780518
2667 45 1.4886462688446045
2668 18 0.2536892294883728
2669 11 4.483405113220215
2669 18 0.2692197561264038
2669 20 0.35555046796798706
2670 4 16.33020782470703
2670 17 0.9269218444824219
2670 18 0.11881786584854126
2670 20 1.5236754417419434
2670 44 1.5964245796203613
2670 49 3.263913154602051
2672 11 17.01595115661621
2672 13 9.43132495880127
2672 18 0.11541992425918579
2672 30 9.748281478881836
2673 5 4.454233169555664
2673 31 10.823013305664062
2673 32 13.8688325881958
2673 33 13.901229858398438
2673 39 0.8588780164718628
2674 3 3.1971020698547363
2674 6 7.188446521759033
2674 28 2.51651668548584
2674 29 1.960

2781 35 1.759857416152954
2781 36 4.184550762176514
2781 37 1.4535514116287231
2781 43 2.654144048690796
2781 44 3.23933482170105
2781 45 1.1756644248962402
2782 18 0.32920369505882263
2784 17 0.0
2784 18 0.03265342116355896
2785 11 7.659069061279297
2785 18 0.2302895188331604
2786 4 7.31941556930542
2786 5 5.183172225952148
2786 11 4.7253923416137695
2786 13 8.689900398254395
2786 17 0.0
2786 18 0.2797697186470032
2786 20 1.7839316129684448
2786 30 19.527612686157227
2787 3 8.803174018859863
2787 5 7.516599655151367
2787 17 0.0
2787 18 0.0
2787 20 6.225618362426758
2787 30 10.830291748046875
2788 11 2.8135669231414795
2788 13 7.056054592132568
2788 18 0.2568604350090027
2790 3 8.114770889282227
2790 11 3.5824503898620605
2790 17 1.9127038717269897
2790 18 1.050499677658081
2790 20 2.5525147914886475
2790 44 1.9217525720596313
2791 5 4.291065216064453
2791 11 4.735662460327148
2791 15 0.14377498626708984
2791 16 0.8889296054840088
2791 17 0.0
2791 18 0.0
2791 20 0.8312958478927612
2791

2912 18 0.26451295614242554
2912 45 1.6288251876831055
2913 3 5.433533191680908
2913 11 7.442744731903076
2913 18 0.8670197129249573
2913 30 3.532160758972168
2914 11 5.7700653076171875
2916 11 7.84366512298584
2916 17 0.694261908531189
2916 18 0.7717366218566895
2916 20 6.528039455413818
2917 18 1.1439794301986694
2918 11 1.2513102293014526
2918 17 3.52891206741333
2918 30 4.664487361907959
2919 11 4.960488319396973
2919 18 1.025597095489502
2919 45 0.6496229767799377
2920 18 1.056679129600525
2921 11 5.444571018218994
2921 13 8.384830474853516
2921 17 5.6729326248168945
2921 18 0.32239654660224915
2921 20 1.9648038148880005
2921 28 14.439040184020996
2921 30 5.926425933837891
2921 33 28.004924774169922
2921 44 0.8007906079292297
2921 45 0.8040710687637329
2925 17 0.9153904914855957
2926 3 6.001279830932617
2926 4 2.224548816680908
2926 10 1.2076644897460938
2926 11 1.0269566774368286
2926 13 0.0
2926 16 3.7588939666748047
2926 17 12.60295295715332
2926 18 1.2204899787902832
2926 19 1

3086 13 12.362037658691406
3086 17 1.9918855428695679
3086 18 1.6734317541122437
3086 20 6.44291353225708
3086 30 9.190559387207031
3086 44 2.6929407119750977
3089 17 3.127615451812744
3089 18 0.718428373336792
3090 17 1.6882027387619019
3090 18 1.0230047702789307
3093 11 8.093751907348633
3093 17 2.7919631004333496
3093 18 0.5716738104820251
3093 30 5.78743314743042
3094 18 0.7807649374008179
3095 18 0.8174424767494202
3097 17 1.1610667705535889
3099 18 0.7673901319503784
3101 18 0.9263944625854492
3104 17 4.845636367797852
3104 18 1.3466856479644775
3105 18 0.8026683330535889
3107 18 0.7795785665512085
3108 18 0.4504849910736084
3109 17 1.469979166984558
3109 18 0.46412500739097595
3110 5 6.093451976776123
3110 11 5.340542793273926
3110 18 1.4695137739181519
3112 18 1.0960485935211182
3115 18 0.6426414251327515
3116 17 0.9346778988838196
3118 18 0.7729804515838623
3119 4 10.1378755569458
3119 11 10.82402515411377
3120 4 9.720306396484375
3120 11 5.513766288757324
3121 11 6.5053563117

In [400]:
df_impute = df_impute.applymap(lambda x: 0 if x<0 else x).applymap(lambda x: 100 if x>100 else x)

In [402]:
df_impute.describe()

Unnamed: 0,DP02_0036PE,DP02_0037PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0050PE,DP02_0051PE,DP02_0094PE,DP02_0095PE,DP02_0098PE,DP02_0099PE,DP02_0101PE,DP02_0102PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP03_0015PE,DP03_0017PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0075PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE
count,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0
mean,94.4,36.76,48.5,10.45,11.01,7.9,19.81,60.55,72.17,43.28,56.76,8.56,91.36,14.24,85.71,18.09,24.18,3.93,1.09,47.83,5.2,65.04,70.92,58.3,35.15,25.55,42.02,19.77,22.12,9.35,8.7,33.97,44.36,52.59,22.81,22.41,26.24,21.02,2.81,3.95,37.38,31.71,14.75,6.26,2.84,3.18,46.89,15.08,10.05,6.73,21.15
std,13.88,12.43,13.27,5.41,5.19,3.86,7.52,5.55,9.91,11.8,11.54,5.99,6.38,7.26,7.52,11.57,15.19,5.37,3.54,24.56,5.9,7.17,6.7,11.89,11.25,8.86,12.27,8.55,9.37,5.43,6.12,9.41,11.29,12.38,9.92,10.03,11.01,9.66,1.0,2.61,14.6,6.01,6.14,4.66,3.1,5.41,7.2,1.92,1.55,1.34,5.2
min,0.0,0.28,0.0,0.0,0.0,0.0,0.0,9.15,0.0,4.71,1.21,0.0,7.09,0.0,11.45,0.0,0.0,0.0,0.0,0.0,0.0,3.81,33.72,5.06,0.67,0.0,3.04,0.58,0.09,0.0,0.0,0.0,0.14,3.24,0.36,0.1,0.0,0.32,0.7,0.14,2.36,1.84,1.04,0.13,0.0,0.0,7.37,0.63,0.08,0.15,1.81
25%,100.0,28.97,40.74,8.57,9.33,6.47,15.57,58.14,70.1,34.52,48.18,5.42,89.47,10.29,83.58,9.63,11.92,1.38,0.42,26.86,2.32,60.95,67.21,49.52,27.07,19.39,32.19,13.47,15.65,5.43,4.92,28.02,37.57,45.81,15.52,15.05,18.58,14.0,2.36,2.0,27.39,28.85,9.85,3.14,1.1,0.96,42.19,14.23,9.3,6.12,17.21
50%,100.0,36.19,48.85,9.81,10.39,7.74,18.99,59.82,73.21,43.73,56.58,7.74,92.15,12.67,87.27,16.28,22.86,2.66,0.61,45.45,3.76,65.72,71.26,58.04,34.19,23.93,42.34,18.98,21.37,8.35,7.37,34.18,44.79,53.52,21.96,21.71,25.64,20.21,2.73,3.5,40.32,32.72,13.35,4.57,1.71,1.51,47.2,15.3,10.07,6.66,20.37
75%,100.0,42.26,56.44,11.07,11.62,8.77,23.18,62.29,76.37,51.71,65.6,10.62,94.56,16.08,89.93,24.82,34.47,4.75,0.92,67.97,5.57,69.79,75.16,67.72,41.73,31.31,50.45,24.66,27.59,12.12,10.8,40.02,51.61,59.87,28.44,28.03,32.4,26.46,3.07,5.28,49.21,35.82,18.87,7.73,3.14,2.92,51.56,16.23,10.88,7.34,24.31
max,100.0,94.07,97.52,96.62,88.21,90.59,92.27,100.0,99.48,97.76,91.71,88.35,100.0,89.42,100.0,92.54,90.99,95.61,97.68,100.0,67.78,96.05,96.86,95.97,97.27,82.53,98.14,70.97,87.86,56.13,87.29,68.0,92.57,97.72,66.44,66.85,92.18,63.42,22.25,21.2,98.28,52.05,42.72,29.99,20.19,54.32,92.24,30.11,28.47,26.59,45.75


In [367]:
df_target.describe()

Unnamed: 0,DP02_0036PE,DP02_0037PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0050PE,DP02_0051PE,DP02_0094PE,DP02_0095PE,DP02_0098PE,DP02_0099PE,DP02_0101PE,DP02_0102PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP03_0015PE,DP03_0017PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0075PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE
count,3117.0,3107.0,3124.0,3124.0,3124.0,3124.0,3124.0,3091.0,3091.0,3129.0,3129.0,3067.0,3067.0,3129.0,3129.0,3129.0,3129.0,3129.0,3129.0,3129.0,3129.0,3140.0,3141.0,3132.0,3132.0,3132.0,3132.0,3141.0,3135.0,3140.0,3131.0,3141.0,3140.0,3059.0,3141.0,3141.0,3140.0,3141.0,3138.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0,3141.0
mean,1242.09,36.75,48.88,10.36,10.84,7.86,19.82,60.42,73.13,43.21,56.79,8.26,91.74,14.16,85.84,17.87,24.2,3.89,1.1,47.75,5.19,65.02,70.8,57.9,34.96,25.73,42.1,19.76,22.17,9.36,8.62,33.93,44.3,52.92,22.81,22.4,26.2,21.06,2.85,3.94,37.36,31.72,14.71,6.24,2.85,3.17,46.95,15.06,10.06,6.75,21.19
std,4113.39,18.26,16.9,9.85,9.85,7.89,12.57,10.73,16.28,18.7,18.7,12.33,12.33,12.76,12.76,15.77,18.76,7.58,4.64,27.74,8.77,10.63,8.74,16.53,15.32,13.03,16.53,8.91,13.04,5.97,10.01,11.56,14.67,24.44,10.27,10.33,12.64,10.19,1.79,3.3,15.45,7.59,6.88,5.06,3.37,5.63,8.9,3.43,2.86,2.47,6.69
min,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,16.3,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25%,123.0,25.1,38.1,4.7,5.3,3.2,12.0,55.0,65.6,30.3,45.5,0.0,88.05,5.8,81.2,6.5,9.5,0.0,0.0,24.9,0.2,58.88,65.9,47.5,24.9,17.0,30.7,13.4,13.2,5.1,2.0,26.7,35.2,37.7,15.4,14.9,17.28,13.7,2.0,1.7,26.7,27.5,9.6,2.8,0.8,0.6,41.1,13.4,8.5,5.4,16.7
50%,298.0,35.9,47.7,8.5,9.0,6.4,18.2,60.3,73.9,42.1,57.9,4.5,95.5,11.5,88.5,14.3,21.1,1.4,0.0,46.6,2.3,65.8,71.5,58.9,34.2,24.65,41.1,18.8,20.5,8.3,5.9,33.8,44.3,52.3,21.9,21.5,25.2,20.0,2.5,3.1,39.7,32.6,13.5,4.8,1.8,1.6,47.2,15.4,10.2,6.7,20.3
75%,816.0,47.1,59.1,13.3,13.6,10.3,25.42,65.7,82.9,54.5,69.7,11.95,100.0,18.8,94.2,25.0,35.1,4.7,0.6,70.3,5.8,71.9,76.5,69.3,43.4,33.9,52.5,24.8,29.0,12.1,11.6,40.9,52.9,68.0,28.6,28.2,33.2,26.7,3.3,5.3,48.9,36.9,19.2,8.1,3.5,3.3,52.6,17.0,11.7,8.1,24.8
max,121611.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,83.3,100.0,100.0,100.0,100.0,100.0,100.0,75.1,100.0,61.6,100.0,87.0,100.0,100.0,70.9,70.9,100.0,67.2,25.9,40.5,100.0,65.2,50.1,33.7,21.7,57.7,100.0,43.3,31.8,30.0,100.0


In [403]:
df_impute.shape

(3142, 51)

In [404]:
df_target.shape

(3142, 51)

In [434]:
for i in range(df_target.shape[0]):
    for j in range(df_target.shape[1]):
        if df_target.iloc[i, j] != df_target.iloc[i, j]:
            df_target.iloc[i, j] = df_impute.iloc[i, j]

In [436]:
df_target.describe()

Unnamed: 0,DP02_0036PE,DP02_0037PE,DP02_0044PE,DP02_0045PE,DP02_0046PE,DP02_0047PE,DP02_0048PE,DP02_0050PE,DP02_0051PE,DP02_0094PE,DP02_0095PE,DP02_0098PE,DP02_0099PE,DP02_0101PE,DP02_0102PE,DP02_0104PE,DP02_0105PE,DP02_0106PE,DP02_0107PE,DP02_0108PE,DP02_0109PE,DP03_0015PE,DP03_0017PE,DP03_0110PE,DP03_0111PE,DP03_0112PE,DP03_0113PE,DP03_0120PE,DP03_0121PE,DP03_0123PE,DP03_0124PE,DP03_0125PE,DP03_0126PE,DP03_0127PE,DP03_0129PE,DP03_0130PE,DP03_0131PE,DP03_0132PE,DP04_0075PE,DP04_0094PE,DP04_0095PE,DP04_0096PE,DP04_0097PE,DP04_0098PE,DP04_0099PE,DP04_0100PE,DP04_0111PE,DP04_0112PE,DP04_0113PE,DP04_0114PE,DP04_0115PE
count,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0,3142.0
mean,1266.61,36.73,48.66,10.41,10.88,7.89,19.84,60.64,72.64,43.27,56.85,8.27,91.71,14.2,85.79,17.97,24.22,3.93,1.1,47.63,5.21,65.02,70.8,57.91,35.02,25.73,42.09,19.76,22.19,9.35,8.63,33.92,44.29,52.92,22.8,22.4,26.19,21.05,2.85,3.94,37.36,31.71,14.71,6.24,2.85,3.17,46.96,15.06,10.06,6.75,21.18
std,4158.1,18.21,17.11,9.97,9.87,7.9,12.57,10.82,16.69,18.69,18.7,12.26,12.32,12.79,12.78,15.83,18.76,7.65,4.63,27.75,8.75,10.63,8.74,16.52,15.36,13.03,16.53,8.91,13.03,5.97,10.0,11.57,14.68,24.22,10.27,10.33,12.64,10.19,1.79,3.3,15.45,7.61,6.88,5.06,3.37,5.64,8.91,3.43,2.86,2.47,6.69
min,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-1.45,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,16.3,0.0,0.0,0.0,0.0,0.0,0.0,-2.18,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25%,123.0,25.1,37.9,4.73,5.4,3.2,12.0,55.0,64.8,30.4,45.6,0.0,88.1,5.8,81.1,6.5,9.5,0.0,0.0,24.7,0.2,58.9,65.9,47.5,25.0,17.0,30.7,13.4,13.2,5.1,2.0,26.7,35.2,37.8,15.4,14.9,17.2,13.7,2.0,1.7,26.7,27.5,9.6,2.8,0.8,0.6,41.1,13.4,8.5,5.4,16.7
50%,299.0,35.9,47.65,8.5,9.1,6.4,18.3,60.5,73.7,42.1,57.9,4.5,95.4,11.6,88.4,14.4,21.2,1.4,0.0,46.4,2.4,65.8,71.5,58.95,34.3,24.65,41.0,18.8,20.5,8.25,5.9,33.8,44.3,52.35,21.9,21.5,25.2,20.0,2.5,3.1,39.7,32.6,13.5,4.8,1.8,1.6,47.2,15.4,10.2,6.7,20.3
75%,821.0,47.0,59.0,13.3,13.7,10.3,25.5,66.0,82.7,54.5,69.8,11.9,100.0,18.9,94.2,25.3,35.0,4.8,0.6,70.2,5.8,71.9,76.5,69.2,43.48,33.88,52.5,24.8,29.0,12.1,11.6,40.9,52.9,67.8,28.6,28.2,33.2,26.67,3.3,5.3,48.9,36.9,19.17,8.1,3.5,3.3,52.6,17.0,11.7,8.1,24.8
max,121611.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,100.0,101.16,100.0,100.0,100.0,100.0,100.0,100.0,100.0,83.3,100.0,100.0,100.0,100.0,100.0,100.0,75.1,100.0,61.6,100.0,87.0,100.0,100.0,70.9,70.9,100.0,67.2,25.9,40.5,100.0,65.2,50.1,33.7,21.7,57.7,100.0,43.3,31.8,30.0,100.0


In [463]:
for col in df_target.columns:
    var_dict[2016].loc[:, col] = df_target.loc[:, col]

In [None]:
missing_row = []
for col in var_dict[2010].:
    if col not in var_dict[2010].columns:
        missing_col.append(col)
missing_col

In [455]:
missing_col = []
for col in var_dict[2016].columns:
    if col not in var_dict[2010].columns:
        missing_col.append(col)
missing_col

['CD115',
 'DP02_0150PE',
 'DP02_0151PE',
 'DP02_0152PE',
 'DP04_0142PE',
 'DP04_0143PE',
 'DP05_0082PE',
 'DP05_0083PE',
 'DP05_0084PE',
 'ZCTA5']

In [461]:
for year in range(2010, 2018):
    var_dict[year] = var_dict[year].applymap(
        lambda x: np.nan if x==-666666666 or x==-888888888 or x==-999999999 else x
    )

In [None]:
for year in range(2010, 2018):
    df = var_dict[year].drop(
        columns=var_dict[year].loc[
            0, 
            ((var_dict[year].isnull().sum()>0)&(var_dict[year].isnull().sum()!=var_dict[year].shape[0]))
        ].index
    )
    df = df.loc[:, df.columns.str.contains(r"DP0")].dropna(axis=1)
    df_target = var_dict[year].loc[
        :, var_dict[year].loc[
            0,
            ((var_dict[year].isnull().sum()>0)&(var_dict[year].isnull().sum()!=var_dict[year].shape[0]))
        ].index
    ]
    impute_var_df_list = []
    test_scores = []
    for i, col in enumerate(var_dict[year].loc[0, 
                                               ((var_dict[year].isnull().sum()>0)&
                                                (var_dict[year].isnull().sum()!=var_dict[year].shape[0]))
                                              ].index):

        xgr_impute = XGBRegressor()
        df_temp = df.loc[df_target.iloc[:, i].notnull()]
        df_target_temp = df_target.iloc[:, i].dropna()

        X_train, X_test, y_train, y_test = train_test_split(df_temp, df_target_temp)
        xgr_impute.fit(X_train, y_train)
        print(col)
        test_scores.append(xgr_impute.score(X_test, y_test))

        impute_var_df_list.append(pd.DataFrame(xgr_impute.predict(df), columns=[col]))
    print(year, "average test score: ", np.mean(test_scores))
    df_impute = reduce(lambda left, right: pd.merge(
        left, right, left_index=True, right_index=True
    ), impute_var_df_list
                      )
    for i in range(df_target.shape[0]):
        for j in range(df_target.shape[1]):
            if df_target.iloc[i, j] != df_target.iloc[i, j]:
                df_target.iloc[i, j] = df_impute.iloc[i, j]
    for col in df_target.columns:
        var_dict[year].loc[:, col] = df_target.loc[:, col]

  if getattr(data, 'base', None) is not None and \


DP02_0037PE


  if getattr(data, 'base', None) is not None and \


DP02_0044PE


  if getattr(data, 'base', None) is not None and \


DP02_0045PE


  if getattr(data, 'base', None) is not None and \


DP02_0046PE


  if getattr(data, 'base', None) is not None and \


DP02_0047PE


  if getattr(data, 'base', None) is not None and \


DP02_0048PE


  if getattr(data, 'base', None) is not None and \


DP02_0050PE


  if getattr(data, 'base', None) is not None and \


DP02_0051PE


  if getattr(data, 'base', None) is not None and \


DP02_0094PE


  if getattr(data, 'base', None) is not None and \


DP02_0095PE


  if getattr(data, 'base', None) is not None and \


DP02_0098PE


  if getattr(data, 'base', None) is not None and \


DP02_0099PE


  if getattr(data, 'base', None) is not None and \


DP02_0101PE


  if getattr(data, 'base', None) is not None and \


DP02_0102PE


  if getattr(data, 'base', None) is not None and \


DP02_0104PE


  if getattr(data, 'base', None) is not None and \


DP02_0105PE


  if getattr(data, 'base', None) is not None and \


DP02_0106PE


  if getattr(data, 'base', None) is not None and \


DP02_0107PE


  if getattr(data, 'base', None) is not None and \


DP02_0108PE


  if getattr(data, 'base', None) is not None and \


DP02_0109PE


  if getattr(data, 'base', None) is not None and \


DP03_0015PE


  if getattr(data, 'base', None) is not None and \


DP03_0017PE


  if getattr(data, 'base', None) is not None and \


DP03_0089PE


  if getattr(data, 'base', None) is not None and \


DP03_0120PE


  if getattr(data, 'base', None) is not None and \


DP03_0121PE


  if getattr(data, 'base', None) is not None and \


DP03_0123PE


  if getattr(data, 'base', None) is not None and \


DP03_0124PE


  if getattr(data, 'base', None) is not None and \


DP03_0125PE


  if getattr(data, 'base', None) is not None and \


DP03_0126PE


  if getattr(data, 'base', None) is not None and \


DP03_0127PE


  if getattr(data, 'base', None) is not None and \


DP03_0129PE


  if getattr(data, 'base', None) is not None and \


DP03_0130PE


  if getattr(data, 'base', None) is not None and \


DP03_0131PE


  if getattr(data, 'base', None) is not None and \


DP03_0132PE


  if getattr(data, 'base', None) is not None and \


DP03_0135PE


  if getattr(data, 'base', None) is not None and \


DP04_0080PE


  if getattr(data, 'base', None) is not None and \


DP04_0081PE


  if getattr(data, 'base', None) is not None and \


DP04_0082PE


  if getattr(data, 'base', None) is not None and \


DP04_0083PE


  if getattr(data, 'base', None) is not None and \


DP04_0084PE


  if getattr(data, 'base', None) is not None and \


DP04_0085PE


  if getattr(data, 'base', None) is not None and \


DP04_0086PE


  if getattr(data, 'base', None) is not None and \


DP04_0087PE


  if getattr(data, 'base', None) is not None and \


DP04_0090PE


  if getattr(data, 'base', None) is not None and \


DP04_0091PE


  if getattr(data, 'base', None) is not None and \


DP04_0093PE


  if getattr(data, 'base', None) is not None and \


DP04_0094PE


  if getattr(data, 'base', None) is not None and \


DP04_0095PE


  if getattr(data, 'base', None) is not None and \


DP04_0096PE


  if getattr(data, 'base', None) is not None and \


DP04_0097PE


  if getattr(data, 'base', None) is not None and \


DP04_0098PE


  if getattr(data, 'base', None) is not None and \


DP04_0099PE


  if getattr(data, 'base', None) is not None and \


DP04_0102PE


  if getattr(data, 'base', None) is not None and \


DP04_0103PE


  if getattr(data, 'base', None) is not None and \


DP04_0104PE


  if getattr(data, 'base', None) is not None and \


DP04_0105PE


  if getattr(data, 'base', None) is not None and \


DP04_0106PE


  if getattr(data, 'base', None) is not None and \


DP04_0109PE


  if getattr(data, 'base', None) is not None and \


DP04_0110PE


  if getattr(data, 'base', None) is not None and \


DP04_0111PE


  if getattr(data, 'base', None) is not None and \


DP04_0112PE


  if getattr(data, 'base', None) is not None and \


DP04_0113PE


  if getattr(data, 'base', None) is not None and \


DP04_0116PE


  if getattr(data, 'base', None) is not None and \


DP04_0117PE


  if getattr(data, 'base', None) is not None and \


DP04_0118PE


  if getattr(data, 'base', None) is not None and \


DP04_0119PE


  if getattr(data, 'base', None) is not None and \


DP04_0120PE


  if getattr(data, 'base', None) is not None and \


DP04_0121PE


  if getattr(data, 'base', None) is not None and \


DP04_0122PE


  if getattr(data, 'base', None) is not None and \


DP05_0026PE


  if getattr(data, 'base', None) is not None and \


DP05_0027PE
2010 average test score:  0.4754814671318099


  if getattr(data, 'base', None) is not None and \


DP02_0036PE


  if getattr(data, 'base', None) is not None and \


DP02_0037PE


  if getattr(data, 'base', None) is not None and \


DP02_0044PE


  if getattr(data, 'base', None) is not None and \


DP02_0045PE


  if getattr(data, 'base', None) is not None and \


DP02_0046PE


  if getattr(data, 'base', None) is not None and \


DP02_0047PE


  if getattr(data, 'base', None) is not None and \


DP02_0048PE


  if getattr(data, 'base', None) is not None and \


DP02_0050PE


  if getattr(data, 'base', None) is not None and \


DP02_0051PE


  if getattr(data, 'base', None) is not None and \


DP02_0053PE


  if getattr(data, 'base', None) is not None and \


DP02_0054PE


  if getattr(data, 'base', None) is not None and \


DP02_0055PE


  if getattr(data, 'base', None) is not None and \


DP02_0056PE


  if getattr(data, 'base', None) is not None and \


DP02_0057PE


  if getattr(data, 'base', None) is not None and \


DP02_0094PE


  if getattr(data, 'base', None) is not None and \


DP02_0095PE


  if getattr(data, 'base', None) is not None and \


In [477]:
for year in range(2010, 2018):
    print(var_dict[year].shape[0])

3143
3143
3143
3143
3142
3142
3142
3142
