In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import matplotlib.dates as mdates
import matplotlib.colors as mcolors
from matplotlib.patches import Patch
from pathlib import Path
from multiprocessing.dummy import Pool as ThreadPool
from collections import defaultdict
from natsort import natsorted
import tsfresh as tf
import sklearn

In [2]:
pd.set_option('max_columns', None)

In [3]:
import os
import glob

dataset_path = 'data_feats_90_c/'
csv_files = glob.glob(dataset_path+'*.csv')

all_df = []

for filename in csv_files:
    df = pd.read_csv(filename, index_col=None, header=0)
    all_df.append(df)

df = pd.concat(all_df, axis=0, ignore_index=True)

In [4]:
df = df[df.class_code != 7]
df['class_code'].replace({8: 7}, inplace=True)


In [5]:
df.class_code.unique()

array([5, 7, 3, 1, 4, 6, 0, 2])

In [6]:
with pd.option_context('display.max_rows', None, 'display.max_columns', None):  # more options can be specified also
    nans = df.isna().sum(axis=0)
    print(nans[nans!=0])

P-PDG__fft_aggregated__aggtype_"centroid"                 8571
P-PDG__fft_aggregated__aggtype_"variance"                 8571
P-PDG__fft_aggregated__aggtype_"skew"                    37244
P-PDG__fft_aggregated__aggtype_"kurtosis"                37244
P-PDG__variation_coefficient                              8571
P-PDG__friedrich_coefficients__coeff_1__m_3__r_30        20675
P-PDG__friedrich_coefficients__coeff_3__m_3__r_30        20675
P-TPT__fft_aggregated__aggtype_"centroid"                   64
P-TPT__fft_aggregated__aggtype_"variance"                   64
P-TPT__fft_aggregated__aggtype_"skew"                    30450
P-TPT__fft_aggregated__aggtype_"kurtosis"                30450
P-TPT__variation_coefficient                                64
P-TPT__friedrich_coefficients__coeff_1__m_3__r_30        12623
P-TPT__friedrich_coefficients__coeff_3__m_3__r_30        12623
T-TPT__fft_aggregated__aggtype_"centroid"                 6514
T-TPT__fft_aggregated__aggtype_"variance"              

In [7]:
df.drop(['Unnamed: 0'], axis='columns', inplace=True) #leftover index column after feat. extrs, unnecessary
df.drop(['QGL__variation_coefficient'], axis='columns', inplace=True) #too many nan values
df.drop(list(df.filter(regex = 'friedrich')), axis = 1, inplace = True)
df.drop(list(df.filter(regex = 'fft_aggregated')), axis = 1, inplace = True)

In [8]:
print(df.shape)
df.head(1)

(51764, 108)


Unnamed: 0,P-PDG__mean,P-PDG__variance,P-PDG__skewness,P-PDG__kurtosis,P-PDG__maximum,P-PDG__minimum,P-PDG__median,P-PDG__quantile__q_0.1,P-PDG__quantile__q_0.2,P-PDG__quantile__q_0.3,P-PDG__quantile__q_0.4,P-PDG__quantile__q_0.6,P-PDG__quantile__q_0.7,P-PDG__quantile__q_0.8,P-PDG__quantile__q_0.9,P-PDG__variation_coefficient,P-PDG__mean_change,P-PDG__mean_second_derivative_central,P-TPT__mean,P-TPT__variance,P-TPT__skewness,P-TPT__kurtosis,P-TPT__maximum,P-TPT__minimum,P-TPT__median,P-TPT__quantile__q_0.1,P-TPT__quantile__q_0.2,P-TPT__quantile__q_0.3,P-TPT__quantile__q_0.4,P-TPT__quantile__q_0.6,P-TPT__quantile__q_0.7,P-TPT__quantile__q_0.8,P-TPT__quantile__q_0.9,P-TPT__variation_coefficient,P-TPT__mean_change,P-TPT__mean_second_derivative_central,T-TPT__mean,T-TPT__variance,T-TPT__skewness,T-TPT__kurtosis,T-TPT__maximum,T-TPT__minimum,T-TPT__median,T-TPT__quantile__q_0.1,T-TPT__quantile__q_0.2,T-TPT__quantile__q_0.3,T-TPT__quantile__q_0.4,T-TPT__quantile__q_0.6,T-TPT__quantile__q_0.7,T-TPT__quantile__q_0.8,T-TPT__quantile__q_0.9,T-TPT__variation_coefficient,T-TPT__mean_change,T-TPT__mean_second_derivative_central,P-MON-CKP__mean,P-MON-CKP__variance,P-MON-CKP__skewness,P-MON-CKP__kurtosis,P-MON-CKP__maximum,P-MON-CKP__minimum,P-MON-CKP__median,P-MON-CKP__quantile__q_0.1,P-MON-CKP__quantile__q_0.2,P-MON-CKP__quantile__q_0.3,P-MON-CKP__quantile__q_0.4,P-MON-CKP__quantile__q_0.6,P-MON-CKP__quantile__q_0.7,P-MON-CKP__quantile__q_0.8,P-MON-CKP__quantile__q_0.9,P-MON-CKP__variation_coefficient,P-MON-CKP__mean_change,P-MON-CKP__mean_second_derivative_central,T-JUS-CKP__mean,T-JUS-CKP__variance,T-JUS-CKP__skewness,T-JUS-CKP__kurtosis,T-JUS-CKP__maximum,T-JUS-CKP__minimum,T-JUS-CKP__median,T-JUS-CKP__quantile__q_0.1,T-JUS-CKP__quantile__q_0.2,T-JUS-CKP__quantile__q_0.3,T-JUS-CKP__quantile__q_0.4,T-JUS-CKP__quantile__q_0.6,T-JUS-CKP__quantile__q_0.7,T-JUS-CKP__quantile__q_0.8,T-JUS-CKP__quantile__q_0.9,T-JUS-CKP__variation_coefficient,T-JUS-CKP__mean_change,T-JUS-CKP__mean_second_derivative_central,QGL__mean,QGL__variance,QGL__skewness,QGL__kurtosis,QGL__maximum,QGL__minimum,QGL__median,QGL__quantile__q_0.1,QGL__quantile__q_0.2,QGL__quantile__q_0.3,QGL__quantile__q_0.4,QGL__quantile__q_0.6,QGL__quantile__q_0.7,QGL__quantile__q_0.8,QGL__quantile__q_0.9,QGL__mean_change,QGL__mean_second_derivative_central,class_code
0,30452520.0,39.064321,-0.029904,-1.707532,30452532.0,30452512.0,30452523.0,30452514.0,30452515.0,30452516.0,30452518.0,30452526.0,30452527.3,30452528.0,30452529.0,2.052423e-07,-0.168539,0.0,21453280.0,12899.168025,0.19382,-0.722604,21453566.0,21453039.0,21453275.0,21453131.0,21453169.0,21453199.7,21453229.6,21453331.0,21453348.3,21453372.2,21453425.2,5e-06,3.022472,1.579545,125.35756,7.086469e-09,0.054108,-0.473179,125.35778,125.35736,125.35756,125.35745,125.35748,125.357517,125.357536,125.35758,125.35761,125.357632,125.357661,6.715285e-07,-7.865169e-07,6.25e-07,1519597.66,3.915511,-0.008192,-1.022432,1519601.0,1519594.0,1519597.7,1519595.0,1519595.98,1519596.37,1519597.0,1519598.0,1519599.0,1519599.82,1519600.31,1e-06,-0.078652,0.0,92.644159,2e-06,0.059343,-1.201477,92.646534,92.641924,92.64413,92.642336,92.64277,92.643215,92.64367,92.644594,92.645066,92.645547,92.646035,1.5e-05,-5.2e-05,6.25e-08,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5


In [9]:
with pd.option_context('display.max_rows', None, 'display.max_columns', None):  # more options can be specified also
    nans = df.isna().sum(axis=0)
    print(nans[nans!=0])

P-PDG__variation_coefficient        8571
P-TPT__variation_coefficient          64
T-TPT__variation_coefficient        6514
P-MON-CKP__variation_coefficient    1200
T-JUS-CKP__variation_coefficient    1819
dtype: int64


In [10]:
imputed_df_list = []
for i in df['class_code'].unique():
    query = 'class_code == ' + str(i)
    print(query)
    imputed = tf.utilities.dataframe_functions.impute(df.query(query))
    print(imputed.shape)
    imputed_df_list.append(imputed)
imputed_df = pd.concat(imputed_df_list)
imputed_df

class_code == 5


A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  return self._where(cond, other, inplace, axis, level, errors=errors)


(14443, 108)
class_code == 7
(2529, 108)
class_code == 3
(5284, 108)
class_code == 1
(9299, 108)
class_code == 4
(2468, 108)
class_code == 6
(6508, 108)
class_code == 0
(10556, 108)
class_code == 2
(677, 108)


Unnamed: 0,P-PDG__mean,P-PDG__variance,P-PDG__skewness,P-PDG__kurtosis,P-PDG__maximum,P-PDG__minimum,P-PDG__median,P-PDG__quantile__q_0.1,P-PDG__quantile__q_0.2,P-PDG__quantile__q_0.3,P-PDG__quantile__q_0.4,P-PDG__quantile__q_0.6,P-PDG__quantile__q_0.7,P-PDG__quantile__q_0.8,P-PDG__quantile__q_0.9,P-PDG__variation_coefficient,P-PDG__mean_change,P-PDG__mean_second_derivative_central,P-TPT__mean,P-TPT__variance,P-TPT__skewness,P-TPT__kurtosis,P-TPT__maximum,P-TPT__minimum,P-TPT__median,P-TPT__quantile__q_0.1,P-TPT__quantile__q_0.2,P-TPT__quantile__q_0.3,P-TPT__quantile__q_0.4,P-TPT__quantile__q_0.6,P-TPT__quantile__q_0.7,P-TPT__quantile__q_0.8,P-TPT__quantile__q_0.9,P-TPT__variation_coefficient,P-TPT__mean_change,P-TPT__mean_second_derivative_central,T-TPT__mean,T-TPT__variance,T-TPT__skewness,T-TPT__kurtosis,T-TPT__maximum,T-TPT__minimum,T-TPT__median,T-TPT__quantile__q_0.1,T-TPT__quantile__q_0.2,T-TPT__quantile__q_0.3,T-TPT__quantile__q_0.4,T-TPT__quantile__q_0.6,T-TPT__quantile__q_0.7,T-TPT__quantile__q_0.8,T-TPT__quantile__q_0.9,T-TPT__variation_coefficient,T-TPT__mean_change,T-TPT__mean_second_derivative_central,P-MON-CKP__mean,P-MON-CKP__variance,P-MON-CKP__skewness,P-MON-CKP__kurtosis,P-MON-CKP__maximum,P-MON-CKP__minimum,P-MON-CKP__median,P-MON-CKP__quantile__q_0.1,P-MON-CKP__quantile__q_0.2,P-MON-CKP__quantile__q_0.3,P-MON-CKP__quantile__q_0.4,P-MON-CKP__quantile__q_0.6,P-MON-CKP__quantile__q_0.7,P-MON-CKP__quantile__q_0.8,P-MON-CKP__quantile__q_0.9,P-MON-CKP__variation_coefficient,P-MON-CKP__mean_change,P-MON-CKP__mean_second_derivative_central,T-JUS-CKP__mean,T-JUS-CKP__variance,T-JUS-CKP__skewness,T-JUS-CKP__kurtosis,T-JUS-CKP__maximum,T-JUS-CKP__minimum,T-JUS-CKP__median,T-JUS-CKP__quantile__q_0.1,T-JUS-CKP__quantile__q_0.2,T-JUS-CKP__quantile__q_0.3,T-JUS-CKP__quantile__q_0.4,T-JUS-CKP__quantile__q_0.6,T-JUS-CKP__quantile__q_0.7,T-JUS-CKP__quantile__q_0.8,T-JUS-CKP__quantile__q_0.9,T-JUS-CKP__variation_coefficient,T-JUS-CKP__mean_change,T-JUS-CKP__mean_second_derivative_central,QGL__mean,QGL__variance,QGL__skewness,QGL__kurtosis,QGL__maximum,QGL__minimum,QGL__median,QGL__quantile__q_0.1,QGL__quantile__q_0.2,QGL__quantile__q_0.3,QGL__quantile__q_0.4,QGL__quantile__q_0.6,QGL__quantile__q_0.7,QGL__quantile__q_0.8,QGL__quantile__q_0.9,QGL__mean_change,QGL__mean_second_derivative_central,class_code
0,3.045252e+07,39.064321,-0.029904,-1.707532,30452532.0,30452512.0,30452523.0,30452514.0,30452515.0,30452516.0,30452518.0,30452526.0,30452527.3,30452528.0,30452529.0,2.052423e-07,-0.168539,0.000000,2.145328e+07,1.289917e+04,0.193820,-0.722604,21453566.0,21453039.0,21453275.0,21453131.0,21453169.0,21453199.7,21453229.6,21453331.0,21453348.3,21453372.2,21453425.2,0.000005,3.022472,1.579545,125.357560,7.086469e-09,0.054108,-0.473179,125.357780,125.357360,125.357560,125.357450,125.357480,125.357517,125.357536,125.357580,125.357610,125.357632,125.357661,6.715285e-07,-7.865169e-07,6.250000e-07,1.519598e+06,3.915511,-0.008192,-1.022432,1519601.0,1519594.0,1519597.7,1519595.00,1519595.98,1519596.37,1519597.00,1519598.00,1519599.00,1519599.82,1519600.31,1.302164e-06,-0.078652,0.000000,92.644159,1.821403e-06,0.059343,-1.201477,92.646534,92.641924,92.644130,92.642336,92.642770,92.643215,92.643670,92.644594,92.645066,92.645547,92.646035,0.000015,-0.000052,6.250000e-08,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5
1,3.045252e+07,30.762469,-0.101150,-1.311308,30452527.0,30452507.0,30452518.0,30452509.9,30452512.0,30452513.0,30452514.0,30452521.0,30452522.0,30452523.0,30452524.0,1.821325e-07,-0.022472,0.125000,2.145324e+07,1.013079e+04,0.447268,-0.311287,21453511.0,21453025.0,21453230.5,21453126.0,21453146.0,21453174.1,21453201.6,21453261.0,21453302.6,21453342.6,21453366.7,0.000005,-2.269663,-0.045455,125.357354,6.379062e-09,0.245186,-0.644995,125.357550,125.357220,125.357350,125.357249,125.357270,125.357300,125.357336,125.357370,125.357390,125.357420,125.357470,6.371308e-07,-2.921348e-06,-3.977273e-07,1.519591e+06,3.380914,-0.061082,-1.281843,1519594.0,1519588.0,1519591.0,1519588.29,1519589.00,1519589.34,1519590.06,1519591.94,1519592.00,1519592.70,1519593.00,1.210014e-06,-0.067416,0.000000,92.639988,1.140812e-06,0.097792,-1.214437,92.641880,92.638236,92.639935,92.638572,92.638900,92.639227,92.639569,92.640320,92.640713,92.641100,92.641486,0.000012,-0.000041,3.409091e-08,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5
2,3.045251e+07,43.143333,-0.125560,-1.227478,30452523.0,30452499.0,30452514.0,30452503.9,30452505.0,30452507.0,30452509.0,30452515.0,30452517.0,30452518.0,30452520.0,2.156918e-07,0.022472,0.022727,2.145323e+07,1.215263e+04,0.183955,-0.179435,21453502.0,21452952.0,21453214.0,21453110.2,21453125.8,21453171.7,21453190.0,21453265.6,21453289.9,21453327.2,21453377.8,0.000005,0.595506,-0.420455,125.357183,5.564802e-09,0.291710,-0.215432,125.357380,125.357040,125.357180,125.357080,125.357120,125.357140,125.357160,125.357200,125.357220,125.357250,125.357281,5.950804e-07,-1.011236e-06,5.681818e-08,1.519586e+06,2.658069,-0.278000,-1.164092,1519588.0,1519583.0,1519586.0,1519583.00,1519584.00,1519584.77,1519585.36,1519586.34,1519587.00,1519587.00,1519588.00,1.072897e-06,-0.056180,0.000000,92.636607,7.914609e-07,0.119171,-1.220648,92.638199,92.635183,92.636565,92.635434,92.635689,92.635959,92.636252,92.636883,92.637205,92.637527,92.637860,0.000010,-0.000034,6.250000e-08,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5
3,3.045251e+07,28.889506,0.109718,-1.159913,30452518.0,30452497.0,30452507.0,30452501.0,30452503.0,30452504.0,30452505.0,30452510.0,30452511.0,30452513.0,30452515.0,1.765009e-07,0.089888,-0.017045,2.145324e+07,1.328920e+04,0.418454,-0.510260,21453524.0,21453020.0,21453216.5,21453113.7,21453130.4,21453152.7,21453183.8,21453266.4,21453305.7,21453340.2,21453372.9,0.000005,0.213483,1.090909,125.357036,4.845988e-09,0.479575,-0.045849,125.357230,125.356900,125.357030,125.356959,125.356980,125.356990,125.357010,125.357044,125.357070,125.357100,125.357122,5.553189e-07,-1.573034e-06,9.659091e-07,1.519581e+06,1.253111,-0.154681,-1.408403,1519583.0,1519579.0,1519581.0,1519579.49,1519580.00,1519580.00,1519580.62,1519581.94,1519582.00,1519582.00,1519582.40,7.366665e-07,-0.044944,0.001136,92.633901,5.018663e-07,0.105621,-1.202358,92.635155,92.632738,92.633859,92.632963,92.633183,92.633403,92.633625,92.634113,92.634378,92.634643,92.634900,0.000008,-0.000027,2.272727e-08,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5
4,3.045250e+07,40.849506,-0.137049,-1.338467,30452516.0,30452491.0,30452504.5,30452495.9,30452497.0,30452498.7,30452501.0,30452508.0,30452508.0,30452510.0,30452511.1,2.098797e-07,-0.123596,-0.147727,2.145324e+07,1.408433e+04,0.634264,-0.590769,21453518.0,21453059.0,21453204.5,21453104.6,21453133.4,21453151.1,21453172.6,21453260.4,21453292.1,21453344.2,21453423.3,0.000006,-1.528090,0.295455,125.356903,5.005444e-09,0.351398,-0.564235,125.357070,125.356760,125.356895,125.356810,125.356830,125.356860,125.356880,125.356910,125.356930,125.356970,125.357001,5.643819e-07,-2.247191e-06,-2.272727e-07,1.519578e+06,0.925388,-0.035209,-1.130741,1519579.0,1519576.0,1519577.7,1519576.38,1519577.00,1519577.00,1519577.10,1519578.00,1519578.06,1519578.84,1519579.00,6.330514e-07,-0.033708,0.000000,92.631672,3.420509e-07,0.073749,-1.184283,92.632712,92.630705,92.631656,92.630884,92.631071,92.631264,92.631461,92.631855,92.632059,92.632272,92.632490,0.000006,-0.000023,2.840909e-08,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
42832,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.304471e-06,0.000000,0.000000,1.176150e+07,3.142752e+10,0.257888,-1.107254,12095948.0,11481689.0,11752046.5,11534052.4,11588441.0,11634722.1,11686018.2,11799651.2,11865082.2,11937354.0,12027432.8,0.015073,-6901.786517,8.375000,27.106353,7.400559e+00,0.142556,-1.153039,32.138268,22.777638,26.978129,23.501861,24.325450,25.204007,26.056338,27.902453,28.853173,29.868864,30.940622,1.003601e-01,-1.051756e-01,4.001818e-04,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.00,0.00,0.00,0.00,0.00,0.00,0.00,0.00,2.250416e-05,0.000000,0.000000,0.000000,0.000000e+00,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.006601,0.000000,0.000000e+00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2
42833,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.304471e-06,0.000000,0.000000,1.129674e+07,1.035892e+10,0.121973,-1.182532,11473998.0,11132767.0,11289533.0,11156287.0,11196237.6,11224390.6,11265359.0,11315303.8,11362406.9,11407501.0,11449804.9,0.009010,-3834.056180,3.971591,19.622236,2.768549e+00,0.169575,-1.176410,22.715385,16.954149,19.495137,17.443330,17.954055,18.447210,18.903729,20.066074,20.724461,21.345438,21.968241,8.479644e-02,-6.473299e-02,1.420852e-04,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.00,0.00,0.00,0.00,0.00,0.00,0.00,0.00,2.250416e-05,0.000000,0.000000,0.000000,0.000000e+00,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.006601,0.000000,0.000000e+00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2
42834,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.304471e-06,0.000000,0.000000,1.102114e+07,3.618600e+09,0.214290,-1.139532,11129219.0,10922550.0,11016814.0,10945430.4,10968393.0,10971921.9,10995071.0,11034880.0,11053275.0,11087308.8,11106260.4,0.005458,-2322.123596,3.914773,14.832567,1.184232e+00,0.187357,-1.133147,16.894829,13.132257,14.761802,13.431825,13.733859,14.044177,14.409780,15.153347,15.518339,15.938264,16.409789,7.336721e-02,-4.227609e-02,2.785284e-04,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.00,0.00,0.00,0.00,0.00,0.00,0.00,0.00,2.250416e-05,0.000000,0.000000,0.000000,0.000000e+00,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.006601,0.000000,0.000000e+00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2
42835,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,8.304471e-06,0.000000,0.000000,1.084509e+07,1.719589e+09,0.179996,-1.203879,10921942.0,10784457.0,10834982.5,10785565.2,10807678.6,10811796.1,10829088.2,10854119.4,10875945.2,10898318.6,10899558.3,0.003824,-1539.573034,10.511364,11.763843,5.053098e-01,0.192496,-1.086058,13.112607,10.604067,11.704885,10.828476,11.049226,11.271157,11.490971,11.929457,12.195421,12.505503,12.776490,6.042680e-02,-2.818584e-02,3.627273e-05,0.000000e+00,0.000000,0.000000,0.000000,0.0,0.0,0.0,0.00,0.00,0.00,0.00,0.00,0.00,0.00,0.00,2.250416e-05,0.000000,0.000000,0.000000,0.000000e+00,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.000000,0.006601,0.000000,0.000000e+00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2


In [11]:
with pd.option_context('display.max_rows', None, 'display.max_columns', None):  # more options can be specified also
    nans = imputed_df.isna().sum(axis=0)
    print(nans[nans!=0])

Series([], dtype: int64)


In [12]:
imputed_df.shape

(51764, 108)