In [1]:
# Import data analytics libraries
import numpy as np
import pandas as pd
from pandas_profiling import ProfileReport

# Import data visualization libraries
import matplotlib.pyplot as plt
import plotly.graph_objects as go

# Import machine learning libraries
from sklearn.cluster import KMeans
from sklearn.decomposition import PCA

# Silence IPython warnings
import warnings
warnings.filterwarnings('ignore')

In [2]:
# Get general population and customers datasets
azdias = pd.read_csv('data/azdias.csv', sep=';')
customers = pd.read_csv('data/customers.csv', sep=';')

del azdias['Unnamed: 0']
del customers['Unnamed: 0']

# Preprocessing

## Data Overview

In [3]:
# Get overview of population data
azdias.head()

Unnamed: 0,LNR,AGER_TYP,AKT_DAT_KL,ALTER_HH,ALTER_KIND1,ALTER_KIND2,ALTER_KIND3,ALTER_KIND4,ALTERSKATEGORIE_FEIN,ANZ_HAUSHALTE_AKTIV,...,VHN,VK_DHT4A,VK_DISTANZ,VK_ZG11,W_KEIT_KIND_HH,WOHNDAUER_2008,WOHNLAGE,ZABEOTYP,ANREDE_KZ,ALTERSKATEGORIE_GROB
0,910215,-1,,,,,,,,,...,,,,,,,,3,1,2
1,910220,-1,9.0,0.0,,,,,21.0,11.0,...,4.0,8.0,11.0,10.0,3.0,9.0,4.0,5,2,1
2,910225,-1,9.0,17.0,,,,,17.0,10.0,...,2.0,9.0,9.0,6.0,3.0,9.0,2.0,5,2,3
3,910226,2,1.0,13.0,,,,,13.0,1.0,...,0.0,7.0,10.0,11.0,,9.0,7.0,3,2,4
4,910241,-1,1.0,20.0,,,,,14.0,3.0,...,2.0,3.0,5.0,4.0,2.0,9.0,3.0,4,1,3


In [4]:
# Get overview of customers data
customers.head()

Unnamed: 0,LNR,AGER_TYP,AKT_DAT_KL,ALTER_HH,ALTER_KIND1,ALTER_KIND2,ALTER_KIND3,ALTER_KIND4,ALTERSKATEGORIE_FEIN,ANZ_HAUSHALTE_AKTIV,...,VK_ZG11,W_KEIT_KIND_HH,WOHNDAUER_2008,WOHNLAGE,ZABEOTYP,PRODUCT_GROUP,CUSTOMER_GROUP,ONLINE_PURCHASE,ANREDE_KZ,ALTERSKATEGORIE_GROB
0,9626,2,1.0,10.0,,,,,10.0,1.0,...,2.0,6.0,9.0,7.0,3,COSMETIC_AND_FOOD,MULTI_BUYER,0,1,4
1,9628,-1,9.0,11.0,,,,,,,...,3.0,0.0,9.0,,3,FOOD,SINGLE_BUYER,0,1,4
2,143872,-1,1.0,6.0,,,,,0.0,1.0,...,11.0,6.0,9.0,2.0,3,COSMETIC_AND_FOOD,MULTI_BUYER,0,2,4
3,143873,1,1.0,8.0,,,,,8.0,0.0,...,2.0,,9.0,7.0,1,COSMETIC,MULTI_BUYER,0,1,4
4,143874,-1,1.0,20.0,,,,,14.0,7.0,...,4.0,2.0,9.0,3.0,1,FOOD,MULTI_BUYER,0,1,3


In [6]:
# Generate Profile Report for azdias
ProfileReport(azdias.iloc[:,:50])

0,1
Number of variables,50
Number of observations,891221
Total Missing (%),11.3%
Total size in memory,340.0 MiB
Average record size in memory,400.0 B

0,1
Numeric,45
Categorical,1
Boolean,0
Date,0
Text (Unique),0
Rejected,2
Unsupported,2

0,1
Distinct count,891221
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,637260
Minimum,191653
Maximum,1082873
Zeros (%),0.0%

0,1
Minimum,191653
5-th percentile,236210
Q1,414460
Median,637260
Q3,860070
95-th percentile,1038300
Maximum,1082873
Range,891220
Interquartile range,445610

0,1
Standard deviation,257270
Coef of variation,0.40372
Kurtosis,-1.2
Mean,637260
MAD,222810
Skewness,-1.5519e-18
Sum,567942168123
Variance,66190000000
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
192418,1,0.0%,
611455,1,0.0%,
982154,1,0.0%,
976009,1,0.0%,
978056,1,0.0%,
955527,1,0.0%,
957574,1,0.0%,
951429,1,0.0%,
953476,1,0.0%,
963715,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
191653,1,0.0%,
191654,1,0.0%,
191655,1,0.0%,
191656,1,0.0%,
191657,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1082869,1,0.0%,
1082870,1,0.0%,
1082871,1,0.0%,
1082872,1,0.0%,
1082873,1,0.0%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,-0.35844
Minimum,-1
Maximum,3
Zeros (%),0.9%

0,1
Minimum,-1
5-th percentile,-1
Q1,-1
Median,-1
Q3,-1
95-th percentile,2
Maximum,3
Range,4
Interquartile range,0

0,1
Standard deviation,1.1987
Coef of variation,-3.3443
Kurtosis,0.73949
Mean,-0.35844
MAD,0.97543
Skewness,1.5243
Sum,-319445
Variance,1.4369
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
-1,677503,76.0%,
2,98472,11.0%,
1,79802,9.0%,
3,27104,3.0%,
0,8340,0.9%,

Value,Count,Frequency (%),Unnamed: 3
-1,677503,76.0%,
0,8340,0.9%,
1,79802,9.0%,
2,98472,11.0%,
3,27104,3.0%,

Value,Count,Frequency (%),Unnamed: 3
-1,677503,76.0%,
0,8340,0.9%,
1,79802,9.0%,
2,98472,11.0%,
3,27104,3.0%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),8.2%
Missing (n),73499
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,4.4219
Minimum,1
Maximum,9
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,1
Median,3
Q3,9
95-th percentile,9
Maximum,9
Range,8
Interquartile range,8

0,1
Standard deviation,3.6388
Coef of variation,0.8229
Kurtosis,-1.7654
Mean,4.4219
MAD,3.4643
Skewness,0.28735
Sum,3615900
Variance,13.241
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
1.0,390258,43.8%,
9.0,270663,30.4%,
5.0,29203,3.3%,
6.0,27655,3.1%,
3.0,24880,2.8%,
4.0,21466,2.4%,
7.0,21026,2.4%,
8.0,17485,2.0%,
2.0,15086,1.7%,
(Missing),73499,8.2%,

Value,Count,Frequency (%),Unnamed: 3
1.0,390258,43.8%,
2.0,15086,1.7%,
3.0,24880,2.8%,
4.0,21466,2.4%,
5.0,29203,3.3%,

Value,Count,Frequency (%),Unnamed: 3
5.0,29203,3.3%,
6.0,27655,3.1%,
7.0,21026,2.4%,
8.0,17485,2.0%,
9.0,270663,30.4%,

0,1
Distinct count,23
Unique (%),0.0%
Missing (%),8.2%
Missing (n),73499
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,10.864
Minimum,0
Maximum,21
Zeros (%),26.6%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,13
Q3,17
95-th percentile,21
Maximum,21
Range,21
Interquartile range,17

0,1
Standard deviation,7.6397
Coef of variation,0.7032
Kurtosis,-1.3649
Mean,10.864
MAD,6.7086
Skewness,-0.42586
Sum,8883800
Variance,58.365
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0.0,236768,26.6%,
18.0,60852,6.8%,
17.0,55665,6.2%,
19.0,52890,5.9%,
15.0,51867,5.8%,
16.0,51857,5.8%,
14.0,44275,5.0%,
21.0,41610,4.7%,
20.0,40671,4.6%,
13.0,37612,4.2%,

Value,Count,Frequency (%),Unnamed: 3
0.0,236768,26.6%,
1.0,1,0.0%,
2.0,47,0.0%,
3.0,200,0.0%,
4.0,603,0.1%,

Value,Count,Frequency (%),Unnamed: 3
17.0,55665,6.2%,
18.0,60852,6.8%,
19.0,52890,5.9%,
20.0,40671,4.6%,
21.0,41610,4.7%,

0,1
Distinct count,18
Unique (%),0.0%
Missing (%),90.9%
Missing (n),810163
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,11.745
Minimum,2
Maximum,18
Zeros (%),0.0%

0,1
Minimum,2
5-th percentile,6
Q1,8
Median,12
Q3,15
95-th percentile,18
Maximum,18
Range,16
Interquartile range,7

0,1
Standard deviation,4.0977
Coef of variation,0.34887
Kurtosis,-1.0326
Mean,11.745
MAD,3.534
Skewness,-0.1436
Sum,952060
Variance,16.791
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
18.0,6703,0.8%,
17.0,6394,0.7%,
8.0,6343,0.7%,
7.0,6249,0.7%,
16.0,6124,0.7%,
15.0,6008,0.7%,
14.0,5992,0.7%,
9.0,5846,0.7%,
13.0,5713,0.6%,
10.0,5678,0.6%,

Value,Count,Frequency (%),Unnamed: 3
2.0,403,0.0%,
3.0,1063,0.1%,
4.0,1084,0.1%,
5.0,1501,0.2%,
6.0,4875,0.5%,

Value,Count,Frequency (%),Unnamed: 3
14.0,5992,0.7%,
15.0,6008,0.7%,
16.0,6124,0.7%,
17.0,6394,0.7%,
18.0,6703,0.8%,

0,1
Distinct count,18
Unique (%),0.0%
Missing (%),96.7%
Missing (n),861722
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,13.403
Minimum,2
Maximum,18
Zeros (%),0.0%

0,1
Minimum,2
5-th percentile,8
Q1,11
Median,14
Q3,16
95-th percentile,18
Maximum,18
Range,16
Interquartile range,5

0,1
Standard deviation,3.2433
Coef of variation,0.24199
Kurtosis,-0.60281
Mean,13.403
MAD,2.7173
Skewness,-0.42323
Sum,395360
Variance,10.519
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
18.0,3128,0.4%,
14.0,3111,0.3%,
17.0,3085,0.3%,
15.0,3083,0.3%,
16.0,3010,0.3%,
13.0,2968,0.3%,
12.0,2628,0.3%,
11.0,2450,0.3%,
10.0,1953,0.2%,
9.0,1641,0.2%,

Value,Count,Frequency (%),Unnamed: 3
2.0,4,0.0%,
3.0,15,0.0%,
4.0,67,0.0%,
5.0,154,0.0%,
6.0,396,0.0%,

Value,Count,Frequency (%),Unnamed: 3
14.0,3111,0.3%,
15.0,3083,0.3%,
16.0,3010,0.3%,
17.0,3085,0.3%,
18.0,3128,0.4%,

0,1
Distinct count,16
Unique (%),0.0%
Missing (%),99.3%
Missing (n),885051
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,14.476
Minimum,4
Maximum,18
Zeros (%),0.0%

0,1
Minimum,4
5-th percentile,9
Q1,13
Median,15
Q3,17
95-th percentile,18
Maximum,18
Range,14
Interquartile range,4

0,1
Standard deviation,2.7124
Coef of variation,0.18737
Kurtosis,-0.052381
Mean,14.476
MAD,2.2243
Skewness,-0.67878
Sum,89317
Variance,7.3573
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
18.0,866,0.1%,
15.0,847,0.1%,
16.0,841,0.1%,
17.0,826,0.1%,
14.0,746,0.1%,
13.0,674,0.1%,
12.0,438,0.0%,
11.0,363,0.0%,
10.0,237,0.0%,
9.0,159,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4.0,2,0.0%,
5.0,8,0.0%,
6.0,21,0.0%,
7.0,40,0.0%,
8.0,102,0.0%,

Value,Count,Frequency (%),Unnamed: 3
14.0,746,0.1%,
15.0,847,0.1%,
16.0,841,0.1%,
17.0,826,0.1%,
18.0,866,0.1%,

0,1
Distinct count,13
Unique (%),0.0%
Missing (%),99.9%
Missing (n),890016
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,15.09
Minimum,7
Maximum,18
Zeros (%),0.0%

0,1
Minimum,7
5-th percentile,10
Q1,14
Median,15
Q3,17
95-th percentile,18
Maximum,18
Range,11
Interquartile range,3

0,1
Standard deviation,2.4529
Coef of variation,0.16256
Kurtosis,-0.048645
Mean,15.09
MAD,1.9971
Skewness,-0.77308
Sum,18183
Variance,6.0169
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
17.0,225,0.0%,
18.0,216,0.0%,
15.0,171,0.0%,
16.0,159,0.0%,
14.0,136,0.0%,
13.0,119,0.0%,
12.0,59,0.0%,
11.0,48,0.0%,
10.0,42,0.0%,
9.0,15,0.0%,

Value,Count,Frequency (%),Unnamed: 3
7.0,1,0.0%,
8.0,14,0.0%,
9.0,15,0.0%,
10.0,42,0.0%,
11.0,48,0.0%,

Value,Count,Frequency (%),Unnamed: 3
14.0,136,0.0%,
15.0,171,0.0%,
16.0,159,0.0%,
17.0,225,0.0%,
18.0,216,0.0%,

0,1
Distinct count,27
Unique (%),0.0%
Missing (%),29.5%
Missing (n),262947
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,13.701
Minimum,0
Maximum,25
Zeros (%),4.6%

0,1
Minimum,0
5-th percentile,0
Q1,11
Median,14
Q3,17
95-th percentile,20
Maximum,25
Range,25
Interquartile range,6

0,1
Standard deviation,5.0798
Coef of variation,0.37077
Kurtosis,1.1989
Mean,13.701
MAD,3.8224
Skewness,-1.0472
Sum,8607800
Variance,25.805
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
15.0,63486,7.1%,
14.0,59709,6.7%,
16.0,53384,6.0%,
18.0,51365,5.8%,
17.0,50011,5.6%,
13.0,49556,5.6%,
12.0,42951,4.8%,
19.0,42340,4.8%,
0.0,41188,4.6%,
10.0,34903,3.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,41188,4.6%,
1.0,1,0.0%,
2.0,64,0.0%,
3.0,218,0.0%,
4.0,636,0.1%,

Value,Count,Frequency (%),Unnamed: 3
21.0,13658,1.5%,
22.0,3669,0.4%,
23.0,2838,0.3%,
24.0,2340,0.3%,
25.0,1017,0.1%,

0,1
Distinct count,293
Unique (%),0.0%
Missing (%),10.5%
Missing (n),93148
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,8.2873
Minimum,0
Maximum,595
Zeros (%),0.7%

0,1
Minimum,0
5-th percentile,1
Q1,1
Median,4
Q3,9
95-th percentile,28
Maximum,595
Range,595
Interquartile range,8

0,1
Standard deviation,15.628
Coef of variation,1.8858
Kurtosis,142.62
Mean,8.2873
MAD,7.565
Skewness,8.78
Sum,6613800
Variance,244.24
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
1.0,195957,22.0%,
2.0,120982,13.6%,
3.0,62575,7.0%,
4.0,43213,4.8%,
5.0,37815,4.2%,
6.0,36020,4.0%,
7.0,34526,3.9%,
8.0,32293,3.6%,
9.0,29002,3.3%,
10.0,25428,2.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,6463,0.7%,
1.0,195957,22.0%,
2.0,120982,13.6%,
3.0,62575,7.0%,
4.0,43213,4.8%,

Value,Count,Frequency (%),Unnamed: 3
445.0,7,0.0%,
515.0,4,0.0%,
523.0,4,0.0%,
536.0,1,0.0%,
595.0,8,0.0%,

0,1
Distinct count,22
Unique (%),0.0%
Missing (%),10.9%
Missing (n),97008
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.040647
Minimum,0
Maximum,23
Zeros (%),86.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,23
Range,23
Interquartile range,0

0,1
Standard deviation,0.32403
Coef of variation,7.9719
Kurtosis,894.89
Mean,0.040647
MAD,0.07884
Skewness,22.719
Sum,32282
Variance,0.10499
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0.0,770244,86.4%,
1.0,20157,2.3%,
2.0,2459,0.3%,
3.0,585,0.1%,
4.0,232,0.0%,
5.0,117,0.0%,
6.0,106,0.0%,
8.0,68,0.0%,
7.0,65,0.0%,
9.0,34,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,770244,86.4%,
1.0,20157,2.3%,
2.0,2459,0.3%,
3.0,585,0.1%,
4.0,232,0.0%,

Value,Count,Frequency (%),Unnamed: 3
16.0,3,0.0%,
17.0,13,0.0%,
18.0,6,0.0%,
20.0,9,0.0%,
23.0,3,0.0%,

0,1
Distinct count,12
Unique (%),0.0%
Missing (%),8.2%
Missing (n),73499
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.15402
Minimum,0
Maximum,11
Zeros (%),82.0%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,1
Maximum,11
Range,11
Interquartile range,0

0,1
Standard deviation,0.50239
Coef of variation,3.2619
Kurtosis,18.39
Mean,0.15402
MAD,0.27546
Skewness,3.9226
Sum,125940
Variance,0.25239
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0.0,731242,82.0%,
1.0,55350,6.2%,
2.0,24445,2.7%,
3.0,5376,0.6%,
4.0,1057,0.1%,
5.0,190,0.0%,
6.0,47,0.0%,
7.0,10,0.0%,
9.0,3,0.0%,
11.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,731242,82.0%,
1.0,55350,6.2%,
2.0,24445,2.7%,
3.0,5376,0.6%,
4.0,1057,0.1%,

Value,Count,Frequency (%),Unnamed: 3
6.0,47,0.0%,
7.0,10,0.0%,
8.0,1,0.0%,
9.0,3,0.0%,
11.0,1,0.0%,

0,1
Distinct count,31
Unique (%),0.0%
Missing (%),8.2%
Missing (n),73499
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.7276
Minimum,0
Maximum,45
Zeros (%),3.8%

0,1
Minimum,0
5-th percentile,1
Q1,1
Median,1
Q3,2
95-th percentile,4
Maximum,45
Range,45
Interquartile range,1

0,1
Standard deviation,1.1558
Coef of variation,0.66903
Kurtosis,14.449
Mean,1.7276
MAD,0.89758
Skewness,1.8753
Sum,1412700
Variance,1.336
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
1.0,423383,47.5%,
2.0,195470,21.9%,
3.0,94905,10.6%,
4.0,47126,5.3%,
0.0,34103,3.8%,
5.0,15503,1.7%,
6.0,4842,0.5%,
7.0,1525,0.2%,
8.0,523,0.1%,
9.0,180,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,34103,3.8%,
1.0,423383,47.5%,
2.0,195470,21.9%,
3.0,94905,10.6%,
4.0,47126,5.3%,

Value,Count,Frequency (%),Unnamed: 3
35.0,1,0.0%,
37.0,2,0.0%,
38.0,2,0.0%,
40.0,1,0.0%,
45.0,1,0.0%,

0,1
Correlation,0.9769

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),8.2%
Missing (n),73499
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.0041616
Minimum,0
Maximum,6
Zeros (%),91.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,6
Range,6
Interquartile range,0

0,1
Standard deviation,0.068855
Coef of variation,16.546
Kurtosis,450.27
Mean,0.0041616
MAD,0.0082908
Skewness,18.793
Sum,3403
Variance,0.004741
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0.0,814542,91.4%,
1.0,2970,0.3%,
2.0,202,0.0%,
3.0,5,0.0%,
4.0,2,0.0%,
6.0,1,0.0%,
(Missing),73499,8.2%,

Value,Count,Frequency (%),Unnamed: 3
0.0,814542,91.4%,
1.0,2970,0.3%,
2.0,202,0.0%,
3.0,5,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,2970,0.3%,
2.0,202,0.0%,
3.0,5,0.0%,
4.0,2,0.0%,
6.0,1,0.0%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),10.9%
Missing (n),97216
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.1679
Minimum,1
Maximum,9
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,3
Median,3
Q3,4
95-th percentile,4
Maximum,9
Range,8
Interquartile range,1

0,1
Standard deviation,1.0024
Coef of variation,0.31642
Kurtosis,-0.21179
Mean,3.1679
MAD,0.81686
Skewness,-0.46129
Sum,2515300
Variance,1.0048
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
4.0,311339,34.9%,
3.0,254988,28.6%,
2.0,135662,15.2%,
1.0,56767,6.4%,
5.0,35090,3.9%,
9.0,159,0.0%,
(Missing),97216,10.9%,

Value,Count,Frequency (%),Unnamed: 3
1.0,56767,6.4%,
2.0,135662,15.2%,
3.0,254988,28.6%,
4.0,311339,34.9%,
5.0,35090,3.9%,

Value,Count,Frequency (%),Unnamed: 3
2.0,135662,15.2%,
3.0,254988,28.6%,
4.0,311339,34.9%,
5.0,35090,3.9%,
9.0,159,0.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),10.5%
Missing (n),93740
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,4.153
Minimum,1
Maximum,7
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,5
Q3,6
95-th percentile,7
Maximum,7
Range,6
Interquartile range,4

0,1
Standard deviation,2.1837
Coef of variation,0.52581
Kurtosis,-1.5178
Mean,4.153
MAD,2
Skewness,-0.23954
Sum,3312000
Variance,4.7686
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
6.0,255093,28.6%,
1.0,151782,17.0%,
2.0,104521,11.7%,
7.0,99039,11.1%,
3.0,73277,8.2%,
4.0,61358,6.9%,
5.0,52411,5.9%,
(Missing),93740,10.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,151782,17.0%,
2.0,104521,11.7%,
3.0,73277,8.2%,
4.0,61358,6.9%,
5.0,52411,5.9%,

Value,Count,Frequency (%),Unnamed: 3
3.0,73277,8.2%,
4.0,61358,6.9%,
5.0,52411,5.9%,
6.0,255093,28.6%,
7.0,99039,11.1%,

0,1
Distinct count,46
Unique (%),0.0%
Missing (%),11.1%
Missing (n),98979

0,1
6B,56672
8A,52438
4C,47819
Other values (42),635313
(Missing),98979

Value,Count,Frequency (%),Unnamed: 3
6B,56672,6.4%,
8A,52438,5.9%,
4C,47819,5.4%,
2D,35074,3.9%,
3C,34769,3.9%,
7A,34399,3.9%,
3D,34307,3.8%,
8B,33434,3.8%,
4A,33155,3.7%,
8C,30993,3.5%,

Unsupported value

Unsupported value

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.6328
Minimum,1
Maximum,6
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,4
Q3,5
95-th percentile,6
Maximum,6
Range,5
Interquartile range,3

0,1
Standard deviation,1.595
Coef of variation,0.43906
Kurtosis,-1.0686
Mean,3.6328
MAD,1.359
Skewness,-0.038885
Sum,3220000
Variance,2.5441
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
4.0,210963,23.7%,
3.0,156449,17.6%,
6.0,153915,17.3%,
2.0,148795,16.7%,
5.0,117376,13.2%,
1.0,98869,11.1%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,98869,11.1%,
2.0,148795,16.7%,
3.0,156449,17.6%,
4.0,210963,23.7%,
5.0,117376,13.2%,

Value,Count,Frequency (%),Unnamed: 3
2.0,148795,16.7%,
3.0,156449,17.6%,
4.0,210963,23.7%,
5.0,117376,13.2%,
6.0,153915,17.3%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.3353
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,4
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.4936
Coef of variation,0.44783
Kurtosis,-1.2962
Mean,3.3353
MAD,1.3199
Skewness,-0.35173
Sum,2956300
Variance,2.2309
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,281804,31.6%,
4.0,174275,19.6%,
1.0,167426,18.8%,
3.0,156998,17.6%,
2.0,105864,11.9%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,167426,18.8%,
2.0,105864,11.9%,
3.0,156998,17.6%,
4.0,174275,19.6%,
5.0,281804,31.6%,

Value,Count,Frequency (%),Unnamed: 3
1.0,167426,18.8%,
2.0,105864,11.9%,
3.0,156998,17.6%,
4.0,174275,19.6%,
5.0,281804,31.6%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.3681
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,3
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.3683
Coef of variation,0.40626
Kurtosis,-1.2724
Mean,3.3681
MAD,1.2173
Skewness,-0.20739
Sum,2985400
Variance,1.8723
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,267488,30.0%,
2.0,196545,22.1%,
3.0,171838,19.3%,
4.0,162940,18.3%,
1.0,87556,9.8%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,87556,9.8%,
2.0,196545,22.1%,
3.0,171838,19.3%,
4.0,162940,18.3%,
5.0,267488,30.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,87556,9.8%,
2.0,196545,22.1%,
3.0,171838,19.3%,
4.0,162940,18.3%,
5.0,267488,30.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.195
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,3
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.4014
Coef of variation,0.43862
Kurtosis,-1.3147
Mean,3.195
MAD,1.2282
Skewness,-0.072315
Sum,2832000
Variance,1.9639
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,233302,26.2%,
2.0,205425,23.0%,
3.0,173910,19.5%,
4.0,153045,17.2%,
1.0,120685,13.5%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,120685,13.5%,
2.0,205425,23.0%,
3.0,173910,19.5%,
4.0,153045,17.2%,
5.0,233302,26.2%,

Value,Count,Frequency (%),Unnamed: 3
1.0,120685,13.5%,
2.0,205425,23.0%,
3.0,173910,19.5%,
4.0,153045,17.2%,
5.0,233302,26.2%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.3513
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,3
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.3965
Coef of variation,0.41671
Kurtosis,-1.2779
Mean,3.3513
MAD,1.2399
Skewness,-0.22812
Sum,2970500
Variance,1.9502
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,270143,30.3%,
2.0,181803,20.4%,
3.0,170162,19.1%,
4.0,160469,18.0%,
1.0,103790,11.6%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,103790,11.6%,
2.0,181803,20.4%,
3.0,170162,19.1%,
4.0,160469,18.0%,
5.0,270143,30.3%,

Value,Count,Frequency (%),Unnamed: 3
1.0,103790,11.6%,
2.0,181803,20.4%,
3.0,170162,19.1%,
4.0,160469,18.0%,
5.0,270143,30.3%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.3362
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,3
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.3731
Coef of variation,0.41158
Kurtosis,-1.2363
Mean,3.3362
MAD,1.2108
Skewness,-0.21596
Sum,2957100
Variance,1.8853
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,254763,28.6%,
3.0,180975,20.3%,
2.0,180312,20.2%,
4.0,169791,19.1%,
1.0,100526,11.3%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,100526,11.3%,
2.0,180312,20.2%,
3.0,180975,20.3%,
4.0,169791,19.1%,
5.0,254763,28.6%,

Value,Count,Frequency (%),Unnamed: 3
1.0,100526,11.3%,
2.0,180312,20.2%,
3.0,180975,20.3%,
4.0,169791,19.1%,
5.0,254763,28.6%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.3607
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,3
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.379
Coef of variation,0.41033
Kurtosis,-1.2424
Mean,3.3607
MAD,1.2173
Skewness,-0.21678
Sum,2978800
Variance,1.9016
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,271673,30.5%,
3.0,194636,21.8%,
2.0,174808,19.6%,
4.0,147220,16.5%,
1.0,98030,11.0%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,98030,11.0%,
2.0,174808,19.6%,
3.0,194636,21.8%,
4.0,147220,16.5%,
5.0,271673,30.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,98030,11.0%,
2.0,174808,19.6%,
3.0,194636,21.8%,
4.0,147220,16.5%,
5.0,271673,30.5%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.5%
Missing (n),4854
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.466
Minimum,1
Maximum,5
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,1
Q1,2
Median,4
Q3,5
95-th percentile,5
Maximum,5
Range,4
Interquartile range,3

0,1
Standard deviation,1.3285
Coef of variation,0.38328
Kurtosis,-1.15
Mean,3.466
MAD,1.1753
Skewness,-0.32678
Sum,3072100
Variance,1.7648
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
5.0,272208,30.5%,
4.0,193430,21.7%,
2.0,175179,19.7%,
3.0,170731,19.2%,
1.0,74819,8.4%,
(Missing),4854,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,74819,8.4%,
2.0,175179,19.7%,
3.0,170731,19.2%,
4.0,193430,21.7%,
5.0,272208,30.5%,

Value,Count,Frequency (%),Unnamed: 3
1.0,74819,8.4%,
2.0,175179,19.7%,
3.0,170731,19.2%,
4.0,193430,21.7%,
5.0,272208,30.5%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.12234
Minimum,0
Maximum,6
Zeros (%),93.3%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,1
Maximum,6
Range,6
Interquartile range,0

0,1
Standard deviation,0.53595
Coef of variation,4.381
Kurtosis,35.69
Mean,0.12234
MAD,0.22834
Skewness,5.5443
Sum,109028
Variance,0.28724
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,831734,93.3%,
1,29771,3.3%,
2,18067,2.0%,
3,5708,0.6%,
4,4082,0.5%,
5,1483,0.2%,
6,376,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,831734,93.3%,
1,29771,3.3%,
2,18067,2.0%,
3,5708,0.6%,
4,4082,0.5%,

Value,Count,Frequency (%),Unnamed: 3
2,18067,2.0%,
3,5708,0.6%,
4,4082,0.5%,
5,1483,0.2%,
6,376,0.0%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.21991
Minimum,0
Maximum,6
Zeros (%),89.1%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,2
Maximum,6
Range,6
Interquartile range,0

0,1
Standard deviation,0.7479
Coef of variation,3.401
Kurtosis,19.494
Mean,0.21991
MAD,0.39189
Skewness,4.1974
Sum,195986
Variance,0.55936
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,794100,89.1%,
1,43554,4.9%,
2,29079,3.3%,
3,10214,1.1%,
4,9041,1.0%,
5,3930,0.4%,
6,1303,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,794100,89.1%,
1,43554,4.9%,
2,29079,3.3%,
3,10214,1.1%,
4,9041,1.0%,

Value,Count,Frequency (%),Unnamed: 3
2,29079,3.3%,
3,10214,1.1%,
4,9041,1.0%,
5,3930,0.4%,
6,1303,0.1%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,9.2674
Minimum,1
Maximum,10
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,5
Q1,10
Median,10
Q3,10
95-th percentile,10
Maximum,10
Range,9
Interquartile range,0

0,1
Standard deviation,1.7357
Coef of variation,0.18729
Kurtosis,7.9887
Mean,9.2674
MAD,1.1152
Skewness,-2.8505
Sum,8259319
Variance,3.0127
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
10,678331,76.1%,
9,82707,9.3%,
8,33062,3.7%,
5,29494,3.3%,
7,20482,2.3%,
6,17152,1.9%,
1,8495,1.0%,
4,8406,0.9%,
2,8001,0.9%,
3,5091,0.6%,

Value,Count,Frequency (%),Unnamed: 3
1,8495,1.0%,
2,8001,0.9%,
3,5091,0.6%,
4,8406,0.9%,
5,29494,3.3%,

Value,Count,Frequency (%),Unnamed: 3
6,17152,1.9%,
7,20482,2.3%,
8,33062,3.7%,
9,82707,9.3%,
10,678331,76.1%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.89273
Minimum,0
Maximum,7
Zeros (%),81.8%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,2.0118
Coef of variation,2.2536
Kurtosis,2.1681
Mean,0.89273
MAD,1.4601
Skewness,1.9755
Sum,795624
Variance,4.0475
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,728811,81.8%,
6,84798,9.5%,
3,27350,3.1%,
5,18539,2.1%,
4,8771,1.0%,
2,8119,0.9%,
7,7656,0.9%,
1,7177,0.8%,

Value,Count,Frequency (%),Unnamed: 3
0,728811,81.8%,
1,7177,0.8%,
2,8119,0.9%,
3,27350,3.1%,
4,8771,1.0%,

Value,Count,Frequency (%),Unnamed: 3
3,27350,3.1%,
4,8771,1.0%,
5,18539,2.1%,
6,84798,9.5%,
7,7656,0.9%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.56858
Minimum,0
Maximum,6
Zeros (%),88.1%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,6
Range,6
Interquartile range,0

0,1
Standard deviation,1.6438
Coef of variation,2.891
Kurtosis,5.7324
Mean,0.56858
MAD,1.0021
Skewness,2.7224
Sum,506730
Variance,2.702
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,785351,88.1%,
6,57103,6.4%,
3,14862,1.7%,
5,13911,1.6%,
4,8165,0.9%,
1,6347,0.7%,
2,5482,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,785351,88.1%,
1,6347,0.7%,
2,5482,0.6%,
3,14862,1.7%,
4,8165,0.9%,

Value,Count,Frequency (%),Unnamed: 3
2,5482,0.6%,
3,14862,1.7%,
4,8165,0.9%,
5,13911,1.6%,
6,57103,6.4%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.10677
Minimum,0
Maximum,7
Zeros (%),98.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,0.80818
Coef of variation,7.5694
Kurtosis,60.045
Mean,0.10677
MAD,0.20959
Skewness,7.777
Sum,95155
Variance,0.65315
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,874745,98.2%,
7,8522,1.0%,
3,3500,0.4%,
6,3202,0.4%,
5,1053,0.1%,
2,118,0.0%,
4,69,0.0%,
1,12,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,874745,98.2%,
1,12,0.0%,
2,118,0.0%,
3,3500,0.4%,
4,69,0.0%,

Value,Count,Frequency (%),Unnamed: 3
3,3500,0.4%,
4,69,0.0%,
5,1053,0.1%,
6,3202,0.4%,
7,8522,1.0%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,9.9268
Minimum,1
Maximum,10
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,10
Q1,10
Median,10
Q3,10
95-th percentile,10
Maximum,10
Range,9
Interquartile range,0

0,1
Standard deviation,0.60564
Coef of variation,0.061011
Kurtosis,117.07
Mean,9.9268
MAD,0.14318
Skewness,-10.309
Sum,8846967
Variance,0.3668
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
10,871535,97.8%,
8,6451,0.7%,
9,5297,0.6%,
5,4177,0.5%,
2,2058,0.2%,
6,509,0.1%,
1,476,0.1%,
7,335,0.0%,
4,311,0.0%,
3,72,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,476,0.1%,
2,2058,0.2%,
3,72,0.0%,
4,311,0.0%,
5,4177,0.5%,

Value,Count,Frequency (%),Unnamed: 3
6,509,0.1%,
7,335,0.0%,
8,6451,0.7%,
9,5297,0.6%,
10,871535,97.8%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,9.4391
Minimum,1
Maximum,10
Zeros (%),0.0%

0,1
Minimum,1
5-th percentile,5
Q1,10
Median,10
Q3,10
95-th percentile,10
Maximum,10
Range,9
Interquartile range,0

0,1
Standard deviation,1.5478
Coef of variation,0.16398
Kurtosis,11.673
Mean,9.4391
MAD,0.91511
Skewness,-3.3723
Sum,8412300
Variance,2.3956
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
10,726982,81.6%,
9,66077,7.4%,
8,22939,2.6%,
5,22124,2.5%,
7,16321,1.8%,
6,13668,1.5%,
1,6917,0.8%,
4,6869,0.8%,
2,4965,0.6%,
3,4359,0.5%,

Value,Count,Frequency (%),Unnamed: 3
1,6917,0.8%,
2,4965,0.6%,
3,4359,0.5%,
4,6869,0.8%,
5,22124,2.5%,

Value,Count,Frequency (%),Unnamed: 3
6,13668,1.5%,
7,16321,1.8%,
8,22939,2.6%,
9,66077,7.4%,
10,726982,81.6%,

0,1
Distinct count,12
Unique (%),0.0%
Missing (%),28.8%
Missing (n),257113
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.70522
Minimum,0
Maximum,10
Zeros (%),66.1%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,10
Maximum,10
Range,10
Interquartile range,0

0,1
Standard deviation,2.5527
Coef of variation,3.6197
Kurtosis,9.2693
Mean,0.70522
MAD,1.3098
Skewness,3.354
Sum,447190
Variance,6.5163
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0.0,588874,66.1%,
10.0,44065,4.9%,
5.0,391,0.0%,
3.0,220,0.0%,
7.0,214,0.0%,
8.0,172,0.0%,
9.0,67,0.0%,
6.0,50,0.0%,
2.0,35,0.0%,
4.0,18,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,588874,66.1%,
1.0,2,0.0%,
2.0,35,0.0%,
3.0,220,0.0%,
4.0,18,0.0%,

Value,Count,Frequency (%),Unnamed: 3
6.0,50,0.0%,
7.0,214,0.0%,
8.0,172,0.0%,
9.0,67,0.0%,
10.0,44065,4.9%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.42565
Minimum,0
Maximum,7
Zeros (%),92.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.5108
Coef of variation,3.5494
Kurtosis,9.7723
Mean,0.42565
MAD,0.78494
Skewness,3.3891
Sum,379344
Variance,2.2825
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,821760,92.2%,
6,43143,4.8%,
5,7744,0.9%,
7,7339,0.8%,
3,5943,0.7%,
2,2928,0.3%,
4,1448,0.2%,
1,916,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,821760,92.2%,
1,916,0.1%,
2,2928,0.3%,
3,5943,0.7%,
4,1448,0.2%,

Value,Count,Frequency (%),Unnamed: 3
3,5943,0.7%,
4,1448,0.2%,
5,7744,0.9%,
6,43143,4.8%,
7,7339,0.8%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.46787
Minimum,0
Maximum,7
Zeros (%),90.8%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.5422
Coef of variation,3.2961
Kurtosis,8.5752
Mean,0.46787
MAD,0.84973
Skewness,3.1832
Sum,416975
Variance,2.3782
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,809304,90.8%,
6,39392,4.4%,
3,15239,1.7%,
5,11899,1.3%,
7,8478,1.0%,
2,3117,0.3%,
4,2013,0.2%,
1,1779,0.2%,

Value,Count,Frequency (%),Unnamed: 3
0,809304,90.8%,
1,1779,0.2%,
2,3117,0.3%,
3,15239,1.7%,
4,2013,0.2%,

Value,Count,Frequency (%),Unnamed: 3
3,15239,1.7%,
4,2013,0.2%,
5,11899,1.3%,
6,39392,4.4%,
7,8478,1.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.1455
Minimum,0
Maximum,7
Zeros (%),77.7%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,2.267
Coef of variation,1.979
Kurtosis,0.80721
Mean,1.1455
MAD,1.7826
Skewness,1.6137
Sum,1020908
Variance,5.1393
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,692502,77.7%,
6,109025,12.2%,
3,30201,3.4%,
7,19637,2.2%,
5,18554,2.1%,
2,8748,1.0%,
1,7262,0.8%,
4,5292,0.6%,

Value,Count,Frequency (%),Unnamed: 3
0,692502,77.7%,
1,7262,0.8%,
2,8748,1.0%,
3,30201,3.4%,
4,5292,0.6%,

Value,Count,Frequency (%),Unnamed: 3
3,30201,3.4%,
4,5292,0.6%,
5,18554,2.1%,
6,109025,12.2%,
7,19637,2.2%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.48551
Minimum,0
Maximum,7
Zeros (%),91.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.6393
Coef of variation,3.3765
Kurtosis,8.789
Mean,0.48551
MAD,0.88596
Skewness,3.2364
Sum,432695
Variance,2.6874
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,813156,91.2%,
6,37502,4.2%,
7,21828,2.4%,
2,8582,1.0%,
3,5127,0.6%,
5,3363,0.4%,
4,1288,0.1%,
1,375,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,813156,91.2%,
1,375,0.0%,
2,8582,1.0%,
3,5127,0.6%,
4,1288,0.1%,

Value,Count,Frequency (%),Unnamed: 3
3,5127,0.6%,
4,1288,0.1%,
5,3363,0.4%,
6,37502,4.2%,
7,21828,2.4%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.25794
Minimum,0
Maximum,7
Zeros (%),95.8%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.2523
Coef of variation,4.8551
Kurtosis,20.708
Mean,0.25794
MAD,0.49437
Skewness,4.7324
Sum,229880
Variance,1.5683
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,854074,95.8%,
6,17732,2.0%,
7,15241,1.7%,
5,2121,0.2%,
3,1926,0.2%,
4,83,0.0%,
2,42,0.0%,
1,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,854074,95.8%,
1,2,0.0%,
2,42,0.0%,
3,1926,0.2%,
4,83,0.0%,

Value,Count,Frequency (%),Unnamed: 3
3,1926,0.2%,
4,83,0.0%,
5,2121,0.2%,
6,17732,2.0%,
7,15241,1.7%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.5854
Minimum,0
Maximum,7
Zeros (%),69.9%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,3
95-th percentile,6
Maximum,7
Range,7
Interquartile range,3

0,1
Standard deviation,2.5479
Coef of variation,1.6071
Kurtosis,-0.72106
Mean,1.5854
MAD,2.2312
Skewness,1.0815
Sum,1412946
Variance,6.4919
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,622788,69.9%,
6,188263,21.1%,
3,26192,2.9%,
5,15900,1.8%,
1,11735,1.3%,
2,9187,1.0%,
7,8853,1.0%,
4,8303,0.9%,

Value,Count,Frequency (%),Unnamed: 3
0,622788,69.9%,
1,11735,1.3%,
2,9187,1.0%,
3,26192,2.9%,
4,8303,0.9%,

Value,Count,Frequency (%),Unnamed: 3
3,26192,2.9%,
4,8303,0.9%,
5,15900,1.8%,
6,188263,21.1%,
7,8853,1.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.19675
Minimum,0
Maximum,7
Zeros (%),96.2%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.0368
Coef of variation,5.2695
Kurtosis,27.293
Mean,0.19675
MAD,0.37867
Skewness,5.3318
Sum,175344
Variance,1.0749
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,857661,96.2%,
6,17942,2.0%,
3,6153,0.7%,
7,4030,0.5%,
5,3225,0.4%,
2,1293,0.1%,
4,465,0.1%,
1,452,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,857661,96.2%,
1,452,0.1%,
2,1293,0.1%,
3,6153,0.7%,
4,465,0.1%,

Value,Count,Frequency (%),Unnamed: 3
3,6153,0.7%,
4,465,0.1%,
5,3225,0.4%,
6,17942,2.0%,
7,4030,0.5%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.67329
Minimum,0
Maximum,7
Zeros (%),85.4%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.7528
Coef of variation,2.6033
Kurtosis,4.4754
Mean,0.67329
MAD,1.1498
Skewness,2.455
Sum,600052
Variance,3.0722
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,761014,85.4%,
6,52060,5.8%,
3,24763,2.8%,
5,17548,2.0%,
4,10951,1.2%,
2,9928,1.1%,
7,7841,0.9%,
1,7116,0.8%,

Value,Count,Frequency (%),Unnamed: 3
0,761014,85.4%,
1,7116,0.8%,
2,9928,1.1%,
3,24763,2.8%,
4,10951,1.2%,

Value,Count,Frequency (%),Unnamed: 3
3,24763,2.8%,
4,10951,1.2%,
5,17548,2.0%,
6,52060,5.8%,
7,7841,0.9%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.34685
Minimum,0
Maximum,7
Zeros (%),93.1%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,3
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.3373
Coef of variation,3.8554
Kurtosis,13.412
Mean,0.34685
MAD,0.64594
Skewness,3.8383
Sum,309124
Variance,1.7883
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,829857,93.1%,
6,25788,2.9%,
3,14572,1.6%,
5,9556,1.1%,
7,7655,0.9%,
2,1967,0.2%,
4,1185,0.1%,
1,641,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0,829857,93.1%,
1,641,0.1%,
2,1967,0.2%,
3,14572,1.6%,
4,1185,0.1%,

Value,Count,Frequency (%),Unnamed: 3
3,14572,1.6%,
4,1185,0.1%,
5,9556,1.1%,
6,25788,2.9%,
7,7655,0.9%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.59068
Minimum,0
Maximum,7
Zeros (%),88.7%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,6
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.7216
Coef of variation,2.9146
Kurtosis,5.6604
Mean,0.59068
MAD,1.0482
Skewness,2.713
Sum,526425
Variance,2.9639
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,790748,88.7%,
6,55056,6.2%,
3,15297,1.7%,
5,13587,1.5%,
7,8514,1.0%,
4,3990,0.4%,
2,2676,0.3%,
1,1353,0.2%,

Value,Count,Frequency (%),Unnamed: 3
0,790748,88.7%,
1,1353,0.2%,
2,2676,0.3%,
3,15297,1.7%,
4,3990,0.4%,

Value,Count,Frequency (%),Unnamed: 3
3,15297,1.7%,
4,3990,0.4%,
5,13587,1.5%,
6,55056,6.2%,
7,8514,1.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.25599
Minimum,0
Maximum,7
Zeros (%),95.6%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,0
95-th percentile,0
Maximum,7
Range,7
Interquartile range,0

0,1
Standard deviation,1.213
Coef of variation,4.7386
Kurtosis,20.217
Mean,0.25599
MAD,0.48924
Skewness,4.6627
Sum,228146
Variance,1.4715
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,851626,95.6%,
6,20410,2.3%,
7,9555,1.1%,
5,4979,0.6%,
3,4003,0.4%,
4,328,0.0%,
2,265,0.0%,
1,55,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0,851626,95.6%,
1,55,0.0%,
2,265,0.0%,
3,4003,0.4%,
4,328,0.0%,

Value,Count,Frequency (%),Unnamed: 3
3,4003,0.4%,
4,328,0.0%,
5,4979,0.6%,
6,20410,2.3%,
7,9555,1.1%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.79768
Minimum,0
Maximum,6
Zeros (%),65.6%

0,1
Minimum,0
5-th percentile,0
Q1,0
Median,0
Q3,1
95-th percentile,4
Maximum,6
Range,6
Interquartile range,1

0,1
Standard deviation,1.3307
Coef of variation,1.6682
Kurtosis,1.9786
Mean,0.79768
MAD,1.0468
Skewness,1.684
Sum,710912
Variance,1.7708
Memory size,6.8 MiB

Value,Count,Frequency (%),Unnamed: 3
0,584797,65.6%,
1,99465,11.2%,
2,97282,10.9%,
3,45685,5.1%,
4,43579,4.9%,
5,16966,1.9%,
6,3447,0.4%,

Value,Count,Frequency (%),Unnamed: 3
0,584797,65.6%,
1,99465,11.2%,
2,97282,10.9%,
3,45685,5.1%,
4,43579,4.9%,

Value,Count,Frequency (%),Unnamed: 3
2,97282,10.9%,
3,45685,5.1%,
4,43579,4.9%,
5,16966,1.9%,
6,3447,0.4%,

0,1
Correlation,0.90686

Unnamed: 0,LNR,AGER_TYP,AKT_DAT_KL,ALTER_HH,ALTER_KIND1,ALTER_KIND2,ALTER_KIND3,ALTER_KIND4,ALTERSKATEGORIE_FEIN,ANZ_HAUSHALTE_AKTIV,ANZ_HH_TITEL,ANZ_KINDER,ANZ_PERSONEN,ANZ_STATISTISCHE_HAUSHALTE,ANZ_TITEL,ARBEIT,BALLRAUM,CAMEO_DEU_2015,CAMEO_DEUG_2015,CAMEO_INTL_2015,CJT_GESAMTTYP,CJT_KATALOGNUTZER,CJT_TYP_1,CJT_TYP_2,CJT_TYP_3,CJT_TYP_4,CJT_TYP_5,CJT_TYP_6,D19_BANKEN_ANZ_12,D19_BANKEN_ANZ_24,D19_BANKEN_DATUM,D19_BANKEN_DIREKT,D19_BANKEN_GROSS,D19_BANKEN_LOKAL,D19_BANKEN_OFFLINE_DATUM,D19_BANKEN_ONLINE_DATUM,D19_BANKEN_ONLINE_QUOTE_12,D19_BANKEN_REST,D19_BEKLEIDUNG_GEH,D19_BEKLEIDUNG_REST,D19_BILDUNG,D19_BIO_OEKO,D19_BUCH_CD,D19_DIGIT_SERV,D19_DROGERIEARTIKEL,D19_ENERGIE,D19_FREIZEIT,D19_GARTEN,D19_GESAMT_ANZ_12,D19_GESAMT_ANZ_24
0,910215,-1,,,,,,,,,,,,,,,,,,,2.0,5.0,1.0,1.0,5.0,5.0,5.0,5.0,0,0,10,0,0,0,10,10,,0,0,0,0,0,0,0,0,0,0,0,0,0
1,910220,-1,9.0,0.0,,,,,21.0,11.0,0.0,0.0,2.0,12.0,0.0,3.0,6.0,8A,8.0,51.0,5.0,1.0,5.0,5.0,2.0,3.0,1.0,1.0,0,0,10,0,0,0,10,10,,0,0,0,0,0,0,0,0,0,0,0,0,0
2,910225,-1,9.0,17.0,,,,,17.0,10.0,0.0,0.0,1.0,7.0,0.0,3.0,2.0,4C,4.0,24.0,3.0,2.0,4.0,4.0,1.0,3.0,2.0,2.0,0,0,10,0,0,0,10,10,0.0,0,0,0,6,0,0,0,0,0,0,0,0,0
3,910226,2,1.0,13.0,,,,,13.0,1.0,0.0,0.0,0.0,2.0,0.0,2.0,4.0,2A,2.0,12.0,2.0,3.0,2.0,2.0,4.0,4.0,5.0,3.0,0,0,10,0,0,0,10,10,0.0,0,0,0,0,0,6,0,0,0,0,0,0,0
4,910241,-1,1.0,20.0,,,,,14.0,3.0,0.0,0.0,4.0,3.0,0.0,4.0,2.0,6B,6.0,43.0,5.0,3.0,3.0,3.0,3.0,4.0,3.0,3.0,3,5,5,1,2,0,10,5,10.0,6,6,1,6,0,6,0,1,5,0,0,6,6
