# Mortalidade Infântil: Extração de Conhecimento - Etapa de Seleção

## Tabela de Conteúdo

- [Profilling](#Profiling)
  - [SIM: DOES2012](#SIM:-DOES2012)
  - [SIM: DOES2013](#SIM:-DOES2013)
  - [SIM: DOES2014](#SIM:-DOES2014)
  - [SIM: DOES2015](#SIM:-DOES2015)
  - [SIM: DOES2016](#SIM:-DOES2016)

## Dependecias e Inicialização

In [19]:
%matplotlib inline
import pandas as pd
import pandas_profiling
import matplotlib.pyplot as plt
from pandas.plotting import register_matplotlib_converters
from IPython.display import display, display_png

register_matplotlib_converters()


CONTEXT_MAX_ROWS_COLS = ('display.max_rows', None, 'display.max_columns', None)

## Recursos

In [2]:
resources = {
   'sim-does2012-raw-csv': '../../../datasets/datasus/raw-csv/DOES2012.csv',
   'sim-does2013-raw-csv': '../../../datasets/datasus/raw-csv/DOES2013.csv',
   'sim-does2014-raw-csv': '../../../datasets/datasus/raw-csv/DOES2014.csv',
   'sim-does2015-raw-csv': '../../../datasets/datasus/raw-csv/DOES2015.csv',
   'sim-does2016-raw-csv': '../../../datasets/datasus/raw-csv/DOES2016.csv',
}

datasus_sim_resources = resources
%store datasus_sim_resources

Stored 'datasus_sim_resources' (dict)


## Funções

In [3]:
date_parser_dmy = lambda x: pd.to_datetime(x, format='%d%m%Y', 
                                           errors='raise',
                                           cache=True)

def load_resource_df_pf(resource, dtype, parse_dates, 
                        date_parser=date_parser_dmy, format='csv'):
    if format == 'csv':
        df = pd.read_csv(resources[resource],
                         dtype=dtype,
                         parse_dates=parse_dates,
                         date_parser=date_parser,)
    else:
        raise NotImplementedError
    
    df = df.reindex(sorted(df.columns), axis=1)
    pf = pandas_profiling.ProfileReport(df)
    
    return df, pf

# Conjuntos de Dados

## Sistema de Informações de Mortalidade (SIM), Declarações de Obitos (DO), Espírito Santo (ES)

### Dicionário de Dados

In [4]:
resources_simdo_raw_date_cols_v1 = ['DTATESTADO', 'DTCADASTRO', 'DTCADINF', 'DTCADINV', 
                                    'DTCONCASO', 'DTINVESTIG', 'DTNASC', 'DTOBITO', 
                                    'DTRECEBIM', 'DTRECORIGA']
resources_simdo_raw_date_cols_v2 = ['DTATESTADO', 'DTCADASTRO', 'DTCADINF', 'DTCADINV', 
                                    'DTCONCASO', 'DTCONINV', 'DTINVESTIG', 'DTNASC', 'DTOBITO', 
                                    'DTRECEBIM', 'DTRECORIG', 'DTREGCART']
resources_simdo_raw_date_cols_v3 = ['DTATESTADO', 'DTCADASTRO', 'DTCADINF', 'DTCADINV', 
                                    'DTCONCASO', 'DTCONINV', 'DTINVESTIG', 'DTNASC', 'DTOBITO', 
                                    'DTRECEBIM', 'DTRECORIGA']

resources_simdo_raw_dtypes = {
    'ACIDTRAB': 'category',
    'ALTCAUSA': 'category',
    'ASSISTMED': 'category',
    'ATESTADO': 'category',
    'ATESTANTE': 'category',
    'CAUSABAS': 'category',
    'CAUSABAS_O': 'category',
    'CAUSAMAT': 'category',
    'CB_PRE': 'category',
    'CIRCOBITO': 'category',
    'CIRURGIA': 'category',
    'CODCART': 'category',
    'CODESTAB': 'category',
    'CODIFICADO': 'category',
    'CODINST': 'category',
    'CODMUNCART': 'category',
    'CODMUNNATU': 'category',
    'CODMUNOCOR': 'category',
    'CODMUNRES': 'category',
    'COMUNSVOIM': 'category',
    'CRM': 'category',
    'DIFDATA': 'float32',
    'ESC': 'category',
    'ESC2010': 'category',
    'ESCFALAGR1': 'category',
    'ESCMAE': 'category',
    'ESCMAE2010': 'category',
    'ESCMAEAGR1': 'category',
    'ESTABDESCR': 'str',
    'ESTCIV': 'category',
    'EXAME': 'category',
    'FONTE': 'category',
    'FONTEINV': 'category',
    'FONTES': 'category',
    'FONTESINF': 'category',
    'GESTACAO': 'category',
    'GRAVIDEZ': 'category',
    'HORAOBITO': 'float32',
    'IDADE': 'float32',
    'IDADEMAE': 'float32',
    'LINHAA': 'category',
    'LINHAA': 'category',
    'LINHAC': 'category',
    'LINHAD': 'category',
    'LINHAII': 'category',
    'LOCOCOR': 'category',
    'MORTEPARTO': 'category',
    'NATURAL': 'category',
    'NECROPSIA': 'category',
    'NUDIASINF': 'float32',
    'NUDIASOBCO': 'float32',
    'NUDIASOBIN': 'float32',
    'NUMERODN': 'str',
    'NUMERODO': 'str',
    'NUMERODV': 'str',
    'NUMEROLOTE': 'str',
    'NUMREGCART': 'str',
    'NUMSUS': 'str',
    'OBITOGRAV': 'category',
    'OBITOPARTO': 'category',
    'OBITOPUERP': 'category',
    'OCUP': 'category',
    'OCUPMAE': 'category',
    'ORIGEM': 'category',
    'PARTO': 'category',
    'PESO': 'float32',
    'QTDFILMORT': 'float32',
    'QTDFILVIVO': 'float32',
    'RACACOR': 'category',
    'SEMAGESTAC': 'float32',
    'SERIESCFAL': 'category',
    'SERIESCMAE': 'category',
    'SEXO': 'category',
    'STCODIFICA': 'category',
    'STDOEPIDEM': 'float32',
    'STDONOVA': 'float32',
    'TIPOBITO': 'category',
    'TPMORTEOCO': 'category',
    'TPNIVELINV': 'category',
    'TPOBITOCOR': 'category',
    'TPPOS': 'category',
    'TPRESGINFO': 'category',
    'VERSAOSCB': 'str',
    'VERSAOSIST': 'str',
}

### SIM DOES2012 `df_sim_does2012_raw`

In [11]:
df_sim_does2012_raw, pf_sim_does2012_raw = load_resource_df_pf('sim-does2012-raw-csv',
                                                               resources_simdo_raw_dtypes,
                                                               resources_simdo_raw_date_cols_v1)
%store df_sim_does2012_raw

Stored 'df_sim_does2012_raw' (DataFrame)


### SIM DOES2013 `df_sim_does2013_raw`

In [12]:
df_sim_does2013_raw, pf_sim_does2013_raw = load_resource_df_pf('sim-does2013-raw-csv',
                                                               resources_simdo_raw_dtypes,
                                                               resources_simdo_raw_date_cols_v2)
%store df_sim_does2013_raw

Stored 'df_sim_does2013_raw' (DataFrame)


### SIM DOES2014 `df_sim_does2014_raw`

In [13]:
df_sim_does2014_raw, pf_sim_does2014_raw = load_resource_df_pf('sim-does2014-raw-csv',
                                                               resources_simdo_raw_dtypes,
                                                               resources_simdo_raw_date_cols_v3)
%store df_sim_does2014_raw

Stored 'df_sim_does2014_raw' (DataFrame)


### SIM DOES2015 `df_sim_does2015_raw`

In [14]:
df_sim_does2015_raw, pf_sim_does2015_raw = load_resource_df_pf('sim-does2015-raw-csv',
                                                               resources_simdo_raw_dtypes,
                                                               resources_simdo_raw_date_cols_v3)
%store df_sim_does2015_raw

Stored 'df_sim_does2015_raw' (DataFrame)


### SIM DOES2016 `df_sim_does2016_raw`

In [15]:
df_sim_does2016_raw, pf_sim_does2016_raw = load_resource_df_pf('sim-does2016-raw-csv',
                                                               resources_simdo_raw_dtypes,
                                                               resources_simdo_raw_date_cols_v3)
%store df_sim_does2016_raw

Stored 'df_sim_does2016_raw' (DataFrame)


### SIM DOES 2012..2016 `df_sim_does20122016_raw`

In [16]:
df_sim_does20122016_raw = pd.concat([
        df_sim_does2012_raw,
        df_sim_does2013_raw,
        df_sim_does2014_raw,
        df_sim_does2015_raw,
        df_sim_does2016_raw,
    ], 
    ignore_index=True, 
    sort=False,
    verify_integrity=True,)

%store df_sim_does20122016_raw

Stored 'df_sim_does20122016_raw' (DataFrame)


# Profiling

### SIM DOES2012 `df_sim_does2012_raw`

In [5]:
display(pf_sim_does2012_raw)

Stored 'df_sim_does2012_raw' (DataFrame)


0,1
Number of variables,73
Number of observations,21616
Total Missing (%),50.0%
Total size in memory,5.1 MiB
Average record size in memory,246.3 B

0,1
Numeric,10
Categorical,49
Boolean,1
Date,10
Text (Unique),0
Rejected,3
Unsupported,0

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),93.2%
Missing (n),20154

0,1
9,919
2,466
1,77
(Missing),20154

Value,Count,Frequency (%),Unnamed: 3
9,919,4.3%,
2,466,2.2%,
1,77,0.4%,
(Missing),20154,93.2%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),7.2%
Missing (n),1554

0,1
1,13553
2,3317
9,3192
(Missing),1554

Value,Count,Frequency (%),Unnamed: 3
1,13553,62.7%,
2,3317,15.3%,
9,3192,14.8%,
(Missing),1554,7.2%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),2.1%
Missing (n),444

0,1
1,6660
2,5093
3,3897
Other values (2),5522

Value,Count,Frequency (%),Unnamed: 3
1,6660,30.8%,
2,5093,23.6%,
3,3897,18.0%,
5,3125,14.5%,
4,2397,11.1%,
(Missing),444,2.1%,

0,1
Distinct count,1443
Unique (%),6.7%
Missing (%),0.0%
Missing (n),0

0,1
I219,1678
I64,779
J189,701
Other values (1440),18458

Value,Count,Frequency (%),Unnamed: 3
I219,1678,7.8%,
I64,779,3.6%,
J189,701,3.2%,
X954,690,3.2%,
E149,525,2.4%,
G309,390,1.8%,
C349,388,1.8%,
I694,378,1.7%,
I678,375,1.7%,
I110,349,1.6%,

0,1
Distinct count,1387
Unique (%),6.4%
Missing (%),0.0%
Missing (n),2

0,1
I219,1664
J189,782
I64,776
Other values (1383),18392

Value,Count,Frequency (%),Unnamed: 3
I219,1664,7.7%,
J189,782,3.6%,
I64,776,3.6%,
X954,647,3.0%,
E149,514,2.4%,
C349,382,1.8%,
I678,367,1.7%,
G309,362,1.7%,
X959,354,1.6%,
R99,344,1.6%,

0,1
Constant value,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),81.5%
Missing (n),17623

0,1
1,1859
3,1605
9,338
Other values (2),191
(Missing),17623

Value,Count,Frequency (%),Unnamed: 3
1,1859,8.6%,
3,1605,7.4%,
9,338,1.6%,
2,168,0.8%,
4,23,0.1%,
(Missing),17623,81.5%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),21591

0,1
2,20
9,3
1,2
(Missing),21591

Value,Count,Frequency (%),Unnamed: 3
2,20,0.1%,
9,3,0.0%,
1,2,0.0%,
(Missing),21591,99.9%,

0,1
Distinct count,287
Unique (%),1.3%
Missing (%),28.3%
Missing (n),6128

0,1
2486199,968
0011738,956
2550687,854
Other values (283),12710
(Missing),6128

Value,Count,Frequency (%),Unnamed: 3
2486199,968,4.5%,
0011738,956,4.4%,
2550687,854,4.0%,
2485680,797,3.7%,
2547821,646,3.0%,
2494442,638,3.0%,
2546957,603,2.8%,
0011746,541,2.5%,
0011819,537,2.5%,
2446030,497,2.3%,

0,1
Distinct count,84
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
RES3205300001,9518
MES3205300001,3748
MES3205200001,2944
Other values (81),5406

Value,Count,Frequency (%),Unnamed: 3
RES3205300001,9518,44.0%,
MES3205300001,3748,17.3%,
MES3205200001,2944,13.6%,
MES3205000001,2247,10.4%,
MES3201300001,1255,5.8%,
MES3201500001,1175,5.4%,
MES3200600001,325,1.5%,
MES3205100001,90,0.4%,
MRJ3300600001,46,0.2%,
MRJ3302200001,25,0.1%,

0,1
Distinct count,162
Unique (%),0.7%
Missing (%),0.0%
Missing (n),0

0,1
320530,3770
320520,2954
320500,2252
Other values (159),12640

Value,Count,Frequency (%),Unnamed: 3
320530,3770,17.4%,
320520,2954,13.7%,
320500,2252,10.4%,
320120,1908,8.8%,
320150,1267,5.9%,
320130,1258,5.8%,
320490,1043,4.8%,
320320,913,4.2%,
320240,361,1.7%,
320060,326,1.5%,

0,1
Distinct count,79
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
320520,2466
320500,2317
320130,2183
Other values (76),14650

Value,Count,Frequency (%),Unnamed: 3
320520,2466,11.4%,
320500,2317,10.7%,
320130,2183,10.1%,
320530,1893,8.8%,
320120,1300,6.0%,
320320,793,3.7%,
320150,753,3.5%,
320240,657,3.0%,
320490,621,2.9%,
320060,436,2.0%,

0,1
Distinct count,58
Unique (%),0.3%
Missing (%),71.1%
Missing (n),15376

0,1
320530,4636
320120,538
320320,496
Other values (54),570
(Missing),15376

Value,Count,Frequency (%),Unnamed: 3
320530,4636,21.4%,
320120,538,2.5%,
320320,496,2.3%,
320150,403,1.9%,
320390,26,0.1%,
320500,26,0.1%,
293135,11,0.1%,
330100,8,0.0%,
312770,8,0.0%,
330220,6,0.0%,

0,1
Distinct count,278
Unique (%),1.3%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,51.4307
Minimum,0.0
Maximum,725.0
Zeros (%),0.1%

0,1
Minimum,0.0
5-th percentile,23.0
Q1,37.0
Median,48.0
Q3,60.0
95-th percentile,83.0
Maximum,725.0
Range,725.0
Interquartile range,23.0

0,1
Standard deviation,31.947268
Coef of variation,0.6211712
Kurtosis,95.84133
Mean,51.4307
MAD,16.245462
Skewness,7.6797805
Sum,1111726.0
Variance,1020.6279
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
46.0,553,2.6%,
54.0,525,2.4%,
39.0,524,2.4%,
45.0,522,2.4%,
38.0,504,2.3%,
43.0,501,2.3%,
55.0,498,2.3%,
47.0,496,2.3%,
37.0,494,2.3%,
44.0,491,2.3%,

Value,Count,Frequency (%),Unnamed: 3
0.0,12,0.1%,
1.0,1,0.0%,
2.0,4,0.0%,
3.0,3,0.0%,
4.0,7,0.0%,

Value,Count,Frequency (%),Unnamed: 3
566.0,1,0.0%,
632.0,1,0.0%,
642.0,1,0.0%,
677.0,1,0.0%,
725.0,1,0.0%,

0,1
Distinct count,389
Unique (%),1.8%
Missing (%),0.2%
Missing (n),41
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-01 00:00:00
Maximum,2013-08-13 00:00:00

0,1
Distinct count,323
Unique (%),1.5%
Missing (%),0.6%
Missing (n),124
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-09 00:00:00
Maximum,2014-02-18 00:00:00

0,1
Distinct count,215
Unique (%),1.0%
Missing (%),97.2%
Missing (n),21019
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-02-15 00:00:00
Maximum,2014-01-28 00:00:00

0,1
Distinct count,282
Unique (%),1.3%
Missing (%),94.5%
Missing (n),20420
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-02-17 00:00:00
Maximum,2013-11-06 00:00:00

0,1
Distinct count,217
Unique (%),1.0%
Missing (%),97.4%
Missing (n),21057
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-13 00:00:00
Maximum,2014-01-28 00:00:00

0,1
Distinct count,398
Unique (%),1.8%
Missing (%),87.1%
Missing (n),18825
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-13 00:00:00
Maximum,2014-01-10 00:00:00

0,1
Distinct count,14828
Unique (%),68.6%
Missing (%),0.2%
Missing (n),48
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1901-02-15 00:00:00
Maximum,2012-12-30 00:00:00

0,1
Distinct count,366
Unique (%),1.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-01 00:00:00
Maximum,2012-12-31 00:00:00

0,1
Distinct count,217
Unique (%),1.0%
Missing (%),0.1%
Missing (n),12
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-10 00:00:00
Maximum,2014-02-14 00:00:00

0,1
Distinct count,191
Unique (%),0.9%
Missing (%),0.1%
Missing (n),12
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-10 00:00:00
Maximum,2014-02-14 00:00:00

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),11.7%
Missing (n),2534

0,1
9,5014
2,4256
1,2824
Other values (4),6988
(Missing),2534

Value,Count,Frequency (%),Unnamed: 3
9,5014,23.2%,
2,4256,19.7%,
1,2824,13.1%,
3,2528,11.7%,
0,2299,10.6%,
4,1644,7.6%,
5,517,2.4%,
(Missing),2534,11.7%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),22.5%
Missing (n),4864

0,1
9,5007
1,4874
0,2818
Other values (4),4053
(Missing),4864

Value,Count,Frequency (%),Unnamed: 3
9,5007,23.2%,
1,4874,22.5%,
0,2818,13.0%,
2,2089,9.7%,
3,1449,6.7%,
5,410,1.9%,
4,105,0.5%,
(Missing),4864,22.5%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.6%
Missing (n),21095

0,1
4,208
3,119
9,79
Other values (4),115
(Missing),21095

Value,Count,Frequency (%),Unnamed: 3
4,208,1.0%,
3,119,0.6%,
9,79,0.4%,
5,42,0.2%,
2,30,0.1%,
0,22,0.1%,
1,21,0.1%,
(Missing),21095,97.6%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.7%
Missing (n),21119

0,1
3,183
2,135
9,79
Other values (4),100
(Missing),21119

Value,Count,Frequency (%),Unnamed: 3
3,183,0.8%,
2,135,0.6%,
9,79,0.4%,
1,38,0.2%,
5,23,0.1%,
0,21,0.1%,
4,18,0.1%,
(Missing),21119,97.7%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),11.1%
Missing (n),2403

0,1
2,6698
1,5132
3,4047
Other values (3),3336
(Missing),2403

Value,Count,Frequency (%),Unnamed: 3
2,6698,31.0%,
1,5132,23.7%,
3,4047,18.7%,
9,1882,8.7%,
4,1093,5.1%,
5,361,1.7%,
(Missing),2403,11.1%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),21591

0,1
2,11
1,9
9,5
(Missing),21591

Value,Count,Frequency (%),Unnamed: 3
2,11,0.1%,
1,9,0.0%,
9,5,0.0%,
(Missing),21591,99.9%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),82.8%
Missing (n),17904

0,1
1,2528
2,392
9,376
Other values (2),416
(Missing),17904

Value,Count,Frequency (%),Unnamed: 3
1,2528,11.7%,
2,392,1.8%,
9,376,1.7%,
4,257,1.2%,
3,159,0.7%,
(Missing),17904,82.8%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),84.5%
Missing (n),18268

0,1
3,1208
1,579
6,508
Other values (5),1053
(Missing),18268

Value,Count,Frequency (%),Unnamed: 3
3,1208,5.6%,
1,579,2.7%,
6,508,2.4%,
4,362,1.7%,
2,316,1.5%,
8,315,1.5%,
5,32,0.1%,
7,28,0.1%,
(Missing),18268,84.5%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.8%
Missing (n),21148

0,1
5,141
4,99
3,96
Other values (4),132
(Missing),21148

Value,Count,Frequency (%),Unnamed: 3
5,141,0.7%,
4,99,0.5%,
3,96,0.4%,
2,93,0.4%,
1,32,0.1%,
9,4,0.0%,
6,3,0.0%,
(Missing),21148,97.8%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21082

0,1
1,448
2,53
9,33
(Missing),21082

Value,Count,Frequency (%),Unnamed: 3
1,448,2.1%,
2,53,0.2%,
9,33,0.2%,
(Missing),21082,97.5%,

0,1
Distinct count,1117
Unique (%),5.2%
Missing (%),11.5%
Missing (n),2493
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1191.3717
Minimum,0.0
Maximum,2359.0
Zeros (%),0.2%

0,1
Minimum,0.0
5-th percentile,125.0
Q1,620.0
Median,1200.0
Q3,1800.0
95-th percentile,2240.0
Maximum,2359.0
Range,2359.0
Interquartile range,1180.0

0,1
Standard deviation,675.5093
Coef of variation,0.5670013
Kurtosis,-1.1723601
Mean,1191.3717
MAD,584.46564
Skewness,0.0052499035
Sum,22782600.0
Variance,456312.8
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
500.0,283,1.3%,
600.0,279,1.3%,
1700.0,236,1.1%,
700.0,231,1.1%,
1000.0,220,1.0%,
800.0,220,1.0%,
900.0,210,1.0%,
400.0,210,1.0%,
1500.0,207,1.0%,
2200.0,204,0.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,51,0.2%,
1.0,6,0.0%,
2.0,6,0.0%,
3.0,3,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2354.0,1,0.0%,
2355.0,35,0.2%,
2357.0,2,0.0%,
2358.0,3,0.0%,
2359.0,3,0.0%,

0,1
Distinct count,186
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,456.1278
Minimum,1.0
Maximum,999.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,417.0
Q1,447.0
Median,466.0
Q3,480.0
95-th percentile,491.0
Maximum,999.0
Range,998.0
Interquartile range,33.0

0,1
Standard deviation,51.70393
Coef of variation,0.11335404
Kurtosis,34.759533
Mean,456.1278
MAD,26.2652
Skewness,-3.0588236
Sum,9859659.0
Variance,2673.2964
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
483.0,478,2.2%,
481.0,463,2.1%,
476.0,455,2.1%,
477.0,450,2.1%,
484.0,447,2.1%,
479.0,445,2.1%,
482.0,443,2.0%,
485.0,434,2.0%,
478.0,422,2.0%,
480.0,400,1.9%,

Value,Count,Frequency (%),Unnamed: 3
1.0,3,0.0%,
2.0,2,0.0%,
3.0,2,0.0%,
5.0,4,0.0%,
8.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
507.0,2,0.0%,
508.0,2,0.0%,
509.0,1,0.0%,
511.0,1,0.0%,
999.0,20,0.1%,

0,1
Distinct count,35
Unique (%),0.2%
Missing (%),97.8%
Missing (n),21147
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,25.976545
Minimum,9.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,9.0
5-th percentile,16.0
Q1,20.0
Median,25.0
Q3,31.0
95-th percentile,38.0
Maximum,99.0
Range,90.0
Interquartile range,11.0

0,1
Standard deviation,7.6012735
Coef of variation,0.29262066
Kurtosis,16.975986
Mean,25.976545
MAD,5.8005557
Skewness,2.136634
Sum,12183.0
Variance,57.77936
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
22.0,33,0.2%,
25.0,30,0.1%,
19.0,29,0.1%,
18.0,27,0.1%,
26.0,25,0.1%,
28.0,25,0.1%,
21.0,24,0.1%,
20.0,23,0.1%,
30.0,21,0.1%,
24.0,20,0.1%,

Value,Count,Frequency (%),Unnamed: 3
9.0,1,0.0%,
13.0,2,0.0%,
14.0,3,0.0%,
15.0,8,0.0%,
16.0,14,0.1%,

Value,Count,Frequency (%),Unnamed: 3
41.0,4,0.0%,
42.0,4,0.0%,
44.0,1,0.0%,
45.0,1,0.0%,
99.0,1,0.0%,

0,1
Distinct count,1014
Unique (%),4.7%
Missing (%),1.4%
Missing (n),309

0,1
*A419,3166
*R092,1382
*J969,1214
Other values (1010),15545

Value,Count,Frequency (%),Unnamed: 3
*A419,3166,14.6%,
*R092,1382,6.4%,
*J969,1214,5.6%,
*R688,1149,5.3%,
*I219,1090,5.0%,
*J960,947,4.4%,
*J81X,826,3.8%,
*R570,603,2.8%,
*J189,470,2.2%,
*T792,342,1.6%,

0,1
Distinct count,1442
Unique (%),6.7%
Missing (%),20.4%
Missing (n),4419

0,1
*J189,1560
*A419,914
*I10X,766
Other values (1438),13957
(Missing),4419

Value,Count,Frequency (%),Unnamed: 3
*J189,1560,7.2%,
*A419,914,4.2%,
*I10X,766,3.5%,
*I219,638,3.0%,
*S069,417,1.9%,
*I500,404,1.9%,
*J180,298,1.4%,
*I509,267,1.2%,
*J159,262,1.2%,
*N390,261,1.2%,

0,1
Distinct count,1435
Unique (%),6.6%
Missing (%),44.8%
Missing (n),9678

0,1
*I10X,956
*J189,572
*E149,305
Other values (1431),10105
(Missing),9678

Value,Count,Frequency (%),Unnamed: 3
*I10X,956,4.4%,
*J189,572,2.6%,
*E149,305,1.4%,
*J449,288,1.3%,
*X954,238,1.1%,
*I219,228,1.1%,
*I64X,226,1.0%,
*N189,213,1.0%,
*I500,210,1.0%,
*I251,194,0.9%,

0,1
Distinct count,958
Unique (%),4.4%
Missing (%),75.1%
Missing (n),16232

0,1
*I10X,778
*E149,245
*F102,184
Other values (954),4177
(Missing),16232

Value,Count,Frequency (%),Unnamed: 3
*I10X,778,3.6%,
*E149,245,1.1%,
*F102,184,0.9%,
*N189,110,0.5%,
*J449,106,0.5%,
*I694,105,0.5%,
*J189,99,0.5%,
*G309,93,0.4%,
*F172,83,0.4%,
*I64X,82,0.4%,

0,1
Distinct count,2098
Unique (%),9.7%
Missing (%),69.7%
Missing (n),15068

0,1
*I10X,651
*E149,318
*I10X*E149,203
Other values (2094),5376
(Missing),15068

Value,Count,Frequency (%),Unnamed: 3
*I10X,651,3.0%,
*E149,318,1.5%,
*I10X*E149,203,0.9%,
*F102,151,0.7%,
*E149*I10,147,0.7%,
*N189,143,0.7%,
*F172,140,0.6%,
*R54X,131,0.6%,
*G309,112,0.5%,
*N179,101,0.5%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,14861
3,3705
4,1691
Other values (3),1359

Value,Count,Frequency (%),Unnamed: 3
1,14861,68.8%,
3,3705,17.1%,
4,1691,7.8%,
5,671,3.1%,
2,627,2.9%,
9,61,0.3%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.2%
Missing (n),21019

0,1
3,580
9,13
1,3
(Missing),21019

Value,Count,Frequency (%),Unnamed: 3
3,580,2.7%,
9,13,0.1%,
1,3,0.0%,
2,1,0.0%,
(Missing),21019,97.2%,

0,1
Distinct count,34
Unique (%),0.2%
Missing (%),94.2%
Missing (n),20360

0,1
800,1147
190,22
832,15
Other values (30),72
(Missing),20360

Value,Count,Frequency (%),Unnamed: 3
800,1147,5.3%,
190,22,0.1%,
832,15,0.1%,
125,11,0.1%,
999,7,0.0%,
831,7,0.0%,
135,4,0.0%,
77,4,0.0%,
78,4,0.0%,
188,3,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),6.7%
Missing (n),1445

0,1
2,13265
1,6065
9,841
(Missing),1445

Value,Count,Frequency (%),Unnamed: 3
2,13265,61.4%,
1,6065,28.1%,
9,841,3.9%,
(Missing),1445,6.7%,

0,1
Distinct count,296
Unique (%),1.4%
Missing (%),91.7%
Missing (n),19823
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,112.4908
Minimum,14.0
Maximum,599.0
Zeros (%),0.0%

0,1
Minimum,14.0
5-th percentile,37.0
Q1,63.0
Median,92.0
Q3,136.0
95-th percentile,274.4
Maximum,599.0
Range,585.0
Interquartile range,73.0

0,1
Standard deviation,74.221535
Coef of variation,0.65980095
Kurtosis,5.1696024
Mean,112.4908
MAD,52.975758
Skewness,1.9878831
Sum,201696.0
Variance,5508.836
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
64.0,29,0.1%,
65.0,25,0.1%,
57.0,25,0.1%,
63.0,24,0.1%,
53.0,23,0.1%,
74.0,21,0.1%,
72.0,20,0.1%,
59.0,20,0.1%,
90.0,18,0.1%,
77.0,18,0.1%,

Value,Count,Frequency (%),Unnamed: 3
14.0,1,0.0%,
17.0,1,0.0%,
18.0,1,0.0%,
19.0,1,0.0%,
21.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
448.0,1,0.0%,
469.0,1,0.0%,
472.0,1,0.0%,
512.0,1,0.0%,
599.0,1,0.0%,

0,1
Distinct count,220
Unique (%),1.0%
Missing (%),99.0%
Missing (n),21393

0,1
59410319,2
62103604,2
59410472,2
Other values (216),217
(Missing),21393

Value,Count,Frequency (%),Unnamed: 3
59410319,2,0.0%,
62103604,2,0.0%,
59410472,2,0.0%,
59425948,2,0.0%,
59398396,1,0.0%,
57482481,1,0.0%,
57784040,1,0.0%,
59425810,1,0.0%,
57393846,1,0.0%,
59418264,1,0.0%,

0,1
Distinct count,21615
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0

0,1
18178000,2
16748497,1
16592402,1
Other values (21612),21612

Value,Count,Frequency (%),Unnamed: 3
18178000,2,0.0%,
16748497,1,0.0%,
16592402,1,0.0%,
18721951,1,0.0%,
18174251,1,0.0%,
16531626,1,0.0%,
18173641,1,0.0%,
16017570,1,0.0%,
16745573,1,0.0%,
18178714,1,0.0%,

0,1
Distinct count,11
Unique (%),0.1%
Missing (%),0.1%
Missing (n),13

0,1
0,3905
7,1988
1,1982
Other values (7),13728

Value,Count,Frequency (%),Unnamed: 3
0,3905,18.1%,
7,1988,9.2%,
1,1982,9.2%,
9,1978,9.2%,
6,1977,9.1%,
4,1974,9.1%,
3,1959,9.1%,
2,1950,9.0%,
5,1947,9.0%,
8,1943,9.0%,

0,1
Distinct count,1095
Unique (%),5.1%
Missing (%),94.9%
Missing (n),20522

0,1
204094984880002,1
898001204578364,1
898050073442889,1
Other values (1091),1091
(Missing),20522

Value,Count,Frequency (%),Unnamed: 3
204094984880002,1,0.0%,
898001204578364,1,0.0%,
898050073442889,1,0.0%,
898000141224217,1,0.0%,
898050085218008,1,0.0%,
898002771837163,1,0.0%,
898001038441511,1,0.0%,
209981477580008,1,0.0%,
898003016520879,1,0.0%,
980016284699978,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),91.9%
Missing (n),19865

0,1
2,1268
9,457
1,26
(Missing),19865

Value,Count,Frequency (%),Unnamed: 3
2,1268,5.9%,
9,457,2.1%,
1,26,0.1%,
(Missing),19865,91.9%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21084

0,1
3,528
9,4
(Missing),21084

Value,Count,Frequency (%),Unnamed: 3
3,528,2.4%,
9,4,0.0%,
(Missing),21084,97.5%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),91.9%
Missing (n),19866

0,1
3,1250
9,457
1,22
(Missing),19866

Value,Count,Frequency (%),Unnamed: 3
3,1250,5.8%,
9,457,2.1%,
1,22,0.1%,
2,21,0.1%,
(Missing),19866,91.9%,

0,1
Distinct count,563
Unique (%),2.6%
Missing (%),22.1%
Missing (n),4776

0,1
999993,5864
999992,2895
621005,2498
Other values (559),5583
(Missing),4776

Value,Count,Frequency (%),Unnamed: 3
999993,5864,27.1%,
999992,2895,13.4%,
621005,2498,11.6%,
715210,685,3.2%,
999991,332,1.5%,
141410,221,1.0%,
782305,202,0.9%,
512105,201,0.9%,
354705,194,0.9%,
622020,140,0.6%,

0,1
Distinct count,67
Unique (%),0.3%
Missing (%),98.3%
Missing (n),21242

0,1
999992,204
999991,35
621005,17
Other values (63),118
(Missing),21242

Value,Count,Frequency (%),Unnamed: 3
999992,204,0.9%,
999991,35,0.2%,
621005,17,0.1%,
521110,7,0.0%,
421125,7,0.0%,
512105,6,0.0%,
516110,5,0.0%,
512120,5,0.0%,
141410,5,0.0%,
622020,5,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,21604
2,12

Value,Count,Frequency (%),Unnamed: 3
1,21604,99.9%,
2,12,0.1%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21083

0,1
2,298
1,202
9,33
(Missing),21083

Value,Count,Frequency (%),Unnamed: 3
2,298,1.4%,
1,202,0.9%,
9,33,0.2%,
(Missing),21083,97.5%,

0,1
Distinct count,331
Unique (%),1.5%
Missing (%),97.8%
Missing (n),21136
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1820.55
Minimum,99.0
Maximum,4965.0
Zeros (%),0.0%

0,1
Minimum,99.0
5-th percentile,500.0
Q1,910.0
Median,1518.0
Q3,2750.0
95-th percentile,3716.2
Maximum,4965.0
Range,4866.0
Interquartile range,1840.0

0,1
Standard deviation,1077.4243
Coef of variation,0.59181255
Kurtosis,-0.8372689
Mean,1820.55
MAD,940.54565
Skewness,0.5284141
Sum,873864.0
Variance,1160843.2
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,8,0.0%,
2800.0,6,0.0%,
3200.0,4,0.0%,
710.0,4,0.0%,
620.0,4,0.0%,
1120.0,4,0.0%,
3500.0,4,0.0%,
935.0,3,0.0%,
680.0,3,0.0%,
500.0,3,0.0%,

Value,Count,Frequency (%),Unnamed: 3
99.0,1,0.0%,
268.0,1,0.0%,
324.0,1,0.0%,
360.0,1,0.0%,
370.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4360.0,1,0.0%,
4400.0,1,0.0%,
4430.0,1,0.0%,
4890.0,1,0.0%,
4965.0,1,0.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),98.1%
Missing (n),21210
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.2413793
Minimum,0.0
Maximum,99.0
Zeros (%),1.4%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,0.0
Median,0.0
Q3,1.0
95-th percentile,1.75
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,13.748386
Coef of variation,6.1338954
Kurtosis,46.161846
Mean,2.2413793
MAD,3.8466108
Skewness,6.916435
Sum,910.0
Variance,189.01813
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
0.0,301,1.4%,
1.0,84,0.4%,
99.0,8,0.0%,
2.0,8,0.0%,
3.0,3,0.0%,
5.0,1,0.0%,
4.0,1,0.0%,
(Missing),21210,98.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,301,1.4%,
1.0,84,0.4%,
2.0,8,0.0%,
3.0,3,0.0%,
4.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2.0,8,0.0%,
3.0,3,0.0%,
4.0,1,0.0%,
5.0,1,0.0%,
99.0,8,0.0%,

0,1
Distinct count,12
Unique (%),0.1%
Missing (%),97.9%
Missing (n),21158
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.886463
Minimum,0.0
Maximum,99.0
Zeros (%),0.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,1.0
Median,1.0
Q3,2.0
95-th percentile,5.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,11.1855345
Coef of variation,3.87517
Kurtosis,69.50092
Mean,2.886463
MAD,2.9418967
Skewness,8.362496
Sum,1322.0
Variance,125.11619
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
1.0,163,0.8%,
0.0,98,0.5%,
2.0,94,0.4%,
3.0,52,0.2%,
4.0,25,0.1%,
5.0,11,0.1%,
99.0,6,0.0%,
7.0,4,0.0%,
6.0,3,0.0%,
11.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,98,0.5%,
1.0,163,0.8%,
2.0,94,0.4%,
3.0,52,0.2%,
4.0,25,0.1%,

Value,Count,Frequency (%),Unnamed: 3
6.0,3,0.0%,
7.0,4,0.0%,
9.0,1,0.0%,
11.0,1,0.0%,
99.0,6,0.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),12.5%
Missing (n),2700

0,1
1,8722
4,8264
2,1854
Other values (2),76
(Missing),2700

Value,Count,Frequency (%),Unnamed: 3
1,8722,40.3%,
4,8264,38.2%,
2,1854,8.6%,
3,46,0.2%,
5,30,0.1%,
(Missing),2700,12.5%,

0,1
Distinct count,32
Unique (%),0.1%
Missing (%),97.8%
Missing (n),21150
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,31.785408
Minimum,0.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,22.0
Q1,27.0
Median,32.0
Q3,38.0
95-th percentile,40.0
Maximum,99.0
Range,99.0
Interquartile range,11.0

0,1
Standard deviation,9.978099
Coef of variation,0.31392074
Kurtosis,17.74902
Mean,31.785408
MAD,6.3415246
Skewness,1.7775881
Sum,14812.0
Variance,99.562454
Memory size,84.5 KiB

Value,Count,Frequency (%),Unnamed: 3
39.0,43,0.2%,
38.0,31,0.1%,
28.0,31,0.1%,
30.0,30,0.1%,
40.0,28,0.1%,
32.0,26,0.1%,
37.0,26,0.1%,
26.0,24,0.1%,
27.0,22,0.1%,
29.0,21,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,2,0.0%,
1.0,4,0.0%,
2.0,3,0.0%,
3.0,4,0.0%,
5.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
39.0,43,0.2%,
40.0,28,0.1%,
41.0,12,0.1%,
42.0,3,0.0%,
99.0,4,0.0%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),92.6%
Missing (n),20018

0,1
4,622
3,255
8,190
Other values (5),531
(Missing),20018

Value,Count,Frequency (%),Unnamed: 3
4,622,2.9%,
3,255,1.2%,
8,190,0.9%,
5,156,0.7%,
2,134,0.6%,
1,91,0.4%,
7,82,0.4%,
6,68,0.3%,
(Missing),20018,92.6%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),99.4%
Missing (n),21493

0,1
3,26
8,25
7,15
Other values (5),57
(Missing),21493

Value,Count,Frequency (%),Unnamed: 3
3,26,0.1%,
8,25,0.1%,
7,15,0.1%,
2,15,0.1%,
1,14,0.1%,
5,10,0.0%,
6,9,0.0%,
4,9,0.0%,
(Missing),21493,99.4%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,12818
2,8796
0,2

Value,Count,Frequency (%),Unnamed: 3
1,12818,59.3%,
2,8796,40.7%,
0,2,0.0%,

0,1
Constant value,0.0

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
Mean,0.99810326

0,1
1.0,21575
0.0,41

Value,Count,Frequency (%),Unnamed: 3
1.0,21575,99.8%,
0.0,41,0.2%,

0,1
Constant value,2

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),91.9%
Missing (n),19867

0,1
8,1223
9,457
4,22
Other values (3),47
(Missing),19867

Value,Count,Frequency (%),Unnamed: 3
8,1223,5.7%,
9,457,2.1%,
4,22,0.1%,
1,22,0.1%,
5,21,0.1%,
2,4,0.0%,
(Missing),19867,91.9%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),94.5%
Missing (n),20420

0,1
9,885
8,254
5,23
Other values (5),34
(Missing),20420

Value,Count,Frequency (%),Unnamed: 3
9,885,4.1%,
8,254,1.2%,
5,23,0.1%,
1,16,0.1%,
6,12,0.1%,
4,4,0.0%,
7,1,0.0%,
3,1,0.0%,
(Missing),20420,94.5%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.7%
Missing (n),154

0,1
N,18055
S,3407
(Missing),154

Value,Count,Frequency (%),Unnamed: 3
N,18055,83.5%,
S,3407,15.8%,
(Missing),154,0.7%,

0,1
Distinct count,21616
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,10808
Minimum,1
Maximum,21616
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,1081.8
Q1,5404.8
Median,10808.0
Q3,16212.0
95-th percentile,20535.0
Maximum,21616.0
Range,21615.0
Interquartile range,10808.0

0,1
Standard deviation,6240.1
Coef of variation,0.57734
Kurtosis,-1.2
Mean,10808
MAD,5404
Skewness,0
Sum,233636536
Variance,38939000
Memory size,169.0 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,1,0.0%,
14994,1,0.0%,
645,1,0.0%,
6790,1,0.0%,
4743,1,0.0%,
19084,1,0.0%,
17037,1,0.0%,
21135,1,0.0%,
10896,1,0.0%,
8849,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,1,0.0%,
2,1,0.0%,
3,1,0.0%,
4,1,0.0%,
5,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
21612,1,0.0%,
21613,1,0.0%,
21614,1,0.0%,
21615,1,0.0%,
21616,1,0.0%,

Unnamed: 0.1,ACIDTRAB,ASSISTMED,ATESTANTE,CAUSABAS,CAUSABAS_O,CAUSAMAT,CIRCOBITO,CIRURGIA,CODESTAB,CODINST,CODMUNOCOR,CODMUNRES,COMUNSVOIM,DIFDATA,DTATESTADO,DTCADASTRO,DTCADINF,DTCADINV,DTCONCASO,DTINVESTIG,DTNASC,DTOBITO,DTRECEBIM,DTRECORIGA,ESC,ESC2010,ESCMAE,ESCMAE2010,ESTCIV,EXAME,FONTE,FONTEINV,GESTACAO,GRAVIDEZ,HORAOBITO,IDADE,IDADEMAE,LINHAA,LINHAB,LINHAC,LINHAD,LINHAII,LOCOCOR,MORTEPARTO,NATURAL,NECROPSIA,NUDIASOBIN,NUMERODN,NUMERODO,NUMERODV,NUMSUS,OBITOGRAV,OBITOPARTO,OBITOPUERP,OCUP,OCUPMAE,ORIGEM,PARTO,PESO,QTDFILMORT,QTDFILVIVO,RACACOR,SEMAGESTAC,SERIESCFAL,SERIESCMAE,SEXO,STDOEPIDEM,STDONOVA,TIPOBITO,TPMORTEOCO,TPOBITOCOR,TPPOS,Unnamed: 0
0,,1,5,I10,I10,,,,,MES3205200001,320520,320520,,69.0,2012-03-08,2012-04-26,NaT,NaT,NaT,NaT,1935-01-10,2012-03-08,2012-05-16,2012-05-16,4,,,,1,,,,,,1930.0,477.0,,*R092,*I10X,,,,3,,832,,,,4282305,,,,,,999993,,1,,,,,1,,,,1,0.0,0.0,2,,,N,1
1,,9,2,N390,N390,,,9.0,,MES3205300001,320530,320530,,57.0,2012-02-23,2012-03-13,NaT,NaT,NaT,NaT,1939-08-03,2012-02-23,2012-04-20,2012-04-20,4,,,,9,2.0,,,,,850.0,472.0,,*R688,*A419,*N390,,*C719,3,,832,9.0,,,6366366,,,,,,999993,,1,,,,,1,,,,2,0.0,0.0,2,,,N,2
2,,1,1,I132,I132,,,2.0,,MES3205200001,320520,320520,,59.0,2012-01-25,2012-03-14,NaT,NaT,NaT,NaT,1931-10-25,2012-01-24,2012-03-23,2012-03-23,1,,,,2,9.0,,,,,2040.0,480.0,,*I500,*I351,*I10X,*N189,,3,,832,2.0,,,7154314,,,,,,715210,,1,,,,,1,,,,1,0.0,0.0,2,,,N,3
3,,1,1,I219,I219,,,2.0,,MES3205200001,320520,320520,,60.0,2012-01-23,2012-03-14,NaT,NaT,NaT,NaT,1921-03-03,2012-01-23,2012-03-23,2012-03-23,3,,,,1,2.0,,,,,1300.0,490.0,,*I219,*J969,,,,3,,832,2.0,,,7473127,,,,,,351505,,1,,,,,1,,,,2,0.0,0.0,2,,,N,4
4,,9,1,J440,J440,,,9.0,11835.0,MES3205300001,320530,320510,,59.0,2012-08-13,2012-09-18,NaT,NaT,NaT,NaT,1935-04-19,2012-08-13,2012-10-11,2012-10-11,1,,,,2,9.0,,,,,900.0,477.0,,*J969,*J189,*I219,*J449,*I10X*I252,2,,832,9.0,,,9947827,,,,,,999993,,1,,,,,1,,,,1,0.0,0.0,2,,,N,5


### SIM DOES2013 `df_sim_does2013_raw`

In [6]:
display(pf_sim_does2013_raw)

Stored 'df_sim_does2013_raw' (DataFrame)


0,1
Number of variables,78
Number of observations,21651
Total Missing (%),48.1%
Total size in memory,5.7 MiB
Average record size in memory,274.2 B

0,1
Numeric,10
Categorical,50
Boolean,1
Date,12
Text (Unique),1
Rejected,4
Unsupported,0

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),93.8%
Missing (n),20301

0,1
9,761
2,511
1,78
(Missing),20301

Value,Count,Frequency (%),Unnamed: 3
9,761,3.5%,
2,511,2.4%,
1,78,0.4%,
(Missing),20301,93.8%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),4.5%
Missing (n),984

0,1
1,14173
2,3393
9,3101
(Missing),984

Value,Count,Frequency (%),Unnamed: 3
1,14173,65.5%,
2,3393,15.7%,
9,3101,14.3%,
(Missing),984,4.5%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),1.8%
Missing (n),385

0,1
1,6534
2,4943
3,3797
Other values (2),5992

Value,Count,Frequency (%),Unnamed: 3
1,6534,30.2%,
2,4943,22.8%,
3,3797,17.5%,
5,3361,15.5%,
4,2631,12.2%,
(Missing),385,1.8%,

0,1
Distinct count,1408
Unique (%),6.5%
Missing (%),0.0%
Missing (n),0

0,1
I219,1777
X954,704
I64,693
Other values (1405),18477

Value,Count,Frequency (%),Unnamed: 3
I219,1777,8.2%,
X954,704,3.3%,
I64,693,3.2%,
J189,688,3.2%,
E149,518,2.4%,
C349,461,2.1%,
I694,415,1.9%,
I678,394,1.8%,
I110,376,1.7%,
G309,367,1.7%,

0,1
Distinct count,1358
Unique (%),6.3%
Missing (%),0.0%
Missing (n),5

0,1
I219,1769
J189,770
I64,685
Other values (1354),18422

Value,Count,Frequency (%),Unnamed: 3
I219,1769,8.2%,
J189,770,3.6%,
I64,685,3.2%,
X954,658,3.0%,
E149,504,2.3%,
C349,459,2.1%,
I678,383,1.8%,
I694,359,1.7%,
J440,345,1.6%,
G309,344,1.6%,

0,1
Constant value,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),82.0%
Missing (n),17760

0,1
1,1839
3,1569
9,321
Other values (2),162
(Missing),17760

Value,Count,Frequency (%),Unnamed: 3
1,1839,8.5%,
3,1569,7.2%,
9,321,1.5%,
2,156,0.7%,
4,6,0.0%,
(Missing),17760,82.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),21623

0,1
2,16
9,6
1,6
(Missing),21623

Value,Count,Frequency (%),Unnamed: 3
2,16,0.1%,
9,6,0.0%,
1,6,0.0%,
(Missing),21623,99.9%,

0,1
Distinct count,258
Unique (%),1.2%
Missing (%),0.8%
Missing (n),176

0,1
1,3459
5220,2272
4909,1180
Other values (254),14564

Value,Count,Frequency (%),Unnamed: 3
1,3459,16.0%,
5220,2272,10.5%,
4909,1180,5.5%,
6104,1151,5.3%,
1617,1044,4.8%,
4085,1022,4.7%,
3441,828,3.8%,
2275,821,3.8%,
4911,764,3.5%,
1616,642,3.0%,

0,1
Distinct count,302
Unique (%),1.4%
Missing (%),29.1%
Missing (n),6291

0,1
0011738,920
2550687,889
2485680,837
Other values (298),12714
(Missing),6291

Value,Count,Frequency (%),Unnamed: 3
0011738,920,4.2%,
2550687,889,4.1%,
2485680,837,3.9%,
2547821,682,3.1%,
7257406,655,3.0%,
2494442,605,2.8%,
2546957,562,2.6%,
2446030,528,2.4%,
0011746,516,2.4%,
2486199,475,2.2%,

0,1
Distinct count,91
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
RES3205300001,9535
MES3205300001,3797
MES3205200001,2703
Other values (88),5616

Value,Count,Frequency (%),Unnamed: 3
RES3205300001,9535,44.0%,
MES3205300001,3797,17.5%,
MES3205200001,2703,12.5%,
MES3205000001,2647,12.2%,
MES3201500001,1189,5.5%,
MES3201300001,1151,5.3%,
MES3200600001,335,1.5%,
MRJ3300600001,30,0.1%,
MBA2931350001,26,0.1%,
MRJ3302200001,23,0.1%,

0,1
Distinct count,112
Unique (%),0.5%
Missing (%),0.8%
Missing (n),170

0,1
320530,3796
320520,2698
320500,2646
Other values (108),12341

Value,Count,Frequency (%),Unnamed: 3
320530,3796,17.5%,
320520,2698,12.5%,
320500,2646,12.2%,
320120,1985,9.2%,
320150,1188,5.5%,
320130,1153,5.3%,
320490,1063,4.9%,
320320,857,4.0%,
320240,339,1.6%,
320060,334,1.5%,

0,1
Distinct count,174
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0

0,1
320530,3825
320520,2710
320500,2655
Other values (171),12461

Value,Count,Frequency (%),Unnamed: 3
320530,3825,17.7%,
320520,2710,12.5%,
320500,2655,12.3%,
320120,1991,9.2%,
320150,1254,5.8%,
320130,1156,5.3%,
320490,1079,5.0%,
320320,860,4.0%,
320240,339,1.6%,
320060,337,1.6%,

0,1
Distinct count,79
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
320520,2454
320500,2299
320130,2187
Other values (76),14711

Value,Count,Frequency (%),Unnamed: 3
320520,2454,11.3%,
320500,2299,10.6%,
320130,2187,10.1%,
320530,2033,9.4%,
320120,1307,6.0%,
320320,756,3.5%,
320150,730,3.4%,
320240,657,3.0%,
320490,648,3.0%,
320060,421,1.9%,

0,1
Distinct count,52
Unique (%),0.2%
Missing (%),70.7%
Missing (n),15297

0,1
320530,4851
320320,533
320120,509
Other values (48),461
(Missing),15297

Value,Count,Frequency (%),Unnamed: 3
320530,4851,22.4%,
320320,533,2.5%,
320120,509,2.4%,
320150,330,1.5%,
293135,25,0.1%,
320500,22,0.1%,
330240,6,0.0%,
312770,6,0.0%,
313940,6,0.0%,
330220,4,0.0%,

0,1
Distinct count,278
Unique (%),1.3%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,55.72874
Minimum,0.0
Maximum,666.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,24.0
Q1,39.0
Median,51.0
Q3,66.0
95-th percentile,94.0
Maximum,666.0
Range,666.0
Interquartile range,27.0

0,1
Standard deviation,32.90761
Coef of variation,0.59049624
Kurtosis,87.45659
Mean,55.72874
MAD,18.619123
Skewness,7.023249
Sum,1206583.0
Variance,1082.911
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
46.0,520,2.4%,
49.0,487,2.2%,
47.0,484,2.2%,
40.0,472,2.2%,
45.0,471,2.2%,
41.0,469,2.2%,
50.0,463,2.1%,
42.0,448,2.1%,
43.0,441,2.0%,
48.0,438,2.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,5,0.0%,
2.0,5,0.0%,
3.0,1,0.0%,
4.0,6,0.0%,
5.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
596.0,1,0.0%,
598.0,1,0.0%,
608.0,1,0.0%,
648.0,1,0.0%,
666.0,1,0.0%,

0,1
Distinct count,386
Unique (%),1.8%
Missing (%),0.2%
Missing (n),43
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-01 00:00:00
Maximum,2014-12-15 00:00:00

0,1
Distinct count,342
Unique (%),1.6%
Missing (%),5.5%
Missing (n),1185
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-08 00:00:00
Maximum,2015-02-19 00:00:00

0,1
Distinct count,232
Unique (%),1.1%
Missing (%),97.5%
Missing (n),21103
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-02-01 00:00:00
Maximum,2015-01-27 00:00:00

0,1
Distinct count,305
Unique (%),1.4%
Missing (%),94.5%
Missing (n),20459
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-02-01 00:00:00
Maximum,2015-03-04 00:00:00

0,1
Distinct count,243
Unique (%),1.1%
Missing (%),97.7%
Missing (n),21163
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-05 00:00:00
Maximum,2015-01-14 00:00:00

0,1
Distinct count,314
Unique (%),1.5%
Missing (%),94.6%
Missing (n),20480
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-25 00:00:00
Maximum,2015-01-08 00:00:00

0,1
Distinct count,462
Unique (%),2.1%
Missing (%),83.9%
Missing (n),18169
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-14 00:00:00
Maximum,2014-12-22 00:00:00

0,1
Distinct count,14854
Unique (%),68.6%
Missing (%),0.2%
Missing (n),49
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1902-08-21 00:00:00
Maximum,2013-12-30 00:00:00

0,1
Distinct count,365
Unique (%),1.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-01 00:00:00
Maximum,2013-12-31 00:00:00

0,1
Distinct count,191
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-08 00:00:00
Maximum,2015-03-04 00:00:00

0,1
Distinct count,175
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-08 00:00:00
Maximum,2015-02-24 00:00:00

0,1
Distinct count,436
Unique (%),2.0%
Missing (%),3.9%
Missing (n),848
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-01 00:00:00
Maximum,2015-02-05 00:00:00

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),23.2%
Missing (n),5030

0,1
9,4856
2,4141
1,2876
Other values (3),4748
(Missing),5030

Value,Count,Frequency (%),Unnamed: 3
9,4856,22.4%,
2,4141,19.1%,
1,2876,13.3%,
3,2576,11.9%,
4,1669,7.7%,
5,503,2.3%,
(Missing),5030,23.2%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),23.4%
Missing (n),5060

0,1
1,4891
9,4840
0,2874
Other values (4),3986
(Missing),5060

Value,Count,Frequency (%),Unnamed: 3
1,4891,22.6%,
9,4840,22.4%,
0,2874,13.3%,
2,2027,9.4%,
3,1457,6.7%,
5,420,1.9%,
4,82,0.4%,
(Missing),5060,23.4%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.7%
Missing (n),21158

0,1
4,187
3,117
5,63
Other values (4),126
(Missing),21158

Value,Count,Frequency (%),Unnamed: 3
4,187,0.9%,
3,117,0.5%,
5,63,0.3%,
9,56,0.3%,
0,27,0.1%,
2,26,0.1%,
1,17,0.1%,
(Missing),21158,97.7%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.9%
Missing (n),21189

0,1
3,166
2,130
9,55
Other values (4),111
(Missing),21189

Value,Count,Frequency (%),Unnamed: 3
3,166,0.8%,
2,130,0.6%,
9,55,0.3%,
5,48,0.2%,
1,32,0.1%,
0,17,0.1%,
4,14,0.1%,
(Missing),21189,97.9%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),12.1%
Missing (n),2615

0,1
2,6773
1,5095
3,4205
Other values (3),2963
(Missing),2615

Value,Count,Frequency (%),Unnamed: 3
2,6773,31.3%,
1,5095,23.5%,
3,4205,19.4%,
9,1504,6.9%,
4,1091,5.0%,
5,368,1.7%,
(Missing),2615,12.1%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),21623

0,1
1,17
9,7
2,4
(Missing),21623

Value,Count,Frequency (%),Unnamed: 3
1,17,0.1%,
9,7,0.0%,
2,4,0.0%,
(Missing),21623,99.9%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),82.8%
Missing (n),17933

0,1
1,2820
2,450
9,196
Other values (2),252
(Missing),17933

Value,Count,Frequency (%),Unnamed: 3
1,2820,13.0%,
2,450,2.1%,
9,196,0.9%,
4,172,0.8%,
3,80,0.4%,
(Missing),17933,82.8%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),82.6%
Missing (n),17886

0,1
3,1149
6,880
1,594
Other values (6),1142
(Missing),17886

Value,Count,Frequency (%),Unnamed: 3
3,1149,5.3%,
6,880,4.1%,
1,594,2.7%,
4,526,2.4%,
8,294,1.4%,
2,193,0.9%,
7,94,0.4%,
5,33,0.2%,
9,2,0.0%,
(Missing),17886,82.6%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.8%
Missing (n),21178

0,1
5,130
2,100
4,94
Other values (4),149
(Missing),21178

Value,Count,Frequency (%),Unnamed: 3
5,130,0.6%,
2,100,0.5%,
4,94,0.4%,
3,90,0.4%,
1,34,0.2%,
9,22,0.1%,
6,3,0.0%,
(Missing),21178,97.8%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.7%
Missing (n),21147

0,1
1,446
2,43
9,12
(Missing),21147

Value,Count,Frequency (%),Unnamed: 3
1,446,2.1%,
2,43,0.2%,
9,12,0.1%,
3,3,0.0%,
(Missing),21147,97.7%,

0,1
Distinct count,1160
Unique (%),5.4%
Missing (%),12.4%
Missing (n),2681
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1197.693
Minimum,0.0
Maximum,2359.0
Zeros (%),0.3%

0,1
Minimum,0.0
5-th percentile,125.0
Q1,630.0
Median,1200.0
Q3,1800.0
95-th percentile,2240.0
Maximum,2359.0
Range,2359.0
Interquartile range,1170.0

0,1
Standard deviation,675.8974
Coef of variation,0.5643328
Kurtosis,-1.1664042
Mean,1197.693
MAD,585.28033
Skewness,0.008757466
Sum,22720236.0
Variance,456837.28
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,275,1.3%,
500.0,228,1.1%,
1600.0,228,1.1%,
900.0,222,1.0%,
800.0,217,1.0%,
700.0,214,1.0%,
1000.0,203,0.9%,
1700.0,202,0.9%,
1200.0,199,0.9%,
2200.0,199,0.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,57,0.3%,
1.0,4,0.0%,
2.0,5,0.0%,
3.0,1,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2355.0,20,0.1%,
2356.0,1,0.0%,
2357.0,3,0.0%,
2358.0,3,0.0%,
2359.0,3,0.0%,

0,1
Distinct count,189
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,456.73752
Minimum,1.0
Maximum,999.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,416.0
Q1,448.0
Median,466.0
Q3,480.0
95-th percentile,492.0
Maximum,999.0
Range,998.0
Interquartile range,32.0

0,1
Standard deviation,50.991234
Coef of variation,0.111642316
Kurtosis,34.94491
Mean,456.73752
MAD,26.00371
Skewness,-3.198602
Sum,9888824.0
Variance,2600.106
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
482.0,482,2.2%,
483.0,466,2.2%,
477.0,458,2.1%,
480.0,452,2.1%,
481.0,448,2.1%,
478.0,445,2.1%,
476.0,445,2.1%,
484.0,429,2.0%,
479.0,421,1.9%,
473.0,416,1.9%,

Value,Count,Frequency (%),Unnamed: 3
1.0,7,0.0%,
3.0,1,0.0%,
5.0,3,0.0%,
6.0,1,0.0%,
10.0,6,0.0%,

Value,Count,Frequency (%),Unnamed: 3
507.0,6,0.0%,
508.0,8,0.0%,
509.0,1,0.0%,
510.0,2,0.0%,
999.0,18,0.1%,

0,1
Distinct count,33
Unique (%),0.2%
Missing (%),97.9%
Missing (n),21189
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,27.469696
Minimum,13.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,13.0
5-th percentile,16.0
Q1,20.0
Median,27.0
Q3,32.0
95-th percentile,39.0
Maximum,99.0
Range,86.0
Interquartile range,12.0

0,1
Standard deviation,10.9244175
Coef of variation,0.3976898
Kurtosis,21.620176
Mean,27.469696
MAD,7.0413227
Skewness,3.6009922
Sum,12691.0
Variance,119.342896
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
17.0,25,0.1%,
29.0,24,0.1%,
20.0,22,0.1%,
25.0,22,0.1%,
19.0,21,0.1%,
32.0,21,0.1%,
30.0,21,0.1%,
28.0,21,0.1%,
21.0,21,0.1%,
34.0,20,0.1%,

Value,Count,Frequency (%),Unnamed: 3
13.0,1,0.0%,
14.0,7,0.0%,
15.0,10,0.0%,
16.0,16,0.1%,
17.0,25,0.1%,

Value,Count,Frequency (%),Unnamed: 3
40.0,5,0.0%,
41.0,3,0.0%,
42.0,5,0.0%,
43.0,3,0.0%,
99.0,6,0.0%,

0,1
Distinct count,1028
Unique (%),4.7%
Missing (%),2.2%
Missing (n),473

0,1
*A419,3304
*R688,1257
*R092,1242
Other values (1024),15375

Value,Count,Frequency (%),Unnamed: 3
*A419,3304,15.3%,
*R688,1257,5.8%,
*R092,1242,5.7%,
*I219,1134,5.2%,
*J969,1055,4.9%,
*J81X,894,4.1%,
*J960,880,4.1%,
*R570,608,2.8%,
*T792,542,2.5%,
*S069,464,2.1%,

0,1
Distinct count,1505
Unique (%),7.0%
Missing (%),16.6%
Missing (n),3595

0,1
*J189,1495
*A419,916
*I10X,745
Other values (1501),14900
(Missing),3595

Value,Count,Frequency (%),Unnamed: 3
*J189,1495,6.9%,
*A419,916,4.2%,
*I10X,745,3.4%,
*I219,736,3.4%,
*S069,498,2.3%,
*I500,371,1.7%,
*J180,287,1.3%,
*J159,277,1.3%,
*N390,253,1.2%,
*X954,244,1.1%,

0,1
Distinct count,1464
Unique (%),6.8%
Missing (%),42.4%
Missing (n),9180

0,1
*I10X,1031
*J189,526
*J449,294
Other values (1460),10620
(Missing),9180

Value,Count,Frequency (%),Unnamed: 3
*I10X,1031,4.8%,
*J189,526,2.4%,
*J449,294,1.4%,
*E149,284,1.3%,
*X954,274,1.3%,
*I251,232,1.1%,
*I500,225,1.0%,
*I64X,215,1.0%,
*I709,210,1.0%,
*I219,209,1.0%,

0,1
Distinct count,987
Unique (%),4.6%
Missing (%),74.2%
Missing (n),16072

0,1
*I10X,841
*E149,259
*F102,223
Other values (983),4256
(Missing),16072

Value,Count,Frequency (%),Unnamed: 3
*I10X,841,3.9%,
*E149,259,1.2%,
*F102,223,1.0%,
*J449,119,0.5%,
*I694,109,0.5%,
*G309,106,0.5%,
*F172,101,0.5%,
*I709,97,0.4%,
*J189,94,0.4%,
*N189,90,0.4%,

0,1
Distinct count,2348
Unique (%),10.8%
Missing (%),67.1%
Missing (n),14535

0,1
*I10X,676
*E149,299
*I10X*E149,211
Other values (2344),5930
(Missing),14535

Value,Count,Frequency (%),Unnamed: 3
*I10X,676,3.1%,
*E149,299,1.4%,
*I10X*E149,211,1.0%,
*F172,167,0.8%,
*F102,161,0.7%,
*R54X,145,0.7%,
*E149*I10,137,0.6%,
*G309,119,0.5%,
*N189,117,0.5%,
*N179,109,0.5%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,14621
3,3636
4,1726
Other values (3),1668

Value,Count,Frequency (%),Unnamed: 3
1,14621,67.5%,
3,3636,16.8%,
4,1726,8.0%,
5,872,4.0%,
2,739,3.4%,
9,57,0.3%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21103

0,1
3,513
9,35
(Missing),21103

Value,Count,Frequency (%),Unnamed: 3
3,513,2.4%,
9,35,0.2%,
(Missing),21103,97.5%,

0,1
Distinct count,27
Unique (%),0.1%
Missing (%),90.5%
Missing (n),19588

0,1
800,1974
190,24
832,22
Other values (23),43
(Missing),19588

Value,Count,Frequency (%),Unnamed: 3
800,1974,9.1%,
190,24,0.1%,
832,22,0.1%,
125,8,0.0%,
999,5,0.0%,
186,3,0.0%,
77,3,0.0%,
8,3,0.0%,
135,2,0.0%,
16,2,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),4.5%
Missing (n),983

0,1
2,13880
1,6217
9,571
(Missing),983

Value,Count,Frequency (%),Unnamed: 3
2,13880,64.1%,
1,6217,28.7%,
9,571,2.6%,
(Missing),983,4.5%,

0,1
Distinct count,341
Unique (%),1.6%
Missing (%),92.0%
Missing (n),19911
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,114.18563
Minimum,12.0
Maximum,750.0
Zeros (%),0.0%

0,1
Minimum,12.0
5-th percentile,34.0
Q1,58.75
Median,88.0
Q3,128.0
95-th percentile,312.05
Maximum,750.0
Range,738.0
Interquartile range,69.25

0,1
Standard deviation,91.59676
Coef of variation,0.80217415
Kurtosis,9.184097
Mean,114.18563
MAD,61.07897
Skewness,2.5723758
Sum,198683.0
Variance,8389.967
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
61.0,25,0.1%,
90.0,24,0.1%,
65.0,24,0.1%,
49.0,23,0.1%,
38.0,20,0.1%,
64.0,19,0.1%,
55.0,19,0.1%,
112.0,18,0.1%,
59.0,18,0.1%,
67.0,17,0.1%,

Value,Count,Frequency (%),Unnamed: 3
12.0,1,0.0%,
14.0,2,0.0%,
15.0,1,0.0%,
16.0,2,0.0%,
17.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
683.0,1,0.0%,
694.0,1,0.0%,
704.0,1,0.0%,
723.0,1,0.0%,
750.0,1,0.0%,

0,1
Distinct count,259
Unique (%),1.2%
Missing (%),98.8%
Missing (n),21393

0,1
62108346,1
62123006,1
62129850,1
Other values (255),255
(Missing),21393

Value,Count,Frequency (%),Unnamed: 3
62108346,1,0.0%,
62123006,1,0.0%,
62129850,1,0.0%,
62132080,1,0.0%,
59856646,1,0.0%,
64331069,1,0.0%,
62107350,1,0.0%,
62097672,1,0.0%,
62121726,1,0.0%,
64314040,1,0.0%,

First 3 values
19179259
18733835
18729927

Last 3 values
18725305
19113795
19129079

Value,Count,Frequency (%),Unnamed: 3
6374031,1,0.0%,
6374032,1,0.0%,
8578075,1,0.0%,
8578076,1,0.0%,
8581617,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
20952192,1,0.0%,
20968012,1,0.0%,
20992970,1,0.0%,
21064301,1,0.0%,
21064428,1,0.0%,

0,1
Distinct count,11
Unique (%),0.1%
Missing (%),0.0%
Missing (n),7

0,1
0,3914
8,1996
9,1992
Other values (7),13742

Value,Count,Frequency (%),Unnamed: 3
0,3914,18.1%,
8,1996,9.2%,
9,1992,9.2%,
6,1988,9.2%,
2,1986,9.2%,
5,1983,9.2%,
7,1974,9.1%,
1,1946,9.0%,
3,1939,9.0%,
4,1926,8.9%,

0,1
Distinct count,18043
Unique (%),83.3%
Missing (%),0.9%
Missing (n),190

0,1
3124,5
4998,5
3073,5
Other values (18039),21446
(Missing),190

Value,Count,Frequency (%),Unnamed: 3
3124,5,0.0%,
4998,5,0.0%,
3073,5,0.0%,
4925,5,0.0%,
4942,5,0.0%,
4973,5,0.0%,
3113,5,0.0%,
5016,5,0.0%,
531,5,0.0%,
3058,5,0.0%,

0,1
Distinct count,1719
Unique (%),7.9%
Missing (%),92.1%
Missing (n),19932

0,1
000000000000000,2
898003900525333,1
206439796750005,1
Other values (1715),1715
(Missing),19932

Value,Count,Frequency (%),Unnamed: 3
000000000000000,2,0.0%,
898003900525333,1,0.0%,
206439796750005,1,0.0%,
898050074623089,1,0.0%,
898002720307787,1,0.0%,
209663495840002,1,0.0%,
309518655810004,1,0.0%,
204022540520001,1,0.0%,
898003210327752,1,0.0%,
201358477580004,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),92.4%
Missing (n),20015

0,1
2,1180
9,438
1,18
(Missing),20015

Value,Count,Frequency (%),Unnamed: 3
2,1180,5.5%,
9,438,2.0%,
1,18,0.1%,
(Missing),20015,92.4%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.7%
Missing (n),21152

0,1
3,479
9,20
(Missing),21152

Value,Count,Frequency (%),Unnamed: 3
3,479,2.2%,
9,20,0.1%,
(Missing),21152,97.7%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),92.4%
Missing (n),20014

0,1
3,1163
9,438
2,18
(Missing),20014

Value,Count,Frequency (%),Unnamed: 3
3,1163,5.4%,
9,438,2.0%,
2,18,0.1%,
1,18,0.1%,
(Missing),20014,92.4%,

0,1
Distinct count,570
Unique (%),2.6%
Missing (%),22.8%
Missing (n),4936

0,1
999993,6278
999992,2598
621005,2180
Other values (566),5659
(Missing),4936

Value,Count,Frequency (%),Unnamed: 3
999993,6278,29.0%,
999992,2598,12.0%,
621005,2180,10.1%,
715210,603,2.8%,
999991,358,1.7%,
611005,268,1.2%,
141410,235,1.1%,
782305,196,0.9%,
512105,191,0.9%,
622020,183,0.8%,

0,1
Distinct count,85
Unique (%),0.4%
Missing (%),98.3%
Missing (n),21274

0,1
999992,175
999991,31
621005,16
Other values (81),155
(Missing),21274

Value,Count,Frequency (%),Unnamed: 3
999992,175,0.8%,
999991,31,0.1%,
621005,16,0.1%,
411010,9,0.0%,
231205,6,0.0%,
516110,6,0.0%,
521110,6,0.0%,
521130,6,0.0%,
512105,5,0.0%,
512120,5,0.0%,

0,1
Constant value,1

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.7%
Missing (n),21148

0,1
2,272
1,215
9,16
(Missing),21148

Value,Count,Frequency (%),Unnamed: 3
2,272,1.3%,
1,215,1.0%,
9,16,0.1%,
(Missing),21148,97.7%,

0,1
Distinct count,341
Unique (%),1.6%
Missing (%),97.8%
Missing (n),21182
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1798.6013
Minimum,270.0
Maximum,5300.0
Zeros (%),0.0%

0,1
Minimum,270.0
5-th percentile,550.0
Q1,875.0
Median,1540.0
Q3,2650.0
95-th percentile,3720.0
Maximum,5300.0
Range,5030.0
Interquartile range,1775.0

0,1
Standard deviation,1068.3523
Coef of variation,0.5939906
Kurtosis,-0.7008948
Mean,1798.6013
MAD,919.6671
Skewness,0.58840954
Sum,843544.0
Variance,1141376.5
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
900.0,7,0.0%,
645.0,5,0.0%,
2800.0,5,0.0%,
970.0,4,0.0%,
1010.0,4,0.0%,
580.0,4,0.0%,
2270.0,4,0.0%,
880.0,4,0.0%,
2300.0,4,0.0%,
2775.0,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
270.0,1,0.0%,
360.0,1,0.0%,
383.0,1,0.0%,
400.0,1,0.0%,
425.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4210.0,1,0.0%,
4230.0,1,0.0%,
4250.0,1,0.0%,
4910.0,1,0.0%,
5300.0,1,0.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),98.1%
Missing (n),21239
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,6.6432037
Minimum,0.0
Maximum,99.0
Zeros (%),1.3%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,0.0
Median,0.0
Q3,1.0
95-th percentile,99.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,24.01138
Coef of variation,3.6144276
Kurtosis,11.032694
Mean,6.6432037
MAD,11.656683
Skewness,3.6002877
Sum,2737.0
Variance,576.5463
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
0.0,274,1.3%,
1.0,79,0.4%,
99.0,26,0.1%,
2.0,21,0.1%,
3.0,8,0.0%,
5.0,2,0.0%,
4.0,2,0.0%,
(Missing),21239,98.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,274,1.3%,
1.0,79,0.4%,
2.0,21,0.1%,
3.0,8,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2.0,21,0.1%,
3.0,8,0.0%,
4.0,2,0.0%,
5.0,2,0.0%,
99.0,26,0.1%,

0,1
Distinct count,12
Unique (%),0.1%
Missing (%),97.9%
Missing (n),21206
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,5.7685394
Minimum,0.0
Maximum,99.0
Zeros (%),0.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,1.0
Median,1.0
Q3,2.0
95-th percentile,7.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,19.770712
Coef of variation,3.427334
Kurtosis,18.431414
Mean,5.7685394
MAD,8.015311
Skewness,4.4955764
Sum,2567.0
Variance,390.881
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
1.0,154,0.7%,
0.0,99,0.5%,
2.0,84,0.4%,
3.0,42,0.2%,
99.0,19,0.1%,
4.0,19,0.1%,
5.0,15,0.1%,
6.0,7,0.0%,
7.0,4,0.0%,
9.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,99,0.5%,
1.0,154,0.7%,
2.0,84,0.4%,
3.0,42,0.2%,
4.0,19,0.1%,

Value,Count,Frequency (%),Unnamed: 3
6.0,7,0.0%,
7.0,4,0.0%,
8.0,1,0.0%,
9.0,1,0.0%,
99.0,19,0.1%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),11.6%
Missing (n),2509

0,1
1,8798
4,8443
2,1851
Other values (2),50
(Missing),2509

Value,Count,Frequency (%),Unnamed: 3
1,8798,40.6%,
4,8443,39.0%,
2,1851,8.5%,
3,28,0.1%,
5,22,0.1%,
(Missing),2509,11.6%,

0,1
Distinct count,32
Unique (%),0.1%
Missing (%),97.8%
Missing (n),21180
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,34.203823
Minimum,0.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,21.0
Q1,27.0
Median,32.0
Q3,38.0
95-th percentile,42.0
Maximum,99.0
Range,99.0
Interquartile range,11.0

0,1
Standard deviation,16.216515
Coef of variation,0.4741141
Kurtosis,9.563933
Mean,34.203823
MAD,8.946353
Skewness,2.7155154
Sum,16110.0
Variance,262.97537
Memory size,84.7 KiB

Value,Count,Frequency (%),Unnamed: 3
39.0,38,0.2%,
38.0,34,0.2%,
28.0,34,0.2%,
26.0,32,0.1%,
40.0,31,0.1%,
25.0,22,0.1%,
99.0,22,0.1%,
32.0,22,0.1%,
30.0,21,0.1%,
36.0,20,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,3,0.0%,
1.0,3,0.0%,
2.0,3,0.0%,
3.0,2,0.0%,
5.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
39.0,38,0.2%,
40.0,31,0.1%,
41.0,11,0.1%,
42.0,3,0.0%,
99.0,22,0.1%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),90.6%
Missing (n),19613

0,1
4,753
3,284
5,235
Other values (5),766
(Missing),19613

Value,Count,Frequency (%),Unnamed: 3
4,753,3.5%,
3,284,1.3%,
5,235,1.1%,
8,209,1.0%,
2,206,1.0%,
1,128,0.6%,
7,115,0.5%,
6,108,0.5%,
(Missing),19613,90.6%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),99.5%
Missing (n),21535

0,1
3,29
8,20
5,16
Other values (5),51
(Missing),21535

Value,Count,Frequency (%),Unnamed: 3
3,29,0.1%,
8,20,0.1%,
5,16,0.1%,
7,15,0.1%,
6,13,0.1%,
1,12,0.1%,
4,7,0.0%,
2,4,0.0%,
(Missing),21535,99.5%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,12782
2,8863
0,6

Value,Count,Frequency (%),Unnamed: 3
1,12782,59.0%,
2,8863,40.9%,
0,6,0.0%,

0,1
Constant value,0.0

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
Mean,0.99870676

0,1
1.0,21623
0.0,28

Value,Count,Frequency (%),Unnamed: 3
1.0,21623,99.9%,
0.0,28,0.1%,

0,1
Constant value,2

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),92.4%
Missing (n),20015

0,1
8,1144
9,438
5,18
Other values (3),36
(Missing),20015

Value,Count,Frequency (%),Unnamed: 3
8,1144,5.3%,
9,438,2.0%,
5,18,0.1%,
4,18,0.1%,
1,13,0.1%,
2,5,0.0%,
(Missing),20015,92.4%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),94.5%
Missing (n),20459

0,1
9,935
8,216
5,16
Other values (5),25
(Missing),20459

Value,Count,Frequency (%),Unnamed: 3
9,935,4.3%,
8,216,1.0%,
5,16,0.1%,
6,11,0.1%,
1,9,0.0%,
4,3,0.0%,
7,1,0.0%,
3,1,0.0%,
(Missing),20459,94.5%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),1.4%
Missing (n),313

0,1
N,17537
S,3801
(Missing),313

Value,Count,Frequency (%),Unnamed: 3
N,17537,81.0%,
S,3801,17.6%,
(Missing),313,1.4%,

0,1
Distinct count,21651
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,10826
Minimum,1
Maximum,21651
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,1083.5
Q1,5413.5
Median,10826.0
Q3,16238.0
95-th percentile,20568.0
Maximum,21651.0
Range,21650.0
Interquartile range,10825.0

0,1
Standard deviation,6250.2
Coef of variation,0.57734
Kurtosis,-1.2
Mean,10826
MAD,5412.7
Skewness,0
Sum,234393726
Variance,39066000
Memory size,169.2 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,1,0.0%,
2708,1,0.0%,
4743,1,0.0%,
19084,1,0.0%,
17037,1,0.0%,
21135,1,0.0%,
10896,1,0.0%,
8849,1,0.0%,
14994,1,0.0%,
12947,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,1,0.0%,
2,1,0.0%,
3,1,0.0%,
4,1,0.0%,
5,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
21647,1,0.0%,
21648,1,0.0%,
21649,1,0.0%,
21650,1,0.0%,
21651,1,0.0%,

Unnamed: 0.1,ACIDTRAB,ASSISTMED,ATESTANTE,CAUSABAS,CAUSABAS_O,CAUSAMAT,CIRCOBITO,CIRURGIA,CODCART,CODESTAB,CODINST,CODMUNCART,CODMUNOCOR,CODMUNRES,COMUNSVOIM,DIFDATA,DTATESTADO,DTCADASTRO,DTCADINF,DTCADINV,DTCONCASO,DTCONINV,DTINVESTIG,DTNASC,DTOBITO,DTRECEBIM,DTRECORIG,DTREGCART,ESC,ESC2010,ESCMAE,ESCMAE2010,ESTCIV,EXAME,FONTE,FONTEINV,GESTACAO,GRAVIDEZ,HORAOBITO,IDADE,IDADEMAE,LINHAA,LINHAB,LINHAC,LINHAD,LINHAII,LOCOCOR,MORTEPARTO,NATURAL,NECROPSIA,NUDIASOBIN,NUMERODN,NUMERODO,NUMERODV,NUMREGCART,NUMSUS,OBITOGRAV,OBITOPARTO,OBITOPUERP,OCUP,OCUPMAE,ORIGEM,PARTO,PESO,QTDFILMORT,QTDFILVIVO,RACACOR,SEMAGESTAC,SERIESCFAL,SERIESCMAE,SEXO,STDOEPIDEM,STDONOVA,TIPOBITO,TPMORTEOCO,TPOBITOCOR,TPPOS,Unnamed: 0
0,,1,1,I110,I110,,,2,2,,MES3205300001,320530,320530,320530,,79.0,2013-01-02,2013-03-06,NaT,NaT,NaT,NaT,NaT,1917-06-06,2013-01-02,2013-03-22,2013-03-22,2013-01-02,1,,,,3,1,,,,,1440.0,495.0,,*I509,*I10X,,,*E119*N179,3,,832,2,,,6374031,,6249,,,,,512120.0,,1,,,,,2,,,,2,0.0,0.0,2,,,N,1
1,,1,2,C349,C349,,,2,2,11835.0,MES3205300001,320530,320530,320530,,71.0,2013-01-10,2013-03-06,NaT,NaT,NaT,NaT,NaT,1932-05-01,2013-01-10,2013-03-22,2013-03-22,2013-01-10,9,,,,2,1,,,,,1410.0,480.0,,*A419,*J159,*C349,,*I10X*L89,2,,832,2,,,6374032,,6253,,,,,141410.0,,1,,,,,1,,,,1,0.0,0.0,2,,,N,2
2,,9,1,C490,C490,,,2,1,,MES3205300001,320530,320530,320530,,101.0,2013-03-20,2013-05-28,NaT,NaT,NaT,NaT,NaT,1915-04-26,2013-03-19,2013-06-28,2013-06-28,2013-03-20,2,,,,3,1,,,,,2320.0,497.0,,*R688,*R092,*C490,,,3,,832,2,,,8578075,,91062,,,,,999993.0,,1,,,,,4,,,,1,0.0,0.0,2,,,N,3
3,,1,1,I219,I219,,,2,4,,MES3205300001,320530,320530,320530,,75.0,2013-04-14,2013-06-13,NaT,NaT,NaT,NaT,NaT,1925-09-08,2013-04-14,2013-06-28,2013-06-28,2013-04-14,9,,,,2,1,,,,,,487.0,,*R092,*I219,*I500,,,3,,832,2,,,8578076,,4005,,,,,999993.0,,1,,,,,1,,,,1,0.0,0.0,2,,,N,4
4,,9,1,I259,I259,,,9,2,,MES3205300001,320530,320530,320530,,59.0,2013-03-19,2013-05-13,NaT,NaT,NaT,NaT,NaT,1950-08-24,2013-03-19,2013-05-17,2013-05-17,2013-03-20,9,,,,1,9,,,,,1745.0,462.0,,*J81X,*I259,*I10X,,,3,,800,9,,,8581617,,6294,,,,,,,1,,,,,4,,,,1,0.0,0.0,2,,,N,5


### SIM DOES2014 `df_sim_does2014_raw`

In [7]:
display(pf_sim_does2014_raw)

Stored 'df_sim_does2014_raw' (DataFrame)


0,1
Number of variables,93
Number of observations,22030
Total Missing (%),49.0%
Total size in memory,7.4 MiB
Average record size in memory,353.1 B

0,1
Numeric,12
Categorical,63
Boolean,1
Date,10
Text (Unique),0
Rejected,7
Unsupported,0

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),92.3%
Missing (n),20344

0,1
9,1040
2,563
1,83
(Missing),20344

Value,Count,Frequency (%),Unnamed: 3
9,1040,4.7%,
2,563,2.6%,
1,83,0.4%,
(Missing),20344,92.3%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.6%
Missing (n),21497

0,1
2,450
1,83
(Missing),21497

Value,Count,Frequency (%),Unnamed: 3
2,450,2.0%,
1,83,0.4%,
(Missing),21497,97.6%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),7.8%
Missing (n),1718

0,1
1,13881
9,3348
2,3083
(Missing),1718

Value,Count,Frequency (%),Unnamed: 3
1,13881,63.0%,
9,3348,15.2%,
2,3083,14.0%,
(Missing),1718,7.8%,

0,1
Distinct count,16327
Unique (%),74.1%
Missing (%),0.0%
Missing (n),0

0,1
I219/I10,124
A419/J189,117
I219,114
Other values (16324),21675

Value,Count,Frequency (%),Unnamed: 3
I219/I10,124,0.6%,
A419/J189,117,0.5%,
I219,114,0.5%,
R99,105,0.5%,
C349,103,0.5%,
Y349,88,0.4%,
C159,72,0.3%,
R092/I219,71,0.3%,
S069/X954,68,0.3%,
C509,66,0.3%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.4%
Missing (n),99

0,1
1,6670
2,5197
3,3842
Other values (2),6222

Value,Count,Frequency (%),Unnamed: 3
1,6670,30.3%,
2,5197,23.6%,
3,3842,17.4%,
5,3544,16.1%,
4,2678,12.2%,
(Missing),99,0.4%,

0,1
Distinct count,1525
Unique (%),6.9%
Missing (%),0.0%
Missing (n),0

0,1
I219,1731
X954,743
J189,718
Other values (1522),18838

Value,Count,Frequency (%),Unnamed: 3
I219,1731,7.9%,
X954,743,3.4%,
J189,718,3.3%,
I64,689,3.1%,
E149,530,2.4%,
G309,420,1.9%,
C349,416,1.9%,
I110,414,1.9%,
I694,388,1.8%,
I678,361,1.6%,

0,1
Distinct count,1452
Unique (%),6.6%
Missing (%),0.0%
Missing (n),4

0,1
I219,1720
J189,789
X954,708
Other values (1448),18809

Value,Count,Frequency (%),Unnamed: 3
I219,1720,7.8%,
J189,789,3.6%,
X954,708,3.2%,
I64,679,3.1%,
E149,512,2.3%,
C349,408,1.9%,
G309,405,1.8%,
I110,374,1.7%,
I678,357,1.6%,
I694,350,1.6%,

0,1
Constant value,

0,1
Constant value,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),82.2%
Missing (n),18108

0,1
1,1845
3,1556
9,346
Other values (2),175
(Missing),18108

Value,Count,Frequency (%),Unnamed: 3
1,1845,8.4%,
3,1556,7.1%,
9,346,1.6%,
2,165,0.7%,
4,10,0.0%,
(Missing),18108,82.2%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),99.8%
Missing (n),21991

0,1
2,28
1,11
(Missing),21991

Value,Count,Frequency (%),Unnamed: 3
2,28,0.1%,
1,11,0.0%,
(Missing),21991,99.8%,

0,1
Distinct count,310
Unique (%),1.4%
Missing (%),26.9%
Missing (n),5921

0,1
7257406,1319
0011738,916
2550687,859
Other values (306),13015
(Missing),5921

Value,Count,Frequency (%),Unnamed: 3
7257406,1319,6.0%,
0011738,916,4.2%,
2550687,859,3.9%,
2485680,852,3.9%,
2547821,667,3.0%,
2446030,577,2.6%,
2546957,550,2.5%,
2494442,518,2.4%,
0011746,504,2.3%,
0011819,458,2.1%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
S,22026
N,4

Value,Count,Frequency (%),Unnamed: 3
S,22026,100.0%,
N,4,0.0%,

0,1
Distinct count,90
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
RES3205300001,9696
MES3205300001,3902
MES3205200001,2703
Other values (87),5729

Value,Count,Frequency (%),Unnamed: 3
RES3205300001,9696,44.0%,
MES3205300001,3902,17.7%,
MES3205200001,2703,12.3%,
MES3205000001,2688,12.2%,
MES3201300001,1200,5.4%,
MES3201500001,1197,5.4%,
MES3200600001,361,1.6%,
MRJ3300600001,24,0.1%,
RRJ3304550000,24,0.1%,
MRJ3302200001,19,0.1%,

0,1
Distinct count,878
Unique (%),4.0%
Missing (%),15.7%
Missing (n),3453

0,1
320530,1467
320150,1145
320520,800
Other values (874),15165
(Missing),3453

Value,Count,Frequency (%),Unnamed: 3
320530,1467,6.7%,
320150,1145,5.2%,
320520,800,3.6%,
320120,634,2.9%,
320000,563,2.6%,
320010,547,2.5%,
320320,525,2.4%,
320500,419,1.9%,
320060,407,1.8%,
320490,393,1.8%,

0,1
Distinct count,180
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0

0,1
320530,3913
320520,2708
320500,2692
Other values (177),12717

Value,Count,Frequency (%),Unnamed: 3
320530,3913,17.8%,
320520,2708,12.3%,
320500,2692,12.2%,
320120,2027,9.2%,
320150,1317,6.0%,
320130,1201,5.5%,
320490,1028,4.7%,
320320,903,4.1%,
320090,371,1.7%,
320060,363,1.6%,

0,1
Distinct count,79
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
320520,2575
320500,2284
320130,2230
Other values (76),14941

Value,Count,Frequency (%),Unnamed: 3
320520,2575,11.7%,
320500,2284,10.4%,
320130,2230,10.1%,
320530,2029,9.2%,
320120,1316,6.0%,
320320,821,3.7%,
320150,796,3.6%,
320240,669,3.0%,
320490,576,2.6%,
320060,440,2.0%,

0,1
Distinct count,66
Unique (%),0.3%
Missing (%),70.6%
Missing (n),15552

0,1
320530,4913
320320,592
320120,502
Other values (62),471
(Missing),15552

Value,Count,Frequency (%),Unnamed: 3
320530,4913,22.3%,
320320,592,2.7%,
320120,502,2.3%,
320150,328,1.5%,
320500,22,0.1%,
330240,11,0.0%,
293135,9,0.0%,
330100,9,0.0%,
310620,8,0.0%,
312770,5,0.0%,

0,1
Distinct count,3053
Unique (%),13.9%
Missing (%),0.3%
Missing (n),58

0,1
6507,477
6733,328
6441,273
Other values (3049),20894

Value,Count,Frequency (%),Unnamed: 3
6507,477,2.2%,
6733,328,1.5%,
6441,273,1.2%,
5132,246,1.1%,
4875,235,1.1%,
11809,194,0.9%,
8207,193,0.9%,
9434,192,0.9%,
9370,187,0.8%,
8887,173,0.8%,

0,1
Distinct count,602
Unique (%),2.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,104.01085
Minimum,2.0
Maximum,814.0
Zeros (%),0.0%

0,1
Minimum,2.0
5-th percentile,24.0
Q1,41.0
Median,59.0
Q3,105.0
95-th percentile,386.0
Maximum,814.0
Range,812.0
Interquartile range,64.0

0,1
Standard deviation,112.1081
Coef of variation,1.0778501
Kurtosis,4.308228
Mean,104.01085
MAD,77.989105
Skewness,2.17938
Sum,2291359.0
Variance,12568.227
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
44.0,354,1.6%,
45.0,345,1.6%,
48.0,326,1.5%,
52.0,316,1.4%,
42.0,312,1.4%,
50.0,311,1.4%,
56.0,309,1.4%,
53.0,308,1.4%,
51.0,307,1.4%,
46.0,306,1.4%,

Value,Count,Frequency (%),Unnamed: 3
2.0,1,0.0%,
3.0,1,0.0%,
4.0,2,0.0%,
6.0,3,0.0%,
7.0,5,0.0%,

Value,Count,Frequency (%),Unnamed: 3
754.0,2,0.0%,
777.0,1,0.0%,
780.0,1,0.0%,
799.0,1,0.0%,
814.0,1,0.0%,

0,1
Distinct count,382
Unique (%),1.7%
Missing (%),0.1%
Missing (n),28
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-01 00:00:00
Maximum,2015-09-11 00:00:00

0,1
Distinct count,326
Unique (%),1.5%
Missing (%),1.2%
Missing (n),275
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-10 00:00:00
Maximum,2016-04-18 00:00:00

0,1
Distinct count,230
Unique (%),1.0%
Missing (%),97.3%
Missing (n),21439
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-02-18 00:00:00
Maximum,2015-12-04 00:00:00

0,1
Distinct count,264
Unique (%),1.2%
Missing (%),94.9%
Missing (n),20909
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-02-18 00:00:00
Maximum,2015-10-28 00:00:00

0,1
Constant value,

0,1
Distinct count,290
Unique (%),1.3%
Missing (%),95.0%
Missing (n),20924
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-20 00:00:00
Maximum,2015-10-28 00:00:00

0,1
Distinct count,439
Unique (%),2.0%
Missing (%),84.5%
Missing (n),18609
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-07 00:00:00
Maximum,2016-03-07 00:00:00

0,1
Distinct count,14968
Unique (%),67.9%
Missing (%),0.2%
Missing (n),52
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1901-02-02 00:00:00
Maximum,2014-12-29 00:00:00

0,1
Distinct count,365
Unique (%),1.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-01 00:00:00
Maximum,2014-12-31 00:00:00

0,1
Distinct count,211
Unique (%),1.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-21 00:00:00
Maximum,2016-04-20 00:00:00

0,1
Distinct count,185
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2014-01-21 00:00:00
Maximum,2016-04-19 00:00:00

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),11.7%
Missing (n),2581

0,1
9,4699
2,3960
3,2810
Other values (4),7980

Value,Count,Frequency (%),Unnamed: 3
9,4699,21.3%,
2,3960,18.0%,
3,2810,12.8%,
0,2776,12.6%,
1,2771,12.6%,
4,1873,8.5%,
5,560,2.5%,
(Missing),2581,11.7%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),24.5%
Missing (n),5388

0,1
1,4944
9,4685
0,2766
Other values (4),4247
(Missing),5388

Value,Count,Frequency (%),Unnamed: 3
1,4944,22.4%,
9,4685,21.3%,
0,2766,12.6%,
2,2154,9.8%,
3,1533,7.0%,
5,468,2.1%,
4,92,0.4%,
(Missing),5388,24.5%,

0,1
Distinct count,14
Unique (%),0.1%
Missing (%),24.5%
Missing (n),5388

0,1
09,4685
10,3462
00,2766
Other values (10),5729
(Missing),5388

Value,Count,Frequency (%),Unnamed: 3
09,4685,21.3%,
10,3462,15.7%,
00,2766,12.6%,
11,1324,6.0%,
12,1293,5.9%,
02,989,4.5%,
01,493,2.2%,
03,490,2.2%,
08,468,2.1%,
04,340,1.5%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21470

0,1
4,250
3,133
5,78
Other values (4),99
(Missing),21470

Value,Count,Frequency (%),Unnamed: 3
4,250,1.1%,
3,133,0.6%,
5,78,0.4%,
9,56,0.3%,
2,22,0.1%,
1,12,0.1%,
0,9,0.0%,
(Missing),21470,97.5%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21481

0,1
3,205
2,162
5,61
Other values (4),121
(Missing),21481

Value,Count,Frequency (%),Unnamed: 3
3,205,0.9%,
2,162,0.7%,
5,61,0.3%,
9,56,0.3%,
1,37,0.2%,
4,16,0.1%,
0,12,0.1%,
(Missing),21481,97.5%,

0,1
Distinct count,14
Unique (%),0.1%
Missing (%),97.5%
Missing (n),21481

0,1
12,140
11,69
08,61
Other values (10),279
(Missing),21481

Value,Count,Frequency (%),Unnamed: 3
12,140,0.6%,
11,69,0.3%,
08,61,0.3%,
09,56,0.3%,
03,48,0.2%,
04,45,0.2%,
06,39,0.2%,
05,26,0.1%,
10,17,0.1%,
07,16,0.1%,

0,1
Constant value,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),13.4%
Missing (n),2953

0,1
2,6622
1,5221
3,4416
Other values (3),2818
(Missing),2953

Value,Count,Frequency (%),Unnamed: 3
2,6622,30.1%,
1,5221,23.7%,
3,4416,20.0%,
9,1262,5.7%,
4,1195,5.4%,
5,361,1.6%,
(Missing),2953,13.4%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),99.8%
Missing (n),21994

0,1
1,31
2,5
(Missing),21994

Value,Count,Frequency (%),Unnamed: 3
1,31,0.1%,
2,5,0.0%,
(Missing),21994,99.8%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),83.0%
Missing (n),18274

0,1
1,2106
9,601
2,580
Other values (2),469
(Missing),18274

Value,Count,Frequency (%),Unnamed: 3
1,2106,9.6%,
9,601,2.7%,
2,580,2.6%,
4,303,1.4%,
3,166,0.8%,
(Missing),18274,83.0%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),84.1%
Missing (n),18519

0,1
3,958
6,907
1,698
Other values (6),948
(Missing),18519

Value,Count,Frequency (%),Unnamed: 3
3,958,4.3%,
6,907,4.1%,
1,698,3.2%,
8,378,1.7%,
4,286,1.3%,
2,186,0.8%,
7,67,0.3%,
5,29,0.1%,
9,2,0.0%,
(Missing),18519,84.1%,

0,1
Distinct count,39
Unique (%),0.2%
Missing (%),94.9%
Missing (n),20909

0,1
SXXXXX,244
SSXXXX,102
SXSXXX,102
Other values (35),673
(Missing),20909

Value,Count,Frequency (%),Unnamed: 3
SXXXXX,244,1.1%,
SSXXXX,102,0.5%,
SXSXXX,102,0.5%,
XXXXXS,91,0.4%,
SXXXXS,71,0.3%,
XXSXXX,69,0.3%,
XXXXSX,54,0.2%,
XXXSXX,53,0.2%,
SXXXSX,37,0.2%,
XSXXXX,37,0.2%,

0,1
Distinct count,38
Unique (%),0.2%
Missing (%),0.0%
Missing (n),0

0,1
XXXXXXX,21497
SXSSXXX,95
XXXSXXX,88
Other values (35),350

Value,Count,Frequency (%),Unnamed: 3
XXXXXXX,21497,97.6%,
SXSSXXX,95,0.4%,
XXXSXXX,88,0.4%,
XXSXXXX,81,0.4%,
SXXSXXX,80,0.4%,
SXSXXXX,41,0.2%,
SXXXXXX,26,0.1%,
XXSSXXX,26,0.1%,
XXSXSXX,9,0.0%,
SSSSXXX,8,0.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.4%
Missing (n),21468

0,1
5,167
2,122
4,115
Other values (4),158
(Missing),21468

Value,Count,Frequency (%),Unnamed: 3
5,167,0.8%,
2,122,0.6%,
4,115,0.5%,
3,89,0.4%,
1,50,0.2%,
9,13,0.1%,
6,6,0.0%,
(Missing),21468,97.4%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.3%
Missing (n),21439

0,1
1,530
2,52
9,5
(Missing),21439

Value,Count,Frequency (%),Unnamed: 3
1,530,2.4%,
2,52,0.2%,
9,5,0.0%,
3,4,0.0%,
(Missing),21439,97.3%,

0,1
Distinct count,1284
Unique (%),5.8%
Missing (%),10.7%
Missing (n),2348
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1192.262
Minimum,0.0
Maximum,2359.0
Zeros (%),0.2%

0,1
Minimum,0.0
5-th percentile,120.0
Q1,615.25
Median,1200.0
Q3,1758.0
95-th percentile,2240.0
Maximum,2359.0
Range,2359.0
Interquartile range,1142.8

0,1
Standard deviation,677.50476
Coef of variation,0.5682516
Kurtosis,-1.176195
Mean,1192.262
MAD,587.1828
Skewness,0.0019528033
Sum,23466100.0
Variance,459012.7
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,277,1.3%,
500.0,230,1.0%,
900.0,228,1.0%,
700.0,216,1.0%,
800.0,214,1.0%,
1700.0,211,1.0%,
1000.0,207,0.9%,
1500.0,203,0.9%,
2100.0,202,0.9%,
1600.0,201,0.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,50,0.2%,
1.0,7,0.0%,
2.0,7,0.0%,
3.0,5,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2355.0,41,0.2%,
2356.0,4,0.0%,
2357.0,5,0.0%,
2358.0,3,0.0%,
2359.0,4,0.0%,

0,1
Distinct count,193
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,456.50055
Minimum,1.0
Maximum,999.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,416.0
Q1,448.0
Median,467.0
Q3,481.0
95-th percentile,492.0
Maximum,999.0
Range,998.0
Interquartile range,33.0

0,1
Standard deviation,52.9429
Coef of variation,0.11597555
Kurtosis,32.159122
Mean,456.50055
MAD,26.785627
Skewness,-3.402485
Sum,10056707.0
Variance,2802.9507
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
483.0,477,2.2%,
484.0,463,2.1%,
482.0,461,2.1%,
481.0,459,2.1%,
485.0,452,2.1%,
477.0,448,2.0%,
480.0,434,2.0%,
486.0,434,2.0%,
475.0,431,2.0%,
474.0,431,2.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,5,0.0%,
2.0,1,0.0%,
3.0,3,0.0%,
5.0,7,0.0%,
6.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
508.0,6,0.0%,
509.0,4,0.0%,
510.0,2,0.0%,
512.0,3,0.0%,
999.0,17,0.1%,

0,1
Distinct count,32
Unique (%),0.1%
Missing (%),97.5%
Missing (n),21469
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,26.351158
Minimum,14.0
Maximum,44.0
Zeros (%),0.0%

0,1
Minimum,14.0
5-th percentile,16.0
Q1,20.0
Median,26.0
Q3,31.0
95-th percentile,39.0
Maximum,44.0
Range,30.0
Interquartile range,11.0

0,1
Standard deviation,7.0160303
Coef of variation,0.2662513
Kurtosis,-0.71681464
Mean,26.351158
MAD,5.845819
Skewness,0.3000668
Sum,14783.0
Variance,49.22468
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
26.0,35,0.2%,
20.0,32,0.1%,
24.0,31,0.1%,
30.0,31,0.1%,
19.0,28,0.1%,
25.0,28,0.1%,
29.0,25,0.1%,
22.0,25,0.1%,
27.0,23,0.1%,
18.0,23,0.1%,

Value,Count,Frequency (%),Unnamed: 3
14.0,4,0.0%,
15.0,16,0.1%,
16.0,21,0.1%,
17.0,19,0.1%,
18.0,23,0.1%,

Value,Count,Frequency (%),Unnamed: 3
40.0,6,0.0%,
41.0,5,0.0%,
42.0,5,0.0%,
43.0,3,0.0%,
44.0,2,0.0%,

0,1
Distinct count,1042
Unique (%),4.7%
Missing (%),2.3%
Missing (n),503

0,1
*A419,3683
*R688,1352
*R092,1267
Other values (1038),15225

Value,Count,Frequency (%),Unnamed: 3
*A419,3683,16.7%,
*R688,1352,6.1%,
*R092,1267,5.8%,
*I219,1139,5.2%,
*J969,1046,4.7%,
*J81X,936,4.2%,
*J960,866,3.9%,
*T792,579,2.6%,
*R570,578,2.6%,
*S068,411,1.9%,

0,1
Distinct count,1586
Unique (%),7.2%
Missing (%),15.2%
Missing (n),3354

0,1
*J189,1643
*A419,998
*I219,719
Other values (1582),15316
(Missing),3354

Value,Count,Frequency (%),Unnamed: 3
*J189,1643,7.5%,
*A419,998,4.5%,
*I219,719,3.3%,
*I10X,708,3.2%,
*S069,517,2.3%,
*I500,371,1.7%,
*N390,348,1.6%,
*J180,344,1.6%,
*J159,299,1.4%,
*I509,270,1.2%,

0,1
Distinct count,1563
Unique (%),7.1%
Missing (%),40.5%
Missing (n),8919

0,1
*I10X,972
*J189,544
*X954,376
Other values (1559),11219
(Missing),8919

Value,Count,Frequency (%),Unnamed: 3
*I10X,972,4.4%,
*J189,544,2.5%,
*X954,376,1.7%,
*J449,299,1.4%,
*I251,282,1.3%,
*E149,274,1.2%,
*I64X,242,1.1%,
*I709,227,1.0%,
*I219,212,1.0%,
*N189,204,0.9%,

0,1
Distinct count,1055
Unique (%),4.8%
Missing (%),73.3%
Missing (n),16142

0,1
*I10X,847
*E149,294
*F102,208
Other values (1051),4539
(Missing),16142

Value,Count,Frequency (%),Unnamed: 3
*I10X,847,3.8%,
*E149,294,1.3%,
*F102,208,0.9%,
*I694,111,0.5%,
*J449,109,0.5%,
*G309,107,0.5%,
*F172,104,0.5%,
*I709,95,0.4%,
*I64X,90,0.4%,
*X954,87,0.4%,

0,1
Distinct count,2360
Unique (%),10.7%
Missing (%),66.0%
Missing (n),14544

0,1
*I10X,729
*E149,321
*I10X*E149,244
Other values (2356),6192
(Missing),14544

Value,Count,Frequency (%),Unnamed: 3
*I10X,729,3.3%,
*E149,321,1.5%,
*I10X*E149,244,1.1%,
*F172,187,0.8%,
*R54X,149,0.7%,
*E149*I10,147,0.7%,
*F102,133,0.6%,
*N189,128,0.6%,
*G309,122,0.6%,
*N19X,90,0.4%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,15298
3,3620
4,1704
Other values (3),1408

Value,Count,Frequency (%),Unnamed: 3
1,15298,69.4%,
3,3620,16.4%,
4,1704,7.7%,
2,810,3.7%,
5,530,2.4%,
9,68,0.3%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.6%
Missing (n),21497

0,1
3,522
9,6
1,4
(Missing),21497

Value,Count,Frequency (%),Unnamed: 3
3,522,2.4%,
9,6,0.0%,
1,4,0.0%,
2,1,0.0%,
(Missing),21497,97.6%,

0,1
Distinct count,47
Unique (%),0.2%
Missing (%),8.9%
Missing (n),1971

0,1
832,13773
831,2641
800,1415
Other values (43),2230
(Missing),1971

Value,Count,Frequency (%),Unnamed: 3
832,13773,62.5%,
831,2641,12.0%,
800,1415,6.4%,
829,1005,4.6%,
833,630,2.9%,
835,127,0.6%,
826,76,0.3%,
823,61,0.3%,
827,46,0.2%,
825,35,0.2%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),7.2%
Missing (n),1593

0,1
2,13310
1,6199
9,928
(Missing),1593

Value,Count,Frequency (%),Unnamed: 3
2,13310,60.4%,
1,6199,28.1%,
9,928,4.2%,
(Missing),1593,7.2%,

0,1
Distinct count,236
Unique (%),1.1%
Missing (%),97.3%
Missing (n),21439
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,134.08122
Minimum,17.0
Maximum,607.0
Zeros (%),0.0%

0,1
Minimum,17.0
5-th percentile,43.0
Q1,77.0
Median,108.0
Q3,166.0
95-th percentile,315.0
Maximum,607.0
Range,590.0
Interquartile range,89.0

0,1
Standard deviation,91.67381
Coef of variation,0.6837185
Kurtosis,5.2567425
Mean,134.08122
MAD,65.89674
Skewness,2.0141628
Sum,79242.0
Variance,8404.088
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
108.0,12,0.1%,
120.0,11,0.0%,
85.0,10,0.0%,
113.0,10,0.0%,
112.0,9,0.0%,
101.0,9,0.0%,
87.0,9,0.0%,
109.0,8,0.0%,
100.0,8,0.0%,
81.0,8,0.0%,

Value,Count,Frequency (%),Unnamed: 3
17.0,1,0.0%,
19.0,1,0.0%,
20.0,3,0.0%,
25.0,1,0.0%,
29.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
532.0,1,0.0%,
539.0,1,0.0%,
575.0,1,0.0%,
587.0,1,0.0%,
607.0,1,0.0%,

0,1
Distinct count,276
Unique (%),1.3%
Missing (%),95.0%
Missing (n),20924
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,99.32459
Minimum,0.0
Maximum,406.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,24.0
Q1,53.0
Median,78.0
Q3,122.75
95-th percentile,255.5
Maximum,406.0
Range,406.0
Interquartile range,69.75

0,1
Standard deviation,70.561386
Coef of variation,0.710412
Kurtosis,2.4841764
Mean,99.32459
MAD,52.386734
Skewness,1.5745417
Sum,109853.0
Variance,4978.909
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
63.0,17,0.1%,
55.0,17,0.1%,
84.0,16,0.1%,
52.0,15,0.1%,
58.0,15,0.1%,
81.0,14,0.1%,
100.0,14,0.1%,
60.0,14,0.1%,
77.0,14,0.1%,
79.0,13,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,1,0.0%,
4.0,1,0.0%,
6.0,2,0.0%,
9.0,1,0.0%,
10.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
365.0,1,0.0%,
369.0,1,0.0%,
388.0,1,0.0%,
402.0,1,0.0%,
406.0,1,0.0%,

0,1
Distinct count,286
Unique (%),1.3%
Missing (%),94.9%
Missing (n),20909
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,112.51472
Minimum,14.0
Maximum,543.0
Zeros (%),0.0%

0,1
Minimum,14.0
5-th percentile,38.0
Q1,62.0
Median,87.0
Q3,134.0
95-th percentile,275.0
Maximum,543.0
Range,529.0
Interquartile range,72.0

0,1
Standard deviation,75.24126
Coef of variation,0.6687237
Kurtosis,3.3773875
Mean,112.51472
MAD,55.625195
Skewness,1.7310216
Sum,126129.0
Variance,5661.2466
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
81.0,18,0.1%,
55.0,17,0.1%,
77.0,16,0.1%,
58.0,16,0.1%,
63.0,15,0.1%,
60.0,15,0.1%,
78.0,14,0.1%,
65.0,14,0.1%,
59.0,13,0.1%,
67.0,13,0.1%,

Value,Count,Frequency (%),Unnamed: 3
14.0,2,0.0%,
15.0,1,0.0%,
18.0,1,0.0%,
20.0,1,0.0%,
22.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
406.0,1,0.0%,
417.0,1,0.0%,
428.0,1,0.0%,
511.0,1,0.0%,
543.0,1,0.0%,

0,1
Distinct count,372
Unique (%),1.7%
Missing (%),98.3%
Missing (n),21658

0,1
64290701,2
64304940,1
64340277,1
Other values (368),368
(Missing),21658

Value,Count,Frequency (%),Unnamed: 3
64290701,2,0.0%,
64304940,1,0.0%,
64340277,1,0.0%,
64308642,1,0.0%,
64290280,1,0.0%,
64340602,1,0.0%,
68777744,1,0.0%,
64294972,1,0.0%,
68785053,1,0.0%,
64326412,1,0.0%,

0,1
Distinct count,22029
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0

0,1
19458646,2
20902805,1
18728881,1
Other values (22026),22026

Value,Count,Frequency (%),Unnamed: 3
19458646,2,0.0%,
20902805,1,0.0%,
18728881,1,0.0%,
20916989,1,0.0%,
20908049,1,0.0%,
20905273,1,0.0%,
16748353,1,0.0%,
19130027,1,0.0%,
20907967,1,0.0%,
19157193,1,0.0%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
0,4008
3,2023
9,2022
Other values (7),13977

Value,Count,Frequency (%),Unnamed: 3
0,4008,18.2%,
3,2023,9.2%,
9,2022,9.2%,
5,2012,9.1%,
8,2011,9.1%,
2,2010,9.1%,
1,1995,9.1%,
4,1988,9.0%,
6,1987,9.0%,
7,1974,9.0%,

0,1
Distinct count,129
Unique (%),0.6%
Missing (%),0.0%
Missing (n),0

0,1
20140035,920
20140019,848
20140021,808
Other values (126),19454

Value,Count,Frequency (%),Unnamed: 3
20140035,920,4.2%,
20140019,848,3.8%,
20140021,808,3.7%,
20140034,723,3.3%,
20140009,707,3.2%,
20140023,699,3.2%,
20140013,695,3.2%,
20150005,660,3.0%,
20140011,605,2.7%,
20140016,594,2.7%,

0,1
Distinct count,2886
Unique (%),13.1%
Missing (%),86.9%
Missing (n),19143

0,1
000000000000000,2
700209425752721,2
898003948545725,1
Other values (2882),2882
(Missing),19143

Value,Count,Frequency (%),Unnamed: 3
000000000000000,2,0.0%,
700209425752721,2,0.0%,
898003948545725,1,0.0%,
898003297357098,1,0.0%,
898003476845089,1,0.0%,
898050082853888,1,0.0%,
705004413367354,1,0.0%,
201629643010002,1,0.0%,
898000464654574,1,0.0%,
200392480240002,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),92.4%
Missing (n),20351

0,1
2,1329
9,327
1,23
(Missing),20351

Value,Count,Frequency (%),Unnamed: 3
2,1329,6.0%,
9,327,1.5%,
1,23,0.1%,
(Missing),20351,92.4%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.3%
Missing (n),21429

0,1
3,600
9,1
(Missing),21429

Value,Count,Frequency (%),Unnamed: 3
3,600,2.7%,
9,1,0.0%,
(Missing),21429,97.3%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),92.4%
Missing (n),20351

0,1
3,1298
9,327
1,31
(Missing),20351

Value,Count,Frequency (%),Unnamed: 3
3,1298,5.9%,
9,327,1.5%,
1,31,0.1%,
2,23,0.1%,
(Missing),20351,92.4%,

0,1
Distinct count,511
Unique (%),2.3%
Missing (%),25.6%
Missing (n),5630

0,1
999993,6046
999992,2709
621005,2217
Other values (507),5428
(Missing),5630

Value,Count,Frequency (%),Unnamed: 3
999993,6046,27.4%,
999992,2709,12.3%,
621005,2217,10.1%,
715210,570,2.6%,
999991,336,1.5%,
512105,257,1.2%,
622020,222,1.0%,
141410,198,0.9%,
354705,161,0.7%,
999994,147,0.7%,

0,1
Distinct count,88
Unique (%),0.4%
Missing (%),98.0%
Missing (n),21593

0,1
999992,194
999991,36
621005,20
Other values (84),187
(Missing),21593

Value,Count,Frequency (%),Unnamed: 3
999992,194,0.9%,
999991,36,0.2%,
621005,20,0.1%,
421125,9,0.0%,
521110,7,0.0%,
512105,7,0.0%,
411010,7,0.0%,
252105,6,0.0%,
412205,6,0.0%,
411005,5,0.0%,

0,1
Constant value,1

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.3%
Missing (n),21439

0,1
2,336
1,247
9,8
(Missing),21439

Value,Count,Frequency (%),Unnamed: 3
2,336,1.5%,
1,247,1.1%,
9,8,0.0%,
(Missing),21439,97.3%,

0,1
Distinct count,387
Unique (%),1.8%
Missing (%),97.4%
Missing (n),21458
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1895.2028
Minimum,245.0
Maximum,4550.0
Zeros (%),0.0%

0,1
Minimum,245.0
5-th percentile,462.75
Q1,828.75
Median,1800.0
Q3,2900.0
95-th percentile,3697.2
Maximum,4550.0
Range,4305.0
Interquartile range,2071.2

0,1
Standard deviation,1120.2227
Coef of variation,0.5910833
Kurtosis,-1.1722802
Mean,1895.2028
MAD,993.8973
Skewness,0.30767417
Sum,1084056.0
Variance,1254898.9
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
800.0,7,0.0%,
740.0,5,0.0%,
675.0,5,0.0%,
2000.0,5,0.0%,
2500.0,4,0.0%,
3000.0,4,0.0%,
2920.0,4,0.0%,
495.0,4,0.0%,
1700.0,4,0.0%,
1100.0,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
245.0,1,0.0%,
270.0,1,0.0%,
275.0,1,0.0%,
290.0,1,0.0%,
305.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4300.0,1,0.0%,
4450.0,1,0.0%,
4495.0,1,0.0%,
4500.0,2,0.0%,
4550.0,1,0.0%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),97.8%
Missing (n),21537
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.969574
Minimum,0.0
Maximum,99.0
Zeros (%),1.6%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,0.0
Median,0.0
Q3,1.0
95-th percentile,2.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,15.833389
Coef of variation,5.3318725
Kurtosis,33.174698
Mean,2.969574
MAD,5.073216
Skewness,5.913958
Sum,1464.0
Variance,250.69623
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
0.0,344,1.6%,
1.0,102,0.5%,
2.0,29,0.1%,
99.0,13,0.1%,
3.0,3,0.0%,
4.0,2,0.0%,
(Missing),21537,97.8%,

Value,Count,Frequency (%),Unnamed: 3
0.0,344,1.6%,
1.0,102,0.5%,
2.0,29,0.1%,
3.0,3,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,102,0.5%,
2.0,29,0.1%,
3.0,3,0.0%,
4.0,2,0.0%,
99.0,13,0.1%,

0,1
Distinct count,12
Unique (%),0.1%
Missing (%),97.6%
Missing (n),21491
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.398887
Minimum,0.0
Maximum,99.0
Zeros (%),0.4%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,1.0
Median,1.0
Q3,2.0
95-th percentile,5.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,13.229546
Coef of variation,3.892317
Kurtosis,48.239277
Mean,3.398887
MAD,3.81622
Skewness,7.0349827
Sum,1832.0
Variance,175.02087
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
1.0,219,1.0%,
2.0,113,0.5%,
0.0,96,0.4%,
3.0,47,0.2%,
4.0,30,0.1%,
5.0,15,0.1%,
99.0,10,0.0%,
6.0,6,0.0%,
10.0,1,0.0%,
7.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,96,0.4%,
1.0,219,1.0%,
2.0,113,0.5%,
3.0,47,0.2%,
4.0,30,0.1%,

Value,Count,Frequency (%),Unnamed: 3
6.0,6,0.0%,
7.0,1,0.0%,
8.0,1,0.0%,
10.0,1,0.0%,
99.0,10,0.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),11.9%
Missing (n),2632

0,1
1,8932
4,8481
2,1890
Other values (2),95
(Missing),2632

Value,Count,Frequency (%),Unnamed: 3
1,8932,40.5%,
4,8481,38.5%,
2,1890,8.6%,
3,74,0.3%,
5,21,0.1%,
(Missing),2632,11.9%,

0,1
Distinct count,33
Unique (%),0.1%
Missing (%),97.5%
Missing (n),21470
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,32.596428
Minimum,0.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,21.0
Q1,27.0
Median,33.0
Q3,38.0
95-th percentile,40.0
Maximum,99.0
Range,99.0
Interquartile range,11.0

0,1
Standard deviation,12.904548
Coef of variation,0.3958884
Kurtosis,14.547313
Mean,32.596428
MAD,7.542168
Skewness,2.7137003
Sum,18254.0
Variance,166.52736
Memory size,86.1 KiB

Value,Count,Frequency (%),Unnamed: 3
38.0,50,0.2%,
39.0,40,0.2%,
28.0,36,0.2%,
37.0,35,0.2%,
40.0,34,0.2%,
27.0,32,0.1%,
36.0,28,0.1%,
34.0,25,0.1%,
24.0,25,0.1%,
29.0,24,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,2,0.0%,
1.0,7,0.0%,
2.0,3,0.0%,
3.0,2,0.0%,
4.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
40.0,34,0.2%,
41.0,8,0.0%,
42.0,5,0.0%,
43.0,1,0.0%,
99.0,13,0.1%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),88.4%
Missing (n),19478

0,1
4,989
3,393
8,340
Other values (5),830
(Missing),19478

Value,Count,Frequency (%),Unnamed: 3
4,989,4.5%,
3,393,1.8%,
8,340,1.5%,
5,257,1.2%,
2,175,0.8%,
1,165,0.7%,
6,123,0.6%,
7,110,0.5%,
(Missing),19478,88.4%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),99.2%
Missing (n),21852

0,1
8,45
3,40
5,19
Other values (5),74
(Missing),21852

Value,Count,Frequency (%),Unnamed: 3
8,45,0.2%,
3,40,0.2%,
5,19,0.1%,
1,18,0.1%,
7,17,0.1%,
4,15,0.1%,
6,12,0.1%,
2,12,0.1%,
(Missing),21852,99.2%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,12846
2,9180
0,4

Value,Count,Frequency (%),Unnamed: 3
1,12846,58.3%,
2,9180,41.7%,
0,4,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),4

0,1
S,22026
(Missing),4

Value,Count,Frequency (%),Unnamed: 3
S,22026,100.0%,
(Missing),4,0.0%,

0,1
Constant value,0.0

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
Mean,0.005537903

0,1
0.0,21908
1.0,122

Value,Count,Frequency (%),Unnamed: 3
0.0,21908,99.4%,
1.0,122,0.6%,

0,1
Constant value,2

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),92.4%
Missing (n),20353

0,1
8,1274
9,327
4,31
Other values (4),45
(Missing),20353

Value,Count,Frequency (%),Unnamed: 3
8,1274,5.8%,
9,327,1.5%,
4,31,0.1%,
5,22,0.1%,
1,15,0.1%,
3,4,0.0%,
2,4,0.0%,
(Missing),20353,92.4%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),94.9%
Missing (n),20909

0,1
M,1113
R,4
E,4
(Missing),20909

Value,Count,Frequency (%),Unnamed: 3
M,1113,5.1%,
R,4,0.0%,
E,4,0.0%,
(Missing),20909,94.9%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),94.9%
Missing (n),20909

0,1
9,876
8,182
5,26
Other values (5),37
(Missing),20909

Value,Count,Frequency (%),Unnamed: 3
9,876,4.0%,
8,182,0.8%,
5,26,0.1%,
6,19,0.1%,
1,9,0.0%,
4,7,0.0%,
2,1,0.0%,
3,1,0.0%,
(Missing),20909,94.9%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),1.0%
Missing (n),226

0,1
N,18259
S,3545
(Missing),226

Value,Count,Frequency (%),Unnamed: 3
N,18259,82.9%,
S,3545,16.1%,
(Missing),226,1.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.7%
Missing (n),21967

0,1
1,39
2,20
3,4
(Missing),21967

Value,Count,Frequency (%),Unnamed: 3
1,39,0.2%,
2,20,0.1%,
3,4,0.0%,
(Missing),21967,99.7%,

0,1
Distinct count,22030
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,11016
Minimum,1
Maximum,22030
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,1102.5
Q1,5508.2
Median,11016.0
Q3,16523.0
95-th percentile,20929.0
Maximum,22030.0
Range,22029.0
Interquartile range,11014.0

0,1
Standard deviation,6359.7
Coef of variation,0.57734
Kurtosis,-1.2
Mean,11016
MAD,5507.5
Skewness,0
Sum,242671465
Variance,40445000
Memory size,172.2 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,1,0.0%,
10912,1,0.0%,
12947,1,0.0%,
2708,1,0.0%,
661,1,0.0%,
6806,1,0.0%,
4759,1,0.0%,
19100,1,0.0%,
17053,1,0.0%,
21151,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,1,0.0%,
2,1,0.0%,
3,1,0.0%,
4,1,0.0%,
5,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
22026,1,0.0%,
22027,1,0.0%,
22028,1,0.0%,
22029,1,0.0%,
22030,1,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),11

0,1
3.2,22019
(Missing),11

Value,Count,Frequency (%),Unnamed: 3
3.2,22019,100.0%,
(Missing),11,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
3.2.00,22004
3.2.01,14
3.2.02,12

Value,Count,Frequency (%),Unnamed: 3
3.2.00,22004,99.9%,
3.2.01,14,0.1%,
3.2.02,12,0.1%,

Unnamed: 0.1,ACIDTRAB,ALTCAUSA,ASSISTMED,ATESTADO,ATESTANTE,CAUSABAS,CAUSABAS_O,CAUSAMAT,CB_PRE,CIRCOBITO,CIRURGIA,CODESTAB,CODIFICADO,CODINST,CODMUNNATU,CODMUNOCOR,CODMUNRES,COMUNSVOIM,CRM,DIFDATA,DTATESTADO,DTCADASTRO,DTCADINF,DTCADINV,DTCONCASO,DTCONINV,DTINVESTIG,DTNASC,DTOBITO,DTRECEBIM,DTRECORIGA,ESC,ESC2010,ESCFALAGR1,ESCMAE,ESCMAE2010,ESCMAEAGR1,ESTABDESCR,ESTCIV,EXAME,FONTE,FONTEINV,FONTES,FONTESINF,GESTACAO,GRAVIDEZ,HORAOBITO,IDADE,IDADEMAE,LINHAA,LINHAB,LINHAC,LINHAD,LINHAII,LOCOCOR,MORTEPARTO,NATURAL,NECROPSIA,NUDIASINF,NUDIASOBCO,NUDIASOBIN,NUMERODN,NUMERODO,NUMERODV,NUMEROLOTE,NUMSUS,OBITOGRAV,OBITOPARTO,OBITOPUERP,OCUP,OCUPMAE,ORIGEM,PARTO,PESO,QTDFILMORT,QTDFILVIVO,RACACOR,SEMAGESTAC,SERIESCFAL,SERIESCMAE,SEXO,STCODIFICA,STDOEPIDEM,STDONOVA,TIPOBITO,TPMORTEOCO,TPNIVELINV,TPOBITOCOR,TPPOS,TPRESGINFO,Unnamed: 0,VERSAOSCB,VERSAOSIST
0,,,2,T794 T792/S271/S273/X994,3,X994,X994,,,3.0,,,S,MES3205000001,320530,320500,320500,320530.0,4317,69.0,2014-01-01,2014-01-31,NaT,2014-02-27,NaT,2014-02-17,2014-02-17,1983-07-02,2014-01-01,2014-03-11,2014-02-14,3.0,2.0,11.0,,,,,2,,1.0,1.0,SXXXSX,XXXXXXX,,,,430.0,,*T794*T792,*S271,*S273,*X994,,4,,832,1,,47.0,57.0,,19273053,3,20140005,,2.0,,3.0,999992,,1,,,,,2.0,,,,2,S,0.0,0.0,2,8.0,M,8.0,S,,1,3.2,3.2.00
1,,,2,X700,3,X700,X700,,,2.0,,,S,MES3205300001,320470,320530,320530,320530.0,4312,203.0,2014-01-02,2014-01-16,NaT,2014-03-11,NaT,2014-02-14,2014-02-10,1976-10-30,2014-01-01,2014-07-23,2014-02-14,5.0,5.0,8.0,,,,,1,,1.0,1.0,XXXXSS,XXXXXXX,,,,437.0,,*X700,,,,,3,,832,1,,44.0,69.0,,19273010,0,20140020,,2.0,,3.0,214105,,1,,,,,4.0,,,,2,S,0.0,0.0,2,8.0,M,9.0,S,,2,3.2,3.2.00
2,,,2,S141/X950,3,X950,X950,,,3.0,,,S,MES3205300001,290560,320530,320530,320530.0,4312,190.0,2014-01-02,2014-01-16,NaT,2014-04-30,NaT,2014-01-20,2014-01-20,1986-09-21,2014-01-01,2014-07-10,2014-02-14,3.0,2.0,11.0,,,,,1,,1.0,1.0,XSXXSS,XXXXXXX,,,,427.0,,*S141,*X950,,,,3,,829,1,,19.0,119.0,,19273011,8,20140019,,1.0,,3.0,841420,,1,,,,,4.0,,,,2,S,0.0,0.0,2,1.0,M,1.0,S,2.0,3,3.2,3.2.00
3,,,2,J81/I500/I10*E149,4,I110,I110,,,,,,S,MES3205200001,320010,320520,320520,320530.0,8287,44.0,2014-01-02,2014-01-15,NaT,NaT,NaT,NaT,NaT,1947-02-27,2014-01-01,2014-02-14,2014-02-14,3.0,2.0,11.0,,,,,2,,,,,XXXXXXX,,,1800.0,466.0,,*J81X,*I500,*I10X,,*E149,3,,832,1,,,,,19273240,4,20140002,,,,,910105,,1,,,,,1.0,,,,1,S,0.0,0.0,2,,,,N,,4,3.2,3.2.00
4,,,1,C349,2,C349,C349,,,,,2494442.0,S,MES3205200001,320120,320520,320530,,12014,44.0,2014-01-01,2014-01-15,NaT,NaT,NaT,NaT,NaT,1951-04-29,2014-01-01,2014-02-14,2014-02-14,,,,,,,,1,,,,,XXXXXXX,,,930.0,462.0,,*C349,,,,,1,,832,2,,,,,19273220,0,20140002,,,,,724420,,1,,,,,,,,,1,S,0.0,0.0,2,,,,N,,5,3.2,3.2.00


### SIM DOES2015 `df_sim_does2015_raw`

In [8]:
display(pf_sim_does2015_raw)

Stored 'df_sim_does2015_raw' (DataFrame)


0,1
Number of variables,93
Number of observations,22332
Total Missing (%),49.3%
Total size in memory,7.5 MiB
Average record size in memory,352.2 B

0,1
Numeric,10
Categorical,63
Boolean,2
Date,10
Text (Unique),1
Rejected,7
Unsupported,0

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),93.2%
Missing (n),20808

0,1
9,918
2,537
1,69
(Missing),20808

Value,Count,Frequency (%),Unnamed: 3
9,918,4.1%,
2,537,2.4%,
1,69,0.3%,
(Missing),20808,93.2%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.4%
Missing (n),21755

0,1
2,472
1,105
(Missing),21755

Value,Count,Frequency (%),Unnamed: 3
2,472,2.1%,
1,105,0.5%,
(Missing),21755,97.4%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),11.5%
Missing (n),2566

0,1
1,13600
9,3477
2,2689
(Missing),2566

Value,Count,Frequency (%),Unnamed: 3
1,13600,60.9%,
9,3477,15.6%,
2,2689,12.0%,
(Missing),2566,11.5%,

0,1
Distinct count,16481
Unique (%),73.8%
Missing (%),0.0%
Missing (n),0

0,1
R99,137
A419/J189,136
I219/I10,120
Other values (16478),21939

Value,Count,Frequency (%),Unnamed: 3
R99,137,0.6%,
A419/J189,136,0.6%,
I219/I10,120,0.5%,
I219,107,0.5%,
Y349,92,0.4%,
C349,83,0.4%,
C159,68,0.3%,
C169,62,0.3%,
C509,60,0.3%,
R092/I219,59,0.3%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),1.5%
Missing (n),326

0,1
1,6400
2,5341
5,3837
Other values (2),6428

Value,Count,Frequency (%),Unnamed: 3
1,6400,28.7%,
2,5341,23.9%,
5,3837,17.2%,
3,3683,16.5%,
4,2745,12.3%,
(Missing),326,1.5%,

0,1
Distinct count,1494
Unique (%),6.7%
Missing (%),0.0%
Missing (n),0

0,1
I219,1777
J189,770
I64,615
Other values (1491),19170

Value,Count,Frequency (%),Unnamed: 3
I219,1777,8.0%,
J189,770,3.4%,
I64,615,2.8%,
X954,569,2.5%,
E149,559,2.5%,
G309,475,2.1%,
C349,441,2.0%,
I694,406,1.8%,
I678,393,1.8%,
J440,364,1.6%,

0,1
Distinct count,1441
Unique (%),6.5%
Missing (%),0.0%
Missing (n),5

0,1
I219,1768
J189,854
I64,609
Other values (1437),19096

Value,Count,Frequency (%),Unnamed: 3
I219,1768,7.9%,
J189,854,3.8%,
I64,609,2.7%,
E149,552,2.5%,
X954,535,2.4%,
G309,443,2.0%,
C349,439,2.0%,
I678,385,1.7%,
I694,365,1.6%,
J440,354,1.6%,

0,1
Constant value,

0,1
Constant value,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),83.7%
Missing (n),18694

0,1
1,1676
3,1378
9,383
Other values (2),201
(Missing),18694

Value,Count,Frequency (%),Unnamed: 3
1,1676,7.5%,
3,1378,6.2%,
9,383,1.7%,
2,188,0.8%,
4,13,0.1%,
(Missing),18694,83.7%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),100.0%
Missing (n),22327

0,1
2,4
9,1
(Missing),22327

Value,Count,Frequency (%),Unnamed: 3
2,4,0.0%,
9,1,0.0%,
(Missing),22327,100.0%,

0,1
Distinct count,294
Unique (%),1.3%
Missing (%),26.4%
Missing (n),5897

0,1
7257406,1223
2550687,921
0011738,855
Other values (290),13436
(Missing),5897

Value,Count,Frequency (%),Unnamed: 3
7257406,1223,5.5%,
2550687,921,4.1%,
0011738,855,3.8%,
2485680,798,3.6%,
2547821,683,3.1%,
2494442,566,2.5%,
2446030,565,2.5%,
2546957,495,2.2%,
0011746,487,2.2%,
7621442,388,1.7%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),1

0,1
S,22327
N,4
(Missing),1

Value,Count,Frequency (%),Unnamed: 3
S,22327,100.0%,
N,4,0.0%,
(Missing),1,0.0%,

0,1
Distinct count,84
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
RES3205300001,9755
MES3205300001,3992
MES3205200001,2730
Other values (81),5855

Value,Count,Frequency (%),Unnamed: 3
RES3205300001,9755,43.7%,
MES3205300001,3992,17.9%,
MES3205200001,2730,12.2%,
MES3205000001,2718,12.2%,
MES3201500001,1393,6.2%,
MES3201300001,1140,5.1%,
MES3200600001,337,1.5%,
MRJ3302200001,22,0.1%,
RRJ3304550000,20,0.1%,
MRJ3300600001,20,0.1%,

0,1
Distinct count,905
Unique (%),4.1%
Missing (%),14.9%
Missing (n),3336

0,1
320530,1306
320150,1280
320520,712
Other values (901),15698
(Missing),3336

Value,Count,Frequency (%),Unnamed: 3
320530,1306,5.8%,
320150,1280,5.7%,
320520,712,3.2%,
320120,627,2.8%,
320010,556,2.5%,
320000,547,2.4%,
320320,513,2.3%,
320490,421,1.9%,
320500,415,1.9%,
320060,382,1.7%,

0,1
Distinct count,172
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0

0,1
320530,4009
320520,2731
320500,2718
Other values (169),12874

Value,Count,Frequency (%),Unnamed: 3
320530,4009,18.0%,
320520,2731,12.2%,
320500,2718,12.2%,
320120,1936,8.7%,
320150,1421,6.4%,
320130,1140,5.1%,
320490,1124,5.0%,
320320,894,4.0%,
320090,346,1.5%,
320060,338,1.5%,

0,1
Distinct count,79
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
320520,2666
320500,2353
320130,2171
Other values (76),15142

Value,Count,Frequency (%),Unnamed: 3
320520,2666,11.9%,
320500,2353,10.5%,
320130,2171,9.7%,
320530,1921,8.6%,
320120,1353,6.1%,
320320,833,3.7%,
320150,806,3.6%,
320490,683,3.1%,
320240,653,2.9%,
320060,453,2.0%,

0,1
Distinct count,59
Unique (%),0.3%
Missing (%),71.4%
Missing (n),15950

0,1
320530,4788
320320,591
320120,516
Other values (55),487
(Missing),15950

Value,Count,Frequency (%),Unnamed: 3
320530,4788,21.4%,
320320,591,2.6%,
320120,516,2.3%,
320150,376,1.7%,
293135,9,0.0%,
320500,9,0.0%,
330100,8,0.0%,
310620,7,0.0%,
320520,5,0.0%,
316860,5,0.0%,

0,1
Distinct count,3110
Unique (%),13.9%
Missing (%),0.5%
Missing (n),121

0,1
6507,536
6733,397
5132,320
Other values (3106),20958

Value,Count,Frequency (%),Unnamed: 3
6507,536,2.4%,
6733,397,1.8%,
5132,320,1.4%,
9434,261,1.2%,
11809,229,1.0%,
9389,216,1.0%,
8556,214,1.0%,
4631,187,0.8%,
6752,185,0.8%,
9370,166,0.7%,

0,1
Distinct count,630
Unique (%),2.8%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,77.88044
Minimum,1.0
Maximum,791.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,18.0
Q1,32.0
Median,47.0
Q3,65.0
95-th percentile,314.0
Maximum,791.0
Range,790.0
Interquartile range,33.0

0,1
Standard deviation,100.766045
Coef of variation,1.2938557
Kurtosis,10.950298
Mean,77.88044
MAD,58.964973
Skewness,3.2151642
Sum,1739226.0
Variance,10153.796
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
37.0,419,1.9%,
39.0,417,1.9%,
46.0,399,1.8%,
36.0,393,1.8%,
40.0,390,1.7%,
47.0,388,1.7%,
38.0,382,1.7%,
30.0,381,1.7%,
42.0,377,1.7%,
41.0,376,1.7%,

Value,Count,Frequency (%),Unnamed: 3
1.0,1,0.0%,
3.0,2,0.0%,
4.0,4,0.0%,
5.0,4,0.0%,
6.0,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
769.0,1,0.0%,
772.0,1,0.0%,
776.0,1,0.0%,
780.0,1,0.0%,
791.0,1,0.0%,

0,1
Distinct count,383
Unique (%),1.7%
Missing (%),0.1%
Missing (n),20
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-01 00:00:00
Maximum,2016-11-16 00:00:00

0,1
Distinct count,333
Unique (%),1.5%
Missing (%),0.0%
Missing (n),3
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-09 00:00:00
Maximum,2017-01-31 00:00:00

0,1
Distinct count,260
Unique (%),1.2%
Missing (%),97.1%
Missing (n),21680
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-03-05 00:00:00
Maximum,2017-02-01 00:00:00

0,1
Distinct count,291
Unique (%),1.3%
Missing (%),94.7%
Missing (n),21138
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-22 00:00:00
Maximum,2016-11-29 00:00:00

0,1
Constant value,

0,1
Distinct count,299
Unique (%),1.3%
Missing (%),94.7%
Missing (n),21148
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-14 00:00:00
Maximum,2016-11-29 00:00:00

0,1
Distinct count,422
Unique (%),1.9%
Missing (%),87.3%
Missing (n),19491
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-04 00:00:00
Maximum,2017-01-20 00:00:00

0,1
Distinct count,14951
Unique (%),66.9%
Missing (%),0.2%
Missing (n),51
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1900-08-10 00:00:00
Maximum,2015-12-29 00:00:00

0,1
Distinct count,365
Unique (%),1.6%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-01 00:00:00
Maximum,2015-12-31 00:00:00

0,1
Distinct count,203
Unique (%),0.9%
Missing (%),0.0%
Missing (n),2
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-15 00:00:00
Maximum,2017-03-21 00:00:00

0,1
Distinct count,180
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2015-01-15 00:00:00
Maximum,2017-01-31 00:00:00

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),24.1%
Missing (n),5379

0,1
9,5066
2,3687
1,2922
Other values (3),5278
(Missing),5379

Value,Count,Frequency (%),Unnamed: 3
9,5066,22.7%,
2,3687,16.5%,
1,2922,13.1%,
3,2850,12.8%,
4,1845,8.3%,
5,583,2.6%,
(Missing),5379,24.1%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),24.1%
Missing (n),5386

0,1
9,5062
1,4828
0,2922
Other values (4),4134
(Missing),5386

Value,Count,Frequency (%),Unnamed: 3
9,5062,22.7%,
1,4828,21.6%,
0,2922,13.1%,
2,2085,9.3%,
3,1467,6.6%,
5,486,2.2%,
4,96,0.4%,
(Missing),5386,24.1%,

0,1
Distinct count,14
Unique (%),0.1%
Missing (%),24.1%
Missing (n),5386

0,1
09,5062
10,3146
00,2922
Other values (10),5816
(Missing),5386

Value,Count,Frequency (%),Unnamed: 3
09,5062,22.7%,
10,3146,14.1%,
00,2922,13.1%,
11,1178,5.3%,
02,1141,5.1%,
12,1126,5.0%,
01,541,2.4%,
03,531,2.4%,
08,486,2.2%,
04,376,1.7%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21776

0,1
4,274
3,133
5,74
Other values (3),75
(Missing),21776

Value,Count,Frequency (%),Unnamed: 3
4,274,1.2%,
3,133,0.6%,
5,74,0.3%,
9,35,0.2%,
2,25,0.1%,
1,15,0.1%,
(Missing),21776,97.5%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21778

0,1
3,238
2,151
5,50
Other values (4),115
(Missing),21778

Value,Count,Frequency (%),Unnamed: 3
3,238,1.1%,
2,151,0.7%,
5,50,0.2%,
1,43,0.2%,
9,35,0.2%,
4,23,0.1%,
0,14,0.1%,
(Missing),21778,97.5%,

0,1
Distinct count,14
Unique (%),0.1%
Missing (%),97.5%
Missing (n),21778

0,1
12,141
06,68
11,62
Other values (10),283
(Missing),21778

Value,Count,Frequency (%),Unnamed: 3
12,141,0.6%,
06,68,0.3%,
11,62,0.3%,
03,53,0.2%,
08,50,0.2%,
04,36,0.2%,
09,35,0.2%,
05,29,0.1%,
07,23,0.1%,
10,18,0.1%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),100.0%
Missing (n),22331

0,1
VITORIA APART,1
(Missing),22331

Value,Count,Frequency (%),Unnamed: 3
VITORIA APART,1,0.0%,
(Missing),22331,100.0%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),13.7%
Missing (n),3062

0,1
2,6939
1,5007
3,4469
Other values (3),2855
(Missing),3062

Value,Count,Frequency (%),Unnamed: 3
2,6939,31.1%,
1,5007,22.4%,
3,4469,20.0%,
4,1242,5.6%,
9,1223,5.5%,
5,390,1.7%,
(Missing),3062,13.7%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),100.0%
Missing (n),22327

0,1
2,2
1,2
9,1
(Missing),22327

Value,Count,Frequency (%),Unnamed: 3
2,2,0.0%,
1,2,0.0%,
9,1,0.0%,
(Missing),22327,100.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),85.2%
Missing (n),19024

0,1
1,1753
9,868
2,376
Other values (2),311
(Missing),19024

Value,Count,Frequency (%),Unnamed: 3
1,1753,7.8%,
9,868,3.9%,
2,376,1.7%,
4,161,0.7%,
3,150,0.7%,
(Missing),19024,85.2%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),87.1%
Missing (n),19443

0,1
3,758
1,606
6,521
Other values (6),1004
(Missing),19443

Value,Count,Frequency (%),Unnamed: 3
3,758,3.4%,
1,606,2.7%,
6,521,2.3%,
4,350,1.6%,
8,341,1.5%,
2,174,0.8%,
7,93,0.4%,
5,44,0.2%,
9,2,0.0%,
(Missing),19443,87.1%,

0,1
Distinct count,38
Unique (%),0.2%
Missing (%),94.6%
Missing (n),21137

0,1
SXXXXX,296
SSXXXX,142
XXSXXX,126
Other values (34),631
(Missing),21137

Value,Count,Frequency (%),Unnamed: 3
SXXXXX,296,1.3%,
SSXXXX,142,0.6%,
XXSXXX,126,0.6%,
XXXXXS,107,0.5%,
SXSXXX,79,0.4%,
XXXXSX,61,0.3%,
XXXSXX,54,0.2%,
SXXXXS,40,0.2%,
XSXXXS,34,0.2%,
SXXXSX,30,0.1%,

0,1
Constant value,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.5%
Missing (n),21763

0,1
5,206
2,125
4,124
Other values (4),114
(Missing),21763

Value,Count,Frequency (%),Unnamed: 3
5,206,0.9%,
2,125,0.6%,
4,124,0.6%,
3,85,0.4%,
1,19,0.1%,
9,6,0.0%,
6,4,0.0%,
(Missing),21763,97.5%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.3%
Missing (n),21727

0,1
1,551
2,44
3,6
(Missing),21727

Value,Count,Frequency (%),Unnamed: 3
1,551,2.5%,
2,44,0.2%,
3,6,0.0%,
9,4,0.0%,
(Missing),21727,97.3%,

0,1
Distinct count,1292
Unique (%),5.8%
Missing (%),10.3%
Missing (n),2296
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1203.322
Minimum,0.0
Maximum,2359.0
Zeros (%),0.2%

0,1
Minimum,0.0
5-th percentile,126.0
Q1,630.0
Median,1200.0
Q3,1800.0
95-th percentile,2240.0
Maximum,2359.0
Range,2359.0
Interquartile range,1170.0

0,1
Standard deviation,673.90533
Coef of variation,0.5600374
Kurtosis,-1.1578877
Mean,1203.322
MAD,582.04095
Skewness,-0.010915146
Sum,24109760.0
Variance,454148.44
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,270,1.2%,
500.0,234,1.0%,
800.0,230,1.0%,
2000.0,219,1.0%,
700.0,206,0.9%,
2200.0,202,0.9%,
1800.0,202,0.9%,
1700.0,202,0.9%,
1600.0,199,0.9%,
1500.0,196,0.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,54,0.2%,
1.0,6,0.0%,
2.0,7,0.0%,
3.0,1,0.0%,
4.0,3,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2355.0,36,0.2%,
2356.0,3,0.0%,
2357.0,4,0.0%,
2358.0,7,0.0%,
2359.0,1,0.0%,

0,1
Distinct count,194
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,457.5978
Minimum,1.0
Maximum,999.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,417.0
Q1,450.0
Median,468.0
Q3,481.0
95-th percentile,492.0
Maximum,999.0
Range,998.0
Interquartile range,31.0

0,1
Standard deviation,51.417
Coef of variation,0.11236286
Kurtosis,31.918533
Mean,457.5978
MAD,25.96308
Skewness,-3.7946002
Sum,10219074.0
Variance,2643.708
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
484.0,514,2.3%,
485.0,508,2.3%,
481.0,483,2.2%,
479.0,471,2.1%,
477.0,464,2.1%,
486.0,461,2.1%,
483.0,460,2.1%,
480.0,459,2.1%,
482.0,456,2.0%,
478.0,438,2.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,9,0.0%,
2.0,1,0.0%,
5.0,2,0.0%,
12.0,1,0.0%,
15.0,3,0.0%,

Value,Count,Frequency (%),Unnamed: 3
509.0,2,0.0%,
510.0,1,0.0%,
511.0,2,0.0%,
514.0,1,0.0%,
999.0,12,0.1%,

0,1
Distinct count,33
Unique (%),0.1%
Missing (%),97.4%
Missing (n),21742
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,27.050848
Minimum,14.0
Maximum,45.0
Zeros (%),0.0%

0,1
Minimum,14.0
5-th percentile,16.0
Q1,21.0
Median,27.0
Q3,33.0
95-th percentile,39.0
Maximum,45.0
Range,31.0
Interquartile range,12.0

0,1
Standard deviation,7.0494823
Coef of variation,0.26060116
Kurtosis,-0.8285664
Mean,27.050848
MAD,5.898018
Skewness,0.15553658
Sum,15960.0
Variance,49.6952
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
33.0,32,0.1%,
26.0,30,0.1%,
30.0,30,0.1%,
25.0,29,0.1%,
27.0,28,0.1%,
28.0,28,0.1%,
29.0,27,0.1%,
18.0,27,0.1%,
23.0,27,0.1%,
17.0,26,0.1%,

Value,Count,Frequency (%),Unnamed: 3
14.0,7,0.0%,
15.0,7,0.0%,
16.0,18,0.1%,
17.0,26,0.1%,
18.0,27,0.1%,

Value,Count,Frequency (%),Unnamed: 3
41.0,8,0.0%,
42.0,4,0.0%,
43.0,2,0.0%,
44.0,1,0.0%,
45.0,1,0.0%,

0,1
Distinct count,1024
Unique (%),4.6%
Missing (%),2.5%
Missing (n),560

0,1
*A419,4027
*R688,1302
*R092,1152
Other values (1020),15291

Value,Count,Frequency (%),Unnamed: 3
*A419,4027,18.0%,
*R688,1302,5.8%,
*R092,1152,5.2%,
*I219,1131,5.1%,
*J969,1074,4.8%,
*J960,939,4.2%,
*J81X,786,3.5%,
*R570,633,2.8%,
*S068,451,2.0%,
*T792,379,1.7%,

0,1
Distinct count,1557
Unique (%),7.0%
Missing (%),15.8%
Missing (n),3539

0,1
*J189,1673
*A419,1102
*I219,714
Other values (1553),15304
(Missing),3539

Value,Count,Frequency (%),Unnamed: 3
*J189,1673,7.5%,
*A419,1102,4.9%,
*I219,714,3.2%,
*I10X,703,3.1%,
*S069,558,2.5%,
*N390,358,1.6%,
*J180,347,1.6%,
*I500,346,1.5%,
*J159,288,1.3%,
*J690,262,1.2%,

0,1
Distinct count,1482
Unique (%),6.6%
Missing (%),40.8%
Missing (n),9101

0,1
*I10X,981
*J189,618
*X954,313
Other values (1478),11319
(Missing),9101

Value,Count,Frequency (%),Unnamed: 3
*I10X,981,4.4%,
*J189,618,2.8%,
*X954,313,1.4%,
*J449,293,1.3%,
*E149,285,1.3%,
*I709,280,1.3%,
*I219,250,1.1%,
*I251,225,1.0%,
*I500,207,0.9%,
*I64X,207,0.9%,

0,1
Distinct count,1015
Unique (%),4.5%
Missing (%),74.1%
Missing (n),16557

0,1
*I10X,779
*E149,317
*F102,190
Other values (1011),4489
(Missing),16557

Value,Count,Frequency (%),Unnamed: 3
*I10X,779,3.5%,
*E149,317,1.4%,
*F102,190,0.9%,
*J449,136,0.6%,
*G309,122,0.5%,
*I709,119,0.5%,
*F172,114,0.5%,
*J189,114,0.5%,
*I694,93,0.4%,
*I64X,87,0.4%,

0,1
Distinct count,2307
Unique (%),10.3%
Missing (%),65.5%
Missing (n),14626

0,1
*I10X,795
*I10X*E149,289
*E149,287
Other values (2303),6335
(Missing),14626

Value,Count,Frequency (%),Unnamed: 3
*I10X,795,3.6%,
*I10X*E149,289,1.3%,
*E149,287,1.3%,
*F172,194,0.9%,
*E149*I10X,158,0.7%,
*G309,155,0.7%,
*F102,147,0.7%,
*N189,142,0.6%,
*R54X,141,0.6%,
*N179,122,0.5%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,15492
3,3717
4,1424
Other values (3),1699

Value,Count,Frequency (%),Unnamed: 3
1,15492,69.4%,
3,3717,16.6%,
4,1424,6.4%,
2,943,4.2%,
5,697,3.1%,
9,59,0.3%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.1%
Missing (n),21680

0,1
3,569
9,80
1,3
(Missing),21680

Value,Count,Frequency (%),Unnamed: 3
3,569,2.5%,
9,80,0.4%,
1,3,0.0%,
(Missing),21680,97.1%,

0,1
Distinct count,49
Unique (%),0.2%
Missing (%),9.9%
Missing (n),2213

0,1
832,13921
831,2725
829,1140
Other values (45),2333
(Missing),2213

Value,Count,Frequency (%),Unnamed: 3
832,13921,62.3%,
831,2725,12.2%,
829,1140,5.1%,
800,1061,4.8%,
833,621,2.8%,
835,144,0.6%,
826,74,0.3%,
823,58,0.3%,
827,53,0.2%,
825,36,0.2%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),10.9%
Missing (n),2434

0,1
2,12744
1,5888
9,1266
(Missing),2434

Value,Count,Frequency (%),Unnamed: 3
2,12744,57.1%,
1,5888,26.4%,
9,1266,5.7%,
(Missing),2434,10.9%,

0,1
Constant value,

0,1
Distinct count,216
Unique (%),1.0%
Missing (%),94.7%
Missing (n),21147
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,85.18819
Minimum,0.0
Maximum,547.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,24.0
Q1,50.0
Median,72.0
Q3,105.0
95-th percentile,176.8
Maximum,547.0
Range,547.0
Interquartile range,55.0

0,1
Standard deviation,59.27301
Coef of variation,0.6957891
Kurtosis,12.991222
Mean,85.18819
MAD,39.323723
Skewness,2.8154287
Sum,100948.0
Variance,3513.2898
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
72.0,20,0.1%,
51.0,19,0.1%,
57.0,18,0.1%,
68.0,18,0.1%,
65.0,18,0.1%,
70.0,18,0.1%,
48.0,18,0.1%,
92.0,17,0.1%,
58.0,15,0.1%,
56.0,15,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,2,0.0%,
2.0,1,0.0%,
3.0,1,0.0%,
5.0,2,0.0%,
7.0,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
410.0,1,0.0%,
466.0,1,0.0%,
487.0,1,0.0%,
523.0,1,0.0%,
547.0,1,0.0%,

0,1
Correlation,0.91958

0,1
Distinct count,321
Unique (%),1.4%
Missing (%),98.6%
Missing (n),22012

0,1
68803758,1
68790655,1
68768338,1
Other values (317),317
(Missing),22012

Value,Count,Frequency (%),Unnamed: 3
68803758,1,0.0%,
68790655,1,0.0%,
68768338,1,0.0%,
64295206,1,0.0%,
68825228,1,0.0%,
68773165,1,0.0%,
68782365,1,0.0%,
68798980,1,0.0%,
68821585,1,0.0%,
68797899,1,0.0%,

First 3 values
20921237
22194252
22176449

Last 3 values
22175040
22182202
22197870

Value,Count,Frequency (%),Unnamed: 3
8857853,1,0.0%,
14658688,1,0.0%,
15286050,1,0.0%,
15286052,1,0.0%,
16009670,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
23030753,1,0.0%,
23030840,1,0.0%,
23037103,1,0.0%,
23737285,1,0.0%,
23843644,1,0.0%,

0,1
Distinct count,11
Unique (%),0.0%
Missing (%),0.0%
Missing (n),2

0,1
0,4077
4,2053
3,2041
Other values (7),14159

Value,Count,Frequency (%),Unnamed: 3
0,4077,18.3%,
4,2053,9.2%,
3,2041,9.1%,
6,2040,9.1%,
1,2036,9.1%,
5,2031,9.1%,
2,2022,9.1%,
8,2018,9.0%,
9,2011,9.0%,
7,2001,9.0%,

0,1
Distinct count,129
Unique (%),0.6%
Missing (%),0.0%
Missing (n),1

0,1
20150010,908
20150023,869
20150008,823
Other values (125),19731

Value,Count,Frequency (%),Unnamed: 3
20150010,908,4.1%,
20150023,869,3.9%,
20150008,823,3.7%,
20150013,809,3.6%,
20150007,745,3.3%,
20150009,629,2.8%,
20150006,561,2.5%,
20150011,551,2.5%,
20160001,488,2.2%,
20150015,487,2.2%,

0,1
Distinct count,3228
Unique (%),14.5%
Missing (%),85.5%
Missing (n),19105

0,1
700208467719322,1
704805550812940,1
708200150951246,1
Other values (3224),3224
(Missing),19105

Value,Count,Frequency (%),Unnamed: 3
700208467719322,1,0.0%,
704805550812940,1,0.0%,
708200150951246,1,0.0%,
020402273456009,1,0.0%,
898000698937912,1,0.0%,
700309959211640,1,0.0%,
700503347547853,1,0.0%,
070540813679097,1,0.0%,
704307546159598,1,0.0%,
708108570626338,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),92.2%
Missing (n),20592

0,1
2,1255
9,470
1,15
(Missing),20592

Value,Count,Frequency (%),Unnamed: 3
2,1255,5.6%,
9,470,2.1%,
1,15,0.1%,
(Missing),20592,92.2%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.3%
Missing (n),21728

0,1
3,598
9,6
(Missing),21728

Value,Count,Frequency (%),Unnamed: 3
3,598,2.7%,
9,6,0.0%,
(Missing),21728,97.3%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),92.2%
Missing (n),20592

0,1
3,1230
9,470
1,26
(Missing),20592

Value,Count,Frequency (%),Unnamed: 3
3,1230,5.5%,
9,470,2.1%,
1,26,0.1%,
2,14,0.1%,
(Missing),20592,92.2%,

0,1
Distinct count,541
Unique (%),2.4%
Missing (%),23.9%
Missing (n),5329

0,1
999993,6528
999992,2706
621005,2139
Other values (537),5630
(Missing),5329

Value,Count,Frequency (%),Unnamed: 3
999993,6528,29.2%,
999992,2706,12.1%,
621005,2139,9.6%,
715210,674,3.0%,
622020,373,1.7%,
999991,296,1.3%,
354705,202,0.9%,
141410,193,0.9%,
512105,190,0.9%,
999994,165,0.7%,

0,1
Distinct count,85
Unique (%),0.4%
Missing (%),97.9%
Missing (n),21867

0,1
999992,231
999991,34
621005,20
Other values (81),180
(Missing),21867

Value,Count,Frequency (%),Unnamed: 3
999992,231,1.0%,
999991,34,0.2%,
621005,20,0.1%,
521110,10,0.0%,
411010,9,0.0%,
999994,8,0.0%,
422105,8,0.0%,
622020,7,0.0%,
512105,7,0.0%,
322205,7,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,22330
3,1
2,1

Value,Count,Frequency (%),Unnamed: 3
1,22330,100.0%,
3,1,0.0%,
2,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.3%
Missing (n),21727

0,1
2,331
1,269
9,5
(Missing),21727

Value,Count,Frequency (%),Unnamed: 3
2,331,1.5%,
1,269,1.2%,
9,5,0.0%,
(Missing),21727,97.3%,

0,1
Distinct count,387
Unique (%),1.7%
Missing (%),97.4%
Missing (n),21753
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2003.1503
Minimum,160.0
Maximum,5345.0
Zeros (%),0.0%

0,1
Minimum,160.0
5-th percentile,499.6
Q1,942.5
Median,1995.0
Q3,2972.5
95-th percentile,3701.0
Maximum,5345.0
Range,5185.0
Interquartile range,2030.0

0,1
Standard deviation,1116.6206
Coef of variation,0.5574323
Kurtosis,-1.0684623
Mean,2003.1503
MAD,990.223
Skewness,0.220103
Sum,1159824.0
Variance,1246841.6
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
950.0,6,0.0%,
2800.0,5,0.0%,
900.0,5,0.0%,
820.0,5,0.0%,
2960.0,4,0.0%,
1000.0,4,0.0%,
3000.0,4,0.0%,
3110.0,4,0.0%,
520.0,4,0.0%,
850.0,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
160.0,1,0.0%,
290.0,1,0.0%,
350.0,1,0.0%,
355.0,1,0.0%,
365.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4510.0,1,0.0%,
4740.0,1,0.0%,
4830.0,1,0.0%,
4890.0,1,0.0%,
5345.0,1,0.0%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),97.8%
Missing (n),21846
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.0720165
Minimum,0.0
Maximum,99.0
Zeros (%),1.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,0.0
Median,0.0
Q3,1.0
95-th percentile,2.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,12.585582
Coef of variation,6.0740743
Kurtosis,55.73467
Mean,2.0720165
MAD,3.3018255
Skewness,7.563576
Sum,1007.0
Variance,158.39687
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
0.0,336,1.5%,
1.0,97,0.4%,
2.0,30,0.1%,
3.0,10,0.0%,
99.0,8,0.0%,
4.0,3,0.0%,
11.0,1,0.0%,
5.0,1,0.0%,
(Missing),21846,97.8%,

Value,Count,Frequency (%),Unnamed: 3
0.0,336,1.5%,
1.0,97,0.4%,
2.0,30,0.1%,
3.0,10,0.0%,
4.0,3,0.0%,

Value,Count,Frequency (%),Unnamed: 3
3.0,10,0.0%,
4.0,3,0.0%,
5.0,1,0.0%,
11.0,1,0.0%,
99.0,8,0.0%,

0,1
Distinct count,13
Unique (%),0.1%
Missing (%),97.5%
Missing (n),21782
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.3527272
Minimum,0.0
Maximum,99.0
Zeros (%),0.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,1.0
Median,1.0
Q3,2.0
95-th percentile,5.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,8.42686
Coef of variation,3.581741
Kurtosis,124.439316
Mean,2.3527272
MAD,2.0847867
Skewness,11.036078
Sum,1294.0
Variance,71.01197
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
1.0,212,0.9%,
2.0,132,0.6%,
0.0,102,0.5%,
3.0,52,0.2%,
4.0,17,0.1%,
5.0,12,0.1%,
7.0,7,0.0%,
6.0,7,0.0%,
99.0,4,0.0%,
11.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,102,0.5%,
1.0,212,0.9%,
2.0,132,0.6%,
3.0,52,0.2%,
4.0,17,0.1%,

Value,Count,Frequency (%),Unnamed: 3
7.0,7,0.0%,
8.0,2,0.0%,
9.0,1,0.0%,
11.0,2,0.0%,
99.0,4,0.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),12.0%
Missing (n),2675

0,1
1,9019
4,8574
2,1959
Other values (2),105
(Missing),2675

Value,Count,Frequency (%),Unnamed: 3
1,9019,40.4%,
4,8574,38.4%,
2,1959,8.8%,
3,80,0.4%,
5,25,0.1%,
(Missing),2675,12.0%,

0,1
Distinct count,30
Unique (%),0.1%
Missing (%),97.5%
Missing (n),21764
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,32.883804
Minimum,0.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,22.0
Q1,27.0
Median,33.5
Q3,38.0
95-th percentile,40.0
Maximum,99.0
Range,99.0
Interquartile range,11.0

0,1
Standard deviation,9.875265
Coef of variation,0.30030787
Kurtosis,20.43143
Mean,32.883804
MAD,6.2743125
Skewness,2.551369
Sum,18678.0
Variance,97.52087
Memory size,87.3 KiB

Value,Count,Frequency (%),Unnamed: 3
38.0,50,0.2%,
39.0,50,0.2%,
40.0,46,0.2%,
37.0,43,0.2%,
32.0,30,0.1%,
26.0,30,0.1%,
34.0,27,0.1%,
28.0,26,0.1%,
33.0,25,0.1%,
36.0,25,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,3,0.0%,
1.0,3,0.0%,
2.0,1,0.0%,
4.0,1,0.0%,
9.0,3,0.0%,

Value,Count,Frequency (%),Unnamed: 3
39.0,50,0.2%,
40.0,46,0.2%,
41.0,17,0.1%,
42.0,4,0.0%,
99.0,6,0.0%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),86.9%
Missing (n),19402

0,1
4,1141
3,490
8,376
Other values (5),923
(Missing),19402

Value,Count,Frequency (%),Unnamed: 3
4,1141,5.1%,
3,490,2.2%,
8,376,1.7%,
5,303,1.4%,
2,225,1.0%,
1,167,0.7%,
7,115,0.5%,
6,113,0.5%,
(Missing),19402,86.9%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),99.1%
Missing (n),22121

0,1
3,73
8,36
7,19
Other values (5),83
(Missing),22121

Value,Count,Frequency (%),Unnamed: 3
3,73,0.3%,
8,36,0.2%,
7,19,0.1%,
5,19,0.1%,
4,18,0.1%,
1,17,0.1%,
6,15,0.1%,
2,14,0.1%,
(Missing),22121,99.1%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,12936
2,9388
0,8

Value,Count,Frequency (%),Unnamed: 3
1,12936,57.9%,
2,9388,42.0%,
0,8,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),5

0,1
S,22325
N,2
(Missing),5

Value,Count,Frequency (%),Unnamed: 3
S,22325,100.0%,
N,2,0.0%,
(Missing),5,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),1

0,1
Mean,0.0

0,1
0.0,22331
(Missing),1

Value,Count,Frequency (%),Unnamed: 3
0.0,22331,100.0%,
(Missing),1,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
Mean,0.9998209

0,1
1.0,22328
0.0,4

Value,Count,Frequency (%),Unnamed: 3
1.0,22328,100.0%,
0.0,4,0.0%,

0,1
Constant value,2

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),92.2%
Missing (n),20594

0,1
8,1213
9,470
4,26
Other values (4),29
(Missing),20594

Value,Count,Frequency (%),Unnamed: 3
8,1213,5.4%,
9,470,2.1%,
4,26,0.1%,
5,14,0.1%,
1,12,0.1%,
3,2,0.0%,
2,1,0.0%,
(Missing),20594,92.2%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),94.6%
Missing (n),21137

0,1
M,1193
R,1
E,1
(Missing),21137

Value,Count,Frequency (%),Unnamed: 3
M,1193,5.3%,
R,1,0.0%,
E,1,0.0%,
(Missing),21137,94.6%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),94.7%
Missing (n),21138

0,1
9,1043
8,100
5,22
Other values (5),29
(Missing),21138

Value,Count,Frequency (%),Unnamed: 3
9,1043,4.7%,
8,100,0.4%,
5,22,0.1%,
6,12,0.1%,
1,10,0.0%,
3,3,0.0%,
7,2,0.0%,
4,2,0.0%,
(Missing),21138,94.7%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.5%
Missing (n),122

0,1
N,19286
S,2924
(Missing),122

Value,Count,Frequency (%),Unnamed: 3
N,19286,86.4%,
S,2924,13.1%,
(Missing),122,0.5%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.8%
Missing (n),22281

0,1
1,30
2,16
3,5
(Missing),22281

Value,Count,Frequency (%),Unnamed: 3
1,30,0.1%,
2,16,0.1%,
3,5,0.0%,
(Missing),22281,99.8%,

0,1
Distinct count,22332
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,11166
Minimum,1
Maximum,22332
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,1117.5
Q1,5583.8
Median,11166.0
Q3,16749.0
95-th percentile,21215.0
Maximum,22332.0
Range,22331.0
Interquartile range,11166.0

0,1
Standard deviation,6446.8
Coef of variation,0.57734
Kurtosis,-1.2
Mean,11166
MAD,5583
Skewness,0
Sum,249370278
Variance,41562000
Memory size,174.5 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,1,0.0%,
6822,1,0.0%,
17053,1,0.0%,
21151,1,0.0%,
10912,1,0.0%,
8865,1,0.0%,
15010,1,0.0%,
12963,1,0.0%,
2724,1,0.0%,
677,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,1,0.0%,
2,1,0.0%,
3,1,0.0%,
4,1,0.0%,
5,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
22328,1,0.0%,
22329,1,0.0%,
22330,1,0.0%,
22331,1,0.0%,
22332,1,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),8

0,1
3.2,22323
2.2,1
(Missing),8

Value,Count,Frequency (%),Unnamed: 3
3.2,22323,100.0%,
2.2,1,0.0%,
(Missing),8,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),0.0%
Missing (n),1

0,1
3.2.00,22285
3.2.02,33
3.2.01,13
(Missing),1

Value,Count,Frequency (%),Unnamed: 3
3.2.00,22285,99.8%,
3.2.02,33,0.1%,
3.2.01,13,0.1%,
(Missing),1,0.0%,

Unnamed: 0.1,ACIDTRAB,ALTCAUSA,ASSISTMED,ATESTADO,ATESTANTE,CAUSABAS,CAUSABAS_O,CAUSAMAT,CB_PRE,CIRCOBITO,CIRURGIA,CODESTAB,CODIFICADO,CODINST,CODMUNNATU,CODMUNOCOR,CODMUNRES,COMUNSVOIM,CRM,DIFDATA,DTATESTADO,DTCADASTRO,DTCADINF,DTCADINV,DTCONCASO,DTCONINV,DTINVESTIG,DTNASC,DTOBITO,DTRECEBIM,DTRECORIGA,ESC,ESC2010,ESCFALAGR1,ESCMAE,ESCMAE2010,ESCMAEAGR1,ESTABDESCR,ESTCIV,EXAME,FONTE,FONTEINV,FONTES,FONTESINF,GESTACAO,GRAVIDEZ,HORAOBITO,IDADE,IDADEMAE,LINHAA,LINHAB,LINHAC,LINHAD,LINHAII,LOCOCOR,MORTEPARTO,NATURAL,NECROPSIA,NUDIASINF,NUDIASOBCO,NUDIASOBIN,NUMERODN,NUMERODO,NUMERODV,NUMEROLOTE,NUMSUS,OBITOGRAV,OBITOPARTO,OBITOPUERP,OCUP,OCUPMAE,ORIGEM,PARTO,PESO,QTDFILMORT,QTDFILVIVO,RACACOR,SEMAGESTAC,SERIESCFAL,SERIESCMAE,SEXO,STCODIFICA,STDOEPIDEM,STDONOVA,TIPOBITO,TPMORTEOCO,TPNIVELINV,TPOBITOCOR,TPPOS,TPRESGINFO,Unnamed: 0,VERSAOSCB,VERSAOSIST
0,,2.0,1,P60/D689/Q894/P291*P369,1,P60,P60,,,,2.0,2339196.0,S,EGO5208700001,,520870,320500,,11574,21.0,2015-09-28,2015-10-14,2016-01-24,NaT,NaT,NaT,NaT,2015-09-02,2015-09-28,2015-10-19,2015-10-19,,,,5.0,,,,,2.0,,,,,4.0,2.0,300.0,226.0,33.0,*P60X,*D689,*Q894,*P291,*P369,1,3.0,,2,,,,67544975.0,8857853,,20150057,,,,,,,1,2.0,2375.0,0.0,4.0,2,,,,2,S,0.0,0.0,2,,,,,,1,3.2,3.2.00
1,,,1,Y848 A419/G419,2,G419,G419,,,,2.0,2200422.0,S,MMG3106200001,,310620,320320,,21338,23.0,2015-02-03,2015-02-05,NaT,2015-05-06,NaT,2015-05-06,NaT,1990-12-17,2015-02-03,2015-02-26,2015-02-12,4.0,,,,,,,1.0,1.0,,,SSXXXX,,,,1350.0,424.0,,*Y848*A419,*G419,,,,1,,,2,,92.0,92.0,,14658688,3.0,20150005,,2.0,,3.0,999991.0,,1,,,,,4,,,,2,S,0.0,0.0,2,,M,9.0,N,,2,3.2,3.2.00
2,,,1,J969/J439/J449,1,J448,J448,,,,2.0,,S,MES3201500001,,320150,320150,,12443,109.0,2015-02-21,2015-05-25,NaT,NaT,NaT,NaT,NaT,1930-09-11,2015-02-21,2015-06-10,2015-06-10,9.0,,,,,,,2.0,2.0,,,,,,,,484.0,,*J969,*J439,*J449,,,3,,,9,,,,,15286050,9.0,20150005,,,,,621005.0,,1,,,,,4,,,,1,S,0.0,0.0,2,,,,N,,3,3.2,3.2.00
3,,,1,C541/I694*E46,1,C541,C541,,,,2.0,,S,MES3201500001,,320150,320150,,11213,57.0,2015-07-28,2015-09-18,NaT,NaT,NaT,NaT,NaT,1961-02-02,2015-07-27,2015-09-22,2015-09-22,9.0,,,,,,,3.0,1.0,,,,,,,2240.0,454.0,,*C541,*I694,,,*E46X,3,,,1,,,,,15286052,5.0,20150010,,2.0,,3.0,999992.0,,1,,,,,3,,,,2,S,0.0,0.0,2,,,,N,,4,3.2,3.2.00
4,,2.0,1,P220/P072,1,P220,P220,,,,,5731186.0,S,MES3201300001,,320130,320510,,6541,133.0,2015-01-16,2015-02-13,2015-04-01,NaT,NaT,NaT,2015-04-01,2015-01-15,2015-01-16,2015-05-29,2015-02-13,,,,3.0,2.0,11.0,,,,,8.0,,,2.0,1.0,840.0,201.0,16.0,*P220,*P072,,,,1,3.0,800.0,2,,,,68769615.0,16009670,7.0,20150005,,,3.0,,,999991.0,1,1.0,505.0,,,4,22.0,,,1,S,0.0,1.0,2,,,,S,,5,3.2,3.2.00


### SIM DOES2016 `df_sim_does2016_raw`

In [9]:
display(pf_sim_does2016_raw)

Stored 'df_sim_does2016_raw' (DataFrame)


0,1
Number of variables,93
Number of observations,22868
Total Missing (%),50.2%
Total size in memory,7.7 MiB
Average record size in memory,354.6 B

0,1
Numeric,10
Categorical,61
Boolean,1
Date,10
Text (Unique),1
Rejected,10
Unsupported,0

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),93.0%
Missing (n),21272

0,1
9,920
2,633
1,43
(Missing),21272

Value,Count,Frequency (%),Unnamed: 3
9,920,4.0%,
2,633,2.8%,
1,43,0.2%,
(Missing),21272,93.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.5%
Missing (n),22294

0,1
2,458
1,116
(Missing),22294

Value,Count,Frequency (%),Unnamed: 3
2,458,2.0%,
1,116,0.5%,
(Missing),22294,97.5%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),6.6%
Missing (n),1510

0,1
1,13988
9,4729
2,2641
(Missing),1510

Value,Count,Frequency (%),Unnamed: 3
1,13988,61.2%,
9,4729,20.7%,
2,2641,11.5%,
(Missing),1510,6.6%,

0,1
Distinct count,17056
Unique (%),74.6%
Missing (%),0.0%
Missing (n),0

0,1
A419/J189,171
R99,132
I219,121
Other values (17053),22444

Value,Count,Frequency (%),Unnamed: 3
A419/J189,171,0.7%,
R99,132,0.6%,
I219,121,0.5%,
I219/I10,121,0.5%,
C349,101,0.4%,
Y349,97,0.4%,
C169,86,0.4%,
C509,79,0.3%,
C159,57,0.2%,
R092/I219,51,0.2%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.6%
Missing (n),142

0,1
1,6436
2,5459
5,4311
Other values (2),6520

Value,Count,Frequency (%),Unnamed: 3
1,6436,28.1%,
2,5459,23.9%,
5,4311,18.9%,
3,3478,15.2%,
4,3042,13.3%,
(Missing),142,0.6%,

0,1
Distinct count,1459
Unique (%),6.4%
Missing (%),0.0%
Missing (n),0

0,1
I219,1962
J189,962
I64,615
Other values (1456),19329

Value,Count,Frequency (%),Unnamed: 3
I219,1962,8.6%,
J189,962,4.2%,
I64,615,2.7%,
E149,509,2.2%,
G309,501,2.2%,
X954,464,2.0%,
I678,432,1.9%,
C349,432,1.9%,
I110,421,1.8%,
J440,336,1.5%,

0,1
Distinct count,1396
Unique (%),6.1%
Missing (%),0.0%
Missing (n),6

0,1
I219,1961
J189,1006
I64,618
Other values (1392),19277

Value,Count,Frequency (%),Unnamed: 3
I219,1961,8.6%,
J189,1006,4.4%,
I64,618,2.7%,
E149,495,2.2%,
G309,482,2.1%,
C349,430,1.9%,
I678,427,1.9%,
X954,422,1.8%,
Y349,401,1.8%,
I110,376,1.6%,

0,1
Constant value,

0,1
Constant value,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),85.0%
Missing (n),19435

0,1
1,1691
3,1197
9,362
Other values (2),183
(Missing),19435

Value,Count,Frequency (%),Unnamed: 3
1,1691,7.4%,
3,1197,5.2%,
9,362,1.6%,
2,171,0.7%,
4,12,0.1%,
(Missing),19435,85.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),100.0%
Missing (n),22862

0,1
2,6
(Missing),22862

Value,Count,Frequency (%),Unnamed: 3
2,6,0.0%,
(Missing),22862,100.0%,

0,1
Distinct count,292
Unique (%),1.3%
Missing (%),24.8%
Missing (n),5677

0,1
7257406,1388
2550687,1008
0011738,891
Other values (288),13904
(Missing),5677

Value,Count,Frequency (%),Unnamed: 3
7257406,1388,6.1%,
2550687,1008,4.4%,
0011738,891,3.9%,
2485680,767,3.4%,
2547821,732,3.2%,
2494442,634,2.8%,
2446030,566,2.5%,
0011746,464,2.0%,
7621442,435,1.9%,
2546957,425,1.9%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
S,22862
N,6

Value,Count,Frequency (%),Unnamed: 3
S,22862,100.0%,
N,6,0.0%,

0,1
Distinct count,83
Unique (%),0.4%
Missing (%),0.0%
Missing (n),0

0,1
RES3205300001,10004
MES3205300001,4108
MES3205000001,2805
Other values (80),5951

Value,Count,Frequency (%),Unnamed: 3
RES3205300001,10004,43.7%,
MES3205300001,4108,18.0%,
MES3205000001,2805,12.3%,
MES3205200001,2746,12.0%,
MES3201500001,1341,5.9%,
MES3201300001,1212,5.3%,
MES3200600001,355,1.6%,
MRJ3300600001,31,0.1%,
RRJ3304550000,26,0.1%,
MRJ3302200001,23,0.1%,

0,1
Distinct count,909
Unique (%),4.0%
Missing (%),18.0%
Missing (n),4125

0,1
320530,1389
320150,1330
320120,665
Other values (905),15359
(Missing),4125

Value,Count,Frequency (%),Unnamed: 3
320530,1389,6.1%,
320150,1330,5.8%,
320120,665,2.9%,
320520,648,2.8%,
320010,518,2.3%,
320320,509,2.2%,
320490,426,1.9%,
320020,400,1.7%,
320500,391,1.7%,
320130,349,1.5%,

0,1
Distinct count,174
Unique (%),0.8%
Missing (%),0.0%
Missing (n),0

0,1
320530,4145
320500,2806
320520,2749
Other values (171),13168

Value,Count,Frequency (%),Unnamed: 3
320530,4145,18.1%,
320500,2806,12.3%,
320520,2749,12.0%,
320120,1936,8.5%,
320150,1354,5.9%,
320490,1233,5.4%,
320130,1212,5.3%,
320320,917,4.0%,
320230,411,1.8%,
320090,404,1.8%,

0,1
Distinct count,79
Unique (%),0.3%
Missing (%),0.0%
Missing (n),0

0,1
320520,2595
320500,2447
320130,2341
Other values (76),15485

Value,Count,Frequency (%),Unnamed: 3
320520,2595,11.3%,
320500,2447,10.7%,
320130,2341,10.2%,
320530,1990,8.7%,
320120,1351,5.9%,
320320,838,3.7%,
320150,764,3.3%,
320490,717,3.1%,
320240,687,3.0%,
320060,451,2.0%,

0,1
Distinct count,54
Unique (%),0.2%
Missing (%),71.6%
Missing (n),16374

0,1
320530,4957
320320,603
320120,541
Other values (50),393
(Missing),16374

Value,Count,Frequency (%),Unnamed: 3
320530,4957,21.7%,
320320,603,2.6%,
320120,541,2.4%,
320150,279,1.2%,
293135,19,0.1%,
320520,12,0.1%,
330100,7,0.0%,
310620,6,0.0%,
355030,4,0.0%,
330240,4,0.0%,

0,1
Distinct count,3210
Unique (%),14.0%
Missing (%),1.0%
Missing (n),234

0,1
6507,585
6734,469
6733,409
Other values (3206),21171

Value,Count,Frequency (%),Unnamed: 3
6507,585,2.6%,
6734,469,2.1%,
6733,409,1.8%,
5132,355,1.6%,
11809,323,1.4%,
9434,264,1.2%,
9389,239,1.0%,
6752,210,0.9%,
8556,189,0.8%,
12162,183,0.8%,

0,1
Distinct count,670
Unique (%),2.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,84.806015
Minimum,2.0
Maximum,770.0
Zeros (%),0.0%

0,1
Minimum,2.0
5-th percentile,19.0
Q1,37.0
Median,55.0
Q3,78.0
95-th percentile,338.0
Maximum,770.0
Range,768.0
Interquartile range,41.0

0,1
Standard deviation,102.92296
Coef of variation,1.213628
Kurtosis,11.264954
Mean,84.806015
MAD,58.823498
Skewness,3.2552674
Sum,1939344.0
Variance,10593.135
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
51.0,376,1.6%,
54.0,372,1.6%,
45.0,370,1.6%,
53.0,352,1.5%,
50.0,349,1.5%,
52.0,344,1.5%,
49.0,342,1.5%,
55.0,341,1.5%,
48.0,339,1.5%,
46.0,332,1.5%,

Value,Count,Frequency (%),Unnamed: 3
2.0,3,0.0%,
3.0,1,0.0%,
4.0,5,0.0%,
5.0,2,0.0%,
6.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
752.0,1,0.0%,
757.0,1,0.0%,
763.0,2,0.0%,
765.0,1,0.0%,
770.0,1,0.0%,

0,1
Distinct count,378
Unique (%),1.7%
Missing (%),0.1%
Missing (n),13
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-01-01 00:00:00
Maximum,2017-07-24 00:00:00

0,1
Distinct count,347
Unique (%),1.5%
Missing (%),0.0%
Missing (n),2
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-01-06 00:00:00
Maximum,2018-02-28 00:00:00

0,1
Distinct count,242
Unique (%),1.1%
Missing (%),97.2%
Missing (n),22226
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-02-11 00:00:00
Maximum,2018-02-06 00:00:00

0,1
Distinct count,289
Unique (%),1.3%
Missing (%),94.9%
Missing (n),21692
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-02-06 00:00:00
Maximum,2018-02-20 00:00:00

0,1
Constant value,

0,1
Distinct count,300
Unique (%),1.3%
Missing (%),94.9%
Missing (n),21708
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-02-02 00:00:00
Maximum,2018-01-22 00:00:00

0,1
Distinct count,428
Unique (%),1.9%
Missing (%),88.2%
Missing (n),20169
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-01-11 00:00:00
Maximum,2018-02-05 00:00:00

0,1
Distinct count,15130
Unique (%),66.2%
Missing (%),0.2%
Missing (n),44
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1900-09-15 00:00:00
Maximum,2016-12-30 00:00:00

0,1
Distinct count,366
Unique (%),1.6%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-01-01 00:00:00
Maximum,2016-12-31 00:00:00

0,1
Distinct count,217
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-01-18 00:00:00
Maximum,2018-02-28 00:00:00

0,1
Distinct count,202
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2016-01-18 00:00:00
Maximum,2018-02-28 00:00:00

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),16.3%
Missing (n),3720

0,1
9,6828
2,3768
1,3000
Other values (3),5552
(Missing),3720

Value,Count,Frequency (%),Unnamed: 3
9,6828,29.9%,
2,3768,16.5%,
1,3000,13.1%,
3,2882,12.6%,
4,1938,8.5%,
5,732,3.2%,
(Missing),3720,16.3%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),16.3%
Missing (n),3728

0,1
9,6827
1,5001
0,3000
Other values (4),4312
(Missing),3728

Value,Count,Frequency (%),Unnamed: 3
9,6827,29.9%,
1,5001,21.9%,
0,3000,13.1%,
2,2016,8.8%,
3,1568,6.9%,
5,595,2.6%,
4,133,0.6%,
(Missing),3728,16.3%,

0,1
Distinct count,14
Unique (%),0.1%
Missing (%),16.3%
Missing (n),3728

0,1
09,6827
10,3256
00,3000
Other values (10),6057
(Missing),3728

Value,Count,Frequency (%),Unnamed: 3
09,6827,29.9%,
10,3256,14.2%,
00,3000,13.1%,
02,1233,5.4%,
12,1226,5.4%,
11,1170,5.1%,
08,595,2.6%,
01,512,2.2%,
03,478,2.1%,
04,368,1.6%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),97.6%
Missing (n),22315

0,1
4,254
3,137
5,72
Other values (3),90
(Missing),22315

Value,Count,Frequency (%),Unnamed: 3
4,254,1.1%,
3,137,0.6%,
5,72,0.3%,
9,52,0.2%,
2,23,0.1%,
1,15,0.1%,
(Missing),22315,97.6%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.6%
Missing (n),22315

0,1
3,212
2,159
9,52
Other values (4),130
(Missing),22315

Value,Count,Frequency (%),Unnamed: 3
3,212,0.9%,
2,159,0.7%,
9,52,0.2%,
5,52,0.2%,
1,43,0.2%,
4,20,0.1%,
0,15,0.1%,
(Missing),22315,97.6%,

0,1
Distinct count,14
Unique (%),0.1%
Missing (%),97.6%
Missing (n),22315

0,1
12,117
06,74
11,68
Other values (10),294
(Missing),22315

Value,Count,Frequency (%),Unnamed: 3
12,117,0.5%,
06,74,0.3%,
11,68,0.3%,
09,52,0.2%,
08,52,0.2%,
03,49,0.2%,
04,42,0.2%,
05,21,0.1%,
07,20,0.1%,
02,20,0.1%,

0,1
Constant value,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),7.9%
Missing (n),1806

0,1
2,7093
1,5061
3,4549
Other values (3),4359

Value,Count,Frequency (%),Unnamed: 3
2,7093,31.0%,
1,5061,22.1%,
3,4549,19.9%,
9,2565,11.2%,
4,1418,6.2%,
5,376,1.6%,
(Missing),1806,7.9%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),100.0%
Missing (n),22862

0,1
2,6
(Missing),22862

Value,Count,Frequency (%),Unnamed: 3
2,6,0.0%,
(Missing),22862,100.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),85.9%
Missing (n),19641

0,1
1,1629
9,983
2,427
Other values (2),188
(Missing),19641

Value,Count,Frequency (%),Unnamed: 3
1,1629,7.1%,
9,983,4.3%,
2,427,1.9%,
4,95,0.4%,
3,93,0.4%,
(Missing),19641,85.9%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),87.5%
Missing (n),20018

0,1
6,739
1,564
3,558
Other values (6),989
(Missing),20018

Value,Count,Frequency (%),Unnamed: 3
6,739,3.2%,
1,564,2.5%,
3,558,2.4%,
8,354,1.5%,
4,323,1.4%,
2,195,0.9%,
7,69,0.3%,
5,47,0.2%,
9,1,0.0%,
(Missing),20018,87.5%,

0,1
Distinct count,38
Unique (%),0.2%
Missing (%),97.2%
Missing (n),22226

0,1
XXXSXX,89
SXXSXX,80
SXSSXX,72
Other values (34),401
(Missing),22226

Value,Count,Frequency (%),Unnamed: 3
XXXSXX,89,0.4%,
SXXSXX,80,0.3%,
SXSSXX,72,0.3%,
XXSXXX,70,0.3%,
XXXXXX,68,0.3%,
SXSXXX,57,0.2%,
SXXXXX,57,0.2%,
XXSSXX,41,0.2%,
SSSSXX,18,0.1%,
XXXXSX,12,0.1%,

0,1
Constant value,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.5%
Missing (n),22306

0,1
5,185
2,146
4,116
Other values (4),115
(Missing),22306

Value,Count,Frequency (%),Unnamed: 3
5,185,0.8%,
2,146,0.6%,
4,116,0.5%,
3,91,0.4%,
1,19,0.1%,
6,3,0.0%,
9,2,0.0%,
(Missing),22306,97.5%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.4%
Missing (n),22279

0,1
1,541
2,47
9,1
(Missing),22279

Value,Count,Frequency (%),Unnamed: 3
1,541,2.4%,
2,47,0.2%,
9,1,0.0%,
(Missing),22279,97.4%,

0,1
Distinct count,1356
Unique (%),5.9%
Missing (%),9.4%
Missing (n),2155
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1191.059
Minimum,0.0
Maximum,2359.0
Zeros (%),0.2%

0,1
Minimum,0.0
5-th percentile,125.0
Q1,620.0
Median,1157.0
Q3,1757.0
95-th percentile,2240.0
Maximum,2359.0
Range,2359.0
Interquartile range,1137.0

0,1
Standard deviation,673.87024
Coef of variation,0.565774
Kurtosis,-1.1610739
Mean,1191.059
MAD,582.34033
Skewness,0.012833047
Sum,24670404.0
Variance,454101.12
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,278,1.2%,
900.0,231,1.0%,
500.0,218,1.0%,
800.0,214,0.9%,
700.0,208,0.9%,
400.0,192,0.8%,
1100.0,189,0.8%,
2200.0,189,0.8%,
2100.0,187,0.8%,
1800.0,180,0.8%,

Value,Count,Frequency (%),Unnamed: 3
0.0,47,0.2%,
1.0,12,0.1%,
2.0,2,0.0%,
3.0,2,0.0%,
4.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2355.0,36,0.2%,
2356.0,5,0.0%,
2357.0,2,0.0%,
2358.0,8,0.0%,
2359.0,3,0.0%,

0,1
Distinct count,199
Unique (%),0.9%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,458.5
Minimum,1.0
Maximum,999.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,418.0
Q1,451.0
Median,468.0
Q3,481.0
95-th percentile,492.0
Maximum,999.0
Range,998.0
Interquartile range,30.0

0,1
Standard deviation,51.074013
Coef of variation,0.111393705
Kurtosis,35.98241
Mean,458.5
MAD,25.206621
Skewness,-3.5814183
Sum,10484978.0
Variance,2608.555
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
478.0,495,2.2%,
486.0,493,2.2%,
480.0,492,2.2%,
481.0,492,2.2%,
477.0,488,2.1%,
483.0,484,2.1%,
482.0,475,2.1%,
476.0,472,2.1%,
479.0,471,2.1%,
484.0,467,2.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,7,0.0%,
3.0,3,0.0%,
4.0,1,0.0%,
5.0,5,0.0%,
7.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
510.0,5,0.0%,
511.0,1,0.0%,
513.0,1,0.0%,
515.0,1,0.0%,
999.0,17,0.1%,

0,1
Distinct count,34
Unique (%),0.1%
Missing (%),97.5%
Missing (n),22305
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,26.45293
Minimum,13.0
Maximum,46.0
Zeros (%),0.0%

0,1
Minimum,13.0
5-th percentile,16.0
Q1,20.0
Median,26.0
Q3,32.0
95-th percentile,39.0
Maximum,46.0
Range,33.0
Interquartile range,12.0

0,1
Standard deviation,7.447026
Coef of variation,0.2815199
Kurtosis,-0.81997216
Mean,26.45293
MAD,6.2640576
Skewness,0.323566
Sum,14893.0
Variance,55.45819
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
18.0,35,0.2%,
26.0,33,0.1%,
17.0,27,0.1%,
19.0,26,0.1%,
20.0,25,0.1%,
16.0,24,0.1%,
23.0,24,0.1%,
22.0,24,0.1%,
29.0,24,0.1%,
24.0,23,0.1%,

Value,Count,Frequency (%),Unnamed: 3
13.0,1,0.0%,
14.0,6,0.0%,
15.0,10,0.0%,
16.0,24,0.1%,
17.0,27,0.1%,

Value,Count,Frequency (%),Unnamed: 3
41.0,9,0.0%,
42.0,5,0.0%,
43.0,6,0.0%,
44.0,1,0.0%,
46.0,1,0.0%,

0,1
Distinct count,994
Unique (%),4.3%
Missing (%),3.0%
Missing (n),681

0,1
*A419,4135
*I219,1314
*R688,1163
Other values (990),15575

Value,Count,Frequency (%),Unnamed: 3
*A419,4135,18.1%,
*I219,1314,5.7%,
*R688,1163,5.1%,
*R092,1142,5.0%,
*J960,1085,4.7%,
*J969,1077,4.7%,
*J81X,794,3.5%,
*R570,686,3.0%,
*R571,420,1.8%,
*S068,374,1.6%,

0,1
Distinct count,1502
Unique (%),6.6%
Missing (%),17.1%
Missing (n),3920

0,1
*J189,1714
*A419,1128
*I219,707
Other values (1498),15399
(Missing),3920

Value,Count,Frequency (%),Unnamed: 3
*J189,1714,7.5%,
*A419,1128,4.9%,
*I219,707,3.1%,
*I10X,686,3.0%,
*S069,532,2.3%,
*N390,385,1.7%,
*I500,384,1.7%,
*J159,338,1.5%,
*J180,299,1.3%,
*J969,273,1.2%,

0,1
Distinct count,1487
Unique (%),6.5%
Missing (%),40.5%
Missing (n),9255

0,1
*I10X,1132
*J189,654
*I709,352
Other values (1483),11475
(Missing),9255

Value,Count,Frequency (%),Unnamed: 3
*I10X,1132,5.0%,
*J189,654,2.9%,
*I709,352,1.5%,
*J449,306,1.3%,
*E149,263,1.2%,
*I219,242,1.1%,
*A419,230,1.0%,
*N189,216,0.9%,
*X954,215,0.9%,
*I500,209,0.9%,

0,1
Distinct count,971
Unique (%),4.2%
Missing (%),74.0%
Missing (n),16932

0,1
*I10X,885
*E149,270
*F102,206
Other values (967),4575
(Missing),16932

Value,Count,Frequency (%),Unnamed: 3
*I10X,885,3.9%,
*E149,270,1.2%,
*F102,206,0.9%,
*I709,141,0.6%,
*J189,133,0.6%,
*G309,129,0.6%,
*F172,121,0.5%,
*J449,116,0.5%,
*I219,86,0.4%,
*I64X,78,0.3%,

0,1
Distinct count,2512
Unique (%),11.0%
Missing (%),63.6%
Missing (n),14554

0,1
*I10X,838
*E149,349
*I10X*E149,300
Other values (2508),6827
(Missing),14554

Value,Count,Frequency (%),Unnamed: 3
*I10X,838,3.7%,
*E149,349,1.5%,
*I10X*E149,300,1.3%,
*F172,211,0.9%,
*E149*I10X,185,0.8%,
*G309,160,0.7%,
*N179,150,0.7%,
*N189,150,0.7%,
*R54X,147,0.6%,
*F102,130,0.6%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,16138
3,3808
4,1207
Other values (3),1715

Value,Count,Frequency (%),Unnamed: 3
1,16138,70.6%,
3,3808,16.7%,
4,1207,5.3%,
2,1053,4.6%,
5,598,2.6%,
9,64,0.3%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.2%
Missing (n),22226

0,1
3,568
9,72
1,2
(Missing),22226

Value,Count,Frequency (%),Unnamed: 3
3,568,2.5%,
9,72,0.3%,
1,2,0.0%,
(Missing),22226,97.2%,

0,1
Distinct count,46
Unique (%),0.2%
Missing (%),16.2%
Missing (n),3705

0,1
832,13821
831,2780
829,1047
Other values (42),1515
(Missing),3705

Value,Count,Frequency (%),Unnamed: 3
832,13821,60.4%,
831,2780,12.2%,
829,1047,4.6%,
833,557,2.4%,
800,358,1.6%,
835,120,0.5%,
826,78,0.3%,
823,52,0.2%,
827,50,0.2%,
843,41,0.2%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),6.0%
Missing (n),1381

0,1
2,14548
1,5912
9,1027
(Missing),1381

Value,Count,Frequency (%),Unnamed: 3
2,14548,63.6%,
1,5912,25.9%,
9,1027,4.5%,
(Missing),1381,6.0%,

0,1
Constant value,

0,1
Distinct count,224
Unique (%),1.0%
Missing (%),94.9%
Missing (n),21705
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,88.69991
Minimum,1.0
Maximum,472.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,23.0
Q1,52.0
Median,80.0
Q3,111.0
95-th percentile,191.0
Maximum,472.0
Range,471.0
Interquartile range,59.0

0,1
Standard deviation,57.449642
Coef of variation,0.64768547
Kurtosis,8.6938715
Mean,88.69991
MAD,39.375484
Skewness,2.2675226
Sum,103158.0
Variance,3300.4614
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
77.0,17,0.1%,
99.0,17,0.1%,
73.0,16,0.1%,
60.0,16,0.1%,
80.0,16,0.1%,
111.0,15,0.1%,
51.0,15,0.1%,
72.0,14,0.1%,
56.0,14,0.1%,
54.0,14,0.1%,

Value,Count,Frequency (%),Unnamed: 3
1.0,1,0.0%,
7.0,1,0.0%,
8.0,3,0.0%,
9.0,3,0.0%,
10.0,3,0.0%,

Value,Count,Frequency (%),Unnamed: 3
408.0,1,0.0%,
422.0,1,0.0%,
426.0,1,0.0%,
458.0,1,0.0%,
472.0,1,0.0%,

0,1
Constant value,

0,1
Distinct count,333
Unique (%),1.5%
Missing (%),98.5%
Missing (n),22536

0,1
71079077,1
71090826,1
71070281,1
Other values (329),329
(Missing),22536

Value,Count,Frequency (%),Unnamed: 3
71079077,1,0.0%,
71090826,1,0.0%,
71070281,1,0.0%,
71069121,1,0.0%,
68817242,1,0.0%,
71078016,1,0.0%,
71133091,1,0.0%,
68824991,1,0.0%,
68797260,1,0.0%,
71069856,1,0.0%,

First 3 values
23166395
22196475
22195731

Last 3 values
23740134
23733088
23163609

Value,Count,Frequency (%),Unnamed: 3
15286054,1,0.0%,
16009671,1,0.0%,
16010299,1,0.0%,
16012506,1,0.0%,
16013553,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
24648350,1,0.0%,
24755650,1,0.0%,
24771481,1,0.0%,
24877146,1,0.0%,
24937484,1,0.0%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
0,4132
8,2117
3,2101
Other values (7),14518

Value,Count,Frequency (%),Unnamed: 3
0,4132,18.1%,
8,2117,9.3%,
3,2101,9.2%,
9,2096,9.2%,
2,2093,9.2%,
6,2082,9.1%,
5,2073,9.1%,
7,2068,9.0%,
1,2055,9.0%,
4,2051,9.0%,

0,1
Distinct count,127
Unique (%),0.6%
Missing (%),0.0%
Missing (n),0

0,1
20160011,856
20160029,730
20160037,659
Other values (124),20623

Value,Count,Frequency (%),Unnamed: 3
20160011,856,3.7%,
20160029,730,3.2%,
20160037,659,2.9%,
20160014,658,2.9%,
20160032,637,2.8%,
20160015,624,2.7%,
20170005,622,2.7%,
20170007,604,2.6%,
20160010,567,2.5%,
20160012,563,2.5%,

0,1
Distinct count,1089
Unique (%),4.8%
Missing (%),95.2%
Missing (n),21780

0,1
700003711594004,1
704605696655620,1
898002743746809,1
Other values (1085),1085
(Missing),21780

Value,Count,Frequency (%),Unnamed: 3
700003711594004,1,0.0%,
704605696655620,1,0.0%,
898002743746809,1,0.0%,
200430815460006,1,0.0%,
709706012698390,1,0.0%,
703004834186376,1,0.0%,
702107759056591,1,0.0%,
701002873808996,1,0.0%,
706004391951847,1,0.0%,
705002295091956,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),90.8%
Missing (n),20758

0,1
2,1309
9,788
1,13
(Missing),20758

Value,Count,Frequency (%),Unnamed: 3
2,1309,5.7%,
9,788,3.4%,
1,13,0.1%,
(Missing),20758,90.8%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.4%
Missing (n),22276

0,1
3,590
9,2
(Missing),22276

Value,Count,Frequency (%),Unnamed: 3
3,590,2.6%,
9,2,0.0%,
(Missing),22276,97.4%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),90.8%
Missing (n),20758

0,1
3,1295
9,788
2,14
(Missing),20758

Value,Count,Frequency (%),Unnamed: 3
3,1295,5.7%,
9,788,3.4%,
2,14,0.1%,
1,13,0.1%,
(Missing),20758,90.8%,

0,1
Distinct count,509
Unique (%),2.2%
Missing (%),21.6%
Missing (n),4948

0,1
999993,6933
999992,2783
621005,2107
Other values (505),6097
(Missing),4948

Value,Count,Frequency (%),Unnamed: 3
999993,6933,30.3%,
999992,2783,12.2%,
621005,2107,9.2%,
715210,610,2.7%,
622020,361,1.6%,
999991,298,1.3%,
999994,295,1.3%,
354705,237,1.0%,
512105,236,1.0%,
992225,227,1.0%,

0,1
Distinct count,84
Unique (%),0.4%
Missing (%),97.9%
Missing (n),22377

0,1
999992,232
999991,43
621005,17
Other values (80),199
(Missing),22377

Value,Count,Frequency (%),Unnamed: 3
999992,232,1.0%,
999991,43,0.2%,
621005,17,0.1%,
999994,13,0.1%,
354705,10,0.0%,
322205,9,0.0%,
239415,8,0.0%,
512105,8,0.0%,
411010,8,0.0%,
421125,8,0.0%,

0,1
Constant value,1

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.4%
Missing (n),22281

0,1
2,352
1,229
9,6
(Missing),22281

Value,Count,Frequency (%),Unnamed: 3
2,352,1.5%,
1,229,1.0%,
9,6,0.0%,
(Missing),22281,97.4%,

0,1
Distinct count,382
Unique (%),1.7%
Missing (%),97.5%
Missing (n),22307
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1883.8806
Minimum,190.0
Maximum,5515.0
Zeros (%),0.0%

0,1
Minimum,190.0
5-th percentile,490.0
Q1,840.0
Median,1675.0
Q3,2835.0
95-th percentile,3635.0
Maximum,5515.0
Range,5325.0
Interquartile range,1995.0

0,1
Standard deviation,1103.7865
Coef of variation,0.5859111
Kurtosis,-1.0095508
Mean,1883.8806
MAD,973.7118
Skewness,0.3717888
Sum,1056857.0
Variance,1218344.6
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,6,0.0%,
700.0,6,0.0%,
2700.0,6,0.0%,
550.0,5,0.0%,
750.0,5,0.0%,
725.0,4,0.0%,
3270.0,4,0.0%,
770.0,4,0.0%,
680.0,4,0.0%,
1145.0,4,0.0%,

Value,Count,Frequency (%),Unnamed: 3
190.0,1,0.0%,
320.0,2,0.0%,
330.0,1,0.0%,
355.0,1,0.0%,
370.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4300.0,1,0.0%,
4375.0,1,0.0%,
4580.0,1,0.0%,
4670.0,1,0.0%,
5515.0,1,0.0%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.9%
Missing (n),22382
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,0.33744857
Minimum,0.0
Maximum,3.0
Zeros (%),1.6%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,0.0
Median,0.0
Q3,1.0
95-th percentile,2.0
Maximum,3.0
Range,3.0
Interquartile range,1.0

0,1
Standard deviation,0.6495969
Coef of variation,1.925025
Kurtosis,4.107296
Mean,0.33744857
MAD,0.50270116
Skewness,2.0705688
Sum,164.0
Variance,0.42197615
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
0.0,362,1.6%,
1.0,92,0.4%,
2.0,24,0.1%,
3.0,8,0.0%,
(Missing),22382,97.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,362,1.6%,
1.0,92,0.4%,
2.0,24,0.1%,
3.0,8,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,362,1.6%,
1.0,92,0.4%,
2.0,24,0.1%,
3.0,8,0.0%,

0,1
Distinct count,12
Unique (%),0.1%
Missing (%),97.6%
Missing (n),22318
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1.550909
Minimum,0.0
Maximum,10.0
Zeros (%),0.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,1.0
Median,1.0
Q3,2.0
95-th percentile,4.0
Maximum,10.0
Range,10.0
Interquartile range,1.0

0,1
Standard deviation,1.4821799
Coef of variation,0.9556846
Kurtosis,5.490102
Mean,1.550909
MAD,1.0910743
Skewness,1.8660893
Sum,853.0
Variance,2.1968572
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
1.0,204,0.9%,
2.0,128,0.6%,
0.0,121,0.5%,
3.0,49,0.2%,
4.0,23,0.1%,
5.0,12,0.1%,
6.0,6,0.0%,
7.0,2,0.0%,
9.0,2,0.0%,
8.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,121,0.5%,
1.0,204,0.9%,
2.0,128,0.6%,
3.0,49,0.2%,
4.0,23,0.1%,

Value,Count,Frequency (%),Unnamed: 3
6.0,6,0.0%,
7.0,2,0.0%,
8.0,2,0.0%,
9.0,2,0.0%,
10.0,1,0.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),12.4%
Missing (n),2842

0,1
1,9202
4,8663
2,2083
Other values (2),78
(Missing),2842

Value,Count,Frequency (%),Unnamed: 3
1,9202,40.2%,
4,8663,37.9%,
2,2083,9.1%,
3,57,0.2%,
5,21,0.1%,
(Missing),2842,12.4%,

0,1
Distinct count,30
Unique (%),0.1%
Missing (%),97.5%
Missing (n),22306
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,31.868328
Minimum,0.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,22.0
Q1,27.0
Median,33.0
Q3,38.0
95-th percentile,40.0
Maximum,99.0
Range,99.0
Interquartile range,11.0

0,1
Standard deviation,8.535995
Coef of variation,0.26785198
Kurtosis,14.902729
Mean,31.868328
MAD,6.1682982
Skewness,0.69847417
Sum,17910.0
Variance,72.8632
Memory size,89.4 KiB

Value,Count,Frequency (%),Unnamed: 3
39.0,52,0.2%,
38.0,50,0.2%,
40.0,47,0.2%,
26.0,33,0.1%,
36.0,33,0.1%,
29.0,27,0.1%,
33.0,26,0.1%,
28.0,25,0.1%,
24.0,25,0.1%,
27.0,25,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,2,0.0%,
1.0,5,0.0%,
2.0,4,0.0%,
3.0,1,0.0%,
9.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
39.0,52,0.2%,
40.0,47,0.2%,
41.0,13,0.1%,
42.0,3,0.0%,
99.0,2,0.0%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),87.2%
Missing (n),19935

0,1
4,1233
3,479
8,368
Other values (5),853
(Missing),19935

Value,Count,Frequency (%),Unnamed: 3
4,1233,5.4%,
3,479,2.1%,
8,368,1.6%,
5,261,1.1%,
2,229,1.0%,
1,146,0.6%,
6,110,0.5%,
7,107,0.5%,
(Missing),19935,87.2%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),99.1%
Missing (n),22651

0,1
3,80
8,42
5,21
Other values (5),74
(Missing),22651

Value,Count,Frequency (%),Unnamed: 3
3,80,0.3%,
8,42,0.2%,
5,21,0.1%,
4,20,0.1%,
7,16,0.1%,
2,13,0.1%,
1,13,0.1%,
6,12,0.1%,
(Missing),22651,99.1%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,13215
2,9649
0,4

Value,Count,Frequency (%),Unnamed: 3
1,13215,57.8%,
2,9649,42.2%,
0,4,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),6

0,1
S,22859
N,3
(Missing),6

Value,Count,Frequency (%),Unnamed: 3
S,22859,100.0%,
N,3,0.0%,
(Missing),6,0.0%,

0,1
Constant value,0.0

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
Mean,0.99995625

0,1
1.0,22867
0.0,1

Value,Count,Frequency (%),Unnamed: 3
1.0,22867,100.0%,
0.0,1,0.0%,

0,1
Constant value,2

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),90.8%
Missing (n),20758

0,1
8,1282
9,788
5,14
Other values (3),26
(Missing),20758

Value,Count,Frequency (%),Unnamed: 3
8,1282,5.6%,
9,788,3.4%,
5,14,0.1%,
4,13,0.1%,
1,9,0.0%,
2,4,0.0%,
(Missing),20758,90.8%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),94.8%
Missing (n),21689

0,1
M,1177
E,1
R,1
(Missing),21689

Value,Count,Frequency (%),Unnamed: 3
M,1177,5.1%,
E,1,0.0%,
R,1,0.0%,
(Missing),21689,94.8%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),94.9%
Missing (n),21692

0,1
9,1024
8,117
5,15
Other values (3),20
(Missing),21692

Value,Count,Frequency (%),Unnamed: 3
9,1024,4.5%,
8,117,0.5%,
5,15,0.1%,
6,12,0.1%,
1,4,0.0%,
4,4,0.0%,
(Missing),21692,94.9%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.4%
Missing (n),99

0,1
N,19887
S,2882
(Missing),99

Value,Count,Frequency (%),Unnamed: 3
N,19887,87.0%,
S,2882,12.6%,
(Missing),99,0.4%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.8%
Missing (n),22833

0,1
1,23
2,8
3,4
(Missing),22833

Value,Count,Frequency (%),Unnamed: 3
1,23,0.1%,
2,8,0.0%,
3,4,0.0%,
(Missing),22833,99.8%,

0,1
Distinct count,22868
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,11434
Minimum,1
Maximum,22868
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,1144.4
Q1,5717.8
Median,11434.0
Q3,17151.0
95-th percentile,21725.0
Maximum,22868.0
Range,22867.0
Interquartile range,11434.0

0,1
Standard deviation,6601.6
Coef of variation,0.57734
Kurtosis,-1.2
Mean,11434
MAD,5717
Skewness,0
Sum,261484146
Variance,43581000
Memory size,178.7 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,1,0.0%,
19116,1,0.0%,
21135,1,0.0%,
10896,1,0.0%,
8849,1,0.0%,
14994,1,0.0%,
12947,1,0.0%,
2708,1,0.0%,
661,1,0.0%,
6806,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,1,0.0%,
2,1,0.0%,
3,1,0.0%,
4,1,0.0%,
5,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
22864,1,0.0%,
22865,1,0.0%,
22866,1,0.0%,
22867,1,0.0%,
22868,1,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),6

0,1
3.2,22862
(Missing),6

Value,Count,Frequency (%),Unnamed: 3
3.2,22862,100.0%,
(Missing),6,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
3.2.00,22793
3.2.02,59
3.2.01,16

Value,Count,Frequency (%),Unnamed: 3
3.2.00,22793,99.7%,
3.2.02,59,0.3%,
3.2.01,16,0.1%,

Unnamed: 0.1,ACIDTRAB,ALTCAUSA,ASSISTMED,ATESTADO,ATESTANTE,CAUSABAS,CAUSABAS_O,CAUSAMAT,CB_PRE,CIRCOBITO,CIRURGIA,CODESTAB,CODIFICADO,CODINST,CODMUNNATU,CODMUNOCOR,CODMUNRES,COMUNSVOIM,CRM,DIFDATA,DTATESTADO,DTCADASTRO,DTCADINF,DTCADINV,DTCONCASO,DTCONINV,DTINVESTIG,DTNASC,DTOBITO,DTRECEBIM,DTRECORIGA,ESC,ESC2010,ESCFALAGR1,ESCMAE,ESCMAE2010,ESCMAEAGR1,ESTABDESCR,ESTCIV,EXAME,FONTE,FONTEINV,FONTES,FONTESINF,GESTACAO,GRAVIDEZ,HORAOBITO,IDADE,IDADEMAE,LINHAA,LINHAB,LINHAC,LINHAD,LINHAII,LOCOCOR,MORTEPARTO,NATURAL,NECROPSIA,NUDIASINF,NUDIASOBCO,NUDIASOBIN,NUMERODN,NUMERODO,NUMERODV,NUMEROLOTE,NUMSUS,OBITOGRAV,OBITOPARTO,OBITOPUERP,OCUP,OCUPMAE,ORIGEM,PARTO,PESO,QTDFILMORT,QTDFILVIVO,RACACOR,SEMAGESTAC,SERIESCFAL,SERIESCMAE,SEXO,STCODIFICA,STDOEPIDEM,STDONOVA,TIPOBITO,TPMORTEOCO,TPNIVELINV,TPOBITOCOR,TPPOS,TPRESGINFO,Unnamed: 0,VERSAOSCB,VERSAOSIST
0,,1.0,,P369/P072*P960,1,P369,P369,,,,,7257406.0,S,MES3205000001,320500,320500,320130,,13597,17.0,2016-01-01,2016-01-12,2016-03-14,NaT,NaT,NaT,NaT,2015-12-28,2016-01-01,2016-01-18,2016-01-18,,,,3.0,2.0,3.0,,,,,,SXSSXX,,2.0,1.0,1450.0,204.0,16.0,*P369,*P072,,,*P960,1,3.0,832,,,,,67391759.0,22196183,6,20160002,706801787564424.0,,3.0,,,999991.0,1,1.0,745.0,0.0,0.0,1,26.0,,6.0,2,S,0.0,1.0,2,,,,N,,1,3.2,3.2.00
1,,,1.0,A419/J189/N189/E149,2,E142,E142,,,,,7257406.0,S,MES3205000001,310060,320500,320500,,1245,24.0,2016-01-01,2016-01-19,NaT,NaT,NaT,NaT,NaT,1923-02-01,2016-01-01,2016-01-25,2016-01-25,2.0,1.0,10.0,,,,,1.0,,,,,,,,845.0,492.0,,*A419,*J189,*N189,*E149,,1,,831,2.0,,,,,22196181,0,20160003,,,,,999992.0,,1,,,,,4,,,,2,S,0.0,1.0,2,,,,N,,2,3.2,3.2.00
2,,,1.0,J969/J690/M809,1,M809,M809,,,,,7257406.0,S,MES3205000001,311340,320500,320500,,13468,209.0,2016-01-01,2016-01-19,NaT,NaT,NaT,NaT,NaT,1929-11-24,2016-01-01,2016-07-28,2016-01-25,2.0,1.0,10.0,,,,,9.0,,,,,,,,1006.0,486.0,,*J969,*J690,*M809,,,1,,831,2.0,,,,,22196182,8,20160026,,,,,999992.0,,1,,,,,4,,,,2,S,0.0,1.0,2,,,,N,,3,3.2,3.2.00
3,,,2.0,T07/X950,3,X950,X950,,,3.0,,,S,MES3205000001,320520,320500,320500,320530.0,10915,24.0,2016-01-01,2016-01-19,NaT,NaT,NaT,NaT,NaT,1998-01-09,2016-01-01,2016-01-25,2016-01-25,3.0,2.0,11.0,,,,,1.0,,1.0,,,,,,,417.0,,*T07X,*X950,,,,3,,832,1.0,,,,,22201559,4,20160003,,,,,999991.0,,1,,,,,4,,,,1,S,0.0,1.0,2,,,,N,,4,3.2,3.2.00
4,,,1.0,A419/I808/N179/C169,5,C169,C169,,,,,7257406.0,S,MES3205000001,320060,320500,320060,,8832,24.0,2016-01-01,2016-01-19,NaT,NaT,NaT,NaT,NaT,1957-12-04,2016-01-01,2016-01-25,2016-01-25,9.0,9.0,9.0,,,,,3.0,,,,,,,,1200.0,458.0,,*A419,*I808,*N179,*C169,,1,,832,2.0,,,,,22196184,4,20160003,702805654925060.0,2.0,,3.0,999992.0,,1,,,,,2,,,,2,S,0.0,1.0,2,8.0,,,N,,5,3.2,3.2.00


### SIM DOES 2012..2016 `df_sim_does20122016_raw`

In [18]:
pf_sim_does20122016_raw = pandas_profiling.ProfileReport(df_sim_does20122016_raw)
pf_sim_does20122016_raw_desc = pf_sim_does20122016_raw.get_description()
pf_sim_does20122016_raw_vars = pf_sim_does20122016_raw_desc['variables']

with pd.option_context(*CONTEXT_MAX_ROWS_COLS):
    display(pf_sim_does20122016_raw_vars)
    display(pf_sim_does20122016_raw)

Unnamed: 0,count,distinct_count,p_missing,n_missing,p_infinite,n_infinite,is_unique,mode,p_unique,memorysize,type,top,freq,mean,min,max,range,histogram,mini_histogram,std,variance,5%,25%,50%,75%,95%,iqr,kurtosis,skewness,sum,mad,cv,n_zeros,p_zeros
ACIDTRAB,7618,4,0.931057,102879,0,0,False,9,3.62001e-05,110681,CAT,9,4558.0,,,,,,,,,,,,,,,,,,,,,
ALTCAUSA,1684,3,0.98476,108813,0,0,False,2,2.71501e-05,884056,CAT,2,1380.0,,,,,,,,,,,,,,,,,,,,,
ASSISTMED,102165,4,0.0754048,8332,0,0,False,1,3.62001e-05,110681,CAT,1,69195.0,,,,,,,,,,,,,,,,,,,,,
ATESTADO,67230,45139,0.391567,43267,0,0,False,A419/J189,0.408509,884056,CAT,A419/J189,424.0,,,,,,,,,,,,,,,,,,,,,
ATESTANTE,109101,6,0.0126338,1396,0,0,False,1,5.43001e-05,110777,CAT,1,32700.0,,,,,,,,,,,,,,,,,,,,,
CAUSABAS,110497,2728,0.0,0,0,0,False,I219,0.0246885,884056,CAT,I219,8925.0,,,,,,,,,,,,,,,,,,,,,
CAUSABAS_O,110475,2641,0.0001991,22,0,0,False,I219,0.0239011,884056,CAT,I219,8882.0,,,,,,,,,,,,,,,,,,,,,
CAUSAMAT,0,1,1.0,110497,0,0,False,,9.05002e-06,110657,CONST,,,,,,,,,,,,,,,,,,,,,,,
CB_PRE,0,1,1.0,110497,0,0,False,,9.05002e-06,884056,CONST,,,,,,,,,,,,,,,,,,,,,,,
CIRCOBITO,18877,6,0.829163,91620,0,0,False,1,5.43001e-05,110777,CAT,1,8910.0,,,,,,,,,,,,,,,,,,,,,


0,1
Number of variables,98
Number of observations,110497
Total Missing (%),55.7%
Total size in memory,60.2 MiB
Average record size in memory,571.1 B

0,1
Numeric,12
Categorical,68
Boolean,2
Date,13
Text (Unique),0
Rejected,3
Unsupported,0

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),93.1%
Missing (n),102879

0,1
9,4558
2,2710
1,350
(Missing),102879

Value,Count,Frequency (%),Unnamed: 3
9,4558,4.1%,
2,2710,2.5%,
1,350,0.3%,
(Missing),102879,93.1%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),98.5%
Missing (n),108813

0,1
2,1380
1,304
(Missing),108813

Value,Count,Frequency (%),Unnamed: 3
2,1380,1.2%,
1,304,0.3%,
(Missing),108813,98.5%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),7.5%
Missing (n),8332

0,1
1,69195
9,17847
2,15123
(Missing),8332

Value,Count,Frequency (%),Unnamed: 3
1,69195,62.6%,
9,17847,16.2%,
2,15123,13.7%,
(Missing),8332,7.5%,

0,1
Distinct count,45139
Unique (%),40.9%
Missing (%),39.2%
Missing (n),43267

0,1
A419/J189,424
R99,374
I219/I10,365
Other values (45135),66067
(Missing),43267

Value,Count,Frequency (%),Unnamed: 3
A419/J189,424,0.4%,
R99,374,0.3%,
I219/I10,365,0.3%,
I219,342,0.3%,
C349,287,0.3%,
Y349,277,0.3%,
C169,209,0.2%,
C509,205,0.2%,
C159,197,0.2%,
R092/I219,181,0.2%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),1.3%
Missing (n),1396

0,1
1,32700
2,26033
3,18697
Other values (2),31671

Value,Count,Frequency (%),Unnamed: 3
1,32700,29.6%,
2,26033,23.6%,
3,18697,16.9%,
5,18178,16.5%,
4,13493,12.2%,
(Missing),1396,1.3%,

0,1
Distinct count,2728
Unique (%),2.5%
Missing (%),0.0%
Missing (n),0

0,1
I219,8925
J189,3839
I64,3391
Other values (2725),94342

Value,Count,Frequency (%),Unnamed: 3
I219,8925,8.1%,
J189,3839,3.5%,
I64,3391,3.1%,
X954,3170,2.9%,
E149,2641,2.4%,
G309,2153,1.9%,
C349,2138,1.9%,
I678,1955,1.8%,
I110,1916,1.7%,
I694,1904,1.7%,

0,1
Distinct count,2641
Unique (%),2.4%
Missing (%),0.0%
Missing (n),22

0,1
I219,8882
J189,4201
I64,3367
Other values (2637),94025

Value,Count,Frequency (%),Unnamed: 3
I219,8882,8.0%,
J189,4201,3.8%,
I64,3367,3.0%,
X954,2970,2.7%,
E149,2577,2.3%,
C349,2118,1.9%,
G309,2036,1.8%,
I678,1919,1.7%,
I110,1701,1.5%,
I694,1688,1.5%,

0,1
Constant value,

0,1
Constant value,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),82.9%
Missing (n),91620

0,1
1,8910
3,7305
9,1750
Other values (2),912
(Missing),91620

Value,Count,Frequency (%),Unnamed: 3
1,8910,8.1%,
3,7305,6.6%,
9,1750,1.6%,
2,848,0.8%,
4,64,0.1%,
(Missing),91620,82.9%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),110394

0,1
2,74
1,19
9,10
(Missing),110394

Value,Count,Frequency (%),Unnamed: 3
2,74,0.1%,
1,19,0.0%,
9,10,0.0%,
(Missing),110394,99.9%,

0,1
Distinct count,258
Unique (%),0.2%
Missing (%),80.6%
Missing (n),89022

0,1
1,3459
5220,2272
4909,1180
Other values (254),14564
(Missing),89022

Value,Count,Frequency (%),Unnamed: 3
1,3459,3.1%,
5220,2272,2.1%,
4909,1180,1.1%,
6104,1151,1.0%,
1617,1044,0.9%,
4085,1022,0.9%,
3441,828,0.7%,
2275,821,0.7%,
4911,764,0.7%,
1616,642,0.6%,

0,1
Distinct count,632
Unique (%),0.6%
Missing (%),27.1%
Missing (n),29914

0,1
7257406,4585
0011738,4538
2550687,4531
Other values (628),66929
(Missing),29914

Value,Count,Frequency (%),Unnamed: 3
7257406,4585,4.1%,
0011738,4538,4.1%,
2550687,4531,4.1%,
2485680,4051,3.7%,
2547821,3410,3.1%,
2494442,2961,2.7%,
2446030,2733,2.5%,
2546957,2635,2.4%,
0011746,2512,2.3%,
0011819,2209,2.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),39.2%
Missing (n),43268

0,1
S,67215
N,14
(Missing),43268

Value,Count,Frequency (%),Unnamed: 3
S,67215,60.8%,
N,14,0.0%,
(Missing),43268,39.2%,

0,1
Distinct count,212
Unique (%),0.2%
Missing (%),0.0%
Missing (n),0

0,1
RES3205300001,48508
MES3205300001,19547
MES3205200001,13826
Other values (209),28616

Value,Count,Frequency (%),Unnamed: 3
RES3205300001,48508,43.9%,
MES3205300001,19547,17.7%,
MES3205200001,13826,12.5%,
MES3205000001,13105,11.9%,
MES3201500001,6295,5.7%,
MES3201300001,5958,5.4%,
MES3200600001,1713,1.6%,
MRJ3300600001,151,0.1%,
MRJ3302200001,112,0.1%,
MES3205100001,90,0.1%,

0,1
Distinct count,112
Unique (%),0.1%
Missing (%),80.6%
Missing (n),89016

0,1
320530,3796
320520,2698
320500,2646
Other values (108),12341
(Missing),89016

Value,Count,Frequency (%),Unnamed: 3
320530,3796,3.4%,
320520,2698,2.4%,
320500,2646,2.4%,
320120,1985,1.8%,
320150,1188,1.1%,
320130,1153,1.0%,
320490,1063,1.0%,
320320,857,0.8%,
320240,339,0.3%,
320060,334,0.3%,

0,1
Distinct count,1513
Unique (%),1.4%
Missing (%),49.0%
Missing (n),54181

0,1
320530,4162
320150,3755
320520,2160
Other values (1509),46239
(Missing),54181

Value,Count,Frequency (%),Unnamed: 3
320530,4162,3.8%,
320150,3755,3.4%,
320520,2160,2.0%,
320120,1926,1.7%,
320010,1621,1.5%,
320320,1547,1.4%,
320000,1251,1.1%,
320490,1240,1.1%,
320500,1225,1.1%,
320020,1144,1.0%,

0,1
Distinct count,331
Unique (%),0.3%
Missing (%),0.0%
Missing (n),0

0,1
320530,19662
320520,13852
320500,13123
Other values (328),63860

Value,Count,Frequency (%),Unnamed: 3
320530,19662,17.8%,
320520,13852,12.5%,
320500,13123,11.9%,
320120,9798,8.9%,
320150,6613,6.0%,
320130,5967,5.4%,
320490,5507,5.0%,
320320,4487,4.1%,
320090,1746,1.6%,
320060,1720,1.6%,

0,1
Distinct count,79
Unique (%),0.1%
Missing (%),0.0%
Missing (n),0

0,1
320520,12756
320500,11700
320130,11112
Other values (76),74929

Value,Count,Frequency (%),Unnamed: 3
320520,12756,11.5%,
320500,11700,10.6%,
320130,11112,10.1%,
320530,9866,8.9%,
320120,6627,6.0%,
320320,4041,3.7%,
320150,3849,3.5%,
320240,3323,3.0%,
320490,3245,2.9%,
320060,2201,2.0%,

0,1
Distinct count,146
Unique (%),0.1%
Missing (%),71.1%
Missing (n),78549

0,1
320530,24145
320320,2815
320120,2606
Other values (142),2382
(Missing),78549

Value,Count,Frequency (%),Unnamed: 3
320530,24145,21.9%,
320320,2815,2.5%,
320120,2606,2.4%,
320150,1716,1.6%,
320500,82,0.1%,
293135,73,0.1%,
330100,35,0.0%,
310620,30,0.0%,
312770,28,0.0%,
330240,26,0.0%,

0,1
Distinct count,5358
Unique (%),4.8%
Missing (%),39.5%
Missing (n),43680

0,1
6507,1598
6733,1134
5132,921
Other values (5354),63164
(Missing),43680

Value,Count,Frequency (%),Unnamed: 3
6507,1598,1.4%,
6733,1134,1.0%,
5132,921,0.8%,
11809,746,0.7%,
9434,717,0.6%,
9389,616,0.6%,
6734,552,0.5%,
6752,542,0.5%,
8207,527,0.5%,
1109,462,0.4%,

0,1
Distinct count,726
Unique (%),0.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,75.00871
Minimum,0.0
Maximum,814.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,21.0
Q1,37.0
Median,51.0
Q3,70.0
95-th percentile,274.0
Maximum,814.0
Range,814.0
Interquartile range,33.0

0,1
Standard deviation,86.790596
Coef of variation,1.1570735
Kurtosis,14.752261
Mean,75.00871
MAD,47.125946
Skewness,3.6469264
Sum,8288238.0
Variance,7532.6074
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
46.0,2110,1.9%,
45.0,2074,1.9%,
47.0,1976,1.8%,
49.0,1967,1.8%,
40.0,1955,1.8%,
48.0,1953,1.8%,
44.0,1949,1.8%,
50.0,1943,1.8%,
41.0,1941,1.8%,
51.0,1926,1.7%,

Value,Count,Frequency (%),Unnamed: 3
0.0,17,0.0%,
1.0,2,0.0%,
2.0,13,0.0%,
3.0,8,0.0%,
4.0,24,0.0%,

Value,Count,Frequency (%),Unnamed: 3
777.0,1,0.0%,
780.0,2,0.0%,
791.0,1,0.0%,
799.0,1,0.0%,
814.0,1,0.0%,

0,1
Distinct count,1839
Unique (%),1.7%
Missing (%),0.1%
Missing (n),145
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-01 00:00:00
Maximum,2017-07-24 00:00:00

0,1
Distinct count,1375
Unique (%),1.2%
Missing (%),1.4%
Missing (n),1589
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-09 00:00:00
Maximum,2018-02-28 00:00:00

0,1
Distinct count,1045
Unique (%),0.9%
Missing (%),97.3%
Missing (n),107467
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-02-15 00:00:00
Maximum,2018-02-06 00:00:00

0,1
Distinct count,1212
Unique (%),1.1%
Missing (%),94.7%
Missing (n),104618
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-02-17 00:00:00
Maximum,2018-02-20 00:00:00

0,1
Distinct count,434
Unique (%),0.4%
Missing (%),99.1%
Missing (n),109450
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-13 00:00:00
Maximum,2015-01-14 00:00:00

0,1
Distinct count,1042
Unique (%),0.9%
Missing (%),95.8%
Missing (n),105876
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-25 00:00:00
Maximum,2018-01-22 00:00:00

0,1
Distinct count,1636
Unique (%),1.5%
Missing (%),86.2%
Missing (n),95263
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-13 00:00:00
Maximum,2018-02-05 00:00:00

0,1
Distinct count,31294
Unique (%),28.3%
Missing (%),0.2%
Missing (n),244
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,1900-08-10 00:00:00
Maximum,2016-12-30 00:00:00

0,1
Distinct count,1827
Unique (%),1.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-01 00:00:00
Maximum,2016-12-31 00:00:00

0,1
Distinct count,793
Unique (%),0.7%
Missing (%),0.0%
Missing (n),14
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-10 00:00:00
Maximum,2018-02-28 00:00:00

0,1
Distinct count,176
Unique (%),0.2%
Missing (%),80.4%
Missing (n),88846
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-08 00:00:00
Maximum,2015-02-24 00:00:00

0,1
Distinct count,679
Unique (%),0.6%
Missing (%),19.6%
Missing (n),21663
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2012-01-10 00:00:00
Maximum,2018-02-28 00:00:00

0,1
Distinct count,436
Unique (%),0.4%
Missing (%),81.2%
Missing (n),89694
Infinite (%),0.0%
Infinite (n),0

0,1
Minimum,2013-01-01 00:00:00
Maximum,2015-02-05 00:00:00

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),17.4%
Missing (n),19244

0,1
9,26463
2,19812
1,14393
Other values (4),30585
(Missing),19244

Value,Count,Frequency (%),Unnamed: 3
9,26463,23.9%,
2,19812,17.9%,
1,14393,13.0%,
3,13646,12.3%,
4,8969,8.1%,
0,5075,4.6%,
5,2895,2.6%,
(Missing),19244,17.4%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),22.1%
Missing (n),24426

0,1
9,26421
1,24538
0,14380
Other values (4),20732
(Missing),24426

Value,Count,Frequency (%),Unnamed: 3
9,26421,23.9%,
1,24538,22.2%,
0,14380,13.0%,
2,10371,9.4%,
3,7474,6.8%,
5,2379,2.2%,
4,508,0.5%,
(Missing),24426,22.1%,

0,1
Distinct count,14
Unique (%),0.0%
Missing (%),52.3%
Missing (n),57769

0,1
09,16574
10,9864
00,8688
Other values (10),17602
(Missing),57769

Value,Count,Frequency (%),Unnamed: 3
09,16574,15.0%,
10,9864,8.9%,
00,8688,7.9%,
11,3672,3.3%,
12,3645,3.3%,
02,3363,3.0%,
08,1549,1.4%,
01,1546,1.4%,
03,1499,1.4%,
04,1084,1.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.6%
Missing (n),107814

0,1
4,1173
3,639
5,329
Other values (4),542
(Missing),107814

Value,Count,Frequency (%),Unnamed: 3
4,1173,1.1%,
3,639,0.6%,
5,329,0.3%,
9,278,0.3%,
2,126,0.1%,
1,80,0.1%,
0,58,0.1%,
(Missing),107814,97.6%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.6%
Missing (n),107882

0,1
3,1004
2,737
9,277
Other values (4),597
(Missing),107882

Value,Count,Frequency (%),Unnamed: 3
3,1004,0.9%,
2,737,0.7%,
9,277,0.3%,
5,234,0.2%,
1,193,0.2%,
4,91,0.1%,
0,79,0.1%,
(Missing),107882,97.6%,

0,1
Distinct count,14
Unique (%),0.0%
Missing (%),98.5%
Missing (n),108841

0,1
12,398
11,199
06,181
Other values (10),878
(Missing),108841

Value,Count,Frequency (%),Unnamed: 3
12,398,0.4%,
11,199,0.2%,
06,181,0.2%,
08,163,0.1%,
03,150,0.1%,
09,143,0.1%,
04,123,0.1%,
05,76,0.1%,
07,59,0.1%,
02,53,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),100.0%
Missing (n),110496

0,1
VITORIA APART,1
(Missing),110496

Value,Count,Frequency (%),Unnamed: 3
VITORIA APART,1,0.0%,
(Missing),110496,100.0%,

0,1
Distinct count,7
Unique (%),0.0%
Missing (%),11.6%
Missing (n),12839

0,1
2,34125
1,25516
3,21686
Other values (3),16331
(Missing),12839

Value,Count,Frequency (%),Unnamed: 3
2,34125,30.9%,
1,25516,23.1%,
3,21686,19.6%,
9,8436,7.6%,
4,6039,5.5%,
5,1856,1.7%,
(Missing),12839,11.6%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),110397

0,1
1,59
2,28
9,13
(Missing),110397

Value,Count,Frequency (%),Unnamed: 3
1,59,0.1%,
2,28,0.0%,
9,13,0.0%,
(Missing),110397,99.9%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),84.0%
Missing (n),92776

0,1
1,10836
9,3024
2,2225
Other values (2),1636
(Missing),92776

Value,Count,Frequency (%),Unnamed: 3
1,10836,9.8%,
9,3024,2.7%,
2,2225,2.0%,
4,988,0.9%,
3,648,0.6%,
(Missing),92776,84.0%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),85.2%
Missing (n),94134

0,1
3,4631
6,3555
1,3041
Other values (6),5136
(Missing),94134

Value,Count,Frequency (%),Unnamed: 3
3,4631,4.2%,
6,3555,3.2%,
1,3041,2.8%,
4,1847,1.7%,
8,1682,1.5%,
2,1064,1.0%,
7,351,0.3%,
5,185,0.2%,
9,7,0.0%,
(Missing),94134,85.2%,

0,1
Distinct count,52
Unique (%),0.0%
Missing (%),97.3%
Missing (n),107539

0,1
SXXXXX,597
XXSXXX,265
SSXXXX,244
Other values (48),1852
(Missing),107539

Value,Count,Frequency (%),Unnamed: 3
SXXXXX,597,0.5%,
XXSXXX,265,0.2%,
SSXXXX,244,0.2%,
SXSXXX,238,0.2%,
XXXXXS,203,0.2%,
XXXSXX,196,0.2%,
XXXXSX,127,0.1%,
SXXXXS,113,0.1%,
SXXSXX,106,0.1%,
SXSSXX,79,0.1%,

0,1
Distinct count,39
Unique (%),0.0%
Missing (%),80.1%
Missing (n),88467

0,1
XXXXXXX,21497
SXSSXXX,95
XXXSXXX,88
Other values (35),350
(Missing),88467

Value,Count,Frequency (%),Unnamed: 3
XXXXXXX,21497,19.5%,
SXSSXXX,95,0.1%,
XXXSXXX,88,0.1%,
XXSXXXX,81,0.1%,
SXXSXXX,80,0.1%,
SXSXXXX,41,0.0%,
SXXXXXX,26,0.0%,
XXSSXXX,26,0.0%,
XXSXSXX,9,0.0%,
SXSSSXX,8,0.0%,

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),97.6%
Missing (n),107863

0,1
5,829
2,586
4,548
Other values (4),671
(Missing),107863

Value,Count,Frequency (%),Unnamed: 3
5,829,0.8%,
2,586,0.5%,
4,548,0.5%,
3,451,0.4%,
1,154,0.1%,
9,47,0.0%,
6,19,0.0%,
(Missing),107863,97.6%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.4%
Missing (n),107674

0,1
1,2516
2,239
9,55
(Missing),107674

Value,Count,Frequency (%),Unnamed: 3
1,2516,2.3%,
2,239,0.2%,
9,55,0.0%,
3,13,0.0%,
(Missing),107674,97.4%,

0,1
Distinct count,1440
Unique (%),1.3%
Missing (%),10.8%
Missing (n),11973
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1195.1311
Minimum,0.0
Maximum,2359.0
Zeros (%),0.2%

0,1
Minimum,0.0
5-th percentile,125.0
Q1,622.0
Median,1200.0
Q3,1800.0
95-th percentile,2240.0
Maximum,2359.0
Range,2359.0
Interquartile range,1178.0

0,1
Standard deviation,675.3164
Coef of variation,0.5650563
Kurtosis,-1.1667507
Mean,1195.1311
MAD,584.2378
Skewness,0.0035498044
Sum,117749096.0
Variance,456052.28
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,1379,1.2%,
500.0,1193,1.1%,
800.0,1095,1.0%,
900.0,1084,1.0%,
700.0,1075,1.0%,
1700.0,1030,0.9%,
1000.0,1000,0.9%,
1600.0,996,0.9%,
2200.0,982,0.9%,
1800.0,966,0.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,259,0.2%,
1.0,35,0.0%,
2.0,27,0.0%,
3.0,12,0.0%,
4.0,10,0.0%,

Value,Count,Frequency (%),Unnamed: 3
2355.0,168,0.2%,
2356.0,13,0.0%,
2357.0,16,0.0%,
2358.0,24,0.0%,
2359.0,14,0.0%,

0,1
Distinct count,225
Unique (%),0.2%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,457.10965
Minimum,1.0
Maximum,999.0
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,417.0
Q1,449.0
Median,467.0
Q3,481.0
95-th percentile,492.0
Maximum,999.0
Range,998.0
Interquartile range,32.0

0,1
Standard deviation,51.633976
Coef of variation,0.11295753
Kurtosis,33.89347
Mean,457.10965
MAD,26.055868
Skewness,-3.4106576
Sum,50509244.0
Variance,2666.0676
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
483.0,2365,2.1%,
481.0,2345,2.1%,
484.0,2320,2.1%,
482.0,2317,2.1%,
477.0,2308,2.1%,
485.0,2249,2.0%,
480.0,2237,2.0%,
479.0,2221,2.0%,
476.0,2218,2.0%,
478.0,2213,2.0%,

Value,Count,Frequency (%),Unnamed: 3
1.0,31,0.0%,
2.0,4,0.0%,
3.0,9,0.0%,
4.0,1,0.0%,
5.0,21,0.0%,

Value,Count,Frequency (%),Unnamed: 3
512.0,3,0.0%,
513.0,1,0.0%,
514.0,1,0.0%,
515.0,1,0.0%,
999.0,84,0.1%,

0,1
Distinct count,37
Unique (%),0.0%
Missing (%),97.6%
Missing (n),107852
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,26.657845
Minimum,9.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,9.0
5-th percentile,16.0
Q1,20.0
Median,26.0
Q3,32.0
95-th percentile,39.0
Maximum,99.0
Range,90.0
Interquartile range,12.0

0,1
Standard deviation,8.036212
Coef of variation,0.30145767
Kurtosis,15.773857
Mean,26.657845
MAD,6.171453
Skewness,2.0608222
Sum,70510.0
Variance,64.580696
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
26.0,143,0.1%,
18.0,132,0.1%,
25.0,132,0.1%,
19.0,128,0.1%,
30.0,125,0.1%,
20.0,120,0.1%,
22.0,118,0.1%,
29.0,116,0.1%,
24.0,116,0.1%,
28.0,115,0.1%,

Value,Count,Frequency (%),Unnamed: 3
9.0,1,0.0%,
13.0,4,0.0%,
14.0,27,0.0%,
15.0,51,0.0%,
16.0,93,0.1%,

Value,Count,Frequency (%),Unnamed: 3
43.0,14,0.0%,
44.0,5,0.0%,
45.0,2,0.0%,
46.0,1,0.0%,
99.0,7,0.0%,

0,1
Distinct count,2535
Unique (%),2.3%
Missing (%),2.3%
Missing (n),2526

0,1
*A419,18315
*R688,6223
*R092,6185
Other values (2531),77248

Value,Count,Frequency (%),Unnamed: 3
*A419,18315,16.6%,
*R688,6223,5.6%,
*R092,6185,5.6%,
*I219,5808,5.3%,
*J969,5466,4.9%,
*J960,4717,4.3%,
*J81X,4236,3.8%,
*R570,3108,2.8%,
*T792,2134,1.9%,
*J189,1920,1.7%,

0,1
Distinct count,3660
Unique (%),3.3%
Missing (%),17.0%
Missing (n),18827

0,1
*J189,8085
*A419,5058
*I10X,3608
Other values (3656),74919
(Missing),18827

Value,Count,Frequency (%),Unnamed: 3
*J189,8085,7.3%,
*A419,5058,4.6%,
*I10X,3608,3.3%,
*I219,3514,3.2%,
*S069,2522,2.3%,
*I500,1876,1.7%,
*N390,1605,1.5%,
*J180,1575,1.4%,
*J159,1464,1.3%,
*I509,1268,1.1%,

0,1
Distinct count,3695
Unique (%),3.3%
Missing (%),41.8%
Missing (n),46133

0,1
*I10X,5072
*J189,2914
*J449,1480
Other values (3691),54898
(Missing),46133

Value,Count,Frequency (%),Unnamed: 3
*I10X,5072,4.6%,
*J189,2914,2.6%,
*J449,1480,1.3%,
*X954,1416,1.3%,
*E149,1411,1.3%,
*I709,1229,1.1%,
*I219,1141,1.0%,
*I251,1126,1.0%,
*I64X,1086,1.0%,
*I500,1044,0.9%,

0,1
Distinct count,2629
Unique (%),2.4%
Missing (%),74.2%
Missing (n),81935

0,1
*I10X,4130
*E149,1385
*F102,1011
Other values (2625),22036
(Missing),81935

Value,Count,Frequency (%),Unnamed: 3
*I10X,4130,3.7%,
*E149,1385,1.3%,
*F102,1011,0.9%,
*J449,586,0.5%,
*G309,557,0.5%,
*I709,529,0.5%,
*F172,523,0.5%,
*J189,515,0.5%,
*I694,493,0.4%,
*N189,424,0.4%,

0,1
Distinct count,8104
Unique (%),7.3%
Missing (%),66.4%
Missing (n),73327

0,1
*I10X,3689
*E149,1574
*I10X*E149,1247
Other values (8100),30660
(Missing),73327

Value,Count,Frequency (%),Unnamed: 3
*I10X,3689,3.3%,
*E149,1574,1.4%,
*I10X*E149,1247,1.1%,
*F172,899,0.8%,
*F102,722,0.7%,
*R54X,713,0.6%,
*N189,680,0.6%,
*G309,668,0.6%,
*N179,567,0.5%,
*E149*I10,431,0.4%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,76410
3,18486
4,7752
Other values (3),7849

Value,Count,Frequency (%),Unnamed: 3
1,76410,69.2%,
3,18486,16.7%,
4,7752,7.0%,
2,4172,3.8%,
5,3368,3.0%,
9,309,0.3%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),97.3%
Missing (n),107525

0,1
3,2752
9,206
1,12
(Missing),107525

Value,Count,Frequency (%),Unnamed: 3
3,2752,2.5%,
9,206,0.2%,
1,12,0.0%,
2,2,0.0%,
(Missing),107525,97.3%,

0,1
Distinct count,82
Unique (%),0.1%
Missing (%),43.3%
Missing (n),47837

0,1
832,41552
831,8153
800,5955
Other values (78),7000
(Missing),47837

Value,Count,Frequency (%),Unnamed: 3
832,41552,37.6%,
831,8153,7.4%,
800,5955,5.4%,
829,3194,2.9%,
833,1811,1.6%,
835,392,0.4%,
826,229,0.2%,
823,171,0.2%,
827,149,0.1%,
190,111,0.1%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),7.1%
Missing (n),7836

0,1
2,67747
1,30281
9,4633
(Missing),7836

Value,Count,Frequency (%),Unnamed: 3
2,67747,61.3%,
1,30281,27.4%,
9,4633,4.2%,
(Missing),7836,7.1%,

0,1
Distinct count,236
Unique (%),0.2%
Missing (%),99.5%
Missing (n),109906
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,134.08122
Minimum,17.0
Maximum,607.0
Zeros (%),0.0%

0,1
Minimum,17.0
5-th percentile,43.0
Q1,77.0
Median,108.0
Q3,166.0
95-th percentile,315.0
Maximum,607.0
Range,590.0
Interquartile range,89.0

0,1
Standard deviation,91.67381
Coef of variation,0.6837185
Kurtosis,5.2567425
Mean,134.08122
MAD,65.89674
Skewness,2.0141628
Sum,79242.0
Variance,8404.088
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
108.0,12,0.0%,
120.0,11,0.0%,
113.0,10,0.0%,
85.0,10,0.0%,
87.0,9,0.0%,
112.0,9,0.0%,
101.0,9,0.0%,
100.0,8,0.0%,
81.0,8,0.0%,
109.0,8,0.0%,

Value,Count,Frequency (%),Unnamed: 3
17.0,1,0.0%,
19.0,1,0.0%,
20.0,3,0.0%,
25.0,1,0.0%,
29.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
532.0,1,0.0%,
539.0,1,0.0%,
575.0,1,0.0%,
587.0,1,0.0%,
607.0,1,0.0%,

0,1
Distinct count,326
Unique (%),0.3%
Missing (%),96.9%
Missing (n),107043
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,90.897224
Minimum,0.0
Maximum,547.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,23.0
Q1,52.0
Median,77.0
Q3,110.75
95-th percentile,219.0
Maximum,547.0
Range,547.0
Interquartile range,58.75

0,1
Standard deviation,62.802937
Coef of variation,0.6909225
Kurtosis,6.941618
Mean,90.897224
MAD,43.52176
Skewness,2.1581578
Sum,313959.0
Variance,3944.2087
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
72.0,45,0.0%,
60.0,44,0.0%,
54.0,42,0.0%,
68.0,41,0.0%,
77.0,41,0.0%,
58.0,41,0.0%,
55.0,40,0.0%,
73.0,39,0.0%,
51.0,38,0.0%,
56.0,38,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,3,0.0%,
1.0,1,0.0%,
2.0,1,0.0%,
3.0,1,0.0%,
4.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
466.0,1,0.0%,
472.0,1,0.0%,
487.0,1,0.0%,
523.0,1,0.0%,
547.0,1,0.0%,

0,1
Distinct count,414
Unique (%),0.4%
Missing (%),94.7%
Missing (n),104648
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,108.88665
Minimum,11.0
Maximum,750.0
Zeros (%),0.0%

0,1
Minimum,11.0
5-th percentile,34.0
Q1,60.0
Median,87.0
Q3,128.0
95-th percentile,271.6
Maximum,750.0
Range,739.0
Interquartile range,68.0

0,1
Standard deviation,78.16301
Coef of variation,0.7178383
Kurtosis,8.3117
Mean,108.88665
MAD,53.740532
Skewness,2.3764334
Sum,636878.0
Variance,6109.4565
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
65.0,81,0.1%,
63.0,73,0.1%,
64.0,73,0.1%,
57.0,70,0.1%,
59.0,70,0.1%,
55.0,65,0.1%,
67.0,63,0.1%,
77.0,62,0.1%,
74.0,62,0.1%,
61.0,61,0.1%,

Value,Count,Frequency (%),Unnamed: 3
11.0,2,0.0%,
12.0,2,0.0%,
14.0,5,0.0%,
15.0,2,0.0%,
16.0,5,0.0%,

Value,Count,Frequency (%),Unnamed: 3
683.0,1,0.0%,
694.0,1,0.0%,
704.0,1,0.0%,
723.0,1,0.0%,
750.0,1,0.0%,

0,1
Distinct count,1501
Unique (%),1.4%
Missing (%),98.6%
Missing (n),108992

0,1
59425948,2
62103604,2
59410472,2
Other values (1497),1499
(Missing),108992

Value,Count,Frequency (%),Unnamed: 3
59425948,2,0.0%,
62103604,2,0.0%,
59410472,2,0.0%,
59410319,2,0.0%,
64290701,2,0.0%,
67400610,1,0.0%,
62105957,1,0.0%,
68811727,1,0.0%,
64333928,1,0.0%,
64341094,1,0.0%,

0,1
Distinct count,110494
Unique (%),100.0%
Missing (%),0.0%
Missing (n),0

0,1
19458646,2
20908246,2
18178000,2
Other values (110491),110491

Value,Count,Frequency (%),Unnamed: 3
19458646,2,0.0%,
20908246,2,0.0%,
18178000,2,0.0%,
20902805,1,0.0%,
18174562,1,0.0%,
16750804,1,0.0%,
18738358,1,0.0%,
23735172,1,0.0%,
23746108,1,0.0%,
22206107,1,0.0%,

0,1
Distinct count,11
Unique (%),0.0%
Missing (%),0.0%
Missing (n),22

0,1
0,20036
9,10099
8,10085
Other values (7),70255

Value,Count,Frequency (%),Unnamed: 3
0,20036,18.1%,
9,10099,9.1%,
8,10085,9.1%,
6,10074,9.1%,
3,10063,9.1%,
2,10061,9.1%,
5,10046,9.1%,
1,10014,9.1%,
7,10005,9.1%,
4,9992,9.0%,

0,1
Distinct count,262
Unique (%),0.2%
Missing (%),39.2%
Missing (n),43268

0,1
20150005,1085
20150008,1039
20150007,1030
Other values (258),64075
(Missing),43268

Value,Count,Frequency (%),Unnamed: 3
20150005,1085,1.0%,
20150008,1039,0.9%,
20150007,1030,0.9%,
20150010,1023,0.9%,
20150013,1004,0.9%,
20160011,983,0.9%,
20140035,920,0.8%,
20150023,884,0.8%,
20140019,848,0.8%,
20150004,828,0.7%,

0,1
Distinct count,18043
Unique (%),16.3%
Missing (%),80.6%
Missing (n),89036

0,1
4998,5
4942,5
3058,5
Other values (18039),21446
(Missing),89036

Value,Count,Frequency (%),Unnamed: 3
4998,5,0.0%,
4942,5,0.0%,
3058,5,0.0%,
3073,5,0.0%,
3124,5,0.0%,
5016,5,0.0%,
4925,5,0.0%,
530,5,0.0%,
2318,5,0.0%,
3113,5,0.0%,

0,1
Distinct count,10010
Unique (%),9.1%
Missing (%),90.9%
Missing (n),100482

0,1
000000000000000,6
700209425752721,2
703608000214230,1
Other values (10006),10006
(Missing),100482

Value,Count,Frequency (%),Unnamed: 3
000000000000000,6,0.0%,
700209425752721,2,0.0%,
703608000214230,1,0.0%,
898003042362363,1,0.0%,
706203580966164,1,0.0%,
858004243407853,1,0.0%,
200997891450018,1,0.0%,
898001223910336,1,0.0%,
700508182314755,1,0.0%,
000000003093332,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),91.9%
Missing (n),101581

0,1
2,6341
9,2480
1,95
(Missing),101581

Value,Count,Frequency (%),Unnamed: 3
2,6341,5.7%,
9,2480,2.2%,
1,95,0.1%,
(Missing),101581,91.9%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),97.4%
Missing (n),107669

0,1
3,2795
9,33
(Missing),107669

Value,Count,Frequency (%),Unnamed: 3
3,2795,2.5%,
9,33,0.0%,
(Missing),107669,97.4%,

0,1
Distinct count,5
Unique (%),0.0%
Missing (%),91.9%
Missing (n),101581

0,1
3,6236
9,2480
1,110
(Missing),101581

Value,Count,Frequency (%),Unnamed: 3
3,6236,5.6%,
9,2480,2.2%,
1,110,0.1%,
2,90,0.1%,
(Missing),101581,91.9%,

0,1
Distinct count,1054
Unique (%),1.0%
Missing (%),23.2%
Missing (n),25619

0,1
999993,31649
999992,13691
621005,11141
Other values (1050),28397
(Missing),25619

Value,Count,Frequency (%),Unnamed: 3
999993,31649,28.6%,
999992,13691,12.4%,
621005,11141,10.1%,
715210,3142,2.8%,
999991,1620,1.5%,
622020,1279,1.2%,
512105,1075,1.0%,
141410,1065,1.0%,
354705,963,0.9%,
782305,810,0.7%,

0,1
Distinct count,200
Unique (%),0.2%
Missing (%),98.1%
Missing (n),108353

0,1
999992,1036
999991,179
621005,90
Other values (196),839
(Missing),108353

Value,Count,Frequency (%),Unnamed: 3
999992,1036,0.9%,
999991,179,0.2%,
621005,90,0.1%,
411010,36,0.0%,
521110,36,0.0%,
421125,34,0.0%,
512105,33,0.0%,
322205,26,0.0%,
999994,25,0.0%,
622020,24,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,110483
2,13
3,1

Value,Count,Frequency (%),Unnamed: 3
1,110483,100.0%,
2,13,0.0%,
3,1,0.0%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),97.4%
Missing (n),107678

0,1
2,1589
1,1162
9,68
(Missing),107678

Value,Count,Frequency (%),Unnamed: 3
2,1589,1.4%,
1,1162,1.1%,
9,68,0.1%,
(Missing),107678,97.4%,

0,1
Distinct count,848
Unique (%),0.8%
Missing (%),97.6%
Missing (n),107836
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,1885.8118
Minimum,99.0
Maximum,5515.0
Zeros (%),0.0%

0,1
Minimum,99.0
5-th percentile,496.0
Q1,880.0
Median,1700.0
Q3,2825.0
95-th percentile,3690.0
Maximum,5515.0
Range,5416.0
Interquartile range,1945.0

0,1
Standard deviation,1100.8094
Coef of variation,0.5837324
Kurtosis,-1.0024577
Mean,1885.8118
MAD,969.7868
Skewness,0.38724148
Sum,5018145.0
Variance,1211781.4
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
600.0,22,0.0%,
2800.0,21,0.0%,
700.0,15,0.0%,
3000.0,15,0.0%,
2700.0,15,0.0%,
900.0,15,0.0%,
550.0,14,0.0%,
1000.0,14,0.0%,
800.0,12,0.0%,
770.0,12,0.0%,

Value,Count,Frequency (%),Unnamed: 3
99.0,1,0.0%,
160.0,1,0.0%,
190.0,1,0.0%,
245.0,1,0.0%,
268.0,1,0.0%,

Value,Count,Frequency (%),Unnamed: 3
4910.0,1,0.0%,
4965.0,1,0.0%,
5300.0,1,0.0%,
5345.0,1,0.0%,
5515.0,1,0.0%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),97.9%
Missing (n),108214
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,2.7516425
Minimum,0.0
Maximum,99.0
Zeros (%),1.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,0.0
Median,0.0
Q3,1.0
95-th percentile,2.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,15.143315
Coef of variation,5.503373
Kurtosis,36.431595
Mean,2.7516425
MAD,4.668275
Skewness,6.189133
Sum,6282.0
Variance,229.31999
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
0.0,1617,1.5%,
1.0,454,0.4%,
2.0,112,0.1%,
99.0,55,0.0%,
3.0,32,0.0%,
4.0,8,0.0%,
5.0,4,0.0%,
11.0,1,0.0%,
(Missing),108214,97.9%,

Value,Count,Frequency (%),Unnamed: 3
0.0,1617,1.5%,
1.0,454,0.4%,
2.0,112,0.1%,
3.0,32,0.0%,
4.0,8,0.0%,

Value,Count,Frequency (%),Unnamed: 3
3.0,32,0.0%,
4.0,8,0.0%,
5.0,4,0.0%,
11.0,1,0.0%,
99.0,55,0.0%,

0,1
Distinct count,14
Unique (%),0.0%
Missing (%),97.7%
Missing (n),107955
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,3.0952005
Minimum,0.0
Maximum,99.0
Zeros (%),0.5%

0,1
Minimum,0.0
5-th percentile,0.0
Q1,1.0
Median,1.0
Q3,2.0
95-th percentile,5.0
Maximum,99.0
Range,99.0
Interquartile range,1.0

0,1
Standard deviation,12.066113
Coef of variation,3.8983302
Kurtosis,58.399555
Mean,3.0952005
MAD,3.318842
Skewness,7.708784
Sum,7868.0
Variance,145.5911
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
1.0,952,0.9%,
2.0,551,0.5%,
0.0,516,0.5%,
3.0,242,0.2%,
4.0,114,0.1%,
5.0,65,0.1%,
99.0,39,0.0%,
6.0,29,0.0%,
7.0,18,0.0%,
8.0,6,0.0%,

Value,Count,Frequency (%),Unnamed: 3
0.0,516,0.5%,
1.0,952,0.9%,
2.0,551,0.5%,
3.0,242,0.2%,
4.0,114,0.1%,

Value,Count,Frequency (%),Unnamed: 3
8.0,6,0.0%,
9.0,5,0.0%,
10.0,2,0.0%,
11.0,3,0.0%,
99.0,39,0.0%,

0,1
Distinct count,6
Unique (%),0.0%
Missing (%),12.1%
Missing (n),13358

0,1
1,44673
4,42425
2,9637
Other values (2),404
(Missing),13358

Value,Count,Frequency (%),Unnamed: 3
1,44673,40.4%,
4,42425,38.4%,
2,9637,8.7%,
3,285,0.3%,
5,119,0.1%,
(Missing),13358,12.1%,

0,1
Distinct count,36
Unique (%),0.0%
Missing (%),97.6%
Missing (n),107870
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,32.647125
Minimum,0.0
Maximum,99.0
Zeros (%),0.0%

0,1
Minimum,0.0
5-th percentile,22.0
Q1,27.0
Median,33.0
Q3,38.0
95-th percentile,40.0
Maximum,99.0
Range,99.0
Interquartile range,11.0

0,1
Standard deviation,11.72508
Coef of variation,0.35914585
Kurtosis,16.75856
Mean,32.647125
MAD,6.9837885
Skewness,2.720046
Sum,85764.0
Variance,137.4775
Memory size,431.7 KiB

Value,Count,Frequency (%),Unnamed: 3
39.0,223,0.2%,
38.0,215,0.2%,
40.0,186,0.2%,
28.0,152,0.1%,
26.0,143,0.1%,
37.0,142,0.1%,
36.0,122,0.1%,
27.0,118,0.1%,
32.0,115,0.1%,
29.0,108,0.1%,

Value,Count,Frequency (%),Unnamed: 3
0.0,12,0.0%,
1.0,22,0.0%,
2.0,14,0.0%,
3.0,9,0.0%,
4.0,2,0.0%,

Value,Count,Frequency (%),Unnamed: 3
40.0,186,0.2%,
41.0,61,0.1%,
42.0,18,0.0%,
43.0,1,0.0%,
99.0,47,0.0%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),89.1%
Missing (n),98446

0,1
4,4738
3,1901
8,1483
Other values (5),3929
(Missing),98446

Value,Count,Frequency (%),Unnamed: 3
4,4738,4.3%,
3,1901,1.7%,
8,1483,1.3%,
5,1212,1.1%,
2,969,0.9%,
1,697,0.6%,
7,529,0.5%,
6,522,0.5%,
(Missing),98446,89.1%,

0,1
Distinct count,9
Unique (%),0.0%
Missing (%),99.2%
Missing (n),109652

0,1
3,248
8,168
5,85
Other values (5),344
(Missing),109652

Value,Count,Frequency (%),Unnamed: 3
3,248,0.2%,
8,168,0.2%,
5,85,0.1%,
7,82,0.1%,
1,74,0.1%,
4,69,0.1%,
6,61,0.1%,
2,58,0.1%,
(Missing),109652,99.2%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
1,64597
2,45876
0,24

Value,Count,Frequency (%),Unnamed: 3
1,64597,58.5%,
2,45876,41.5%,
0,24,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),39.2%
Missing (n),43282

0,1
S,67210
N,5
(Missing),43282

Value,Count,Frequency (%),Unnamed: 3
S,67210,60.8%,
N,5,0.0%,
(Missing),43282,39.2%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),1

0,1
Mean,0.0

0,1
0.0,110496
(Missing),1

Value,Count,Frequency (%),Unnamed: 3
0.0,110496,100.0%,
(Missing),1,0.0%,

0,1
Distinct count,2
Unique (%),0.0%
Missing (%),0.0%
Missing (n),0

0,1
Mean,0.80106246

0,1
1.0,88515
0.0,21982

Value,Count,Frequency (%),Unnamed: 3
1.0,88515,80.1%,
0.0,21982,19.9%,

0,1
Constant value,2

0,1
Distinct count,8
Unique (%),0.0%
Missing (%),91.9%
Missing (n),101587

0,1
8,6136
9,2480
4,110
Other values (4),184
(Missing),101587

Value,Count,Frequency (%),Unnamed: 3
8,6136,5.6%,
9,2480,2.2%,
4,110,0.1%,
5,89,0.1%,
1,71,0.1%,
2,18,0.0%,
3,6,0.0%,
(Missing),101587,91.9%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),96.8%
Missing (n),107002

0,1
M,3483
R,6
E,6
(Missing),107002

Value,Count,Frequency (%),Unnamed: 3
M,3483,3.2%,
R,6,0.0%,
E,6,0.0%,
(Missing),107002,96.8%,

0,1
Distinct count,10
Unique (%),0.0%
Missing (%),94.7%
Missing (n),104618

0,1
9,4763
8,869
5,102
Other values (6),145
(Missing),104618

Value,Count,Frequency (%),Unnamed: 3
9,4763,4.3%,
8,869,0.8%,
5,102,0.1%,
6,66,0.1%,
1,48,0.0%,
4,20,0.0%,
3,6,0.0%,
7,4,0.0%,
2,1,0.0%,
(Missing),104618,94.7%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),0.8%
Missing (n),914

0,1
N,93024
S,16559
(Missing),914

Value,Count,Frequency (%),Unnamed: 3
N,93024,84.2%,
S,16559,15.0%,
(Missing),914,0.8%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),99.9%
Missing (n),110348

0,1
1,92
2,44
3,13
(Missing),110348

Value,Count,Frequency (%),Unnamed: 3
1,92,0.1%,
2,44,0.0%,
3,13,0.0%,
(Missing),110348,99.9%,

0,1
Distinct count,22868
Unique (%),20.7%
Missing (%),0.0%
Missing (n),0
Infinite (%),0.0%
Infinite (n),0

0,1
Mean,11055
Minimum,1
Maximum,22868
Zeros (%),0.0%

0,1
Minimum,1.0
5-th percentile,1105.8
Q1,5525.0
Median,11050.0
Q3,16575.0
95-th percentile,20995.0
Maximum,22868.0
Range,22867.0
Interquartile range,11050.0

0,1
Standard deviation,6388.1
Coef of variation,0.57784
Kurtosis,-1.1934
Mean,11055
MAD,5529.8
Skewness,0.0046952
Sum,1221556151
Variance,40808000
Memory size,863.3 KiB

Value,Count,Frequency (%),Unnamed: 3
2047,5,0.0%,
8022,5,0.0%,
20252,5,0.0%,
18205,5,0.0%,
12112,5,0.0%,
10065,5,0.0%,
16210,5,0.0%,
14163,5,0.0%,
3924,5,0.0%,
1877,5,0.0%,

Value,Count,Frequency (%),Unnamed: 3
1,5,0.0%,
2,5,0.0%,
3,5,0.0%,
4,5,0.0%,
5,5,0.0%,

Value,Count,Frequency (%),Unnamed: 3
22864,1,0.0%,
22865,1,0.0%,
22866,1,0.0%,
22867,1,0.0%,
22868,1,0.0%,

0,1
Distinct count,3
Unique (%),0.0%
Missing (%),39.2%
Missing (n),43292

0,1
3.2,67204
2.2,1
(Missing),43292

Value,Count,Frequency (%),Unnamed: 3
3.2,67204,60.8%,
2.2,1,0.0%,
(Missing),43292,39.2%,

0,1
Distinct count,4
Unique (%),0.0%
Missing (%),39.2%
Missing (n),43268

0,1
3.2.00,67082
3.2.02,104
3.2.01,43
(Missing),43268

Value,Count,Frequency (%),Unnamed: 3
3.2.00,67082,60.7%,
3.2.02,104,0.1%,
3.2.01,43,0.0%,
(Missing),43268,39.2%,

Unnamed: 0.1,ACIDTRAB,ASSISTMED,ATESTANTE,CAUSABAS,CAUSABAS_O,CAUSAMAT,CIRCOBITO,CIRURGIA,CODESTAB,CODINST,CODMUNOCOR,CODMUNRES,COMUNSVOIM,DIFDATA,DTATESTADO,DTCADASTRO,DTCADINF,DTCADINV,DTCONCASO,DTINVESTIG,DTNASC,DTOBITO,DTRECEBIM,DTRECORIGA,ESC,ESC2010,ESCMAE,ESCMAE2010,ESTCIV,EXAME,FONTE,FONTEINV,GESTACAO,GRAVIDEZ,HORAOBITO,IDADE,IDADEMAE,LINHAA,LINHAB,LINHAC,LINHAD,LINHAII,LOCOCOR,MORTEPARTO,NATURAL,NECROPSIA,NUDIASOBIN,NUMERODN,NUMERODO,NUMERODV,NUMSUS,OBITOGRAV,OBITOPARTO,OBITOPUERP,OCUP,OCUPMAE,ORIGEM,PARTO,PESO,QTDFILMORT,QTDFILVIVO,RACACOR,SEMAGESTAC,SERIESCFAL,SERIESCMAE,SEXO,STDOEPIDEM,STDONOVA,TIPOBITO,TPMORTEOCO,TPOBITOCOR,TPPOS,Unnamed: 0,CODCART,CODMUNCART,DTCONINV,DTRECORIG,DTREGCART,NUMREGCART,ALTCAUSA,ATESTADO,CB_PRE,CODIFICADO,CODMUNNATU,CRM,ESCFALAGR1,ESCMAEAGR1,ESTABDESCR,FONTES,FONTESINF,NUDIASINF,NUDIASOBCO,NUMEROLOTE,STCODIFICA,TPNIVELINV,TPRESGINFO,VERSAOSCB,VERSAOSIST
0,,1,5,I10,I10,,,,,MES3205200001,320520,320520,,69.0,2012-03-08,2012-04-26,NaT,NaT,NaT,NaT,1935-01-10,2012-03-08,2012-05-16,2012-05-16,4,,,,1,,,,,,1930.0,477.0,,*R092,*I10X,,,,3,,832,,,,4282305,,,,,,999993,,1,,,,,1,,,,1,0.0,0.0,2,,,N,1,,,NaT,NaT,NaT,,,,,,,,,,,,,,,,,,,,
1,,9,2,N390,N390,,,9.0,,MES3205300001,320530,320530,,57.0,2012-02-23,2012-03-13,NaT,NaT,NaT,NaT,1939-08-03,2012-02-23,2012-04-20,2012-04-20,4,,,,9,2.0,,,,,850.0,472.0,,*R688,*A419,*N390,,*C719,3,,832,9.0,,,6366366,,,,,,999993,,1,,,,,1,,,,2,0.0,0.0,2,,,N,2,,,NaT,NaT,NaT,,,,,,,,,,,,,,,,,,,,
2,,1,1,I132,I132,,,2.0,,MES3205200001,320520,320520,,59.0,2012-01-25,2012-03-14,NaT,NaT,NaT,NaT,1931-10-25,2012-01-24,2012-03-23,2012-03-23,1,,,,2,9.0,,,,,2040.0,480.0,,*I500,*I351,*I10X,*N189,,3,,832,2.0,,,7154314,,,,,,715210,,1,,,,,1,,,,1,0.0,0.0,2,,,N,3,,,NaT,NaT,NaT,,,,,,,,,,,,,,,,,,,,
3,,1,1,I219,I219,,,2.0,,MES3205200001,320520,320520,,60.0,2012-01-23,2012-03-14,NaT,NaT,NaT,NaT,1921-03-03,2012-01-23,2012-03-23,2012-03-23,3,,,,1,2.0,,,,,1300.0,490.0,,*I219,*J969,,,,3,,832,2.0,,,7473127,,,,,,351505,,1,,,,,1,,,,2,0.0,0.0,2,,,N,4,,,NaT,NaT,NaT,,,,,,,,,,,,,,,,,,,,
4,,9,1,J440,J440,,,9.0,11835.0,MES3205300001,320530,320510,,59.0,2012-08-13,2012-09-18,NaT,NaT,NaT,NaT,1935-04-19,2012-08-13,2012-10-11,2012-10-11,1,,,,2,9.0,,,,,900.0,477.0,,*J969,*J189,*I219,*J449,*I10X*I252,2,,832,9.0,,,9947827,,,,,,999993,,1,,,,,1,,,,1,0.0,0.0,2,,,N,5,,,NaT,NaT,NaT,,,,,,,,,,,,,,,,,,,,
