In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

%matplotlib inline
pd.set_option('display.max_columns',500)
sns.set()

In [9]:
def top_value_counts(df, n=5, only_categories = True, cols_to_include = None):
    """ Function to generate summary information for string or categorical
    data in dataframes"""
    if cols_to_include:
        df = df[cols_to_include]
    if only_categories:
        df = df.select_dtypes(include=['O','category'])
    cols = df.columns
    df_value_counts = pd.DataFrame()
    i_name = -1
    for col in cols:
        i_name += 1
        counts = df[col].value_counts(dropna=False)[:n]
        top_n_names = list(counts.index)
        top_n = list(counts)
        if len(top_n) < n+1:
            for i in range(n-len(top_n)):
                top_n.append('-')
                top_n_names.append('-')
        top_n_names.insert(0,'n_unique')
        top_n.insert(0,df[col].nunique())
        df_value_counts[col] = top_n_names
        df_value_counts[i_name] = top_n
    return(df_value_counts)

In [4]:
svi = pd.read_csv('SVI2016_US.csv')

In [5]:
svi.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 72836 entries, 0 to 72835
Columns: 125 entries, FID to E_DAYPOP
dtypes: float64(117), int64(4), object(4)
memory usage: 69.5+ MB


In [6]:
svi.head()

Unnamed: 0,FID,ST,STATE,ST_ABBR,STCNTY,COUNTY,FIPS,LOCATION,AREA_SQMI,E_TOTPOP,M_TOTPOP,E_HU,M_HU,E_HH,M_HH,E_POV,M_POV,E_UNEMP,M_UNEMP,E_PCI,M_PCI,E_NOHSDP,M_NOHSDP,E_AGE65,M_AGE65,E_AGE17,M_AGE17,E_DISABL,M_DISABL,E_SNGPNT,M_SNGPNT,E_MINRTY,M_MINRTY,E_LIMENG,M_LIMENG,E_MUNIT,M_MUNIT,E_MOBILE,M_MOBILE,E_CROWD,M_CROWD,E_NOVEH,M_NOVEH,E_GROUPQ,M_GROUPQ,EP_POV,MP_POV,EP_UNEMP,MP_UNEMP,EP_PCI,MP_PCI,EP_NOHSDP,MP_NOHSDP,EP_AGE65,MP_AGE65,EP_AGE17,MP_AGE17,EP_DISABL,MP_DISABL,EP_SNGPNT,MP_SNGPNT,EP_MINRTY,MP_MINRTY,EP_LIMENG,MP_LIMENG,EP_MUNIT,MP_MUNIT,EP_MOBILE,MP_MOBILE,EP_CROWD,MP_CROWD,EP_NOVEH,MP_NOVEH,EP_GROUPQ,MP_GROUPQ,EPL_POV,EPL_UNEMP,EPL_PCI,EPL_NOHSDP,SPL_THEME1,RPL_THEME1,EPL_AGE65,EPL_AGE17,EPL_DISABL,EPL_SNGPNT,SPL_THEME2,RPL_THEME2,EPL_MINRTY,EPL_LIMENG,SPL_THEME3,RPL_THEME3,EPL_MUNIT,EPL_MOBILE,EPL_CROWD,EPL_NOVEH,EPL_GROUPQ,SPL_THEME4,RPL_THEME4,SPL_THEMES,RPL_THEMES,F_POV,F_UNEMP,F_PCI,F_NOHSDP,F_THEME1,F_AGE65,F_AGE17,F_DISABL,F_SNGPNT,F_THEME2,F_MINRTY,F_LIMENG,F_THEME3,F_MUNIT,F_MOBILE,F_CROWD,F_NOVEH,F_GROUPQ,F_THEME4,F_TOTAL,E_UNINSUR,M_UNINSUR,EP_UNINSUR,MP_UNINSUR,E_DAYPOP
0,0,1,ALABAMA,AL,1015,Calhoun,1015981902,"Census Tract 9819.02, Calhoun County, Alabama",34.644448,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,-999.0,-999.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,15.6,0.0,15.6,0.0,44.0,0.0,15.6,0.0,11.0,0.0,15.6,0.0,11.0,0.0,11.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,11.0,-999.0,-999.0,335.0
1,1,1,ALABAMA,AL,1015,Calhoun,1015981903,"Census Tract 9819.03, Calhoun County, Alabama",13.929908,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,-999.0,-999.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,15.6,0.0,15.6,0.0,44.0,0.0,15.6,0.0,11.0,0.0,15.6,0.0,11.0,0.0,11.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,11.0,-999.0,-999.0,0.0
2,2,1,ALABAMA,AL,1097,Mobile,1097990000,"Census Tract 9900, Mobile County, Alabama",0.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,-999.0,-999.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,15.6,0.0,15.6,0.0,44.0,0.0,15.6,0.0,11.0,0.0,15.6,0.0,11.0,0.0,11.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,11.0,-999.0,-999.0,0.0
3,3,1,ALABAMA,AL,1117,Shelby,1117980000,"Census Tract 9800, Shelby County, Alabama",13.634818,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,-999.0,-999.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,11.0,0.0,15.6,0.0,15.6,0.0,44.0,0.0,15.6,0.0,11.0,0.0,15.6,0.0,11.0,0.0,11.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,11.0,-999.0,-999.0,140.0
4,4,2,ALASKA,AK,2198,Prince of Wales-Hyder,2198000300,"Census Tract 3, Prince of Wales-Hyder Census A...",196.854533,0.0,9.0,62.0,24.0,0.0,9.0,0.0,9.0,0.0,9.0,-999.0,-999.0,0.0,9.0,0.0,9.0,0.0,9.0,0.0,9.0,0.0,12.7,0.0,12.7,0.0,36.0,0.0,12.7,0.0,9.0,0.0,12.7,0.0,9.0,0.0,9.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,20.5,0.0,24.2,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,9.0,-999.0,-999.0,12.0


In [11]:
top_value_counts(svi,cols=['STATE','COUNTY'])

Unnamed: 0,STATE,0,COUNTY,1
0,n_unique,51,n_unique,1851
1,CALIFORNIA,8041,Los Angeles,2344
2,TEXAS,5254,Cook,1325
3,NEW YORK,4906,Orange,938
4,FLORIDA,4212,Jefferson,923
5,PENNSYLVANIA,3217,Maricopa,916


In [12]:
svi.describe().round(1)

Unnamed: 0,FID,ST,STCNTY,FIPS,AREA_SQMI,E_TOTPOP,M_TOTPOP,E_HU,M_HU,E_HH,M_HH,E_POV,M_POV,E_UNEMP,M_UNEMP,E_PCI,M_PCI,E_NOHSDP,M_NOHSDP,E_AGE65,M_AGE65,E_AGE17,M_AGE17,E_DISABL,M_DISABL,E_SNGPNT,M_SNGPNT,E_MINRTY,M_MINRTY,E_LIMENG,M_LIMENG,E_MUNIT,M_MUNIT,E_MOBILE,M_MOBILE,E_CROWD,M_CROWD,E_NOVEH,M_NOVEH,E_GROUPQ,M_GROUPQ,EP_POV,MP_POV,EP_UNEMP,MP_UNEMP,EP_PCI,MP_PCI,EP_NOHSDP,MP_NOHSDP,EP_AGE65,MP_AGE65,EP_AGE17,MP_AGE17,EP_DISABL,MP_DISABL,EP_SNGPNT,MP_SNGPNT,EP_MINRTY,MP_MINRTY,EP_LIMENG,MP_LIMENG,EP_MUNIT,MP_MUNIT,EP_MOBILE,MP_MOBILE,EP_CROWD,MP_CROWD,EP_NOVEH,MP_NOVEH,EP_GROUPQ,MP_GROUPQ,EPL_POV,EPL_UNEMP,EPL_PCI,EPL_NOHSDP,SPL_THEME1,RPL_THEME1,EPL_AGE65,EPL_AGE17,EPL_DISABL,EPL_SNGPNT,SPL_THEME2,RPL_THEME2,EPL_MINRTY,EPL_LIMENG,SPL_THEME3,RPL_THEME3,EPL_MUNIT,EPL_MOBILE,EPL_CROWD,EPL_NOVEH,EPL_GROUPQ,SPL_THEME4,RPL_THEME4,SPL_THEMES,RPL_THEMES,F_POV,F_UNEMP,F_PCI,F_NOHSDP,F_THEME1,F_AGE65,F_AGE17,F_DISABL,F_SNGPNT,F_THEME2,F_MINRTY,F_LIMENG,F_THEME3,F_MUNIT,F_MOBILE,F_CROWD,F_NOVEH,F_GROUPQ,F_THEME4,F_TOTAL,E_UNINSUR,M_UNINSUR,EP_UNINSUR,MP_UNINSUR,E_DAYPOP
count,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0,72836.0
mean,36417.5,27.7,27830.1,27830400000.0,48.5,4373.6,360.6,1840.5,77.8,1616.2,107.4,644.4,251.8,162.1,84.2,29378.0,4026.9,381.9,126.6,634.0,109.5,1010.7,191.9,539.2,147.3,150.1,74.1,1664.0,471.2,184.0,102.3,243.6,68.0,116.1,43.2,54.0,41.4,145.0,60.2,110.9,42.5,8.4,-1.8,0.7,-3.1,29378.0,4026.9,7.8,-1.4,9.4,-2.9,22.3,-1.5,6.0,-3.5,9.5,-2.9,37.3,4.5,4.2,-2.6,12.1,-3.7,-1.8,-4.8,3.6,-4.9,1.4,-4.1,2.7,-4.6,-7.2,-6.7,-5.9,-5.3,-6.4,-7.9,-5.2,-5.2,-6.7,-5.2,-5.2,-6.7,-5.2,-5.2,-4.7,-5.2,-5.2,-7.6,-5.2,-7.7,-5.3,-5.9,-7.7,-1.6,-8.3,-7.6,-7.1,-6.3,-5.7,-8.0,-5.6,-5.6,-7.1,-5.6,-6.8,-5.6,-5.6,-5.5,-5.6,-7.9,-5.6,-8.1,-5.6,-7.7,-7.3,503.9,188.8,4.5,-2.8,4435.8
std,21026.1,15.8,15813.3,15813330000.0,542.7,2166.3,189.1,872.5,46.2,772.1,51.6,556.1,168.6,116.7,50.6,15568.9,3005.4,355.2,82.5,411.3,59.0,665.5,110.0,302.6,74.8,116.6,42.4,1708.1,224.3,341.4,83.3,465.3,62.0,223.9,46.5,79.0,31.3,230.8,41.9,445.0,76.0,89.7,88.0,85.5,85.1,15568.9,3005.4,77.9,76.5,76.9,75.6,6.9,75.8,85.7,84.7,6.6,91.4,30.2,76.5,6.9,78.0,18.4,89.5,89.2,88.4,5.3,91.3,91.6,90.4,9.6,75.6,87.5,84.7,79.4,76.1,91.4,91.3,75.4,75.4,84.4,75.4,84.5,84.4,75.4,75.4,75.4,75.4,75.4,89.1,75.4,90.0,75.4,90.1,90.0,93.9,93.3,87.4,84.7,79.4,76.1,91.3,75.4,75.4,84.4,75.4,84.4,75.4,75.4,75.4,75.4,89.1,75.4,89.9,75.4,90.0,93.4,454.4,129.4,85.7,84.8,5416.5
min,0.0,1.0,1001.0,1001020000.0,0.0,0.0,0.0,0.0,3.0,0.0,3.0,0.0,3.0,0.0,1.0,-999.0,-999.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,2.8,0.0,2.0,0.0,29.7,0.0,2.8,0.0,2.0,0.0,2.8,0.0,2.0,0.0,2.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,0.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,-999.0,0.0,2.0,-999.0,-999.0,-999.0
25%,18208.8,12.0,12127.0,12127080000.0,0.7,2912.0,234.0,1263.0,45.0,1095.0,71.0,257.0,129.0,81.0,49.0,19809.0,2372.0,147.0,68.0,367.0,69.0,581.0,116.0,326.0,95.0,67.0,43.0,423.0,319.9,9.0,48.0,7.0,19.8,0.0,12.0,8.0,18.4,37.0,29.0,0.0,11.0,6.9,3.5,4.4,2.6,19809.0,2372.0,5.7,2.6,10.2,1.9,18.8,2.8,9.0,2.6,4.9,3.2,11.5,7.5,0.3,1.4,0.5,1.4,0.0,1.4,0.5,1.3,2.5,2.1,0.0,0.3,0.2,0.2,0.2,0.2,1.1,0.2,0.2,0.2,0.2,0.2,1.6,0.2,0.2,0.2,0.5,0.2,0.2,0.0,0.2,0.2,0.0,1.7,0.2,5.5,0.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,203.0,98.0,5.8,2.8,1872.0
50%,36417.5,27.0,27130.0,27130430000.0,1.9,4092.0,331.0,1729.0,67.0,1526.0,99.0,492.0,216.0,136.0,74.0,26179.0,3220.0,279.0,108.0,569.0,99.0,892.0,171.0,487.0,134.0,123.0,66.9,1107.0,438.9,50.0,69.1,72.0,47.5,11.0,18.0,27.0,30.1,84.0,52.0,10.0,15.0,12.8,5.5,6.7,3.6,26179.0,3220.0,10.6,4.0,14.4,2.5,22.5,3.8,12.4,3.3,8.1,4.5,28.3,9.9,1.3,2.0,4.4,3.0,0.7,2.2,1.8,2.2,5.4,3.4,0.2,0.4,0.5,0.5,0.5,0.5,1.9,0.5,0.5,0.5,0.5,0.5,2.0,0.5,0.5,0.5,1.0,0.5,0.5,0.5,0.5,0.5,0.5,2.3,0.5,7.2,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,375.0,159.0,10.1,4.0,3142.0
75%,54626.2,41.0,41039.0,41039000000.0,13.3,5478.0,457.0,2294.0,99.0,2031.0,134.0,864.0,336.0,213.0,108.0,34987.5,4683.0,499.0,166.0,820.0,138.0,1293.0,245.0,694.0,185.0,203.0,97.1,2373.0,582.0,190.0,123.1,278.0,96.8,134.0,61.0,66.0,54.7,171.0,81.0,63.0,43.0,22.1,7.8,10.0,4.9,34987.5,4683.0,18.5,5.6,18.6,3.3,26.3,5.0,16.5,4.2,12.6,6.0,59.4,12.3,4.7,3.3,15.7,5.4,7.6,3.8,4.2,3.6,11.2,5.3,1.5,1.1,0.7,0.7,0.7,0.7,2.8,0.7,0.7,0.7,0.7,0.7,2.4,0.7,0.7,0.7,1.4,0.7,0.7,0.7,0.7,0.7,0.7,2.9,0.7,9.0,0.7,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,661.0,248.0,15.7,5.4,5287.2
max,72835.0,56.0,56045.0,56045950000.0,85569.3,61133.0,2793.0,26043.0,710.0,20474.0,736.0,9075.0,2575.0,1949.0,940.0,227095.0,88591.0,5056.0,1142.0,28764.0,1039.0,21527.0,1502.0,7639.0,1183.0,1671.0,511.7,33302.0,4123.8,5242.0,993.2,12230.0,945.6,3178.0,463.0,1193.0,377.9,6119.0,730.0,17194.0,3022.0,100.0,100.0,100.0,100.0,227095.0,88591.0,100.0,100.0,100.0,100.0,91.4,400.0,100.0,100.0,100.0,1100.0,100.0,400.0,68.9,1600.0,100.0,1555.6,100.0,100.0,100.0,1555.6,100.0,100.0,100.0,366.7,1.0,1.0,1.0,1.0,4.0,1.0,1.0,1.0,1.0,1.0,3.8,1.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,1.0,4.6,1.0,13.8,1.0,1.0,1.0,1.0,1.0,4.0,1.0,1.0,1.0,1.0,4.0,1.0,1.0,2.0,1.0,1.0,1.0,1.0,1.0,4.0,13.0,7907.0,1943.0,100.0,100.0,376673.0
