In [37]:
# Import packages
import pandas as pd
import numpy as np
import os

# Import data
svi2014 = pd.read_csv('original_dataset.csv')
svi2016 = pd.read_csv('SVI2016_US.csv')
svi2018 = pd.read_csv('SVI2018_US.csv')

In [38]:
def count_out_of_range(value_list):
    oor = 0
    ir = 0
    for value in value_list:
        if value < -1 or value > 1:
            oor+=1
        else:
            ir+=1
    print('Percent out of range: {}%'.format((oor*100)/(oor+ir)))
# Drop uncommon columns
# 2014 - 127 columns... AFFGEOID, TRACTIC, FID
# 2016 - 125 columns... FID
# 2018 - 124 columns
svi2014 = svi2014.drop(['AFFGEOID', 'TRACTCE', 'FID'], axis = 1)
svi2016 = svi2016.drop('FID', axis = 1)

In [39]:
# Merge datasets
svimain = svi2014.merge(svi2016, on = 'FIPS', suffixes = ['_2014', '_2016'])
svimain = svimain.merge(svi2018, on = 'FIPS')

In [40]:
len(svimain)

72831

In [41]:
#Drop rows that have any undefined values
svimain = svimain.replace(to_replace=-999, value=np.nan).dropna()

In [42]:
len(svimain)

71520

In [2]:
maincols = svimain.columns.values.tolist()
maincols.sort()

In [44]:
# Create new columns showing difference between poverty estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_POV_2016_2014_DIF'] = svimain['EP_POV_2016'] - svimain['EP_POV_2014']
svimain['EP_POV_2018_2016_DIF'] = svimain['EP_POV'] - svimain['EP_POV_2016']
svimain['EP_POV_2018_2014_DIF'] = svimain['EP_POV'] - svimain['EP_POV_2014']

# Create new columns showing difference between unemployment estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_UNEMP_2016_2014_DIF'] = svimain['EP_UNEMP_2016'] - svimain['EP_UNEMP_2014']
svimain['EP_UNEMP_2018_2016_DIF'] = svimain['EP_UNEMP'] - svimain['EP_UNEMP_2016']
svimain['EP_UNEMP_2018_2014_DIF'] = svimain['EP_UNEMP'] - svimain['EP_UNEMP_2014']

# Create new columns showing difference between per capita income estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_PCI_2016_2014_DIF'] = svimain['EP_PCI_2016'] - svimain['EP_PCI_2014']
svimain['EP_PCI_2018_2016_DIF'] = svimain['EP_PCI'] - svimain['EP_PCI_2016']
svimain['EP_PCI_2018_2014_DIF'] = svimain['EP_PCI'] - svimain['EP_PCI_2014']

# Create new columns showing difference between no HS diploma estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_NOHSDP_2016_2014_DIF'] = svimain['EP_NOHSDP_2016'] - svimain['EP_NOHSDP_2014']
svimain['EP_NOHSDP_2018_2016_DIF'] = svimain['EP_NOHSDP'] - svimain['EP_NOHSDP_2016']
svimain['EP_NOHSDP_2018_2014_DIF'] = svimain['EP_NOHSDP'] - svimain['EP_NOHSDP_2014']

# Create new columns showing difference between overall socieconomic
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['SPL_THEME1_2016_2014_DIF'] = svimain['SPL_THEME1_2016'] - svimain['SPL_THEME1_2014']
svimain['SPL_THEME1_2018_2016_DIF'] = svimain['SPL_THEME1'] - svimain['SPL_THEME1_2016']
svimain['SPL_THEME1_2018_2014_DIF'] = svimain['SPL_THEME1'] - svimain['SPL_THEME1_2014']

# Create new columns showing difference between ages 65 and older estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_AGE65_2016_2014_DIF'] = svimain['EP_AGE65_2016'] - svimain['EP_AGE65_2014']
svimain['EP_AGE65_2018_2016_DIF'] = svimain['EP_AGE65'] - svimain['EP_AGE65_2016']
svimain['EP_AGE65_2018_2014_DIF'] = svimain['EP_AGE65'] - svimain['EP_AGE65_2014']

# Create new columns showing difference between ages 17 and younger estimates from 2014 - 2016 
# and 2016 - 2018 and 2014 - 2018
svimain['EP_AGE17_2016_2014_DIF'] = svimain['EP_AGE17_2016'] - svimain['EP_AGE17_2014']
svimain['EP_AGE17_2018_2016_DIF'] = svimain['EP_AGE17'] - svimain['EP_AGE17_2016']
svimain['EP_AGE17_2018_2014_DIF'] = svimain['EP_AGE17'] - svimain['EP_AGE17_2014']

# Create new columns showing difference between disability estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_DISABL_2016_2014_DIF'] = svimain['EP_DISABL_2016'] - svimain['EP_DISABL_2014']
svimain['EP_DISABL_2018_2016_DIF'] = svimain['EP_DISABL'] - svimain['EP_DISABL_2016']
svimain['EP_DISABL_2018_2014_DIF'] = svimain['EP_DISABL'] - svimain['EP_DISABL_2014']

# Create new columns showing difference between single parent households
# estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_SNGPNT_2016_2014_DIF'] = svimain['EP_SNGPNT_2016'] - svimain['EP_SNGPNT_2014']
svimain['EP_SNGPNT_2018_2016_DIF'] = svimain['EP_SNGPNT'] - svimain['EP_SNGPNT_2016']
svimain['EP_SNGPNT_2018_2014_DIF'] = svimain['EP_SNGPNT'] - svimain['EP_SNGPNT_2014']

# Create new columns showing difference between overall household composition and disability
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['SPL_THEME2_2016_2014_DIF'] = svimain['SPL_THEME2_2016'] - svimain['SPL_THEME2_2014']
svimain['SPL_THEME2_2018_2016_DIF'] = svimain['SPL_THEME2'] - svimain['SPL_THEME2_2016']
svimain['SPL_THEME2_2018_2014_DIF'] = svimain['SPL_THEME2'] - svimain['SPL_THEME2_2014']

# Create new columns showing difference between minority estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_MINRTY_2016_2014_DIF'] = svimain['EP_MINRTY_2016'] - svimain['EP_MINRTY_2014']
svimain['EP_MINRTY_2018_2016_DIF'] = svimain['EP_MINRTY'] - svimain['EP_MINRTY_2016']
svimain['EP_MINRTY_2018_2014_DIF'] = svimain['EP_MINRTY'] - svimain['EP_MINRTY_2014']

# Create new columns showing difference between English "less than well" estimates 
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_LIMENG_2016_2014_DIF'] = svimain['EP_LIMENG_2016'] - svimain['EP_LIMENG_2014']
svimain['EP_LIMENG_2018_2016_DIF'] = svimain['EP_LIMENG'] - svimain['EP_LIMENG_2016']
svimain['EP_LIMENG_2018_2014_DIF'] = svimain['EP_LIMENG'] - svimain['EP_LIMENG_2014']

# Create new columns showing difference between overall minority status and language
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['SPL_THEME3_2016_2014_DIF'] = svimain['SPL_THEME3_2016'] - svimain['SPL_THEME3_2014']
svimain['SPL_THEME3_2018_2016_DIF'] = svimain['SPL_THEME3'] - svimain['SPL_THEME3_2016']
svimain['SPL_THEME3_2018_2014_DIF'] = svimain['SPL_THEME3'] - svimain['SPL_THEME3_2014']

# Create new columns showing difference between 10+ units estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_MUNIT_2016_2014_DIF'] = svimain['EP_MUNIT_2016'] - svimain['EP_MUNIT_2014']
svimain['EP_MUNIT_2018_2016_DIF'] = svimain['EP_MUNIT'] - svimain['EP_MUNIT_2016']
svimain['EP_MUNIT_2018_2014_DIF'] = svimain['EP_MUNIT'] - svimain['EP_MUNIT_2014']

# Create new columns showing difference between mobile home estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_MOBILE_2016_2014_DIF'] = svimain['EP_MOBILE_2016'] - svimain['EP_MOBILE_2014']
svimain['EP_MOBILE_2018_2016_DIF'] = svimain['EP_MOBILE'] - svimain['EP_MOBILE_2016']
svimain['EP_MOBILE_2018_2014_DIF'] = svimain['EP_MOBILE'] - svimain['EP_MOBILE_2014']

# Create new columns showing difference between more people than rooms estimates 
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_CROWD_2016_2014_DIF'] = svimain['EP_CROWD_2016'] - svimain['EP_CROWD_2014']
svimain['EP_CROWD_2018_2016_DIF'] = svimain['EP_CROWD'] - svimain['EP_CROWD_2016']
svimain['EP_CROWD_2018_2014_DIF'] = svimain['EP_CROWD'] - svimain['EP_CROWD_2014']

# Create new columns showing difference between household with no vehicle available estimates
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_NOVEH_2016_2014_DIF'] = svimain['EP_NOVEH_2016'] - svimain['EP_NOVEH_2014']
svimain['EP_NOVEH_2018_2016_DIF'] = svimain['EP_NOVEH'] - svimain['EP_NOVEH_2016']
svimain['EP_NOVEH_2018_2014_DIF'] = svimain['EP_NOVEH'] - svimain['EP_NOVEH_2014']

# Create new columns showing difference between institulionalized group quarters estimates
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['EP_GROUPQ_2016_2014_DIF'] = svimain['EP_GROUPQ_2016'] - svimain['EP_GROUPQ_2014']
svimain['EP_GROUPQ_2018_2016_DIF'] = svimain['EP_GROUPQ'] - svimain['EP_GROUPQ_2016']
svimain['EP_GROUPQ_2018_2014_DIF'] = svimain['EP_GROUPQ'] - svimain['EP_GROUPQ_2014']

# Create new columns showing difference between overall housing and transportation
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['SPL_THEME4_2016_2014_DIF'] = svimain['SPL_THEME4_2016'] - svimain['SPL_THEME4_2014']
svimain['SPL_THEME4_2018_2016_DIF'] = svimain['SPL_THEME4'] - svimain['SPL_THEME4_2016']
svimain['SPL_THEME4_2018_2014_DIF'] = svimain['SPL_THEME4'] - svimain['SPL_THEME4_2014']

# Create new columns showing difference between overall tract summary ranking
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['SPL_THEMES_2016_2014_DIF'] = svimain['SPL_THEMES_2016'] - svimain['SPL_THEMES_2014']
svimain['SPL_THEMES_2018_2016_DIF'] = svimain['SPL_THEMES'] - svimain['SPL_THEMES_2016']
svimain['SPL_THEMES_2018_2014_DIF'] = svimain['SPL_THEMES'] - svimain['SPL_THEMES_2014']
# Create new columns showing difference between poverty estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_POV_2016_2014_DIF'] = svimain['E_POV_2016'] - svimain['E_POV_2014']
svimain['E_POV_2018_2016_DIF'] = svimain['E_POV'] - svimain['E_POV_2016']
svimain['E_POV_2018_2014_DIF'] = svimain['E_POV'] - svimain['E_POV_2014']

# Create new columns showing difference between unemployment estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_UNEMP_2016_2014_DIF'] = svimain['E_UNEMP_2016'] - svimain['E_UNEMP_2014']
svimain['E_UNEMP_2018_2016_DIF'] = svimain['E_UNEMP'] - svimain['E_UNEMP_2016']
svimain['E_UNEMP_2018_2014_DIF'] = svimain['E_UNEMP'] - svimain['E_UNEMP_2014']

# Create new columns showing difference between per capita income estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_PCI_2016_2014_DIF'] = svimain['E_PCI_2016'] - svimain['E_PCI_2014']
svimain['E_PCI_2018_2016_DIF'] = svimain['E_PCI'] - svimain['E_PCI_2016']
svimain['E_PCI_2018_2014_DIF'] = svimain['E_PCI'] - svimain['E_PCI_2014']

# Create new columns showing difference between no HS diploma estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_NOHSDP_2016_2014_DIF'] = svimain['E_NOHSDP_2016'] - svimain['E_NOHSDP_2014']
svimain['E_NOHSDP_2018_2016_DIF'] = svimain['E_NOHSDP'] - svimain['E_NOHSDP_2016']
svimain['E_NOHSDP_2018_2014_DIF'] = svimain['E_NOHSDP'] - svimain['E_NOHSDP_2014']

# Create new columns showing difference between overall socieconomic
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['RPL_THEME1_2016_2014_DIF'] = svimain['RPL_THEME1_2016'] - svimain['RPL_THEME1_2014']
svimain['RPL_THEME1_2018_2016_DIF'] = svimain['RPL_THEME1'] - svimain['RPL_THEME1_2016']
svimain['RPL_THEME1_2018_2014_DIF'] = svimain['RPL_THEME1'] - svimain['RPL_THEME1_2014']

# Create new columns showing difference between ages 65 and older estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_AGE65_2016_2014_DIF'] = svimain['E_AGE65_2016'] - svimain['E_AGE65_2014']
svimain['E_AGE65_2018_2016_DIF'] = svimain['E_AGE65'] - svimain['E_AGE65_2016']
svimain['E_AGE65_2018_2014_DIF'] = svimain['E_AGE65'] - svimain['E_AGE65_2014']

# Create new columns showing difference between ages 17 and younger estimates from 2014 - 2016 
# and 2016 - 2018 and 2014 - 2018
svimain['E_AGE17_2016_2014_DIF'] = svimain['E_AGE17_2016'] - svimain['E_AGE17_2014']
svimain['E_AGE17_2018_2016_DIF'] = svimain['E_AGE17'] - svimain['E_AGE17_2016']
svimain['E_AGE17_2018_2014_DIF'] = svimain['E_AGE17'] - svimain['E_AGE17_2014']

# Create new columns showing difference between disability estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_DISABL_2016_2014_DIF'] = svimain['E_DISABL_2016'] - svimain['E_DISABL_2014']
svimain['E_DISABL_2018_2016_DIF'] = svimain['E_DISABL'] - svimain['E_DISABL_2016']
svimain['E_DISABL_2018_2014_DIF'] = svimain['E_DISABL'] - svimain['E_DISABL_2014']

# Create new columns showing difference between single parent households
# estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_SNGPNT_2016_2014_DIF'] = svimain['E_SNGPNT_2016'] - svimain['E_SNGPNT_2014']
svimain['E_SNGPNT_2018_2016_DIF'] = svimain['E_SNGPNT'] - svimain['E_SNGPNT_2016']
svimain['E_SNGPNT_2018_2014_DIF'] = svimain['E_SNGPNT'] - svimain['E_SNGPNT_2014']

# Create new columns showing difference between overall household composition and disability
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['RPL_THEME2_2016_2014_DIF'] = svimain['RPL_THEME2_2016'] - svimain['RPL_THEME2_2014']
svimain['RPL_THEME2_2018_2016_DIF'] = svimain['RPL_THEME2'] - svimain['RPL_THEME2_2016']
svimain['RPL_THEME2_2018_2014_DIF'] = svimain['RPL_THEME2'] - svimain['RPL_THEME2_2014']

# Create new columns showing difference between minority estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_MINRTY_2016_2014_DIF'] = svimain['E_MINRTY_2016'] - svimain['E_MINRTY_2014']
svimain['E_MINRTY_2018_2016_DIF'] = svimain['E_MINRTY'] - svimain['E_MINRTY_2016']
svimain['E_MINRTY_2018_2014_DIF'] = svimain['E_MINRTY'] - svimain['E_MINRTY_2014']

# Create new columns showing difference between English "less than well" estimates 
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_LIMENG_2016_2014_DIF'] = svimain['E_LIMENG_2016'] - svimain['E_LIMENG_2014']
svimain['E_LIMENG_2018_2016_DIF'] = svimain['E_LIMENG'] - svimain['E_LIMENG_2016']
svimain['E_LIMENG_2018_2014_DIF'] = svimain['E_LIMENG'] - svimain['E_LIMENG_2014']

# Create new columns showing difference between overall minority status and language
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['RPL_THEME3_2016_2014_DIF'] = svimain['RPL_THEME3_2016'] - svimain['RPL_THEME3_2014']
svimain['RPL_THEME3_2018_2016_DIF'] = svimain['RPL_THEME3'] - svimain['RPL_THEME3_2016']
svimain['RPL_THEME3_2018_2014_DIF'] = svimain['RPL_THEME3'] - svimain['RPL_THEME3_2014']

# Create new columns showing difference between 10+ units estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_MUNIT_2016_2014_DIF'] = svimain['E_MUNIT_2016'] - svimain['E_MUNIT_2014']
svimain['E_MUNIT_2018_2016_DIF'] = svimain['E_MUNIT'] - svimain['E_MUNIT_2016']
svimain['E_MUNIT_2018_2014_DIF'] = svimain['E_MUNIT'] - svimain['E_MUNIT_2014']

# Create new columns showing difference between mobile home estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_MOBILE_2016_2014_DIF'] = svimain['E_MOBILE_2016'] - svimain['E_MOBILE_2014']
svimain['E_MOBILE_2018_2016_DIF'] = svimain['E_MOBILE'] - svimain['E_MOBILE_2016']
svimain['E_MOBILE_2018_2014_DIF'] = svimain['E_MOBILE'] - svimain['E_MOBILE_2014']

# Create new columns showing difference between more people than rooms estimates 
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_CROWD_2016_2014_DIF'] = svimain['E_CROWD_2016'] - svimain['E_CROWD_2014']
svimain['E_CROWD_2018_2016_DIF'] = svimain['E_CROWD'] - svimain['E_CROWD_2016']
svimain['E_CROWD_2018_2014_DIF'] = svimain['E_CROWD'] - svimain['E_CROWD_2014']

# Create new columns showing difference between household with no vehicle available estimates
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_NOVEH_2016_2014_DIF'] = svimain['E_NOVEH_2016'] - svimain['E_NOVEH_2014']
svimain['E_NOVEH_2018_2016_DIF'] = svimain['E_NOVEH'] - svimain['E_NOVEH_2016']
svimain['E_NOVEH_2018_2014_DIF'] = svimain['E_NOVEH'] - svimain['E_NOVEH_2014']

# Create new columns showing difference between institulionalized group quarters estimates
# from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['E_GROUPQ_2016_2014_DIF'] = svimain['E_GROUPQ_2016'] - svimain['E_GROUPQ_2014']
svimain['E_GROUPQ_2018_2016_DIF'] = svimain['E_GROUPQ'] - svimain['E_GROUPQ_2016']
svimain['E_GROUPQ_2018_2014_DIF'] = svimain['E_GROUPQ'] - svimain['E_GROUPQ_2014']

# Create new columns showing difference between overall housing and transportation
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['RPL_THEME4_2016_2014_DIF'] = svimain['RPL_THEME4_2016'] - svimain['RPL_THEME4_2014']
svimain['RPL_THEME4_2018_2016_DIF'] = svimain['RPL_THEME4'] - svimain['RPL_THEME4_2016']
svimain['RPL_THEME4_2018_2014_DIF'] = svimain['RPL_THEME4'] - svimain['RPL_THEME4_2014']

# Create new columns showing difference between overall tract summary ranking
# theme estimates from 2014 - 2016 and 2016 - 2018 and 2014 - 2018
svimain['RPL_THEMES_2016_2014_DIF'] = svimain['RPL_THEMES_2016'] - svimain['RPL_THEMES_2014']
svimain['RPL_THEMES_2018_2016_DIF'] = svimain['RPL_THEMES'] - svimain['RPL_THEMES_2016']
svimain['RPL_THEMES_2018_2014_DIF'] = svimain['RPL_THEMES'] - svimain['RPL_THEMES_2014']

In [45]:
count_out_of_range(svimain['SPL_THEMES_2016_2014_DIF'])
count_out_of_range(svimain['SPL_THEMES_2018_2016_DIF'])
count_out_of_range(svimain['SPL_THEMES_2018_2014_DIF'])

Percent out of range: 9.7581096196868%
Percent out of range: 9.198825503355705%
Percent out of range: 22.17281879194631%


In [46]:
# # Subset dataset
# svimain = svimain[['ST', 'STATE', 'ST_ABBR', 'STCNTY', 'COUNTY', 'FIPS', 'LOCATION', 'AREA_SQMI', 'EP_POV_2016_2014_DIF',
#                   'EP_POV_2018_2016_DIF', 'EP_POV_2018_2014_DIF','EP_UNEMP_2016_2014_DIF',
#                   'EP_UNEMP_2018_2016_DIF', 'EP_UNEMP_2018_2014_DIF','EP_PCI_2016_2014_DIF', 'EP_PCI_2018_2016_DIF',
#                   'EP_PCI_2018_2014_DIF', 'EP_NOHSDP_2016_2014_DIF', 'EP_NOHSDP_2018_2016_DIF', 'EP_NOHSDP_2018_2014_DIF',
#                   'SPL_THEME1_2016_2014_DIF', 'SPL_THEME1_2018_2016_DIF', 'SPL_THEME1_2018_2014_DIF',
#                   'EP_AGE65_2016_2014_DIF', 'EP_AGE65_2018_2016_DIF', 'EP_AGE65_2018_2014_DIF', 'EP_AGE17_2016_2014_DIF',
#                   'EP_AGE17_2018_2016_DIF', 'EP_AGE17_2018_2014_DIF', 'EP_DISABL_2016_2014_DIF', 'EP_DISABL_2018_2016_DIF',
#                   'EP_DISABL_2018_2014_DIF', 'EP_SNGPNT_2016_2014_DIF', 'EP_SNGPNT_2018_2016_DIF', 'EP_SNGPNT_2018_2014_DIF',
#                   'SPL_THEME2_2016_2014_DIF', 'SPL_THEME2_2018_2016_DIF', 'SPL_THEME2_2018_2014_DIF',
#                   'EP_MINRTY_2016_2014_DIF', 'EP_MINRTY_2018_2016_DIF', 'EP_MINRTY_2018_2014_DIF', 'EP_LIMENG_2016_2014_DIF',
#                   'EP_LIMENG_2018_2016_DIF', 'EP_LIMENG_2018_2014_DIF', 'SPL_THEME3_2016_2014_DIF', 'SPL_THEME3_2018_2016_DIF',
#                   'SPL_THEME3_2018_2014_DIF', 'EP_MUNIT_2016_2014_DIF', 'EP_MOBILE_2018_2016_DIF', 'EP_MUNIT_2018_2014_DIF',
#                   'EP_MOBILE_2016_2014_DIF', 'EP_MOBILE_2018_2016_DIF', 'EP_MOBILE_2018_2014_DIF', 'EP_CROWD_2016_2014_DIF',
#                   'EP_CROWD_2018_2016_DIF', 'EP_CROWD_2018_2014_DIF', 'EP_NOVEH_2016_2014_DIF', 'EP_NOVEH_2018_2016_DIF',
#                   'EP_NOVEH_2018_2014_DIF', 'EP_GROUPQ_2016_2014_DIF', 'EP_GROUPQ_2018_2016_DIF', 'EP_GROUPQ_2018_2014_DIF',
#                   'SPL_THEME4_2016_2014_DIF', 'SPL_THEME4_2018_2016_DIF', 'SPL_THEME4_2018_2014_DIF',
#                   'SPL_THEMES_2016_2014_DIF', 'SPL_THEMES_2018_2016_DIF', 'SPL_THEMES_2018_2014_DIF']]

# Export dataset
svimain.to_csv('svi_main_ep_spl.csv')