In [4]:
# import python packages
import numpy as np
import pandas as pd
import os

In [5]:
directory = '.'
list_of_dirs = [x[0] for x in os.walk(directory)] # get list of all folders in the directory

In [6]:
list_of_dirs

['.',
 './.ipynb_checkpoints',
 './.git',
 './.git/logs',
 './.git/logs/refs',
 './.git/logs/refs/remotes',
 './.git/logs/refs/remotes/origin',
 './.git/logs/refs/heads',
 './.git/branches',
 './.git/hooks',
 './.git/info',
 './.git/objects',
 './.git/objects/76',
 './.git/objects/e5',
 './.git/objects/83',
 './.git/objects/pack',
 './.git/objects/2f',
 './.git/objects/15',
 './.git/objects/1a',
 './.git/objects/b2',
 './.git/objects/91',
 './.git/objects/b4',
 './.git/objects/9c',
 './.git/objects/a6',
 './.git/objects/b0',
 './.git/objects/4d',
 './.git/objects/11',
 './.git/objects/30',
 './.git/objects/53',
 './.git/objects/7c',
 './.git/objects/a7',
 './.git/objects/28',
 './.git/objects/1c',
 './.git/objects/21',
 './.git/objects/c4',
 './.git/objects/f8',
 './.git/objects/14',
 './.git/objects/2d',
 './.git/objects/2a',
 './.git/objects/info',
 './.git/objects/e7',
 './.git/objects/b5',
 './.git/objects/55',
 './.git/objects/06',
 './.git/objects/10',
 './.git/objects/52',
 './.

## Class to parse (and access) by state

In [83]:
class PM_Parser():
    def __init__(self, path):
        asthma_raw_path = path + 'PolicyMapData_Asthma_2017.csv'
        COPD_raw_path = path + 'PolicyMapData_COPD_2017.csv'
        diabetes_raw_path = path + 'PolicyMapData_Diabetes_2017.csv'
        heartDisease_raw_path = path + 'PolicyMapData_HeartDisease_2017.csv'
        print('Initializing PM_Parser object, reading datasets from: %s'%path)
        # read CSV files for all four data sets
        asthma_raw = pd.read_csv(asthma_raw_path)[['State','Estimated percent of adults reporting to have asthma in 2017.']]\
                    .rename(columns={'State': 'state', 'Estimated percent of adults reporting to have asthma in 2017.': 'est_asthma_perc'})
        COPD_raw = pd.read_csv(COPD_raw_path)[['State','Estimated percent of adults ever diagnosed with chronic obstruct']]\
                    .rename(columns={'state': 'state', 'Estimated percent of adults ever diagnosed with chronic obstruct': 'est_COPD_perc'})
        diabetes_raw = pd.read_csv(diabetes_raw_path)[['State','Estimated percent of adults ever diagnosed with diabetes in 2017']]\
                    .rename(columns={'State': 'state', 'Estimated percent of adults ever diagnosed with diabetes in 2017': 'est_diabetes_perc'})
        heartDisease_raw = pd.read_csv(heartDisease_raw_path)[['State','Estimated percent of adults ever diagnosed with heart disease in']]\
                    .rename(columns={'State': 'state', 'Estimated percent of adults ever diagnosed with heart disease in': 'est_heartDisease_perc'})
        # aggregate data state-wise into single dataframe
        self.cumulative_data = pd.concat([asthma_raw['state'],asthma_raw['est_asthma_perc'],COPD_raw['est_COPD_perc'],diabetes_raw['est_diabetes_perc'],\
                    heartDisease_raw['est_heartDisease_perc']], axis=1).iloc[0:51]
        
    def index_by_state(self,state):
        return self.cumulative_data.where(self.cumulative_data['state']==state).dropna(how='all')

        

## Print data for New York

In [84]:
path = './data/'
state = 'New York'
pm_parser = PM_Parser(path)
pm_parser.index_by_state(state)

Initializing PM_Parser object, reading datasets from: ./data/


Unnamed: 0,state,est_asthma_perc,est_COPD_perc,est_diabetes_perc,est_heartDisease_perc
32,New York,9.2,5.3,10.5,3.9


## Print data for California

In [88]:
path = './data/'
state = 'California'
pm_parser = PM_Parser(path)
pm_parser.index_by_state(state)

Initializing PM_Parser object, reading datasets from: ./data/


Unnamed: 0,state,est_asthma_perc,est_COPD_perc,est_diabetes_perc,est_heartDisease_perc
4,California,7.9,4.5,10.5,2.8


## Print data for Illinois

In [89]:
path = './data/'
state = 'Illinois'
pm_parser = PM_Parser(path)
pm_parser.index_by_state(state)

Initializing PM_Parser object, reading datasets from: ./data/


Unnamed: 0,state,est_asthma_perc,est_COPD_perc,est_diabetes_perc,est_heartDisease_perc
13,Illinois,8.2,6.7,11.0,4.0
