In [1]:
import pandas as pd
from pathlib import Path
pd.set_option("display.max_columns", 200)

pd.options.mode.copy_on_write = True

In [2]:
# Read in the Active Grant csv and store into Pandas DataFrame
# https://data.hrsa.gov//DataDownload/DD_Files/EHB_ACTIVE_GRANT_FA_AGR.csv (source file)
ehb_active_path = Path("data/EHB_ACTIVE_GRANT_FA_AGR.csv")
ehb_active_df = pd.read_csv(ehb_active_path, encoding="utf-8")

ehb_active_df.head(2)

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
0,2022,"ESPERANZA HEALTH CENTER, INC.",4417 N 6th St,Philadelphia,PA,19140-2319,H76,H76HA00725,725,2001/09/30,2024/12/31,HAB,HIV/AIDS,Ryan White Part C Outpatient EIS Program (H76),HRSA-25-052 announces the opportunity to apply...,Brendan F. Boyle,Philadelphia County,N,N,"Robert P. Casey, Jr.",John Fetterman,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",825732159.0,KLD1L3GC9NA5,-75.136916,40.019019,
1,2022,STAR COMMUNITY HEALTH INC,"520 E Broad St, Ste 108",Bethlehem,PA,18018-6330,CE1,CE1HS46454,46454,2022/08/01,2025/07/31,HSB,Healthcare Systems,Community Project Funding/Congressionally Dire...,This notice announces the opportunity to apply...,Susan Wild,Northampton County,N,N,"Robert P. Casey, Jr.",John Fetterman,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",116967999.0,DQC6BD3GQ1Z5,-75.366128,40.62206,


In [3]:
# isolate 2023 data
ehb_active_2023_df = ehb_active_df[(ehb_active_df['Award Year'] == 2023)]

ehb_active_2023_df.head(2)

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
1808,2023,ASIAN SERVICES IN ACTION INC,370 E Market St,Akron,OH,44304-1526,H8H,H8HCS44946,44946,2021/09/01,2025/08/31,BPHC,Primary Health Care,FY 2021 Ending the HIV Epidemic - Primary Care...,,Emilia Strong Sykes,Summit County,N,N,Sherrod Brown,J. D. Vance,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",958980674.0,ZNWLBCD4KMS9,-81.505867,41.080739,
1809,2023,MAINE CHILDRENS HOME FOR LITTLE WANDERER,93 Silver St,Waterville,ME,04901-5923,CE1,CE1HS52190,52190,2023/09/30,2026/09/29,HSB,Healthcare Systems,Community Project Funding/Congressionally Dire...,This notice announces the opportunity to apply...,Chellie Pingree,Kennebec County,N,N,Susan M. Collins,"Angus S., Jr. King",2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",,M7S6J7ZJ5MB7,-69.637793,44.545158,


In [4]:
# Number of unique grant programs
len(ehb_active_df['Grant Program Name'].unique())

299

In [5]:
# look at how the naming is formated
names = ehb_active_df[(ehb_active_df['HRSA Program Area Name'] == 'Maternal and Child Health')]
names['Grant Program Name'].unique()

array(['Catalysts for Infant Health Equity (U1V)',
       'Leadership Education  in Adolescent Health (LEAH) (T71)',
       'Healthy Start Initiative-Eliminating Racial/Ethnic Disparities (H49)',
       'Maternal and Child Health Public Health Catalyst Program (T1C)',
       'American Rescue Plan Act – Pediatric Mental Health Care Access New Area Expansion (U4A)',
       'Leadership Education in Neurodevelopmental and Related Disorders Training Program (T73)',
       'Sickle Cell Disease Newborn Screening Follow-up Program (D1J)',
       'MCH Leadership, Education, and Advancement in Undergraduate Pathways Program (T16)',
       'Healthy Tomorrows Partnership for Children Program (H17)',
       'Family Professional Partnership/CSHCN (H84)',
       'Universal Newborn Hearing Screening and Intervention (H61)',
       'MCHB State Systems Development Initiative (H18)',
       'Pediatric Mental Health Care Access Program (U4C)',
       'Early Childhood Comprehensive Systems: Health Integrat

In [6]:
# create condensed df
code_for_program_df =names[['Grant Activity Code', 'Grant Program Name', 'HRSA Program Area Name']]

code_for_program_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
15,U1V,Catalysts for Infant Health Equity (U1V),Maternal and Child Health
21,T71,Leadership Education in Adolescent Health (LE...,Maternal and Child Health
32,H49,Healthy Start Initiative-Eliminating Racial/Et...,Maternal and Child Health
33,T1C,Maternal and Child Health Public Health Cataly...,Maternal and Child Health
34,U4A,American Rescue Plan Act – Pediatric Mental He...,Maternal and Child Health
...,...,...,...
22663,H84,Family Professional Partnership/CSHCN (H84),Maternal and Child Health
22679,H61,Universal Newborn Hearing Screening and Interv...,Maternal and Child Health
22684,H84,Family Professional Partnership/CSHCN (H84),Maternal and Child Health
22689,H61,Universal Newborn Hearing Screening and Interv...,Maternal and Child Health


In [7]:
# Remove duplicates from column 'Grant Activity Code'
code_for_program_df = code_for_program_df.drop_duplicates(subset = 'Grant Activity Code')

code_for_program_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
15,U1V,Catalysts for Infant Health Equity (U1V),Maternal and Child Health
21,T71,Leadership Education in Adolescent Health (LE...,Maternal and Child Health
32,H49,Healthy Start Initiative-Eliminating Racial/Et...,Maternal and Child Health
33,T1C,Maternal and Child Health Public Health Cataly...,Maternal and Child Health
34,U4A,American Rescue Plan Act – Pediatric Mental He...,Maternal and Child Health
...,...,...,...
11051,U1X,Supporting Maternal and Child Health Innovatio...,Maternal and Child Health
13364,U2L,HRSA-24-041: National Coordinating Center on T...,Maternal and Child Health
13366,US8,Center for Maternal and Child Health Medicaid ...,Maternal and Child Health
13406,UF5,Supporting Healthy Start Performance Project (...,Maternal and Child Health


In [8]:
# drop null values
code_for_program_df.dropna().copy()

# widen columns in df to show the end of 'Grant Program Name'
pd.set_option('display.max_colwidth', None)

code_for_program_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
15,U1V,Catalysts for Infant Health Equity (U1V),Maternal and Child Health
21,T71,Leadership Education in Adolescent Health (LEAH) (T71),Maternal and Child Health
32,H49,Healthy Start Initiative-Eliminating Racial/Ethnic Disparities (H49),Maternal and Child Health
33,T1C,Maternal and Child Health Public Health Catalyst Program (T1C),Maternal and Child Health
34,U4A,American Rescue Plan Act – Pediatric Mental Health Care Access New Area Expansion (U4A),Maternal and Child Health
...,...,...,...
11051,U1X,Supporting Maternal and Child Health Innovation in States (U1X),Maternal and Child Health
13364,U2L,HRSA-24-041: National Coordinating Center on Transition (NCCT) (U2L),Maternal and Child Health
13366,US8,Center for Maternal and Child Health Medicaid Partnerships (US8),Maternal and Child Health
13406,UF5,Supporting Healthy Start Performance Project (UF5),Maternal and Child Health


In [9]:
# Slice off 'Grant Activity Code' form 'Grant Program Name'
###***** don't run this cell more than once, it will contiuouly slice 5 from the end of the string

code_for_program_df['Grant Program Name'] = code_for_program_df['Grant Program Name'].str.slice(0, -5)

code_for_program_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
15,U1V,Catalysts for Infant Health Equity,Maternal and Child Health
21,T71,Leadership Education in Adolescent Health (LEAH),Maternal and Child Health
32,H49,Healthy Start Initiative-Eliminating Racial/Ethnic Disparities,Maternal and Child Health
33,T1C,Maternal and Child Health Public Health Catalyst Program,Maternal and Child Health
34,U4A,American Rescue Plan Act – Pediatric Mental Health Care Access New Area Expansion,Maternal and Child Health
...,...,...,...
11051,U1X,Supporting Maternal and Child Health Innovation in States,Maternal and Child Health
13364,U2L,HRSA-24-041: National Coordinating Center on Transition (NCCT),Maternal and Child Health
13366,US8,Center for Maternal and Child Health Medicaid Partnerships,Maternal and Child Health
13406,UF5,Supporting Healthy Start Performance Project,Maternal and Child Health


In [10]:
# Number of unique grant programs
len(code_for_program_df['Grant Program Name'].unique())

101

In [11]:
# export df to a .csv file
code_for_program_df.to_csv('data/grant_program_codes.csv', index=False)