In [11]:
import pandas as pd
from pathlib import Path
pd.set_option("display.max_columns", 200)

pd.options.mode.copy_on_write = True

In [12]:
# Read in the Active Grant csv and store into Pandas DataFrame
# https://data.hrsa.gov//DataDownload/DD_Files/EHB_ACTIVE_GRANT_FA_AGR.csv (source file)
ehb_active_path = Path("data/EHB_ACTIVE_GRANT_FA_AGR.csv")
ehb_active_df = pd.read_csv(ehb_active_path, encoding = "utf-8")

ehb_active_df

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
0,2022,"ESPERANZA HEALTH CENTER, INC.",4417 N 6th St,Philadelphia,PA,19140-2319,H76,H76HA00725,725,2001/09/30,2024/12/31,HAB,HIV/AIDS,Ryan White Part C Outpatient EIS Program (H76),HRSA-25-052 announces the opportunity to apply...,Brendan F. Boyle,Philadelphia County,N,N,"Robert P. Casey, Jr.",John Fetterman,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",825732159.0,KLD1L3GC9NA5,-75.136916,40.019019,
1,2022,STAR COMMUNITY HEALTH INC,"520 E Broad St, Ste 108",Bethlehem,PA,18018-6330,CE1,CE1HS46454,46454,2022/08/01,2025/07/31,HSB,Healthcare Systems,Community Project Funding/Congressionally Dire...,This notice announces the opportunity to apply...,Susan Wild,Northampton County,N,N,"Robert P. Casey, Jr.",John Fetterman,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",116967999.0,DQC6BD3GQ1Z5,-75.366128,40.622060,
2,2022,LEWIS UNIVERSITY,1 University Pkwy,Romeoville,IL,60446-2200,D19,D19HP42035,42035,2021/07/01,2025/06/30,BHW,Health Workforce,Nursing Workforce Diversity (D19),,Lauren Underwood,Will County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",69964104.0,EHUHEAQXWAU5,-88.079771,41.601904,
3,2022,"OUTER CAPE HEALTH SERVICES, INC.",710 Route 28,Harwich Port,MA,02646,H80,H80CS00468,468,2002/02/01,2025/01/31,BPHC,Primary Health Care,Health Center Program (H80),To assist health centers in a Hurricane Helene...,William R. Keating,Barnstable County,N,N,Elizabeth Warren,Edward J. Markey,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",76575729.0,UEKHT333SBU7,-70.060154,41.670379,
4,2022,RHODE ISLAND COLLEGE,600 Mount Pleasant Ave,Providence,RI,02908-1940,M01,M01HP42514,42514,2021/09/01,2025/08/31,BHW,Health Workforce,Behavioral Health Workforce Education and Trai...,The purpose of the Behavioral Health Workforce...,Seth Magaziner,Providence County,N,N,Jack Reed,Sheldon Whitehouse,2024/11/05,No Link,,U.S. Government Entity,75707588.0,VM5MA47AM9F8,-71.466068,41.839428,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
22722,2022,WESTCHESTER ELLENVILLE INC,10 Healthy Way,Ellenville,NY,12428,G20,G20RH46028,46028,2022/08/01,2026/07/31,FORHP,Rural Health,Small Health Care Provider Quality Improvement...,,Patrick Ryan,Ulster County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",60545852.0,JSK2MWMTLXQ9,-74.379576,41.733184,
22723,2022,PHILADELPHIA FIGHT,1233 Locust St FL 5,Philadelphia,PA,19107-5461,H12,H12HA46117,46117,2022/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Brendan F. Boyle,Philadelphia County,N,N,"Robert P. Casey, Jr.",John Fetterman,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",785736596.0,REMRC15CK3H8,-75.161735,39.947929,
22724,2022,BOARD OF REGENTS TENNESSEE,1 Bridgestone Park,Nashville,TN,37214-2453,T29,T29HP46721,46721,2022/09/15,2025/09/14,BHW,Health Workforce,Community Health Worker Training Program (T29),This notice announces the opportunity to apply...,John W. Rose,Davidson County,N,N,Marsha Blackburn,Bill Hagerty,2024/11/05,No Link,,U.S. Government Entity,,JBG7T7RXQ2B7,-86.690607,36.166610,
22725,2022,THE UNIVERSITY OF SOUTH DAKOTA,414 E Clark St,Vermillion,SD,57069-2307,U77,U77HP26850,26850,2014/05/01,2027/08/31,BHW,Health Workforce,Area Health Education Centers (AHEC) Program (...,,Dusty Johnson,Clay County,N,N,John Thune,Mike Rounds,2024/11/05,No Link,,U.S. Government Entity,929930808.0,U9EDNSCHTBE7,-96.926563,42.782528,


In [13]:
# get counts of grants within categories, within 'HRSA Program Area Name'
ehb_active_df['HRSA Program Area Name'].value_counts()

HRSA Program Area Name
Primary Health Care            7159
Health Workforce               6385
Maternal and Child Health      2885
HIV/AIDS                       2676
Rural Health                   1921
Healthcare Systems             1434
Office of the Administrator     267
Name: count, dtype: int64

In [16]:
# isolate 2023 data
ehb_active_2023_df = ehb_active_df[(ehb_active_df['Award Year'] == 2023)]

# create a key to narrow results so we can exclude data from 'Maternal and Child Health'
key = ehb_active_2023_df["HRSA Program Area Name"] == 'Maternal and Child Health'
nonmaternal_df = ehb_active_2023_df[~key] # exclude
maternal_df = ehb_active_2023_df[key] # include

In [17]:
# utilize key with 'keywords'
missedstuff_df = nonmaternal_df[nonmaternal_df['Grant Program Name'].str.contains('Infant|Maternal|Fetus|Unborn|Pregnan|Breast', regex=True, case=False)]

missedstuff_df

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
1823,2023,HOWARD BROWN HEALTH CENTER,4025 N Sheridan Rd,Chicago,IL,60613-2010,H12,H12HA24805,24805,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Janice D. Schakowsky,Cook County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",10911980.0,K4K7GLAR8QN1,-87.654510,41.955207,
1861,2023,"SUNSET PARK HEALTH COUNCIL, INC.",150 55th St,Brooklyn,NY,11220-2559,Q8M,Q8MCS49133,49133,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Daniel S. Goldman,Kings County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",785145843.0,DC4UE8MU2ZE8,-74.020541,40.646690,
1938,2023,MAINLINE HEALTH SYSTEMS INC,233 N Main St,Portland,AR,71663-9230,Q8M,Q8MCS49307,49307,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Bruce Westerman,Ashley County,N,N,John Boozman,Tom Cotton,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",119842946.0,JEKKQBGWTZS5,-91.511351,33.238906,
2017,2023,University of Florida,1523 Union Rd RM 207,Gainesville,FL,32611-1941,H12,H12HA24824,24824,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Kat Cammack,Alachua County,N,N,Marco Rubio,Rick Scott,2024/11/05,No Link,,U.S. Government Entity,969663814.0,NNFQH1JAPEP3,-82.342089,29.649732,
2018,2023,COUNTY OF INGHAM,5303 S Cedar St,Lansing,MI,48911-3800,H12,H12HA24806,24806,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Elissa Slotkin,Ingham County,N,N,Debbie Stabenow,Gary C. Peters,2024/11/05,No Link,,U.S. Government Entity,31875656.0,MNXZAXJQTMN6,-84.548038,42.681075,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
10091,2023,THE HEKTOEN INSTITUTE FOR MEDICAL RESEARCH,1339 S Wood St,Chicago,IL,60608-1204,H12,H12HA24803,24803,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Danny K. Davis,Cook County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",68625136.0,NRJ8QC6LM4T1,-87.671177,41.862765,
10100,2023,YOUR HEALTH CLINIC,1521 Baker Rd,Sherman,TX,75090-2409,H12,H12HA24844,24844,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Pat Fallon,Grayson County,N,N,John Cornyn,Ted Cruz,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",879477875.0,T6E1PLTJ3Q25,-96.596205,33.664001,
10116,2023,MARY HITCHCOCK MEMORIAL HOSPITAL,1 Medical Center Dr,Lebanon,NH,03756-1000,H12,H12HA31112,31112,2017/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Ann M. Kuster,Grafton County,N,N,Jeanne Shaheen,Margaret Wood Hassan,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",69910297.0,QYLXERHDAQL4,-72.273635,43.678113,
10184,2023,RESEARCH FOUNDATION FOR THE STATE UNIVERSITY O...,520 Lee Entrance STE 211,Amherst,NY,14228-2577,T34,T34HP42144,42144,2021/07/01,2026/06/30,BHW,Health Workforce,Primary Care Training and Enhancement-Communit...,,Timothy M Kennedy,Erie County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",38633251.0,LMCJKRFW5R81,-78.785538,43.002054,


In [18]:
# drop duplicate rows within 'Grant Program Name' to isolate unique 'Grant Activity Code' not contained within 'Maternal and Child Health'
missedstuff_df = missedstuff_df.drop_duplicates(subset = ('Grant Program Name'))

missedstuff_df

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
1823,2023,HOWARD BROWN HEALTH CENTER,4025 N Sheridan Rd,Chicago,IL,60613-2010,H12,H12HA24805,24805,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Janice D. Schakowsky,Cook County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",10911980.0,K4K7GLAR8QN1,-87.65451,41.955207,
1861,2023,"SUNSET PARK HEALTH COUNCIL, INC.",150 55th St,Brooklyn,NY,11220-2559,Q8M,Q8MCS49133,49133,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Daniel S. Goldman,Kings County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/05,No Link,,"Corporate Entity, Federal Tax Exempt",785145843.0,DC4UE8MU2ZE8,-74.020541,40.64669,
2046,2023,UNIVERSITY OF UTAH,201 Presidents Cir,Salt Lake City,UT,84112-9049,T34,T34HP42133,42133,2021/07/01,2026/06/30,BHW,Health Workforce,Primary Care Training and Enhancement-Communit...,,Blake D. Moore,Salt Lake County,N,N,Mike Lee,Mitt Romney,2024/11/05,No Link,,U.S. Government Entity,9095365.0,LL8GLEVH6MG3,-111.849426,40.765004,


In [19]:
# create condensed df
missedstuff_df = missedstuff_df[['Grant Activity Code', 'Grant Program Name', 'HRSA Program Area Name']]

# widen columns in df to show the end of 'Grant Program Name'
pd.set_option('display.max_colwidth', None)

missedstuff_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
1823,H12,"Ryan White Title IV Women, Infants, Children, Youth and Affected Family Members AIDS Healthcare (H12)",HIV/AIDS
1861,Q8M,Quality Improvement Fund – Maternal Health (Q8M),Primary Health Care
2046,T34,Primary Care Training and Enhancement-Community Prevention and Maternal Health (T34),Health Workforce


In [20]:
# Slice off 'Grant Activity Code' form 'Grant Program Name'
###***** don't run this cell more than once, it will contiuouly slice 5 from the end of the string, restart Kernel to restore values

missedstuff_df['Grant Program Name'] = missedstuff_df['Grant Program Name'].str.slice(0, -5)

missedstuff_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
1823,H12,"Ryan White Title IV Women, Infants, Children, Youth and Affected Family Members AIDS Healthcare",HIV/AIDS
1861,Q8M,Quality Improvement Fund – Maternal Health,Primary Health Care
2046,T34,Primary Care Training and Enhancement-Community Prevention and Maternal Health,Health Workforce


In [21]:
# export Julia's df to a .csv file 'missedstuff_df'
missedstuff_df.to_csv('data/missed_grant_program_codes.csv', index=False)