In [1]:
import pandas as pd
from pathlib import Path
pd.set_option("display.max_columns", 200)

pd.options.mode.copy_on_write = True

In [2]:
# Read in the Active Grant csv and store into Pandas DataFrame
# https://data.hrsa.gov//DataDownload/DD_Files/EHB_ACTIVE_GRANT_FA_AGR.csv (source file)
ehb_active_path = Path("data/EHB_ACTIVE_GRANT_FA_AGR.csv")
ehb_active_df = pd.read_csv(ehb_active_path, encoding = "utf-8")

ehb_active_df

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
0,2022,KITTITAS COUNTY HEALTH NETWORK,107 E Mountain View Ave,Ellensburg,WA,98926-3666,G28,G28RH46280,46280,2022/09/01,2026/08/31,FORHP,Rural Health,Rural Communities Opioid Response Program – Me...,,Kim Schrier,Kittitas County,N,N,Patty Murray,Maria Cantwell,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",116973065.0,NMV5T3LJ9L15,-120.545778,46.984584,
1,2022,UNIVERSITY OF HAWAII,2425 Campus Rd RM 1,Honolulu,HI,96822-2247,U1U,U1UTH42529,42529,2021/09/01,2025/08/31,OA,Office of the Administrator,Regional Telehealth Resource Centers (U1U),This notice announces the opportunity to apply...,Ed Case,Honolulu County,N,N,Brian Schatz,Mazie K. Hirono,2024/11/04,No Link,,U.S. Government Entity,965088057.0,NSCKLFSSABF2,-157.820846,21.299072,
2,2022,WEST VIRGINIA UNIVERSITY RESEARCH CORPORATION,886 Chestnut Ridge Rd,Morgantown,WV,26505-2742,T34,T34HP42152,42152,2021/07/01,2026/06/30,BHW,Health Workforce,Primary Care Training and Enhancement-Communit...,,Alexander X. Mooney,Monongalia County,N,N,"Joe Manchin, III",Shelley Moore Capito,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",191510239.0,M7PNRH24BBM8,-79.955362,39.658047,
3,2022,"TRIANGLE AREA NETWORK, INC",1495 N 7th St,Beaumont,TX,77702-1345,H80,H80CS28977,28977,2015/08/01,2025/05/31,BPHC,Primary Health Care,Health Center Program (H80),To assist health centers in a Hurricane Helene...,Brian Babin,Jefferson County,N,N,John Cornyn,Ted Cruz,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",609896378.0,W3TKCN3G3R45,-94.120531,30.095351,
4,2022,THE SICKLE CELL ASSOCIATION OF NEW JERSEY INC,72 Abington Ave,Newark,NJ,07104-1426,D1J,D1JMC42477,42477,2021/09/01,2026/08/31,MCHB,Maternal and Child Health,Sickle Cell Disease Newborn Screening Follow-u...,,Robert Menendez,Essex County,N,N,Robert Menendez,George S. Helmy,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",967686580.0,UNMTSNWJZM31,-74.173821,40.767664,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
22712,2022,MINNESOTA DEPARTMENT OF HEALTH,625 Robert St N,Saint Paul,MN,55155,T29,T29HP46683,46683,2022/09/15,2025/09/14,BHW,Health Workforce,Community Health Worker Training Program (T29),This notice announces the opportunity to apply...,Betty McCollum,Ramsey County,N,N,Amy Klobuchar,Tina Smith,2024/11/04,No Link,,U.S. Government Entity,804887321.0,DHQVY2WCVHC5,-93.097776,44.954403,
22713,2022,"UNIVERSITY OF CALIFORNIA, DAVIS","1850 Research Park Dr, Ste 300",Davis,CA,95618-6153,T08,T08HP39324,39324,2020/07/01,2025/06/30,BHW,Health Workforce,Scholarships for Disadvantaged Students (T08),,Mike Thompson,Yolo County,N,N,Alex Padilla,Laphonza R. Butler,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",47120084.0,TX2DAGQPENZ5,-121.729909,38.543755,
22714,2022,KENT COUNTY MEMORIAL HOSPITAL,455 Toll Gate Rd,Warwick,RI,02886-2759,D58,D58HP37575,37575,2020/07/01,2025/06/30,BHW,Health Workforce,Residency Training in Primary Care (D58),,Seth Magaziner,Kent County,N,N,Jack Reed,Sheldon Whitehouse,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",69855195.0,NPXGTX5G5C74,-71.478336,41.704736,
22715,2022,University of Illinois,809 S Marshfield Ave,Chicago,IL,60612-4305,U77,U77HP26847,26847,2014/05/01,2027/08/31,BHW,Health Workforce,Area Health Education Centers (AHEC) Program (...,,Danny K. Davis,Cook County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/04,No Link,,U.S. Government Entity,98987217.0,W8XEAJDKMXH3,-87.667728,41.870292,


In [3]:
# get counts of grants within categories, within 'HRSA Program Area Name'
ehb_active_df['HRSA Program Area Name'].value_counts()

HRSA Program Area Name
Primary Health Care            7159
Health Workforce               6375
Maternal and Child Health      2885
HIV/AIDS                       2676
Rural Health                   1921
Healthcare Systems             1434
Office of the Administrator     267
Name: count, dtype: int64

In [4]:
# isolate 2023 data
ehb_active_2023_df = ehb_active_df[(ehb_active_df['Award Year'] == 2023)]

# create a key to narrow results so we can exclude data from 'Maternal and Child Health'
key = ehb_active_2023_df["HRSA Program Area Name"] == 'Maternal and Child Health'
nonmaternal_df = ehb_active_2023_df[~key] # exclude
maternal_df = ehb_active_2023_df[key] # include

In [5]:
# utilize key with 'keywords'
missedstuff_df = nonmaternal_df[nonmaternal_df['Grant Program Name'].str.contains('Infant|Maternal|Fetus|Unborn|Pregnan|Breast', regex=True, case=False)]

missedstuff_df

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
60,2023,HOWARD BROWN HEALTH CENTER,4025 N Sheridan Rd,Chicago,IL,60613-2010,H12,H12HA24805,24805,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Janice D. Schakowsky,Cook County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",10911980.0,K4K7GLAR8QN1,-87.654510,41.955207,
98,2023,"SUNSET PARK HEALTH COUNCIL, INC.",150 55th St,Brooklyn,NY,11220-2559,Q8M,Q8MCS49133,49133,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Daniel S. Goldman,Kings County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",785145843.0,DC4UE8MU2ZE8,-74.020541,40.646690,
174,2023,MAINLINE HEALTH SYSTEMS INC,233 N Main St,Portland,AR,71663-9230,Q8M,Q8MCS49307,49307,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Bruce Westerman,Ashley County,N,N,John Boozman,Tom Cotton,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",119842946.0,JEKKQBGWTZS5,-91.511351,33.238906,
256,2023,University of Florida,1523 Union Rd RM 207,Gainesville,FL,32611-1941,H12,H12HA24824,24824,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Kat Cammack,Alachua County,N,N,Marco Rubio,Rick Scott,2024/11/04,No Link,,U.S. Government Entity,969663814.0,NNFQH1JAPEP3,-82.342089,29.649732,
257,2023,COUNTY OF INGHAM,5303 S Cedar St,Lansing,MI,48911-3800,H12,H12HA24806,24806,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Elissa Slotkin,Ingham County,N,N,Debbie Stabenow,Gary C. Peters,2024/11/04,No Link,,U.S. Government Entity,31875656.0,MNXZAXJQTMN6,-84.548038,42.681075,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
8393,2023,CHERRY STREET SERVICES INC,100 Cherry St SE,Grand Rapids,MI,49503-4526,Q8M,Q8MCS49108,49108,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Hillary J. Scholten,Kent County,N,N,Debbie Stabenow,Gary C. Peters,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",603136417.0,JFKSJFHNA2F1,-85.665816,42.959516,
8402,2023,YOUR HEALTH CLINIC,1521 Baker Rd,Sherman,TX,75090-2409,H12,H12HA24844,24844,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Pat Fallon,Grayson County,N,N,John Cornyn,Ted Cruz,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",879477875.0,T6E1PLTJ3Q25,-96.596205,33.664001,
8418,2023,MARY HITCHCOCK MEMORIAL HOSPITAL,1 Medical Center Dr,Lebanon,NH,03756-1000,H12,H12HA31112,31112,2017/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Ann M. Kuster,Grafton County,N,N,Jeanne Shaheen,Margaret Wood Hassan,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",69910297.0,QYLXERHDAQL4,-72.273635,43.678113,
8482,2023,RESEARCH FOUNDATION FOR THE STATE UNIVERSITY O...,520 Lee Entrance STE 211,Amherst,NY,14228-2577,T34,T34HP42144,42144,2021/07/01,2026/06/30,BHW,Health Workforce,Primary Care Training and Enhancement-Communit...,,Timothy M Kennedy,Erie County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",38633251.0,LMCJKRFW5R81,-78.785538,43.002054,


In [6]:
# drop duplicate rows within 'Grant Program Name' to isolate unique 'Grant Activity Code' not contained within 'Maternal and Child Health'
missedstuff_df = missedstuff_df.drop_duplicates(subset = ('Grant Program Name'))

missedstuff_df

Unnamed: 0,Award Year,Grantee Name,Grantee Address,Grantee City,Grantee State Abbreviation,Grantee ZIP Code,Grant Activity Code,Grant Number,Grant Serial Number,Project Period Start Date,Grant Project Period End Date,HRSA Program Area Code,HRSA Program Area Name,Grant Program Name,Uniform Data System Grant Program Description,U.S. Congressional Representative Name,Complete County Name,U.S. - Mexico Border 100 Kilometer Indicator,U.S. - Mexico Border County Indicator,Name of U.S. Senator Number One,Name of U.S. Senator Number Two,Data Warehouse Record Create Date,Abstract,Grant Program Description,Grantee Type Description,DUNS Number,Unique Entity Identifier,Geocoding Artifact Address Primary X Coordinate,Geocoding Artifact Address Primary Y Coordinate,Unnamed: 29
60,2023,HOWARD BROWN HEALTH CENTER,4025 N Sheridan Rd,Chicago,IL,60613-2010,H12,H12HA24805,24805,2012/08/01,2026/07/31,HAB,HIV/AIDS,"Ryan White Title IV Women, Infants, Children, ...",Funding under this program supports current RW...,Janice D. Schakowsky,Cook County,N,N,Richard J. Durbin,Tammy Duckworth,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",10911980.0,K4K7GLAR8QN1,-87.65451,41.955207,
98,2023,"SUNSET PARK HEALTH COUNCIL, INC.",150 55th St,Brooklyn,NY,11220-2559,Q8M,Q8MCS49133,49133,2023/06/01,2025/05/31,BPHC,Primary Health Care,Quality Improvement Fund – Maternal Health (Q8M),This notice announces the opportunity for curr...,Daniel S. Goldman,Kings County,N,N,Charles E. Schumer,Kirsten E. Gillibrand,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",785145843.0,DC4UE8MU2ZE8,-74.020541,40.64669,
266,2023,MERCY MEMORIAL HOSPITAL CORP,718 N Macomb St,Monroe,MI,48162-7815,T34,T34HP42141,42141,2021/07/01,2026/06/30,BHW,Health Workforce,Primary Care Training and Enhancement-Communit...,,Tim Walberg,Monroe County,N,N,Debbie Stabenow,Gary C. Peters,2024/11/04,No Link,,"Corporate Entity, Federal Tax Exempt",63716542.0,SMDJQG62LLC8,-83.389124,41.924996,


In [7]:
# create condensed df
missedstuff_df = missedstuff_df[['Grant Activity Code', 'Grant Program Name', 'HRSA Program Area Name']]

# widen columns in df to show the end of 'Grant Program Name'
pd.set_option('display.max_colwidth', None)

missedstuff_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
60,H12,"Ryan White Title IV Women, Infants, Children, Youth and Affected Family Members AIDS Healthcare (H12)",HIV/AIDS
98,Q8M,Quality Improvement Fund – Maternal Health (Q8M),Primary Health Care
266,T34,Primary Care Training and Enhancement-Community Prevention and Maternal Health (T34),Health Workforce


In [8]:
# Slice off 'Grant Activity Code' form 'Grant Program Name'
###***** don't run this cell more than once, it will contiuouly slice 5 from the end of the string, restart Kernel to restore values

missedstuff_df['Grant Program Name'] = missedstuff_df['Grant Program Name'].str.slice(0, -5)

missedstuff_df

Unnamed: 0,Grant Activity Code,Grant Program Name,HRSA Program Area Name
60,H12,"Ryan White Title IV Women, Infants, Children, Youth and Affected Family Members AIDS Healthcare",HIV/AIDS
98,Q8M,Quality Improvement Fund – Maternal Health,Primary Health Care
266,T34,Primary Care Training and Enhancement-Community Prevention and Maternal Health,Health Workforce


In [9]:
# export Julia's df to a .csv file 'missedstuff_df'
missedstuff_df.to_csv('data/output/missed_grant_program_codes.csv', index=False)