# Overview
The purpose of this analysis is to calculate the number of unique synthetic beneficiaries. Visit Data.gov to download the data used for this analysis. <br>
Note: The data are filtered on 2021 only.

#  Load libraries

In [1]:
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib

# Load data

In [2]:
synthetic_inpatient_df = pd.read_csv('data/inpatient.csv',  sep="|", low_memory=False)
print(f"inpatient shape {synthetic_inpatient_df.shape}")

synthetic_outpatient_df = pd.read_csv('data/outpatient.csv', sep="|",low_memory=False)
print(f"outpatient shape{synthetic_outpatient_df.shape}")

synthetic_carrier_df = pd.read_csv('data/carrier.csv', sep="|", low_memory=False)
print(f"carrier shape {synthetic_carrier_df.shape}")

synthetic_dme_df = pd.read_csv('data/dme.csv', sep="|",  low_memory=False)
print(f"dme shape {synthetic_dme_df.shape}")

synthetic_hha_df = pd.read_csv('data/hha.csv', sep="|", low_memory=False)
print(f"hha shape {synthetic_hha_df.shape}")

synthetic_hospice_df = pd.read_csv('data/hospice.csv', sep="|", low_memory=False)
print(f"hospice shape {synthetic_hospice_df.shape}")

synthetic_snf_df = pd.read_csv('data/snf.csv', sep="|", low_memory=False)
print(f"snf shape {synthetic_snf_df.shape}")

inpatient shape (39123, 275)
outpatient shape(238718, 234)
carrier shape (1308798, 99)
dme shape (49146, 95)
hha shape (21645, 131)
hospice shape (97186, 129)
snf shape (359990, 230)


# Calculate number of unique synthetic benes in 2021

In [3]:
# evaluate 2021 only
values = [2021]

# inpatient
# convert CLM_FROM_DT to datetime
synthetic_inpatient_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_inpatient_df['CLM_FROM_DT'])
# extract year from CLM_FROM_DT 
synthetic_inpatient_df['CLM_FROM_YR'] = synthetic_inpatient_df['CLM_FROM_DT'].dt.year
# filter CLM_FROM_YR on 2021 only
synthetic_inpatient_df = synthetic_inpatient_df[synthetic_inpatient_df.CLM_FROM_YR.isin(values)]

# outpatient
synthetic_outpatient_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_outpatient_df['CLM_FROM_DT'])
synthetic_outpatient_df['CLM_FROM_YR'] = synthetic_outpatient_df['CLM_FROM_DT'].dt.year
synthetic_outpatient_df = synthetic_outpatient_df[synthetic_outpatient_df.CLM_FROM_YR.isin(values)]

# carrier
synthetic_carrier_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_carrier_df['CLM_FROM_DT'])
synthetic_carrier_df['CLM_FROM_YR'] = synthetic_carrier_df['CLM_FROM_DT'].dt.year
synthetic_carrier_df = synthetic_carrier_df[synthetic_carrier_df.CLM_FROM_YR.isin(values)]

# dme
synthetic_dme_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_dme_df['CLM_FROM_DT'])
synthetic_dme_df['CLM_FROM_YR'] = synthetic_dme_df['CLM_FROM_DT'].dt.year
synthetic_dme_df = synthetic_dme_df[synthetic_dme_df.CLM_FROM_YR.isin(values)]

# hha
synthetic_hha_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_hha_df['CLM_FROM_DT'])
synthetic_hha_df['CLM_FROM_YR'] = synthetic_hha_df['CLM_FROM_DT'].dt.year
synthetic_hha_df = synthetic_hha_df[synthetic_hha_df.CLM_FROM_YR.isin(values)]

# hospice
synthetic_hospice_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_hospice_df['CLM_FROM_DT'])
synthetic_hospice_df['CLM_FROM_YR'] = synthetic_hospice_df['CLM_FROM_DT'].dt.year
synthetic_hospice_df = synthetic_hospice_df[synthetic_hospice_df.CLM_FROM_YR.isin(values)]

# snf
synthetic_snf_df['CLM_FROM_DT'] = pd.to_datetime(synthetic_snf_df['CLM_FROM_DT'])
synthetic_snf_df['CLM_FROM_YR'] = synthetic_snf_df['CLM_FROM_DT'].dt.year
synthetic_snf_df = synthetic_snf_df[synthetic_snf_df.CLM_FROM_YR.isin(values)]

# print count of unique BENE_IDs in each service type
print(f"inpatient {synthetic_inpatient_df[['BENE_ID']].nunique()}\n")
print(f"outpatient {synthetic_outpatient_df[['BENE_ID']].nunique()}\n")
print(f"carrier {synthetic_carrier_df[['BENE_ID']].nunique()}\n")
print(f"dme {synthetic_dme_df[['BENE_ID']].nunique()}\n")
print(f"hha {synthetic_hha_df[['BENE_ID']].nunique()}\n")
print(f"hospice {synthetic_hospice_df[['BENE_ID']].nunique()}\n")
print(f"snf {synthetic_snf_df[['BENE_ID']].nunique()}\n")                                            

inpatient BENE_ID    1918
dtype: int64

outpatient BENE_ID    9326
dtype: int64

carrier BENE_ID    9411
dtype: int64

dme BENE_ID    4480
dtype: int64

hha BENE_ID    168
dtype: int64

hospice BENE_ID    300
dtype: int64

snf BENE_ID    411
dtype: int64

