In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline

#  Project Objective
Investigate whether there is any measurable difference in progress based on the eligibility category. There are three options:
*Preliminary Analysis*
+ Developmental evaluation (delay)
+ Diagnosed condition
+ Diagnosed condition, developmental evaluation (by both delay and diagnosis)
1. Start by looking at overall progress by eligibility category (column AI of the "Elig Timeline Rpt 2018-2022" tab)
2. Factor in the time of service ("ECO with Exit-21-22" tab)
3. Do the above comparison by POE as well (column A of the "ECO with Exit21-22")
*Additional Analysis*
Additional areas you can look into are listed below:
+ Does typical time of service differ for different eligibility categories?


In [None]:
teis = pd.ExcelFile("../Data/TEIS_NSS_Project_Data_10_2022.xlsx")
eco_21_22_exit = pd.read_excel(teis, 'ECO with Exit21-22', nrows=8633)
elig = pd.read_excel(teis, 'Elig Timeline Rpt 2018-2022', nrows=67611)

In [None]:
eco_21_22_exit["CHILD_ID"] = eco_21_22_exit["CHILD_ID"].fillna(0).apply(np.int64)
eco_21_22_exit

In [None]:
print(elig['Init. Elig. Category'].value_counts()['Developmental Evaluation'])

In [None]:
print(elig['Init. Elig. Category'].value_counts()['Diagnosed Condition'])

In [None]:
print(elig['Init. Elig. Category'].value_counts()['Diagnosed Condition, Developmental Evaluation'])

In [None]:
elig = elig[['Child ID', 'Init. Elig. Category']]

In [None]:
eco_21_22_exit = eco_21_22_exit[['CHILD_ID', 'ECO_Entry_DATE', 'ECO_Exit_DATE', 'Exit Date', 'Days btw Initial and Exit', 'Days btw I-IFSP to Exit ECO']]

In [None]:
elig.rename(columns = {'Child ID':'CHILD_ID'}, inplace = True)

In [None]:
eco_exit_elig = pd.merge(elig, eco_21_22_exit, how="inner", on=["CHILD_ID"])

In [None]:
eco_exit_elig

Found total number of days

In [None]:
eco_exit_elig['TOTAL DAYS IN ECO'] = (eco_exit_elig['ECO_Exit_DATE'] - eco_exit_elig['ECO_Entry_DATE']) / np.timedelta64(1, 'D')

In [None]:
eco_exit_elig

In [None]:
eco_exit_elig['ECO_ENTRY to Exit Date'] = (eco_exit_elig['Exit Date'] - eco_exit_elig['ECO_Entry_DATE']) / np.timedelta64(1, 'D')

Filtered out cases where total time was less than 6 months

In [None]:
eco_exit_elig=eco_exit_elig[eco_exit_elig['TOTAL DAYS IN ECO']>=183]
eco_exit_elig=eco_exit_elig[eco_exit_elig['Days btw I-IFSP to Exit ECO']>=0]

In [None]:
eco_exit_elig

In [None]:
eco_exit_elig.groupby('Init. Elig. Category', as_index=False)["Days btw Initial and Exit", "Days btw I-IFSP to Exit ECO", "TOTAL DAYS IN ECO", "ECO_ENTRY to Exit Date"].mean()