In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
%matplotlib inline


#  Project Objective
Investigate whether there is any measurable difference in progress based on the eligibility category. There are three options:
*Preliminary Analysis*
+ Developmental evaluation (delay)
+ Diagnosed condition
+ Diagnosed condition, developmental evaluation (by both delay and diagnosis)
1. Start by looking at overall progress by eligibility category (column AI of the "Elig Timeline Rpt 2018-2022" tab)
2. Factor in the time of service ("ECO with Exit-21-22" tab)
3. Do the above comparison by POE as well (column A of the "ECO with Exit21-22")
*Additional Analysis*
Additional areas you can look into are listed below:
+ Does typical time of service differ for different eligibility categories?
+ Do exit reasons vary by eligibility category? Do more children in one eligibility category age out compared to leaving for other reasons?
+ "ECO with Exit21-22" contains the entry ECO scores (columns D, E, and F) and exit scores (columns H, I, and J) Analyze these scores by looking at the typical improvement seen for each entry rating compared to the time of service. What percentage of children entering with a score of 1 also exit with a score of 1? How many improve to a 2 or a 3? How does this vary by time of service?

In [None]:
teis = pd.ExcelFile("../Data/TEIS_NSS_Project_Data_10_2022.xlsx")
eco = pd.read_excel(teis, 'ECO with Exit21-22', nrows=8633)
elig = pd.read_excel(teis, 'Elig Timeline Rpt 2018-2022', nrows=67611)


In [None]:
eco.head()

In [None]:
eco.info()

In [None]:
elig.info()

In [None]:
elig.head()

In [None]:
elig.dtypes

In [None]:
eco.dtypes

In [None]:
eco["CHILD_ID"] = eco["CHILD_ID"].fillna(0).apply(np.int64)
eco

In [None]:
print(elig['Init. Elig. Category'].value_counts()['Developmental Evaluation'])

In [None]:
print(elig['Init. Elig. Category'].value_counts()['Diagnosed Condition'])

In [None]:
print(elig['Init. Elig. Category'].value_counts()['Diagnosed Condition, Developmental Evaluation'])

In [None]:
elig = elig[['District', 'Child ID', 'Init. Elig. Category']]

In [None]:
elig

In [None]:
eco = eco[['DISTRICT', 'CHILD_ID', 'ECO_Entry_DATE', 'Ent SOCIAL_SCALE', 'Ent KNOWLEDGE_SCALE', 'Ent APPROPRIATE_ACTION_SCALE', 'ECO_Exit_DATE', 'Exit SOCIAL_SCALE', 'Exit KNOWLEDGE_SCALE', 'Exit APPROPRIATE_ACTION_SCALE']]

In [None]:
eco

In [None]:
elig.rename(columns = {'District':'DISTRICT', 'Child ID':'CHILD_ID'}, inplace = True)

In [None]:
eco_elig = pd.merge(eco, elig, how="outer", on=["DISTRICT", "CHILD_ID"])

In [None]:
eco_elig.head()

In [None]:
eco_elig.tail()

In [None]:
eco_elig.info()