In [None]:
#Importing Packages
import pandas as pd
from pathlib import Path
import openpyxl
import seaborn as sns
import matplotlib.pyplot as plt
from matplotlib import rcParams


In [None]:
#Reading in Crisis version 1 Excel file, removing the first two rows, converting to a Dataframe, and 
#printing the first five rows.
crisisv1 = pd.read_excel('../data/NSSCrisisv.1.xlsx', skiprows=2)
crisisv1_df = pd.DataFrame(crisisv1)
crisisv1_df.head()

In [None]:
crisisv1_df.tail()

In [None]:
#Viewing info about Crisis v1 Dataframe
crisisv1_df.info()

In [None]:
#Getting a sum of null values
crisisv1_df.isnull().sum()

In [None]:
nullPostCodes = crisisv1_df.PostalCode.isnull().sum()
nullPostCodes 

In [None]:
nonNullPostCodesV1 = crisisv1_df.PostalCode.notnull().sum()
nonNullPostCodesV1 

In [None]:
# Converting CallDateAndTimeStart column data type to string and creating call year column
crisisv1_df['CallDateAndTimeStart'] = crisisv1_df['CallDateAndTimeStart'].astype('str')
crisisv1_df['call_year'] = crisisv1_df.CallDateAndTimeStart.str[0:4]
crisisv1_df.info()

In [None]:
filter2020 = crisisv1_df['call_year'].isin(['2020'])
crisisZip2020 = crisisv1_df[filter2020]
crisisZip2020

In [None]:
nonNullPostCodesV1_2020 = crisisZip2020.PostalCode.notnull().sum()
nonNullPostCodesV1_2020 

In [None]:
filter2021 = crisisv1_df['call_year'].isin(['2021'])
crisisZip2021 = crisisv1_df[filter2021]
crisisZip2021

In [None]:
nonNullPostCodesV1_2021 = crisisZip2021.PostalCode.notnull().sum()
nonNullPostCodesV1_2021

In [None]:
#Dropping all null values and viewing resulting info
crisisv1_df.dropna()
crisisv1_df.info()

In [None]:
#Viewing resulting dataframe
crisisv1_df

In [None]:
#Dropping all null value columns and viewing resulting info
crisisv1_df.dropna(how='all', axis=1, inplace=True)
crisisv1_df.info()
 

In [None]:
#Viewing resulting dataframe
crisisv1_df

In [None]:
#Reading in Crisis v2 Excel dataset, converting to dataframe, and viewing the top 5 rows
crisisv2 = pd.read_excel('../data/NSSCrisisv.2.xlsx', skiprows=2)
crisisv2_df = pd.DataFrame(crisisv2)
crisisv2_df.head()

In [None]:
crisisv2_df.tail()

In [None]:
nullPostCodesV2 = crisisv2_df.PostalCode.isnull().sum()
nullPostCodesV2

In [None]:
nonNullPostCodesV2 = crisisv2_df.PostalCode.notnull().sum()
nonNullPostCodesV2

In [None]:
# Converting CallDateAndTimeStart column data type to string and creating call year column
crisisv2_df['CallDateAndTimeStart'] = crisisv2_df['CallDateAndTimeStart'].astype('str')
crisisv2_df['call_year'] = crisisv2_df.CallDateAndTimeStart.str[0:4]
crisisv2_df.info()

In [None]:
filter2022 = crisisv2_df['call_year'].isin(['2022'])
crisisZip2022 = crisisv2_df[filter2022]
crisisZip2022

In [None]:
nonNullPostCodesV2_2022 = crisisZip2022.PostalCode.notnull().sum()
nonNullPostCodesV2_2022 

In [None]:
#Dropping all null values and viewing resulting info
crisisv2_df.dropna()
crisisv2_df.info()

In [None]:
#Viewing resulting dataframe
crisisv2_df

In [None]:
#Dropping all null value columns and viewing resulting info
crisisv2_df.dropna(how='all', axis=1, inplace=True)
crisisv2_df.info()

In [None]:
#Viewing resulting dataframe
crisisv2_df

In [None]:
#Concatenating the Crisis v1 and v2 Dataframes and viewing resulting dataframe
crisis1and2_df = pd.concat([crisisv1_df, crisisv2_df])
crisis1and2_df

In [None]:
crisis1and2_df.info()

In [None]:
crisis1and2_df

In [None]:
crisis1and2_df.describe()

In [None]:
demographics = crisis1and2_df.loc[:,['Demographics' in i for i in crisis1and2_df.columns]]

In [None]:
demographics.count()

In [None]:
topAgeBracket = crisis1and2_df['CRISIS Demographics - Age'].value_counts()
topAgeBracket = topAgeBracket.drop(topAgeBracket.index[7])
topAgeBracket_df = pd.DataFrame(topAgeBracket).reset_index()
topAgeBracket_df = topAgeBracket_df.rename(columns={'index': 'Age Bracket'})
topAgeBracket_df.sort_values(by=['Age Bracket'], inplace=True)
topAgeBracket_df


In [None]:
#Viridis
sns.set(font_scale = 10)
sns.set_style('darkgrid')
sns.set(rc={"figure.figsize":(15,12)})
cmap = sns.color_palette('viridis')
ax = sns.barplot(x='Age Bracket', y='CRISIS Demographics - Age', data=topAgeBracket_df, palette=cmap)
cmap = sns.color_palette('viridis')
plt.xlabel('Age Bracket', fontdict= {'fontsize':20, 'fontweight':'bold'})
plt.ylabel('Call Volume', fontdict= {'fontsize':20, 'fontweight':'bold'})
plt.title("Call Volume by Age Bracket",fontdict= { 'fontsize': 30, 'fontweight':'bold','verticalalignment': 'center'})
plt.xticks(fontsize=17, rotation=60)
plt.yticks(fontsize=17)
;

#Gradient One
#sns.set(font_scale = 10)
#sns.set_style('darkgrid')
#sns.set(rc={"figure.figsize":(15,12)})
#cmap = sns.color_palette('light:#5A9')
#ax = sns.barplot(x='Age Bracket', y='CRISIS Demographics - Age', data=topAgeBracket_df, palette=cmap)
#cmap = sns.color_palette('viridis')
#plt.xlabel('Age Bracket', fontdict= {'fontsize':20, 'fontweight':'bold'})
#plt.ylabel('Call Volume', fontdict= {'fontsize':20, 'fontweight':'bold'})
#plt.title("Call Volume by Age Bracket",fontdict= { 'fontsize': 30, 'fontweight':'bold','verticalalignment': 'center'})
#plt.xticks(fontsize=17, rotation=60)
#plt.yticks(fontsize=17)
#;

#Gradient Two
#sns.set(font_scale = 10)
#sns.set_style('darkgrid')
#sns.set(rc={"figure.figsize":(15,12)})
#cmap = sns.color_palette('ch:s=.25,rot=-.25')
#ax = sns.barplot(x='Age Bracket', y='CRISIS Demographics - Age', data=topAgeBracket_df, palette=cmap)
#cmap = sns.color_palette('viridis')
#plt.xlabel('Age Bracket', fontdict= {'fontsize':20, 'fontweight':'bold'})
#plt.ylabel('Call Volume', fontdict= {'fontsize':20, 'fontweight':'bold'})
#plt.title("Call Volume by Age Bracket",fontdict= { 'fontsize': 30, 'fontweight':'bold','verticalalignment': 'center'})
#plt.xticks(fontsize=17, rotation=60)
#plt.yticks(fontsize=17)
#;

In [None]:
codes = ['K1A 0A1', 'V5K 0A1']
crisis1and2_df = crisis1and2_df[crisis1and2_df.PostalCode.isin(codes) == False]
crisis1and2_df['PostalCode'] = crisis1and2_df['PostalCode'].fillna(0)
crisis1and2_df['PostalCode'] = crisis1and2_df['PostalCode'].astype(int)
crisis1and2_df['PostalCode'] = crisis1and2_df['PostalCode'].astype(str)
crisis1and2_df['PostalCode'].dtypes

In [None]:
highestAgeBracketCount = crisis1and2_df.groupby('PostalCode')['CRISIS Demographics - Age'].value_counts()
highestAgeBracketCount_df = pd.DataFrame(highestAgeBracketCount)
highestAgeBracketCount_df.head(20)

In [None]:
zipCount = crisis1and2_df['PostalCode'].count()
zipCount

In [None]:
# Getting counts of differing postal codes of callers
#postalCodes = crisis1and2_df['PostalCode'].unique() 
postalCodeCount = crisis1and2_df['PostalCode'].value_counts().to_frame()
postalCodeCount


In [None]:
topAgeBracket = crisis1and2_df['CRISIS Demographics - Age'].value_counts()
topAgeBracket = topAgeBracket.drop(topAgeBracket.index[7])
topAgeBracket_df = pd.DataFrame(topAgeBracket)
topAgeBracket_df

In [None]:
#Getting Top 10 postal codes based on call volume across all years
postalCodeTop10_df = postalCodeCount.head(11)
postalCodeTop10_df = postalCodeTop10_df.drop(postalCodeTop10_df.index[0])
postalCodeTop10_df


In [None]:
top10zip = crisis1and2_df.loc[crisis1and2_df['PostalCode'].isin(['37075', '37115', '38012', '37211', '37138', '37013', '37857', '37207', '37238', '37130'])]
top10zip.head()

In [None]:
top10zipAge = top10zip.groupby('PostalCode')['CRISIS Demographics - Age'].value_counts(sort=True, ascending=True)
top10zipAge = top10zipAge.unstack()
top10zipAge = top10zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']] = top10zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']].fillna(0)
top10zipAge = top10zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']] = top10zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']].astype(int)
top10zipAge

In [None]:
#Top 5 zip codes
top5zip = crisis1and2_df.loc[crisis1and2_df['PostalCode'].isin(['37075', '37115', '38012', '37211', '37138'])]
top5zip.head()

In [None]:
#Number of callers in each age bracket for each of the top 5 zip codes
top5zipAge = top5zip.groupby('PostalCode')['CRISIS Demographics - Age'].value_counts()
top5zipAge = top5zipAge.drop(top5zipAge.index[5])
top5zipAge = top5zipAge.drop(top5zipAge.index[-3])
top5zipAge = top5zipAge.unstack()
top5zipAge = top5zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']] = top5zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']].fillna(0)
top5zipAge = top5zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']] = top5zipAge[['56-70', '70-85', '13-17', '41-55', '25-30', '18-24', '31-40']].astype(int)
top5zipAge['Postal Code'] = top5zipAge.index
top5zipAge


In [None]:
top5zipAge.dtypes

In [None]:
zip2013 = pd.read_csv('../data/US Zip Codes from 2013 Government Data.csv', dtype={'zip': 'string'})
zip2013.head()

In [None]:
zipPlusCrisis1And2 = crisis1and2_df.merge(zip2013, left_on='PostalCode', right_on='zip', how='left')
zipPlusCrisis1And2

In [None]:
ax = top5zipAge.plot(kind='bar', figsize=(7, 5), cmap='viridis', rot=0, width=.8)
ax.legend(title='Age Bracket', bbox_to_anchor=(1,1), loc='upper left')
plt.xticks(rotation=60)
plt.tight_layout()
plt.savefig('Top 5 Zip Codes based on Call Volume per Age Bracket')
ax.set_title('Top 5 Zip Codes based on Call Volume per Age Bracket', fontsize=20)
ax.set_xlabel(xlabel='Zip Code', fontsize=12)
ax.set_ylabel('Call Volume', fontsize=12)
plt.show()

In [None]:
#Top 3 zip codes
top3zip = crisis1and2_df.loc[crisis1and2_df['PostalCode'].isin(['37075', '37115', '38012'])]
top3zip.head()

In [None]:
top3zipAge = top3zip.groupby('PostalCode')['CRISIS Demographics - Age'].value_counts()
top3zipAge = top3zipAge.drop(top3zipAge.index[5])
top3zipAge

In [None]:
#Number of callers for each gender identity in the top 5 zip codes
top5zipGendIdent = top5zip.groupby('PostalCode')['CRISIS Demographics - Gender Identity'].value_counts()
top5zipGendIdent

In [None]:
#Number of callers in each gender identity for each of the top 5 zip codes
top5zipGenderId = top5zip.groupby('PostalCode')['CRISIS Demographics - Gender Identity'].value_counts()
top5zipGenderId = top5zipGenderId.unstack()
top5zipGenderId = top5zipGenderId[['Female', 'Male', 'Transgender']] = top5zipGenderId[['Female', 'Male', 'Transgender']].fillna(0)
top5zipGenderId = top5zipGenderId[['Female', 'Male', 'Transgender']] = top5zipGenderId[['Female', 'Male', 'Transgender']].astype(int)
top5zipGenderId

In [None]:
ax = top5zipGenderId.plot(kind='bar', figsize=(7, 5), cmap='viridis', rot=0, width=.8)
ax.legend(title='Gender Indentity', bbox_to_anchor=(1,1), loc='upper left')
plt.xticks(rotation=60)
plt.tight_layout()
plt.savefig('Top 5 Zip Codes based on Call Volume per Gender Identity')
ax.set_title('Top 5 Zip Codes based on Call Volume per Gender Identity', fontsize=15)
ax.set_xlabel(xlabel='Zip Code', fontsize=12)
ax.set_ylabel('Call Volume', fontsize=12)
plt.show()

In [None]:
#Number of callers in each military status for each of the top 5 zip codes
top5zipMilit = top5zip.groupby('PostalCode')['CRISIS Demographics - Military'].value_counts()
top5zipMilit = top5zipMilit.unstack()
top5zipMilit = top5zipMilit[['3rd Party Calling about Veteran', 'Family of Military', 'Veteran']] =  top5zipMilit[['3rd Party Calling about Veteran', 'Family of Military', 'Veteran']].fillna(0)
top5zipMilit = top5zipMilit[['3rd Party Calling about Veteran', 'Family of Military', 'Veteran']] =  top5zipMilit[['3rd Party Calling about Veteran', 'Family of Military', 'Veteran']].astype(int)
top5zipMilit

In [None]:
ax = top5zipMilit.plot(kind='bar', figsize=(7, 5), cmap='viridis', rot=0, width=.8)
ax.legend(title='Military Status', bbox_to_anchor=(1,1), loc='upper left')
plt.xticks(rotation=60)
plt.tight_layout()
plt.savefig('Top 5 Zip Codes based on Call Volume per Military Status')
ax.set_title('Top 5 Zip Codes based on Call Volume per Military Status', fontsize=15)
ax.set_xlabel(xlabel=False)
ax.set_ylabel('Call Volume', fontsize=12)
plt.show()

In [None]:
topMilitary = crisis1and2_df['CRISIS Demographics - Military'].value_counts(normalize=True) * 100
topMilitary = topMilitary.drop(topMilitary.index[0])
topMilitary = topMilitary.drop(topMilitary.index[0])
topMilitary_df = pd.DataFrame(topMilitary).reset_index()
topMilitary_df = topMilitary_df.rename(columns={'index': 'Military Status'})
topMilitary_df





In [None]:
#Viridis
sns.set_style('darkgrid')
sns.set(rc={"figure.figsize":(45,30)})
sns.set(font_scale = 10)
ax = sns.barplot(x='Military Status', y='CRISIS Demographics - Military', data=topMilitary_df, palette=cmap)
cmap = sns.color_palette('viridis')
plt.xlabel('Military Status', fontdict= {'fontsize':70, 'fontweight':'bold'})
plt.ylabel('Call Volume', fontdict= {'fontsize':70, 'fontweight':'bold'})
plt.title("Call Volume by Military Status (Percentage)",fontdict= { 'fontsize': 80, 'fontweight':'bold','verticalalignment': 'center'})
plt.xticks(fontsize=60, rotation=60)
plt.yticks(fontsize=60)
;

#Gradient One
#sns.set_style('darkgrid')
#sns.set(rc={"figure.figsize":(45,30)})
#sns.set(font_scale = 10)
#ax = sns.barplot(x='Military Status', y='CRISIS Demographics - Military', data=topMilitary_df, palette=cmap)
#cmap = sns.color_palette('light:#5A9')
#plt.xlabel('Military Status', fontdict= {'fontsize':70, 'fontweight':'bold'})
#plt.ylabel('Call Volume', fontdict= {'fontsize':70, 'fontweight':'bold'})
#plt.title("Call Volume by Military Status (Percentage)",fontdict= { 'fontsize': 80, 'fontweight':'bold','verticalalignment': 'center'})
#plt.xticks(fontsize=60, rotation=60)
#plt.yticks(fontsize=60)
#;

#Gradient Two
#sns.set_style('darkgrid')
#sns.set(rc={"figure.figsize":(45,30)})
#sns.set(font_scale = 10)
#ax = sns.barplot(x='Military Status', y='CRISIS Demographics - Military', data=topMilitary_df, palette=cmap)
#cmap = sns.color_palette('ch:s=.25,rot=-.25')
#plt.xlabel('Military Status', fontdict= {'fontsize':70, 'fontweight':'bold'})
#plt.ylabel('Call Volume', fontdict= {'fontsize':70, 'fontweight':'bold'})
#plt.title("Call Volume by Military Status (Percentage)",fontdict= { 'fontsize': 80, 'fontweight':'bold','verticalalignment': 'center'})
#plt.xticks(fontsize=60, rotation=60)
#plt.yticks(fontsize=60)
#;




In [None]:
#Value counts of gender identity - 37075
genIdentCountFor37075= crisis1and2_df[crisis1and2_df['PostalCode']=='37075']['CRISIS Demographics - Gender Identity'].value_counts()
genIdentCountFor37075

In [None]:
#Military count - 37075
militCountFor37075 = crisis1and2_df[crisis1and2_df['PostalCode']=='37075']['CRISIS Demographics - Military'].value_counts()
militCountFor37075

In [None]:
#Number of callers in each age bracket  - 37115
ageBracketCountFor37115 = crisis1and2_df[crisis1and2_df['PostalCode']=='37115']['CRISIS Demographics - Age'].value_counts()
ageBracketCountFor37115

In [None]:
#Value counts of gender identity - 37115
genIdentCountFor37115 = crisis1and2_df[crisis1and2_df['PostalCode']=='37115']['CRISIS Demographics - Gender Identity'].value_counts()
genIdentCountFor37115

In [None]:
#Military count - 37115
militCountFor37115 = crisis1and2_df[crisis1and2_df['PostalCode']=='37115']['CRISIS Demographics - Military'].value_counts()
militCountFor37115

In [None]:
#Number of callers in each age bracket - 38012
ageBracketCountFor38012 = crisis1and2_df[crisis1and2_df['PostalCode']=='38012']['CRISIS Demographics - Age'].value_counts()
ageBracketCountFor38012

In [None]:
#Value counts of gender identity - 38012
genIdentCountFor38012 = crisis1and2_df[crisis1and2_df['PostalCode']=='38012']['CRISIS Demographics - Gender Identity'].value_counts()
genIdentCountFor38012

In [None]:
#Military count - 38012
militCountFor38012 = crisis1and2_df[crisis1and2_df['PostalCode']=='38012']['CRISIS Demographics - Military'].value_counts()
militCountFor38012

In [None]:
#Number of callers in each age bracket  - 37211
ageBracketCountFor37211 = crisis1and2_df[crisis1and2_df['PostalCode']=='37211']['CRISIS Demographics - Age'].value_counts()
ageBracketCountFor37211

In [None]:
#Value counts of gender identity - 37211
genIdentCountFor37211 = crisis1and2_df[crisis1and2_df['PostalCode']=='37211']['CRISIS Demographics - Gender Identity'].value_counts()
genIdentCountFor37211

In [None]:
#Military count - 37211
militCountFor37211 = crisis1and2_df[crisis1and2_df['PostalCode']=='37211']['CRISIS Demographics - Military'].value_counts()
militCountFor37211

In [None]:
#Number of callers in each age bracket  - 37138
ageBracketCountFor37138 = crisis1and2_df[crisis1and2_df['PostalCode']=='37138']['CRISIS Demographics - Age'].value_counts()
ageBracketCountFor37138

In [None]:
#Value counts of gender identity - 37138
genIdentCountFor37138 = crisis1and2_df[crisis1and2_df['PostalCode']=='37138']['CRISIS Demographics - Gender Identity'].value_counts()
genIdentCountFor37138

In [None]:
#Military count - 37138
militCountFor37138 = crisis1and2_df[crisis1and2_df['PostalCode']=='37138']['CRISIS Demographics - Military'].value_counts()
militCountFor37138

In [None]:
zipNonNulls = nonNullPostCodesV1 + nonNullPostCodesV2
zipNonNulls

In [None]:
#Percentage of call volume per zip code for all years
postalCodePerc = crisis1and2_df['PostalCode'].value_counts() / zipNonNulls
postalCodePerc_df = pd.DataFrame(postalCodePerc)
postalCodeTop10Perc_df = postalCodePerc_df.head(11)
postalCodeTop10Perc_df = round(postalCodeTop10Perc_df.drop(postalCodeTop10Perc_df.index[0]), 2)
postalCodeTop10Perc_df

In [None]:
#Records assocaited with Top 10 postal codes across all years
crisisTop10Zip = crisis1and2_df.loc[crisis1and2_df['PostalCode'].isin(['37075', '37115', '38012', '37211', '37138', '37013', '37857', '37207', '37238', '37130'])]
crisisTop10Zip


In [None]:
# Getting records from calls placed in 2020 alone
filter2020 = crisis1and2_df['call_year'].isin(['2020'])
crisisZip2020 = crisis1and2_df[filter2020]
crisisZip2020.head()

In [None]:
postalCodeCount2020 = crisisZip2020['PostalCode'].value_counts()
Top10_2020_df = pd.DataFrame(postalCodeCount2020.head(11))
Top10_2020_df = Top10_2020_df.drop(Top10_2020_df.index[0])
Top10_2020_df

In [None]:
postalCodePerc2020 = crisisZip2020['PostalCode'].value_counts() / nonNullPostCodesV1_2020
Top10_2020Perc_df = pd.DataFrame(postalCodePerc2020.head(11))
Top10_2020Perc_df = round(Top10_2020Perc_df.drop(Top10_2020Perc_df.index[0]), 2)
Top10_2020Perc_df

In [None]:
# Getting records from calls placed in 2020 alone
filter2021 = crisis1and2_df['call_year'].isin(['2021'])
crisisZip2021 = crisis1and2_df[filter2021]
crisisZip2021.head()

In [None]:
postalCodeCount2021 = crisisZip2021['PostalCode'].value_counts()
Top10_2021_df = pd.DataFrame(postalCodeCount2021.head(11))
Top10_2021_df = Top10_2021_df.drop(Top10_2021_df.index[[0]])
Top10_2021_df

In [None]:
postalCodePerc2021 = crisisZip2021['PostalCode'].value_counts() / nonNullPostCodesV1_2021
Top10_2021Perc_df = pd.DataFrame(postalCodePerc2021.head(11))
Top10_2021Perc_df = round(Top10_2021Perc_df.drop(Top10_2021Perc_df.index[0]), 2)
Top10_2021Perc_df

In [None]:
filter2022 = crisis1and2_df['call_year'].isin(['2022'])
crisisZip2022 = crisis1and2_df[filter2022]
crisisZip2022.head()

In [None]:
postalCodeCount2022 = crisisZip2022['PostalCode'].value_counts()
Top10_2022_df = pd.DataFrame(postalCodeCount2022.head(11))
Top10_2022_df = Top10_2022_df.drop(Top10_2022_df.index[[0]])
Top10_2022_df

In [None]:
postalCodePerc2022 = crisisZip2022['PostalCode'].value_counts() / nonNullPostCodesV2_2022
Top10_2022Perc_df = pd.DataFrame(postalCodePerc2022.head(11))
Top10_2022Perc_df = round(Top10_2022Perc_df.drop(Top10_2022Perc_df.index[0]), 2)
Top10_2022Perc_df

In [None]:
crisis1and2_df['ThirdPartyCity'].value_counts()

In [None]:
crisis1and2_df['ThirdPartyCounty'].value_counts()

In [None]:
crisis1and2_df['ThirdPartyStateProvince'].value_counts()

In [None]:
crisis1and2_df['ThirdPartyPostalCode'] = crisis1and2_df['ThirdPartyPostalCode'].astype('str')
crisis1and2_df['ThirdPartyPostalCode'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Occupation'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Occupation'].value_counts()

In [None]:
crisis1and2_df['SUI AX Demographics - Name of Third Party'].value_counts()

In [None]:
# Getting counts of age brackets of callers
crisis1and2_df['CRISIS Demographics - Age'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Education Level'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Ethnicity'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Gender Identity'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Has a disability?'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Homeless?'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Income'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Marital Status'].value_counts()

In [None]:
crisis1and2_df['CRISIS Demographics - Military'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Age'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Education Level'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Ethnicity'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Gender'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Has a disability?'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Homeless?'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Marital Status'].value_counts()

In [None]:
crisis1and2_df['HOM AX Demographics - Military'].value_counts()

Curious if columns FY, GL, GU, and GV should be considered a demographics

In [None]:
crisis1and2_df['HOM AX Third-Party Risk Assessment Demographics - Does this risk assesment have different demographics than the caller? (Third-party Call)'].value_counts()

In [None]:
crisis1and2_df['SUI AX Demographics - Age'].value_counts()

In [None]:
crisis1and2_df['SUI AX Demographics - Ethnicity'].value_counts()

In [None]:
crisis1and2_df['SUI AX Demographics - Gender'].value_counts()

In [None]:
crisis1and2_df['SUI AX Demographics - Relationship to person at risk'].value_counts()

In [None]:
crisis1and2_df['SUI AX Third-Party Risk Assessment Demographics - SUI AX Does this risk assesment have different demographics than the caller? (Third-party Call)'].value_counts()

In [None]:
crisis1and2_df['SUI AX Demographics - Relationship to person at risk'].value_counts()

In [None]:
#Reading in Sheet 2020 of Call volume Excel File
callVol2020 = pd.read_excel('../data/Contact center call volume_2020-2022.xlsx', sheet_name ='2020', skiprows=10)
callVol2020_df = pd.DataFrame(callVol2020)
callVol2020_df

In [None]:
#Reading in Sheet 2021 of Call volume Excel File
callVol2021 = pd.read_excel('../data/Contact center call volume_2020-2022.xlsx', sheet_name ='2021', skiprows=10)
callVol2021_df = pd.DataFrame(callVol2021)
callVol2021_df

In [None]:
#Reading in Sheet 2022 of Call volume Excel File
callVol2022 = pd.read_excel('../data/Contact center call volume_2020-2022.xlsx', sheet_name ='2022', skiprows=7)
callVol2022_df = pd.DataFrame(callVol2022)
callVol2022_df
