In [1]:
import pandas as pd
import numpy as np
import plotly.express as px
pd.options.display.float_format = '{:.0f}'.format

In [2]:
nurse_df = pd.read_csv('https://raw.githubusercontent.com/datadesk/california-coronavirus-data/master/cdph-skilled-nursing-totals.csv')
nurse_df.head(5)

Unnamed: 0,date,staff_active_cases,patients_active_cases,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,staff_deaths_note,source_url
0,2021-07-31,451,188,51807,61935,242,9091,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
1,2021-07-30,420,134,51755,61908,242,9087,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
2,2021-07-29,401,142,51708,61886,242,9084,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
3,2021-07-28,397,121,51673,61854,241,9081,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
4,2021-07-27,381,103,51635,61842,241,9080,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...


In [3]:
nurse_df.drop(nurse_df.columns[[1, 2, 7, 8]], axis=1, inplace=True)
nurse_df['type'] = 'SN'
nurse_df

Unnamed: 0,date,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type
0,2021-07-31,51807,61935,242,9091,SN
1,2021-07-30,51755,61908,242,9087,SN
2,2021-07-29,51708,61886,242,9084,SN
3,2021-07-28,51673,61854,241,9081,SN
4,2021-07-27,51635,61842,241,9080,SN
...,...,...,...,...,...,...
423,2020-04-29,2594,3923,19,618,SN
424,2020-04-28,2323,3515,1,578,SN
425,2020-04-25,2329,3441,1,545,SN
426,2020-04-24,2099,3141,1,486,SN


In [4]:
today = nurse_df[(nurse_df['date'] == '2021-07-31')]
today.set_index('date', inplace=True)
today

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
2021-07-31,51807,61935,242,9091,SN


In [5]:
senior_df = pd.read_csv('https://raw.githubusercontent.com/datadesk/california-coronavirus-data/master/cdph-adult-and-senior-care-totals.csv')

In [6]:
senior_df

Unnamed: 0,date,confirmed_cases,deaths,active_cases,source_url
0,2021-07-27,43066,3749,307,https://www.cdss.ca.gov/Portals/9/Additional-R...
1,2021-07-14,42910,3747,181,https://www.cdss.ca.gov/Portals/9/Additional-R...
2,2021-07-12,42811,3746,97,https://www.cdss.ca.gov/Portals/9/Additional-R...
3,2021-06-21,42733,3744,59,https://www.cdss.ca.gov/Portals/9/Additional-R...
4,2021-05-31,42696,3744,89,https://www.cdss.ca.gov/Portals/9/Additional-R...
...,...,...,...,...,...
290,2020-05-02,1404,175,,https://www.cdss.ca.gov/Portals/9/Additional-R...
291,2020-05-01,1340,170,,https://www.cdss.ca.gov/Portals/9/Additional-R...
292,2020-04-29,1267,155,,https://www.cdss.ca.gov/Portals/9/Additional-R...
293,2020-04-28,1198,147,,https://www.cdss.ca.gov/Portals/9/Additional-R...


In [7]:
senior_df.drop(senior_df.columns[[3, 4]], axis=1, inplace=True)
senior_df['type'] = 'SC'
sc_today = senior_df[(senior_df['date'] == '2021-07-27')]
sc_today

Unnamed: 0,date,confirmed_cases,deaths,type
0,2021-07-27,43066,3749,SC


In [8]:
sc_today.set_index('date', inplace=True)
sc_today

Unnamed: 0_level_0,confirmed_cases,deaths,type
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
2021-07-27,43066,3749,SC


In [9]:
latest_df = pd.merge(today, sc_today, left_on=['date'], right_on=['date'])
latest_df

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type_x,confirmed_cases,deaths,type_y
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1


In [10]:
combined = today.merge(sc_today, how='outer', left_index=True, right_index=True)
combined

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type_x,confirmed_cases,deaths,type_y
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
2021-07-27,,,,,,43066.0,3749.0,SC
2021-07-31,51807.0,61935.0,242.0,9091.0,SN,,,


In [11]:
combined['patient_cases'] = combined["patients_confirmed_cases"] + combined["confirmed_cases"]
combined['patient_deaths'] = combined["patients_deaths"] + combined["deaths"]
combined

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type_x,confirmed_cases,deaths,type_y,patient_cases,patient_deaths
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
2021-07-27,,,,,,43066.0,3749.0,SC,,
2021-07-31,51807.0,61935.0,242.0,9091.0,SN,,,,,


In [12]:
combined2 = combined[['patient_cases', 'patient_deaths', 'staff_confirmed_cases', 'staff_deaths']]
combined2

Unnamed: 0_level_0,patient_cases,patient_deaths,staff_confirmed_cases,staff_deaths
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
2021-07-27,,,,
2021-07-31,,,51807.0,242.0
