In [1]:
import pandas as pd
import numpy as np
import plotly.express as px
pd.options.display.float_format = '{:.0f}'.format

In [2]:
nurse_df = pd.read_csv('https://raw.githubusercontent.com/datadesk/california-coronavirus-data/master/cdph-skilled-nursing-totals.csv')
nurse_df.head(5)

Unnamed: 0,date,staff_active_cases,patients_active_cases,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,staff_deaths_note,source_url
0,2021-05-04,128,64,50722,61422,229,9050,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
1,2021-05-03,125,63,50715,61409,229,9050,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
2,2021-05-01,120,53,50692,61388,229,9048,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
3,2021-04-30,132,54,50687,61386,229,9048,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...
4,2021-04-29,149,46,50678,61380,229,9047,,https://www.cdph.ca.gov/Programs/CID/DCDC/Page...


In [3]:
nurse_df.drop(nurse_df.columns[[1, 2, 7, 8]], axis=1, inplace=True)
nurse_df['type'] = 'SN'
nurse_df

Unnamed: 0,date,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type
0,2021-05-04,50722,61422,229,9050,SN
1,2021-05-03,50715,61409,229,9050,SN
2,2021-05-01,50692,61388,229,9048,SN
3,2021-04-30,50687,61386,229,9048,SN
4,2021-04-29,50678,61380,229,9047,SN
...,...,...,...,...,...,...
337,2020-04-29,2594,3923,19,618,SN
338,2020-04-28,2323,3515,1,578,SN
339,2020-04-25,2329,3441,1,545,SN
340,2020-04-24,2099,3141,1,486,SN


In [4]:
today = nurse_df[(nurse_df['date'] == '2021-05-04')]
today.set_index('date', inplace=True)
today

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
2021-05-04,50722,61422,229,9050,SN


In [5]:
senior_df = pd.read_csv('https://raw.githubusercontent.com/datadesk/california-coronavirus-data/master/cdph-adult-and-senior-care-totals.csv')

In [6]:
senior_df.drop(senior_df.columns[[3, 4]], axis=1, inplace=True)
senior_df['type'] = 'SC'
sc_today = senior_df[(senior_df['date'] == '2021-04-30')]
sc_today

Unnamed: 0,date,confirmed_cases,deaths,type
0,2021-04-30,42573,3739,SC


In [7]:
sc_today.set_index('date', inplace=True)
sc_today

Unnamed: 0_level_0,confirmed_cases,deaths,type
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
2021-04-30,42573,3739,SC


In [8]:
latest_df = pd.merge(today, sc_today, left_on=['date'], right_on=['date'])
latest_df

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type_x,confirmed_cases,deaths,type_y
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1


In [9]:
combined = today.merge(sc_today, how='outer', left_index=True, right_index=True)
combined

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type_x,confirmed_cases,deaths,type_y
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1
2021-04-30,,,,,,42573.0,3739.0,SC
2021-05-04,50722.0,61422.0,229.0,9050.0,SN,,,


In [10]:
combined['patient_cases'] = combined["patients_confirmed_cases"] + combined["confirmed_cases"]
combined['patient_deaths'] = combined["patients_deaths"] + combined["deaths"]
combined

Unnamed: 0_level_0,staff_confirmed_cases,patients_confirmed_cases,staff_deaths,patients_deaths,type_x,confirmed_cases,deaths,type_y,patient_cases,patient_deaths
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
2021-04-30,,,,,,42573.0,3739.0,SC,,
2021-05-04,50722.0,61422.0,229.0,9050.0,SN,,,,,


In [11]:
combined2 = combined[['patient_cases', 'patient_deaths', 'staff_confirmed_cases', 'staff_deaths']]
combined2

Unnamed: 0_level_0,patient_cases,patient_deaths,staff_confirmed_cases,staff_deaths
date,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
2021-04-30,,,,
2021-05-04,,,50722.0,229.0
