In [2]:
import pandas as pd
import numpy as np
from matplotlib import pyplot as plt
import datetime

### US Data

In [3]:
ilinet_data = pd.read_csv('F:/Pandemic-Database/Raw_Data/Influenza/ILINet.csv',
                         header= 1)

ilinet_data = ilinet_data[['REGION','YEAR','WEEK','ILITOTAL']]

ilinet_data.insert(0,'Microbe Family','Orthomyxovididae')
ilinet_data.insert(1,'Microbe Genus','Influenza A, B, and C Virus')
ilinet_data.insert(2,'Microbe Species', 'None' )
ilinet_data.insert(3,'Region', 'AMRO' )
ilinet_data.insert(4,'Country', 'United States' )
ilinet_data.insert(6,'Sub-Domain', np.nan )
ilinet_data.insert(7,'date', np.nan )
ilinet_data.insert(8,'type', 'ILI_Total')

ilinet_data = ilinet_data.rename(columns={'REGION':'Domain',
                                         'ILITOTAL':'number'})

ilinet_data['date'] = ilinet_data['YEAR'].astype(str) + '-' + ilinet_data['WEEK'].astype(str) + '-1'

ilinet_data['date'] = ilinet_data['date'].map(lambda x: datetime.datetime.strptime(x, "%Y-%W-%w").date())

ilinet_data = ilinet_data.drop(columns=['YEAR','WEEK'])

ilinet_data


Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,Domain,Sub-Domain,date,type,number
0,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alabama,,2010-10-04,ILI_Total,249
1,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alaska,,2010-10-04,ILI_Total,15
2,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Arizona,,2010-10-04,ILI_Total,172
3,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Arkansas,,2010-10-04,ILI_Total,18
4,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,California,,2010-10-04,ILI_Total,632
...,...,...,...,...,...,...,...,...,...,...
36828,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Wyoming,,2023-10-23,ILI_Total,68
36829,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Commonwealth of the Northern Mariana Islands,,2023-10-23,ILI_Total,X
36830,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Puerto Rico,,2023-10-23,ILI_Total,157
36831,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Virgin Islands,,2023-10-23,ILI_Total,22


In [4]:
len(set(ilinet_data['Domain']))

55

In [5]:
ilinet_data = ilinet_data.sort_values(by = ['Country','Domain','Sub-Domain','date'])

ilinet_data = ilinet_data[ilinet_data['number'] != 'X']

ilinet_data['number'] = ilinet_data['number'].astype(int)

ilinet_cumulative_data = ilinet_data.groupby(['Microbe Family','Microbe Genus','Microbe Species','Region','Country','Domain','date','type']).sum().groupby(level=5).cumsum().reset_index()
ilinet_cumulative_data['Sub-Domain'] = np.nan
ilinet_cumulative_data

Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,Domain,date,type,Sub-Domain,number
0,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alabama,2010-10-04,ILI_Total,,249
1,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alabama,2010-10-11,ILI_Total,,488
2,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alabama,2010-10-18,ILI_Total,,720
3,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alabama,2010-10-25,ILI_Total,,994
4,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Alabama,2010-11-01,ILI_Total,,1336
...,...,...,...,...,...,...,...,...,...,...
35935,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Wyoming,2023-09-25,ILI_Total,,33196
35936,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Wyoming,2023-10-02,ILI_Total,,33235
35937,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Wyoming,2023-10-09,ILI_Total,,33298
35938,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Wyoming,2023-10-16,ILI_Total,,33384


### World Data

In [6]:
world_ilinet_data = pd.read_csv('F:/Pandemic-Database/Raw_Data/Influenza/WHO_influenza.csv')
world_ilinet_data = world_ilinet_data.dropna(subset=['Cases of influenza-like illnesses'])
world_ilinet_data = world_ilinet_data[['Country','Day','Cases of influenza-like illnesses']]
world_ilinet_data = world_ilinet_data.reset_index(drop = True)
world_ilinet_data.insert(0,'Microbe Family','Orthomyxovididae')
world_ilinet_data.insert(1,'Microbe Genus','Influenza A, B, and C Virus')
world_ilinet_data.insert(2,'Microbe Species', 'None' )
world_ilinet_data.insert(3,'Region', np.nan )
world_ilinet_data.insert(5,'Domain', np.nan)
world_ilinet_data.insert(6,'Sub-Domain', np.nan)
world_ilinet_data.insert(8,'type', 'Cases')

world_ilinet_data = world_ilinet_data.rename(columns={'Day':'date',
                                                      'Cases of influenza-like illnesses': 'number'})

world_ilinet_data

Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,Domain,Sub-Domain,date,type,number
0,Orthomyxovididae,"Influenza A, B, and C Virus",,,Afghanistan,,,2016-03-14,Cases,494.0
1,Orthomyxovididae,"Influenza A, B, and C Virus",,,Afghanistan,,,2016-03-21,Cases,715.0
2,Orthomyxovididae,"Influenza A, B, and C Virus",,,Afghanistan,,,2016-03-28,Cases,704.0
3,Orthomyxovididae,"Influenza A, B, and C Virus",,,Afghanistan,,,2016-04-04,Cases,749.0
4,Orthomyxovididae,"Influenza A, B, and C Virus",,,Afghanistan,,,2016-04-11,Cases,651.0
...,...,...,...,...,...,...,...,...,...,...
68349,Orthomyxovididae,"Influenza A, B, and C Virus",,,Zambia,,,2021-11-29,Cases,1866.0
68350,Orthomyxovididae,"Influenza A, B, and C Virus",,,Zambia,,,2021-12-06,Cases,1394.0
68351,Orthomyxovididae,"Influenza A, B, and C Virus",,,Zambia,,,2021-12-13,Cases,1348.0
68352,Orthomyxovididae,"Influenza A, B, and C Virus",,,Zambia,,,2021-12-20,Cases,1513.0


In [7]:
country_to_region_dict = np.load('F:/Pandemic-Database/Internal/Intermediate_Data_Archive/Country_Region_Dict.npy',
                                 allow_pickle=True).item()

country_to_region_dict.update({'American Samoa':'AMRO',
'Anguilla':'AMRO',
'Bonaire Sint Eustatius and Saba':'AMRO',
'British Virgin Islands':'AMRO',
"Cayman Islands":'AMRO',
"Cote d'Ivoire":'AFRO',
'East Timor':'WPRO',
'French Polynesia':'WPRO',
'Kosovo':'EURO',
'Micronesia (country)':'WPRO',
'Montserrat':'AMRO',
'Northern Mariana Islands':'WPRO',
'Pitcairn':'WPRO',
'Sint Maarten (Dutch part)':'AMRO',
'Tokelau':'WPRO',
'Turks and Caicos Islands':'AMRO',
'Wallis and Futuna':'WPRO'})

np.save('F:/Pandemic-Database/Internal/Intermediate_Data_Archive/Country_Region_Dict.npy', country_to_region_dict)

In [8]:
world_ilinet_data['Region'] = world_ilinet_data['Country'].map(country_to_region_dict)
world_ilinet_data = world_ilinet_data.dropna(subset=['Region'])
world_ilinet_data['date'] = pd.to_datetime(world_ilinet_data['date']).dt.date
world_ilinet_data

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  world_ilinet_data['date'] = pd.to_datetime(world_ilinet_data['date']).dt.date


Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,Domain,Sub-Domain,date,type,number
0,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Afghanistan,,,2016-03-14,Cases,494.0
1,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Afghanistan,,,2016-03-21,Cases,715.0
2,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Afghanistan,,,2016-03-28,Cases,704.0
3,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Afghanistan,,,2016-04-04,Cases,749.0
4,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Afghanistan,,,2016-04-11,Cases,651.0
...,...,...,...,...,...,...,...,...,...,...
68349,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Zambia,,,2021-11-29,Cases,1866.0
68350,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Zambia,,,2021-12-06,Cases,1394.0
68351,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Zambia,,,2021-12-13,Cases,1348.0
68352,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Zambia,,,2021-12-20,Cases,1513.0


In [21]:
world_ilinet_data['number'] = world_ilinet_data['number'].astype(int)
world_ilinet_cumulative_data = world_ilinet_data.groupby(['Microbe Family','Microbe Genus','Microbe Species','Region','Country','date','type']).sum().groupby(level=4).cumsum().reset_index()
world_ilinet_cumulative_data['type'] = 'Cumulative_Cases'
world_ilinet_cumulative_data['Domain'] = np.nan
world_ilinet_cumulative_data['Sub-Domain'] = np.nan
world_ilinet_cumulative_data

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  world_ilinet_data['number'] = world_ilinet_data['number'].astype(int)


Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,date,type,Domain,Sub-Domain,number
0,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Cameroon,2012-01-02,Cumulative_Cases,,,86
1,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Cameroon,2012-01-09,Cumulative_Cases,,,86
2,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Cameroon,2012-01-16,Cumulative_Cases,,,86
3,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Cameroon,2012-01-23,Cumulative_Cases,,,86
4,Orthomyxovididae,"Influenza A, B, and C Virus",,AFRO,Cameroon,2012-01-30,Cumulative_Cases,,,86
...,...,...,...,...,...,...,...,...,...,...
66140,Orthomyxovididae,"Influenza A, B, and C Virus",,WPRO,Wallis and Futuna,2023-08-07,Cumulative_Cases,,,14492
66141,Orthomyxovididae,"Influenza A, B, and C Virus",,WPRO,Wallis and Futuna,2023-08-14,Cumulative_Cases,,,14507
66142,Orthomyxovididae,"Influenza A, B, and C Virus",,WPRO,Wallis and Futuna,2023-08-21,Cumulative_Cases,,,14536
66143,Orthomyxovididae,"Influenza A, B, and C Virus",,WPRO,Wallis and Futuna,2023-08-28,Cumulative_Cases,,,14570


In [7]:
world_ilinet_data.to_csv('F:/Pandemic-Database/Past_Pandemic_Time_Series_Data/Influenza/Influenza_World_Weekly_Cases.csv',
                        index = False)

FileNotFoundError: [Errno 2] No such file or directory: 'F:/Pandemic-Database/Past_Pandemic_Time_Series_Data/Influenza/Influenza_World_Weekly_Cases.csv'

### Combine Data

In [8]:
combined_data = pd.concat([world_ilinet_data,ilinet_data])
combined_data = combined_data.sort_values(by = ['date','Country'])
combined_data

Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,Domain,Sub-Domain,date,type,number
6875,Orthomyxovididae,"Influenza A, B, and C Virus",,EURO,Belgium,,,2009-01-05,Cases,396.0
37926,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Morocco,,,2009-01-05,Cases,3407.0
6876,Orthomyxovididae,"Influenza A, B, and C Virus",,EURO,Belgium,,,2009-01-12,Cases,992.0
37927,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Morocco,,,2009-01-12,Cases,3513.0
6877,Orthomyxovididae,"Influenza A, B, and C Virus",,EURO,Belgium,,,2009-01-19,Cases,1369.0
...,...,...,...,...,...,...,...,...,...,...
36828,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Wyoming,,2023-10-23,ILI_Total,68
36829,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Commonwealth of the Northern Mariana Islands,,2023-10-23,ILI_Total,X
36830,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Puerto Rico,,2023-10-23,ILI_Total,157
36831,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,Virgin Islands,,2023-10-23,ILI_Total,22


In [23]:
combined_cumulative_data = pd.concat([world_ilinet_cumulative_data,ilinet_cumulative_data])
combined_cumulative_data = combined_cumulative_data.sort_values(by = ['date','Country'])
combined_cumulative_data

Unnamed: 0,Microbe Family,Microbe Genus,Microbe Species,Region,Country,date,type,Domain,Sub-Domain,number
20830,Orthomyxovididae,"Influenza A, B, and C Virus",,EURO,Belgium,2009-01-05,Cumulative_Cases,,,396
16612,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Morocco,2009-01-05,Cumulative_Cases,,,3407
20831,Orthomyxovididae,"Influenza A, B, and C Virus",,EURO,Belgium,2009-01-12,Cumulative_Cases,,,1388
16613,Orthomyxovididae,"Influenza A, B, and C Virus",,EMRO,Morocco,2009-01-12,Cumulative_Cases,,,6920
20832,Orthomyxovididae,"Influenza A, B, and C Virus",,EURO,Belgium,2009-01-19,Cumulative_Cases,,,2757
...,...,...,...,...,...,...,...,...,...,...
33219,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,2023-10-23,ILI_Total,Virginia,,1380435
33899,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,2023-10-23,ILI_Total,Washington,,148734
34579,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,2023-10-23,ILI_Total,West Virginia,,123368
35259,Orthomyxovididae,"Influenza A, B, and C Virus",,AMRO,United States,2023-10-23,ILI_Total,Wisconsin,,106395


In [75]:
combined_data.to_csv('F:/Pandemic-Database/Past_Pandemic_Time_Series_Data/Influenza/Influenza_World_Domain_Weekly_Cases.csv',
                     index = False)

In [24]:
combined_cumulative_data.to_csv('F:/Pandemic-Database/Processed_Data/Influenza/Influenza_World_Domain_Weekly_CumCases.csv',
                     index = False)