## Import libraries

In [1]:
import pandas as pd
import os

## Get file names and country names

In [2]:
# Function to get country name
def get_country_names(csv_files):
    country_names = []
    for filename in csv_files:
        country_name = image_name = filename[:filename.index('.csv')]
        country_names.append(country_name)
    return country_names

In [3]:
# Path to dataset:
path = 'Google_Trends (COVID-19 Symptoms)'

# Get files:
csv_files = os.listdir(path)

# Get country names:
country_names = get_country_names(csv_files)

print(f'The countries in the directory are: {len(country_names)}')

The countries in the directory are: 32


## Read csv files

In [4]:
# Function to read COVID-19 symptoms file
def read_file(country):
    df_trends = pd.read_csv(f'Google_Trends (COVID-19 Symptoms)/{country}.csv', skiprows=1)
    df_trends['Week'] = pd.to_datetime(df_trends['Week'])
    return df_trends

In [5]:
def rename_columns(df, country):
    for column in df.columns.values:
        if column == 'Week':
            continue
        else:
            new_column_name = column[:column.index(': (')] + '_' + country
            df.rename(columns = {column:new_column_name}, inplace = True)

In [6]:
def merge_dataframes(country_names):
    latam_df = pd.DataFrame()
    for i, country in enumerate(country_names):
        df = read_file(country)
        rename_columns(df,country)
        if i == 0:
            latam_df = df
        else:
            latam_df = pd.merge(latam_df, df, how="left", on=["Week"])
    return latam_df

In [7]:
latam_df = merge_dataframes(country_names)
latam_df

Unnamed: 0,Week,Fever_Antigua and Barbuda,Headache_Antigua and Barbuda,Cough_Antigua and Barbuda,Fever_Bahamas,Headache_Bahamas,Cough_Bahamas,Fever_Barbados,Headache_Barbados,Cough_Barbados,...,Cough_Guatemala,Fever_Honduras,Headache_Honduras,Cough_Honduras,Fever_Trinidad and Tobago,Headache_Trinidad and Tobago,Cough_Trinidad and Tobago,Fever_Cuba,Headache_Cuba,Cough_Cuba
0,2020-01-05,77,0,19,21,23,26,19,38,19,...,42,11,18,22,19,32,45,26,14,43
1,2020-01-12,55,46,0,17,49,46,19,33,24,...,32,14,13,22,39,43,39,22,17,27
2,2020-01-19,8,8,25,18,24,22,24,33,33,...,29,12,14,20,32,40,44,29,20,23
3,2020-01-26,38,30,8,21,27,34,24,38,24,...,36,13,27,25,42,59,44,33,24,24
4,2020-02-02,39,15,8,38,36,26,29,62,33,...,28,12,17,19,48,36,40,29,24,21
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
122,2022-05-08,10,19,48,35,21,28,16,22,33,...,25,15,14,23,57,71,61,33,10,36
123,2022-05-15,76,9,0,30,17,30,11,44,21,...,38,16,17,33,50,53,69,37,19,31
124,2022-05-22,10,39,29,25,32,49,8,28,35,...,34,20,18,22,49,56,64,43,11,36
125,2022-05-29,0,31,10,29,48,22,32,41,26,...,33,10,17,25,45,61,33,54,14,32


## LATAM dataframe to csv

In [8]:
latam_df.to_csv(path + "/covid-19_Symptoms_latam.csv", index=False)

## Read LATAM file

In [10]:
pd.read_csv('Google_Trends (COVID-19 Symptoms)/covid-19_Symptoms_latam.csv')

Unnamed: 0,Week,Fever_Antigua and Barbuda,Headache_Antigua and Barbuda,Cough_Antigua and Barbuda,Fever_Bahamas,Headache_Bahamas,Cough_Bahamas,Fever_Barbados,Headache_Barbados,Cough_Barbados,...,Cough_Guatemala,Fever_Honduras,Headache_Honduras,Cough_Honduras,Fever_Trinidad and Tobago,Headache_Trinidad and Tobago,Cough_Trinidad and Tobago,Fever_Cuba,Headache_Cuba,Cough_Cuba
0,2020-01-05,77,0,19,21,23,26,19,38,19,...,42,11,18,22,19,32,45,26,14,43
1,2020-01-12,55,46,0,17,49,46,19,33,24,...,32,14,13,22,39,43,39,22,17,27
2,2020-01-19,8,8,25,18,24,22,24,33,33,...,29,12,14,20,32,40,44,29,20,23
3,2020-01-26,38,30,8,21,27,34,24,38,24,...,36,13,27,25,42,59,44,33,24,24
4,2020-02-02,39,15,8,38,36,26,29,62,33,...,28,12,17,19,48,36,40,29,24,21
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
122,2022-05-08,10,19,48,35,21,28,16,22,33,...,25,15,14,23,57,71,61,33,10,36
123,2022-05-15,76,9,0,30,17,30,11,44,21,...,38,16,17,33,50,53,69,37,19,31
124,2022-05-22,10,39,29,25,32,49,8,28,35,...,34,20,18,22,49,56,64,43,11,36
125,2022-05-29,0,31,10,29,48,22,32,41,26,...,33,10,17,25,45,61,33,54,14,32
