In [1]:
import pandas as pd
from sqlalchemy import create_engine

In [2]:
#Load and read the cleaned Symptoms CSV file into pandas via pd.read_csv
# Symptoms CSV file read into pandas as symptoms dataframe
csv_file = "Cleaned_CSVs/Symptoms.csv"
symptoms= pd.read_csv(csv_file)
symptoms.head()

Unnamed: 0.1,Unnamed: 0,VAERS_ID,SYMPTOM1,SYMPTOM2,SYMPTOM3,SYMPTOM4,SYMPTOM5
0,0,916600,Dysphagia,Epiglottitis,,,
1,1,916601,Anxiety,Dyspnoea,,,
2,2,916602,Chest discomfort,Dysphagia,Pain in extremity,Visual impairment,
3,3,916603,Dizziness,Fatigue,Mobility decreased,,
4,4,916604,Injection site erythema,Injection site pruritus,Injection site swelling,Injection site warmth,


In [3]:
#Load and read the cleaned VAERSVAX CSV file into pandas via pd.read_csv
# VAERSVAX CSV file read into pandas as vaersvax dataframe
csv_file = "Cleaned_CSVs/VAERSVAX.csv"
vaersvax= pd.read_csv(csv_file)
vaersvax.head()

Unnamed: 0.1,Unnamed: 0,VAERS_ID,Vaccine,Dose,Route,Site
0,0,916600,MODERNA,1,IM,LA
1,1,916601,MODERNA,1,IM,RA
2,2,916602,PFIZER\BIONTECH,1,IM,LA
3,4,916604,MODERNA,1,IM,LA
4,5,916606,MODERNA,1,IM,LA


In [4]:
#Load and read the cleaned vaers_data CSV file into pandas via pd.read_csv
# vaers_data CSV file read into pandas as vaersdata dataframe
csv_file = "Cleaned_CSVs/vaers_data.csv"
vaersdata= pd.read_csv(csv_file)
vaersdata.head()

Unnamed: 0.1,Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,SEX,SYMPTOM_TEXT,RECOVD,ALLERGIES
0,0,916600,01/01/2021,TX,33.0,F,Right side of epiglottis swelled up and hinder...,Y,Pcn and bee venom
1,1,916601,01/01/2021,CA,73.0,F,Approximately 30 min post vaccination administ...,Y,"""Dairy"""
2,2,916602,01/01/2021,WA,23.0,F,"About 15 minutes after receiving the vaccine, ...",U,Shellfish
3,3,916603,01/01/2021,WA,58.0,F,"extreme fatigue, dizziness,. could not lift my...",Y,"Diclofenac, novacaine, lidocaine, pickles, tom..."
4,4,916604,01/01/2021,TX,47.0,F,"Injection site swelling, redness, warm to the ...",N,Na


In [5]:
#using outer merge on "VAERS_ID" to merge symptoms and vaersvax dataframes first.
merged_outer_first = pd.merge(symptoms, vaersvax, on="VAERS_ID", how="outer")
merged_outer_first

Unnamed: 0,Unnamed: 0_x,VAERS_ID,SYMPTOM1,SYMPTOM2,SYMPTOM3,SYMPTOM4,SYMPTOM5,Unnamed: 0_y,Vaccine,Dose,Route,Site
0,0,916600,Dysphagia,Epiglottitis,,,,0.0,MODERNA,1,IM,LA
1,1,916601,Anxiety,Dyspnoea,,,,1.0,MODERNA,1,IM,RA
2,2,916602,Chest discomfort,Dysphagia,Pain in extremity,Visual impairment,,2.0,PFIZER\BIONTECH,1,IM,LA
3,3,916603,Dizziness,Fatigue,Mobility decreased,,,,,,,
4,4,916604,Injection site erythema,Injection site pruritus,Injection site swelling,Injection site warmth,,4.0,MODERNA,1,IM,LA
...,...,...,...,...,...,...,...,...,...,...,...,...
48726,48105,1113920,Nasal discomfort,Night sweats,Platelet count,Platelet count decreased,Pyrexia,,,,,
48727,48106,1113920,Rash,SARS-CoV-2 test,,,,,,,,
48728,48107,1113963,Haemophagocytic lymphohistiocytosis,SARS-CoV-2 test,,,,,,,,
48729,48108,1115045,Death,,,,,,,,,


In [6]:
# Then merge the merged symptoms-vaersvax dataframe with the third dataframe vaersdata 
# still via outer merge on VAERS_ID.
merged_outer_second = pd.merge(merged_outer_first, vaersdata, on="VAERS_ID", how="outer")
merged_outer_second

Unnamed: 0.1,Unnamed: 0_x,VAERS_ID,SYMPTOM1,SYMPTOM2,SYMPTOM3,SYMPTOM4,SYMPTOM5,Unnamed: 0_y,Vaccine,Dose,Route,Site,Unnamed: 0,RECVDATE,STATE,AGE_YRS,SEX,SYMPTOM_TEXT,RECOVD,ALLERGIES
0,0,916600,Dysphagia,Epiglottitis,,,,0.0,MODERNA,1,IM,LA,0.0,01/01/2021,TX,33.0,F,Right side of epiglottis swelled up and hinder...,Y,Pcn and bee venom
1,1,916601,Anxiety,Dyspnoea,,,,1.0,MODERNA,1,IM,RA,1.0,01/01/2021,CA,73.0,F,Approximately 30 min post vaccination administ...,Y,"""Dairy"""
2,2,916602,Chest discomfort,Dysphagia,Pain in extremity,Visual impairment,,2.0,PFIZER\BIONTECH,1,IM,LA,2.0,01/01/2021,WA,23.0,F,"About 15 minutes after receiving the vaccine, ...",U,Shellfish
3,3,916603,Dizziness,Fatigue,Mobility decreased,,,,,,,,3.0,01/01/2021,WA,58.0,F,"extreme fatigue, dizziness,. could not lift my...",Y,"Diclofenac, novacaine, lidocaine, pickles, tom..."
4,4,916604,Injection site erythema,Injection site pruritus,Injection site swelling,Injection site warmth,,4.0,MODERNA,1,IM,LA,4.0,01/01/2021,TX,47.0,F,"Injection site swelling, redness, warm to the ...",N,Na
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
48726,48105,1113920,Nasal discomfort,Night sweats,Platelet count,Platelet count decreased,Pyrexia,,,,,,34117.0,03/19/2021,PA,83.0,F,positive COVID-19 test with no symptoms; Asymp...,Y,NKA
48727,48106,1113920,Rash,SARS-CoV-2 test,,,,,,,,,34117.0,03/19/2021,PA,83.0,F,positive COVID-19 test with no symptoms; Asymp...,Y,NKA
48728,48107,1113963,Haemophagocytic lymphohistiocytosis,SARS-CoV-2 test,,,,,,,,,34118.0,03/19/2021,MS,59.0,F,HLH (hemophagocyticlymphohistiocytosis); This ...,N,NKA
48729,48108,1115045,Death,,,,,,,,,,34119.0,03/19/2021,AZ,57.0,M,Death; A spontaneous report was received from ...,N,NKA


In [7]:
# Delete unwanted columns
del merged_outer_second['Unnamed: 0_x']
del merged_outer_second['Unnamed: 0_y']
del merged_outer_second['Unnamed: 0']

In [8]:
merged_outer_second.drop_duplicates("VAERS_ID", inplace=True)
merged_outer_second

Unnamed: 0,VAERS_ID,SYMPTOM1,SYMPTOM2,SYMPTOM3,SYMPTOM4,SYMPTOM5,Vaccine,Dose,Route,Site,RECVDATE,STATE,AGE_YRS,SEX,SYMPTOM_TEXT,RECOVD,ALLERGIES
0,916600,Dysphagia,Epiglottitis,,,,MODERNA,1,IM,LA,01/01/2021,TX,33.0,F,Right side of epiglottis swelled up and hinder...,Y,Pcn and bee venom
1,916601,Anxiety,Dyspnoea,,,,MODERNA,1,IM,RA,01/01/2021,CA,73.0,F,Approximately 30 min post vaccination administ...,Y,"""Dairy"""
2,916602,Chest discomfort,Dysphagia,Pain in extremity,Visual impairment,,PFIZER\BIONTECH,1,IM,LA,01/01/2021,WA,23.0,F,"About 15 minutes after receiving the vaccine, ...",U,Shellfish
3,916603,Dizziness,Fatigue,Mobility decreased,,,,,,,01/01/2021,WA,58.0,F,"extreme fatigue, dizziness,. could not lift my...",Y,"Diclofenac, novacaine, lidocaine, pickles, tom..."
4,916604,Injection site erythema,Injection site pruritus,Injection site swelling,Injection site warmth,,MODERNA,1,IM,LA,01/01/2021,TX,47.0,F,"Injection site swelling, redness, warm to the ...",N,Na
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
48724,1113917,Dysphagia,Hernia,Obstruction,,,,,,,03/19/2021,FL,88.0,F,throat closure three weeks after second dose; ...,U,NKA
48725,1113920,Arrhythmia,Asymptomatic COVID-19,Chills,Coccidioidomycosis,Drug ineffective,,,,,03/19/2021,PA,83.0,F,positive COVID-19 test with no symptoms; Asymp...,Y,NKA
48728,1113963,Haemophagocytic lymphohistiocytosis,SARS-CoV-2 test,,,,,,,,03/19/2021,MS,59.0,F,HLH (hemophagocyticlymphohistiocytosis); This ...,N,NKA
48729,1115045,Death,,,,,,,,,03/19/2021,AZ,57.0,M,Death; A spontaneous report was received from ...,N,NKA
