## Importing the libraries

Using set_option(), we can change the default number of rows to be displayed.
the maximum number of rows and columns to display to unlimited, allowing the  full DataFrame to be displayed when printed.

In [6]:
import pandas as pd
import re
pd.set_option('display.max_columns', None)

## Importing the dataset

By default, Pandas has the low_memory=True argument. This means that the CSV file gets split up in multiple chunks and the guess is done for every chunk, resulting in a column with multiple dtypes. By setting the low_memory argument to False, you’re basically telling Pandas not to be efficient, and process the whole file, all at once.

Latin-1 is the same as 8859-1. Every character is encoded as a single byte. There are 191 characters total.

In [7]:
vdata = pd.read_csv('2022VAERSDATA.csv', encoding='latin1',low_memory=False)
vvax = pd.read_csv('2022VAERSVAX.csv',encoding='latin1',low_memory=False)
vsymp = pd.read_csv('2022VAERSSYMPTOMS.csv',encoding='latin1',low_memory=False)

# Checking data frames

Pandas head() method is used to return top n (5 by default) rows of a data frame or series.

In [8]:
vdata.head()

Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,CAGE_YR,CAGE_MO,SEX,RPT_DATE,SYMPTOM_TEXT,DIED,DATEDIED,L_THREAT,ER_VISIT,HOSPITAL,HOSPDAYS,X_STAY,DISABLE,RECOVD,VAX_DATE,ONSET_DATE,NUMDAYS,LAB_DATA,V_ADMINBY,V_FUNDBY,OTHER_MEDS,CUR_ILL,HISTORY,PRIOR_VAX,SPLTTYPE,FORM_VERS,TODAYS_DATE,BIRTH_DEFECT,OFC_VISIT,ER_ED_VISIT,ALLERGIES
0,1996873,01/01/2022,CA,,,,U,,This spontaneous report was received from a ph...,,,,,,,,,U,12/15/2021,12/15/2021,0.0,,UNK,,,,,,US0095075132112USA007320,2,12/31/2021,,,,
1,1996874,01/01/2022,,,,,U,,SUSPECTED CLINICAL VACCINATION FAILURE; SUSPEC...,,,,,,,,,U,,,,,UNK,,,,,,USJNJFOC20211263430,2,01/01/2022,,,,
2,1996875,01/01/2022,OH,,,,M,,SUSPECTED CLINICAL VACCINATION FAILURE; SUSPEC...,,,,,,,,,U,,12/28/2021,,Test Date: 20211230; Test Name: COVID-19 antig...,OTH,,,,,,USJNJFOC20211266010,2,01/01/2022,,,,
3,1996876,01/01/2022,MS,34.0,,,F,,Irregular menstrual cycle.; period extremely h...,,,,,,,,,N,08/18/2021,09/03/2021,16.0,,PVT,,ZOLOFT; ORTHO-TRI-CYCLEN LO,,Comments: List of non-encoded Patient Relevant...,,USPFIZER INC202101162241,2,12/31/2021,,,,
4,1996877,01/01/2022,CT,,,,F,,Breakthrough and heavy periods; longer period ...,,,,,,,,,N,03/26/2021,06/07/2021,73.0,Test Date: 20210921; Test Name: Nasal Swab; Re...,PVT,,ALDACTONE [SPIRONOLACTONE],,,,USPFIZER INC202101281356,2,12/31/2021,,,,


In [9]:
vvax.head()

Unnamed: 0,VAERS_ID,VAX_TYPE,VAX_MANU,VAX_LOT,VAX_DOSE_SERIES,VAX_ROUTE,VAX_SITE,VAX_NAME
0,1996873,HPV9,MERCK & CO. INC.,R017624,UNK,,,HPV (GARDASIL 9)
1,1996874,COVID19,JANSSEN,,1,OT,,COVID19 (COVID19 (JANSSEN))
2,1996875,COVID19,JANSSEN,204A21A,1,,,COVID19 (COVID19 (JANSSEN))
3,1996876,COVID19,PFIZER\BIONTECH,Fd8448,2,,LA,COVID19 (COVID19 (PFIZER-BIONTECH))
4,1996877,COVID19,PFIZER\BIONTECH,EP6955,1,,LA,COVID19 (COVID19 (PFIZER-BIONTECH))


In [10]:
vsymp.head()

Unnamed: 0,VAERS_ID,SYMPTOM1,SYMPTOMVERSION1,SYMPTOM2,SYMPTOMVERSION2,SYMPTOM3,SYMPTOMVERSION3,SYMPTOM4,SYMPTOMVERSION4,SYMPTOM5,SYMPTOMVERSION5
0,1996873,Expired product administered,24.1,No adverse event,24.1,,,,,,
1,1996874,Suspected COVID-19,24.1,Vaccination failure,24.1,,,,,,
2,1996875,SARS-CoV-2 test,24.1,Suspected COVID-19,24.1,Vaccination failure,24.1,,,,
3,1996876,Dysmenorrhoea,24.1,Heavy menstrual bleeding,24.1,Menstruation irregular,24.1,,,,
4,1996877,Heavy menstrual bleeding,24.1,Oligomenorrhoea,24.1,SARS-CoV-2 test negative,24.1,,,,


Pandas duplicated() method helps in analyzing duplicate values only. Counts duplicated VAERS ID.

In [11]:
tt = vsymp.duplicated(subset=['VAERS_ID'])
tt = tt.value_counts()
print(tt)

False    240841
True      81137
dtype: int64


The len() function returns the number of items in an object.

In [12]:
a = len(vdata)
b = len(vvax)
c = len(vsymp)
print(a,b,c)

240841 276445 321978


The value_counts() function is used to get a Series containing counts of unique values.

In [13]:
vt= vdata.duplicated(subset=["VAERS_ID"])
vt= (vt.value_counts())
vv= vvax.duplicated(subset=["VAERS_ID"])
vv= (vv.value_counts())
vs= vsymp.duplicated(subset=["VAERS_ID"])
vs= (vs.value_counts())
print(vt,'\n',vv,'\n',vs)

False    240841
dtype: int64 
 False    240841
True      35604
dtype: int64 
 False    240841
True      81137
dtype: int64


# Merging Data

Outer Merge returns all records from both the left or right dataframes. When rows in one dataframe do not match another dataframe, the merged dataframe will have NaN for the cells.  Use how=’outer’ in merge() to outer merge two dataframes in Pandas.

In [14]:
v1 = vdata.merge(vvax, on='VAERS_ID', how='outer')
v1

Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,CAGE_YR,CAGE_MO,SEX,RPT_DATE,SYMPTOM_TEXT,DIED,DATEDIED,L_THREAT,ER_VISIT,HOSPITAL,HOSPDAYS,X_STAY,DISABLE,RECOVD,VAX_DATE,ONSET_DATE,NUMDAYS,LAB_DATA,V_ADMINBY,V_FUNDBY,OTHER_MEDS,CUR_ILL,HISTORY,PRIOR_VAX,SPLTTYPE,FORM_VERS,TODAYS_DATE,BIRTH_DEFECT,OFC_VISIT,ER_ED_VISIT,ALLERGIES,VAX_TYPE,VAX_MANU,VAX_LOT,VAX_DOSE_SERIES,VAX_ROUTE,VAX_SITE,VAX_NAME
0,1996873,01/01/2022,CA,,,,U,,This spontaneous report was received from a ph...,,,,,,,,,U,12/15/2021,12/15/2021,0.0,,UNK,,,,,,US0095075132112USA007320,2,12/31/2021,,,,,HPV9,MERCK & CO. INC.,R017624,UNK,,,HPV (GARDASIL 9)
1,1996874,01/01/2022,,,,,U,,SUSPECTED CLINICAL VACCINATION FAILURE; SUSPEC...,,,,,,,,,U,,,,,UNK,,,,,,USJNJFOC20211263430,2,01/01/2022,,,,,COVID19,JANSSEN,,1,OT,,COVID19 (COVID19 (JANSSEN))
2,1996875,01/01/2022,OH,,,,M,,SUSPECTED CLINICAL VACCINATION FAILURE; SUSPEC...,,,,,,,,,U,,12/28/2021,,Test Date: 20211230; Test Name: COVID-19 antig...,OTH,,,,,,USJNJFOC20211266010,2,01/01/2022,,,,,COVID19,JANSSEN,204A21A,1,,,COVID19 (COVID19 (JANSSEN))
3,1996876,01/01/2022,MS,34.0,,,F,,Irregular menstrual cycle.; period extremely h...,,,,,,,,,N,08/18/2021,09/03/2021,16.0,,PVT,,ZOLOFT; ORTHO-TRI-CYCLEN LO,,Comments: List of non-encoded Patient Relevant...,,USPFIZER INC202101162241,2,12/31/2021,,,,,COVID19,PFIZER\BIONTECH,Fd8448,2,,LA,COVID19 (COVID19 (PFIZER-BIONTECH))
4,1996877,01/01/2022,CT,,,,F,,Breakthrough and heavy periods; longer period ...,,,,,,,,,N,03/26/2021,06/07/2021,73.0,Test Date: 20210921; Test Name: Nasal Swab; Re...,PVT,,ALDACTONE [SPIRONOLACTONE],,,,USPFIZER INC202101281356,2,12/31/2021,,,,,COVID19,PFIZER\BIONTECH,EP6955,1,,LA,COVID19 (COVID19 (PFIZER-BIONTECH))
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
276440,2541569,12/23/2022,,2.0,2.0,0.3,F,,No adverse event; Vaccine administered after b...,,,,,,,,,U,07/09/2022,07/09/2022,0.0,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,AS1414B,UNK,OT,,COVID19 (COVID19 (MODERNA))
276441,2541570,12/23/2022,,68.0,,,F,,No adverse event; lot that had been expired wa...,,,,,,,,,U,,,,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,O70H21A,UNK,OT,,COVID19 (COVID19 (MODERNA))
276442,2541571,12/23/2022,,79.0,,,M,,No adverse event; Expired vaccine used; This s...,,,,,,,,,U,,,,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,O70H21A,UNK,OT,,COVID19 (COVID19 (MODERNA))
276443,2541572,12/23/2022,,63.0,,,M,,no adverse event; expired vaccine used; This s...,,,,,,,,,U,,,,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,O70H21A,UNK,OT,,COVID19 (COVID19 (MODERNA))


In [15]:
VAERSM = v1.merge(vsymp, on ="VAERS_ID", how='outer')
VAERSM

Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,CAGE_YR,CAGE_MO,SEX,RPT_DATE,SYMPTOM_TEXT,DIED,DATEDIED,L_THREAT,ER_VISIT,HOSPITAL,HOSPDAYS,X_STAY,DISABLE,RECOVD,VAX_DATE,ONSET_DATE,NUMDAYS,LAB_DATA,V_ADMINBY,V_FUNDBY,OTHER_MEDS,CUR_ILL,HISTORY,PRIOR_VAX,SPLTTYPE,FORM_VERS,TODAYS_DATE,BIRTH_DEFECT,OFC_VISIT,ER_ED_VISIT,ALLERGIES,VAX_TYPE,VAX_MANU,VAX_LOT,VAX_DOSE_SERIES,VAX_ROUTE,VAX_SITE,VAX_NAME,SYMPTOM1,SYMPTOMVERSION1,SYMPTOM2,SYMPTOMVERSION2,SYMPTOM3,SYMPTOMVERSION3,SYMPTOM4,SYMPTOMVERSION4,SYMPTOM5,SYMPTOMVERSION5
0,1996873,01/01/2022,CA,,,,U,,This spontaneous report was received from a ph...,,,,,,,,,U,12/15/2021,12/15/2021,0.0,,UNK,,,,,,US0095075132112USA007320,2,12/31/2021,,,,,HPV9,MERCK & CO. INC.,R017624,UNK,,,HPV (GARDASIL 9),Expired product administered,24.1,No adverse event,24.1,,,,,,
1,1996874,01/01/2022,,,,,U,,SUSPECTED CLINICAL VACCINATION FAILURE; SUSPEC...,,,,,,,,,U,,,,,UNK,,,,,,USJNJFOC20211263430,2,01/01/2022,,,,,COVID19,JANSSEN,,1,OT,,COVID19 (COVID19 (JANSSEN)),Suspected COVID-19,24.1,Vaccination failure,24.1,,,,,,
2,1996875,01/01/2022,OH,,,,M,,SUSPECTED CLINICAL VACCINATION FAILURE; SUSPEC...,,,,,,,,,U,,12/28/2021,,Test Date: 20211230; Test Name: COVID-19 antig...,OTH,,,,,,USJNJFOC20211266010,2,01/01/2022,,,,,COVID19,JANSSEN,204A21A,1,,,COVID19 (COVID19 (JANSSEN)),SARS-CoV-2 test,24.1,Suspected COVID-19,24.1,Vaccination failure,24.1,,,,
3,1996876,01/01/2022,MS,34.0,,,F,,Irregular menstrual cycle.; period extremely h...,,,,,,,,,N,08/18/2021,09/03/2021,16.0,,PVT,,ZOLOFT; ORTHO-TRI-CYCLEN LO,,Comments: List of non-encoded Patient Relevant...,,USPFIZER INC202101162241,2,12/31/2021,,,,,COVID19,PFIZER\BIONTECH,Fd8448,2,,LA,COVID19 (COVID19 (PFIZER-BIONTECH)),Dysmenorrhoea,24.1,Heavy menstrual bleeding,24.1,Menstruation irregular,24.1,,,,
4,1996877,01/01/2022,CT,,,,F,,Breakthrough and heavy periods; longer period ...,,,,,,,,,N,03/26/2021,06/07/2021,73.0,Test Date: 20210921; Test Name: Nasal Swab; Re...,PVT,,ALDACTONE [SPIRONOLACTONE],,,,USPFIZER INC202101281356,2,12/31/2021,,,,,COVID19,PFIZER\BIONTECH,EP6955,1,,LA,COVID19 (COVID19 (PFIZER-BIONTECH)),Heavy menstrual bleeding,24.1,Oligomenorrhoea,24.1,SARS-CoV-2 test negative,24.1,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
375745,2541569,12/23/2022,,2.0,2.0,0.3,F,,No adverse event; Vaccine administered after b...,,,,,,,,,U,07/09/2022,07/09/2022,0.0,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,AS1414B,UNK,OT,,COVID19 (COVID19 (MODERNA)),Expired product administered,25.1,No adverse event,25.1,,,,,,
375746,2541570,12/23/2022,,68.0,,,F,,No adverse event; lot that had been expired wa...,,,,,,,,,U,,,,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,O70H21A,UNK,OT,,COVID19 (COVID19 (MODERNA)),Expired product administered,25.1,No adverse event,25.1,,,,,,
375747,2541571,12/23/2022,,79.0,,,M,,No adverse event; Expired vaccine used; This s...,,,,,,,,,U,,,,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,O70H21A,UNK,OT,,COVID19 (COVID19 (MODERNA)),Expired product administered,25.1,No adverse event,25.1,,,,,,
375748,2541572,12/23/2022,,63.0,,,M,,no adverse event; expired vaccine used; This s...,,,,,,,,,U,,,,,UNK,,,,,,"USMODERNATX, INC.MOD20226",2,12/23/2022,,,,,COVID19,MODERNA,O70H21A,UNK,OT,,COVID19 (COVID19 (MODERNA)),Expired product administered,25.1,No adverse event,25.1,,,,,,


Checks for duplicated data after merge

In [16]:
test = VAERSM.duplicated(subset=["VAERS_ID"])
test.value_counts()

False    240841
True     134909
dtype: int64

Checks all cloumns in dataframe

In [17]:
VAERSM.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 375750 entries, 0 to 375749
Data columns (total 52 columns):
 #   Column           Non-Null Count   Dtype  
---  ------           --------------   -----  
 0   VAERS_ID         375750 non-null  int64  
 1   RECVDATE         375750 non-null  object 
 2   STATE            311582 non-null  object 
 3   AGE_YRS          332973 non-null  float64
 4   CAGE_YR          296842 non-null  float64
 5   CAGE_MO          7581 non-null    float64
 6   SEX              375750 non-null  object 
 7   RPT_DATE         184 non-null     object 
 8   SYMPTOM_TEXT     375288 non-null  object 
 9   DIED             16665 non-null   object 
 10  DATEDIED         15475 non-null   object 
 11  L_THREAT         9316 non-null    object 
 12  ER_VISIT         36 non-null      object 
 13  HOSPITAL         79730 non-null   object 
 14  HOSPDAYS         55068 non-null   float64
 15  X_STAY           236 non-null     object 
 16  DISABLE          14984 non-null   obje

# Searching for symptom 

Searching for myocarditis symptom

The re.IGNORECASE allows the regular expression to become case-insensitive

A Regular Expression (RegEx) is a sequence of characters that defines a search pattern.

na: fill value for missing values. The default depends on dtype of the array. 

In [18]:
found = VAERSM[VAERSM['SYMPTOM_TEXT'].str.contains('myocarditis',na=False, flags=re.IGNORECASE, regex=True)]
found

Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,CAGE_YR,CAGE_MO,SEX,RPT_DATE,SYMPTOM_TEXT,DIED,DATEDIED,L_THREAT,ER_VISIT,HOSPITAL,HOSPDAYS,X_STAY,DISABLE,RECOVD,VAX_DATE,ONSET_DATE,NUMDAYS,LAB_DATA,V_ADMINBY,V_FUNDBY,OTHER_MEDS,CUR_ILL,HISTORY,PRIOR_VAX,SPLTTYPE,FORM_VERS,TODAYS_DATE,BIRTH_DEFECT,OFC_VISIT,ER_ED_VISIT,ALLERGIES,VAX_TYPE,VAX_MANU,VAX_LOT,VAX_DOSE_SERIES,VAX_ROUTE,VAX_SITE,VAX_NAME,SYMPTOM1,SYMPTOMVERSION1,SYMPTOM2,SYMPTOMVERSION2,SYMPTOM3,SYMPTOMVERSION3,SYMPTOM4,SYMPTOMVERSION4,SYMPTOM5,SYMPTOMVERSION5
346,1997198,01/01/2022,MD,56.0,56.0,,M,,Onset of headache and neck pain 10/10 over 1 m...,,,,,,,,,U,10/26/2021,10/26/2021,0.0,ECG telemetry showing SVT,OTH,,famotidine but have not been taking,,,flu vaccine 15 years ago but only neuropathy a...,,2,01/01/2022,,Y,,Penicillin,COVID19,JANSSEN,,UNK,,,COVID19 (COVID19 (JANSSEN)),Cardiac telemetry abnormal,24.1,Dyspnoea,24.1,Fatigue,24.1,Headache,24.1,Insomnia,24.1
347,1997198,01/01/2022,MD,56.0,56.0,,M,,Onset of headache and neck pain 10/10 over 1 m...,,,,,,,,,U,10/26/2021,10/26/2021,0.0,ECG telemetry showing SVT,OTH,,famotidine but have not been taking,,,flu vaccine 15 years ago but only neuropathy a...,,2,01/01/2022,,Y,,Penicillin,COVID19,JANSSEN,,UNK,,,COVID19 (COVID19 (JANSSEN)),Myocarditis,24.1,Neck pain,24.1,Palpitations,24.1,Supraventricular tachycardia,24.1,,
384,1997216,01/01/2022,OH,43.0,43.0,,M,,Thirteen days after I received this dose of th...,,,,,,,,,U,05/29/2021,06/11/2021,13.0,The following labs were drawn and measured: CB...,PUB,,"Flecainide, metoprolol, cabergoline, cetirizne...",,Idiopathic ventricular fibrillation,,,2,01/01/2022,,Y,,,COVID19,JANSSEN,1808982,1,SYR,AR,COVID19 (COVID19 (JANSSEN)),Blood magnesium,24.1,Blood thyroid stimulating hormone,24.1,Full blood count,24.1,Metabolic function test,24.1,Ventricular fibrillation,24.1
458,1997256,01/01/2022,MT,15.0,15.0,,M,,"chest pain on 12/20/21 intermittently, then co...",,,,,Y,1.0,,,Y,12/27/2021,12/30/2021,3.0,"elevated troponin, elevated CRP; nml d-dimer",PHM,,none,none,none,,,2,01/01/2022,,,,none,COVID19,PFIZER\BIONTECH,ED0809,1,IM,LA,COVID19 (COVID19 (PFIZER-BIONTECH)),C-reactive protein increased,24.1,Chest pain,24.1,Fibrin D dimer normal,24.1,Myocarditis,24.1,Troponin increased,24.1
479,1997273,01/01/2022,CA,18.0,18.0,,M,,The patient developed low grade fevers 24 hour...,,,Y,,Y,5.0,,,N,12/21/2021,12/23/2021,2.0,"all 2021: Troponin-I: 12/26 .51 ug/ml, 12/26 ...",PVT,,"Flovent 44 mcg, 2 puffs twice daily, vitamin C...",subjective sensation of dyspnea since COVID 10...,History of COVID 10/15/21,,,2,12/30/2021,,,Y,none,COVID19,PFIZER\BIONTECH,FJ1620,3,IM,RA,COVID19 (COVID19 (PFIZER-BIONTECH)),Abnormal faeces,24.1,Alanine aminotransferase increased,24.1,Aspartate aminotransferase increased,24.1,Blood fibrinogen increased,24.1,Blood lactate dehydrogenase increased,24.1
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
375371,2540525,12/22/2022,VA,64.0,64.0,,M,,"sudden cardiac arrest, ems response, transport...",,,,,Y,7.0,,,Y,10/14/2022,11/06/2022,23.0,,UNK,,,none,none,,,2,12/22/2022,,Y,,none,COVID19-2,MODERNA,,1,IM,LA,COVID19 (COVID19 (MODERNA BIVALENT)),Cardiac arrest,25.1,Cardiac dysfunction,25.1,Cardiac pacemaker insertion,25.1,Endotracheal intubation,25.1,Implantable defibrillator insertion,25.1
375372,2540525,12/22/2022,VA,64.0,64.0,,M,,"sudden cardiac arrest, ems response, transport...",,,,,Y,7.0,,,Y,10/14/2022,11/06/2022,23.0,,UNK,,,none,none,,,2,12/22/2022,,Y,,none,COVID19-2,MODERNA,,1,IM,LA,COVID19 (COVID19 (MODERNA BIVALENT)),Intensive care,25.1,Myocarditis,25.1,,,,,,
375454,2540650,12/22/2022,MI,54.0,54.0,,F,,Date of Admission: 10/19/2022 Date of Discharg...,,,,,Y,,,,Y,05/25/2021,10/19/2022,512.0,"10/19 Covid-19, Flu, RSV by NAA, Detected",UNK,,,,,,,2,,,,,,COVID19,PFIZER\BIONTECH,EW0191,2,,,COVID19 (COVID19 (PFIZER-BIONTECH)),COVID-19,25.1,Influenza virus test positive,25.1,Respiratory syncytial virus test positive,25.1,SARS-CoV-2 test positive,25.1,,
375562,2541334,12/23/2022,,,,,M,,HEART FAILURE; This spontaneous report receive...,Y,,,,,,,,N,,,,,UNK,,,,,,USJNJFOC20221245816,2,12/22/2022,,,,,COVID19,JANSSEN,,1,,,COVID19 (COVID19 (JANSSEN)),Cardiac failure,25.1,,,,,,,,


Remove duplicate data. You don't remove duplicates at the beginning because an individual can file multiple results and a particular symptom could be reported on the final file

Pandas drop_duplicates() method helps in removing duplicates from the Pandas Dataframe In Python.

In [19]:
refine = found.drop_duplicates(subset=['VAERS_ID'],keep='first')
refine

Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,CAGE_YR,CAGE_MO,SEX,RPT_DATE,SYMPTOM_TEXT,DIED,DATEDIED,L_THREAT,ER_VISIT,HOSPITAL,HOSPDAYS,X_STAY,DISABLE,RECOVD,VAX_DATE,ONSET_DATE,NUMDAYS,LAB_DATA,V_ADMINBY,V_FUNDBY,OTHER_MEDS,CUR_ILL,HISTORY,PRIOR_VAX,SPLTTYPE,FORM_VERS,TODAYS_DATE,BIRTH_DEFECT,OFC_VISIT,ER_ED_VISIT,ALLERGIES,VAX_TYPE,VAX_MANU,VAX_LOT,VAX_DOSE_SERIES,VAX_ROUTE,VAX_SITE,VAX_NAME,SYMPTOM1,SYMPTOMVERSION1,SYMPTOM2,SYMPTOMVERSION2,SYMPTOM3,SYMPTOMVERSION3,SYMPTOM4,SYMPTOMVERSION4,SYMPTOM5,SYMPTOMVERSION5
346,1997198,01/01/2022,MD,56.0,56.0,,M,,Onset of headache and neck pain 10/10 over 1 m...,,,,,,,,,U,10/26/2021,10/26/2021,0.0,ECG telemetry showing SVT,OTH,,famotidine but have not been taking,,,flu vaccine 15 years ago but only neuropathy a...,,2,01/01/2022,,Y,,Penicillin,COVID19,JANSSEN,,UNK,,,COVID19 (COVID19 (JANSSEN)),Cardiac telemetry abnormal,24.1,Dyspnoea,24.1,Fatigue,24.1,Headache,24.1,Insomnia,24.1
384,1997216,01/01/2022,OH,43.0,43.0,,M,,Thirteen days after I received this dose of th...,,,,,,,,,U,05/29/2021,06/11/2021,13.0,The following labs were drawn and measured: CB...,PUB,,"Flecainide, metoprolol, cabergoline, cetirizne...",,Idiopathic ventricular fibrillation,,,2,01/01/2022,,Y,,,COVID19,JANSSEN,1808982,1,SYR,AR,COVID19 (COVID19 (JANSSEN)),Blood magnesium,24.1,Blood thyroid stimulating hormone,24.1,Full blood count,24.1,Metabolic function test,24.1,Ventricular fibrillation,24.1
458,1997256,01/01/2022,MT,15.0,15.0,,M,,"chest pain on 12/20/21 intermittently, then co...",,,,,Y,1.0,,,Y,12/27/2021,12/30/2021,3.0,"elevated troponin, elevated CRP; nml d-dimer",PHM,,none,none,none,,,2,01/01/2022,,,,none,COVID19,PFIZER\BIONTECH,ED0809,1,IM,LA,COVID19 (COVID19 (PFIZER-BIONTECH)),C-reactive protein increased,24.1,Chest pain,24.1,Fibrin D dimer normal,24.1,Myocarditis,24.1,Troponin increased,24.1
479,1997273,01/01/2022,CA,18.0,18.0,,M,,The patient developed low grade fevers 24 hour...,,,Y,,Y,5.0,,,N,12/21/2021,12/23/2021,2.0,"all 2021: Troponin-I: 12/26 .51 ug/ml, 12/26 ...",PVT,,"Flovent 44 mcg, 2 puffs twice daily, vitamin C...",subjective sensation of dyspnea since COVID 10...,History of COVID 10/15/21,,,2,12/30/2021,,,Y,none,COVID19,PFIZER\BIONTECH,FJ1620,3,IM,RA,COVID19 (COVID19 (PFIZER-BIONTECH)),Abnormal faeces,24.1,Alanine aminotransferase increased,24.1,Aspartate aminotransferase increased,24.1,Blood fibrinogen increased,24.1,Blood lactate dehydrogenase increased,24.1
643,1997414,01/01/2022,CA,50.0,50.0,,M,,Cardiac arrest Myocarditis,,,Y,,Y,7.0,,,N,12/23/2021,12/24/2021,1.0,,PVT,,,Seasonal asthma Seasonal allergies,Seasonal allergies Sesonal Asthma,,,2,01/01/2022,,,Y,,COVID19,PFIZER\BIONTECH,FL3197,3,IM,LA,COVID19 (COVID19 (PFIZER-BIONTECH)),Cardiac arrest,24.1,Myocarditis,24.1,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
375361,2540253,12/22/2022,,5.0,,,F,,myocarditis; Initial information received on 1...,Y,,,,,,,,N,,,,,UNK,,,,,,USSA2022SA513796,2,12/21/2022,,,,,FLUX,UNKNOWN MANUFACTURER,,UNK,OT,,INFLUENZA (SEASONAL) (NO BRAND NAME),Death,25.1,Myocarditis,25.1,,,,,,
375371,2540525,12/22/2022,VA,64.0,64.0,,M,,"sudden cardiac arrest, ems response, transport...",,,,,Y,7.0,,,Y,10/14/2022,11/06/2022,23.0,,UNK,,,none,none,,,2,12/22/2022,,Y,,none,COVID19-2,MODERNA,,1,IM,LA,COVID19 (COVID19 (MODERNA BIVALENT)),Cardiac arrest,25.1,Cardiac dysfunction,25.1,Cardiac pacemaker insertion,25.1,Endotracheal intubation,25.1,Implantable defibrillator insertion,25.1
375454,2540650,12/22/2022,MI,54.0,54.0,,F,,Date of Admission: 10/19/2022 Date of Discharg...,,,,,Y,,,,Y,05/25/2021,10/19/2022,512.0,"10/19 Covid-19, Flu, RSV by NAA, Detected",UNK,,,,,,,2,,,,,,COVID19,PFIZER\BIONTECH,EW0191,2,,,COVID19 (COVID19 (PFIZER-BIONTECH)),COVID-19,25.1,Influenza virus test positive,25.1,Respiratory syncytial virus test positive,25.1,SARS-CoV-2 test positive,25.1,,
375562,2541334,12/23/2022,,,,,M,,HEART FAILURE; This spontaneous report receive...,Y,,,,,,,,N,,,,,UNK,,,,,,USJNJFOC20221245816,2,12/22/2022,,,,,COVID19,JANSSEN,,1,,,COVID19 (COVID19 (JANSSEN)),Cardiac failure,25.1,,,,,,,,


# Symptom Display

In [20]:
pd.set_option('display.max_colwidth', None)

In [21]:
refine[['VAERS_ID','SYMPTOM_TEXT']]

Unnamed: 0,VAERS_ID,SYMPTOM_TEXT
346,1997198,"Onset of headache and neck pain 10/10 over 1 minute which resolved after 2 days After 4 days developed myocarditis with SVT with several bouts of heart rate to 140's and SVT on ECG telemetry. Palpitations, insomnia, Dyspnea, shortness of breath, fatigue, headaches. Gradually resolving over last few months."
384,1997216,"Thirteen days after I received this dose of the Janssen COVID vaccine my Automated Internal Cardiac Defibrillator fired twice as I was experiencing ventricular fibrillation. This was not a new condition to me (hence the AICD) but it was the first time being shocked in over 2.5 years, and I have not been shocked since then. The labs run that day show no electrolyte imbalance nor any other common cause that might explain why I was shocked. I know the Janssen vaccine may cause myocarditis, a common symptom of which is cardiac arrhythmias. I did ask my electrophysiology cardiologist before my vaccination if it was safe for me to do so, and he agreed the risk was worth it. I did not think at the time I was shocked that it might be vaccine-related. I have since asked my EP cardiologist several times if there was any data gathered that might answer the question of whether or not I had myocarditis on June 11, 2021. No one will answer that question."
458,1997256,"chest pain on 12/20/21 intermittently, then continued through the night into the early morning on 12/31/21. Seen in the ED with chest pain and had elevated troponin 10K, peak was 12K and elevated crp. Nml d-dimer. Admission for myocarditis overnight stay"
479,1997273,"The patient developed low grade fevers 24 hours after his flu vaccine and pfizer booster. Approx 48 hours after the vaccines, his fevers started spiking to tmax 103.7. He was treated at home until 12/26 with alternating ibuprofen and tylenol until 12/26 when, upon discussion with his primary care doc, me, he went to the ER. In ER noted to be hypotensive, tachycardic, and w fever. Also developed vomiting. Given fluids and ceftriaxone. Noted to have elevated troponin, crp, ldh. Normal chest xray. EKG with mild t wave abnormalities which resolved on second EKG. Normal bedside echo. Stabilized, sent to ICU for monitoring. Labs generally improved. Formal Echo normal. On 12/27 developed GI bleed w melanotic stool. sent for EGD and colonoscopy which showed possible mallory weiss tear/gastritis. Placed on protonix and received blood transfusion for drop of hemoglobin from 13 to 8. Advanced diet slowly. Meanwhile ebv serology came back igm positive, heterophile neg. CMV igm also positive. NO EBV DNA found. Patient stablized well with down trending troponins and inflammatory markers Hemoglobin stable able to eat and drink Discharged home on protonix and carafate on 12/30/21 Ultimately diagnosed with EBV and hyperinflammatory state. No Misc given self resolving fever and downtrending inflammation without treatement. No myocarditis given normal echo, ekgs, and normal cardiac MRI. It was felt that the elevated troponins were due to cross reactivity with EBV."
643,1997414,Cardiac arrest Myocarditis
...,...,...
375361,2540253,"myocarditis; Initial information received on 16-Dec-2022 regarding an unsolicited valid serious case received from a consumer/non-hcp received from social media page. This case involves a 5 years old female patient who experienced myocarditis after receiving vaccine influenza vaccine. It is unknown if the patient had any medical history, concomitant disease or risk factor. The patient's past medical history, medical treatment(s), vaccination(s) and family history were not provided. On an unknown date, the patient received an unknown dose (units unspecified) of suspect influenza vaccine produced by unknown manufacturer (formulation; strength; lot number and expiry date not reported) via unknown route in unknown administration site for prophylactic vaccination. On an unknown date the patient had a serious event of myocarditis (unknown latency) following the administration of influenza vaccine. It was unknown if there were lab data/results available. Action taken was not applicable. It was not reported if the patient received a corrective treatment for the event. At time of reporting, the outcome was Fatal for the event. No autopsy was done. The cause of death was reported as Myocarditis. This event was assessed as medically significant and was leading to death.; Sender's Comments: Sanofi company comment for information received on 21-Dec-2022: This case involves a 5 years old female patient who experienced myocarditis after receiving vaccine influenza vaccine. The causal role of the company suspect vaccine cannot be assessed based on the temporal relevance. The time to onset is not reported with the role of the vaccine. Further information regarding concurrent condition during vaccination, previous vaccination, tolerance, allergic history, laboratory investigations , autopsy results excluding alternative etiologies for the reported event are needed to fully assess this case. Based on the data provided, the role of vaccine cannot be assessed.; Reported Cause(s) of Death: myocarditis"
375371,2540525,"sudden cardiac arrest, ems response, transported to hospital, intubation and restore heart function, four days in ccu, diagnosis myocarditis from the booster, left ventricle 35 percent function, pacemaker and defibrillator installed, one week in hospital discharged with medication and restrictions"
375454,2540650,Date of Admission: 10/19/2022 Date of Discharge: 10/26/2022 Active Hospital Problems Diagnosis o Heart failure (CMS/HCC) o Stress-induced cardiomyopathy o COVID-19 o Myocarditis (CMS/HCC) o HLD o Coronary artery disease involving native coronary artery of native heart without angina pectoris o HTN
375562,2541334,"HEART FAILURE; This spontaneous report received from a consumer via a company representative via social media concerned a 18 year old male of an unspecified race and ethnicity. The patient's weight, height, and medical history were not reported. The patient received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, and batch number were not reported, expiry: unknown) dose was not reported, 1 total, start therapy date were not reported for covid-19 prophylaxis. The batch number was not reported. Per procedure, no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patient died from heart failure. It was unspecified if an autopsy was performed. The reporter stated that ""No, you do not have the data. Because injuries are not being reported into VAERS. I had 1 coworker whose lips and tongue went numb after his vaccine, and he nearly died. 2 others had severe tinnitus. One had hands so painful he sat there rubbing them nearly crying. Another had he and his wife both experiencing numb hands with loss of grip. Another coworker's wife has myocarditis. My supervisor's daughter had her 18 year old best friend die of heart failure after his vaccine. These adverse events are not rare, look in every comment section about Covid vaccines. And do not give me that ""anecdotal"" stuff. Big pharma can not hide behind that lie forever "". The action taken with covid-19 vaccine ad26.cov2.s was not applicable. This report was serious (Death). This case, from the same reporter is linked to 20221243340, 20221243356, 20221243261, 20221243606, 20221245881 and 20221245969.; Sender's Comments: V0: 20221245816- Heart failure. The event has an unknown/unclear temporal relationship, is unlabeled, and has unknown scientific plausibility. There is no information on any other factors potentially associated with the event. Therefore, the WHO Causality is considered indeterminate. The company causality is considered unassessable.; Reported Cause(s) of Death: HEART FAILURE"


# Searching for death

In [22]:
pd.set_option('display.max_colwidth', None)

Pandas provide many methods to filter a Data frame and Dataframe.query() is one of them.

In [23]:
rr = VAERSM.query('DIED=="Y"')
rr

Unnamed: 0,VAERS_ID,RECVDATE,STATE,AGE_YRS,CAGE_YR,CAGE_MO,SEX,RPT_DATE,SYMPTOM_TEXT,DIED,DATEDIED,L_THREAT,ER_VISIT,HOSPITAL,HOSPDAYS,X_STAY,DISABLE,RECOVD,VAX_DATE,ONSET_DATE,NUMDAYS,LAB_DATA,V_ADMINBY,V_FUNDBY,OTHER_MEDS,CUR_ILL,HISTORY,PRIOR_VAX,SPLTTYPE,FORM_VERS,TODAYS_DATE,BIRTH_DEFECT,OFC_VISIT,ER_ED_VISIT,ALLERGIES,VAX_TYPE,VAX_MANU,VAX_LOT,VAX_DOSE_SERIES,VAX_ROUTE,VAX_SITE,VAX_NAME,SYMPTOM1,SYMPTOMVERSION1,SYMPTOM2,SYMPTOMVERSION2,SYMPTOM3,SYMPTOMVERSION3,SYMPTOM4,SYMPTOMVERSION4,SYMPTOM5,SYMPTOMVERSION5
606,1997395,01/01/2022,MS,59.0,59.0,,M,,"Hospitalized for fever, seizure, pneumonia 9/3/21 Death by cardiac arrest from blood clot on September 16, 2021",Y,09/16/2021,,,Y,13.0,,,N,08/20/2021,09/01/2021,12.0,,PVT,,Insulin,,Diabetes,,,2,01/01/2022,,,Y,,COVID19,MODERNA,059EZIA,1,IM,UN,COVID19 (COVID19 (MODERNA)),Cardiac arrest,24.1,Death,24.1,Pneumonia,24.1,Pyrexia,24.1,Seizure,24.1
607,1997395,01/01/2022,MS,59.0,59.0,,M,,"Hospitalized for fever, seizure, pneumonia 9/3/21 Death by cardiac arrest from blood clot on September 16, 2021",Y,09/16/2021,,,Y,13.0,,,N,08/20/2021,09/01/2021,12.0,,PVT,,Insulin,,Diabetes,,,2,01/01/2022,,,Y,,COVID19,MODERNA,059EZIA,1,IM,UN,COVID19 (COVID19 (MODERNA)),Thrombosis,24.1,,,,,,,,
669,1997432,01/01/2022,PA,29.0,29.0,,M,,"Soon after getting J&J Booster, Patient started complaining about shortness of breath that would come and go. On 12/22/2021 he was feeling like ""crap"" and thought it was COVID and was waiting to get tested. We found him dead in his apartment, and the autopsy revealed pulmonary thrombo embolism.",Y,12/23/2021,,,,,,,N,12/02/2021,12/06/2021,4.0,autopsy on 12/27/2021,PHM,,the only thing he took was acid reducer over the counter medication.,,,,,2,01/01/2022,,,,"Cats, ashtma",COVID19,JANSSEN,213D21A,1,UN,UN,COVID19 (COVID19 (JANSSEN)),Autopsy,24.1,Death,24.1,Dyspnoea,24.1,Feeling abnormal,24.1,Pulmonary embolism,24.1
826,2501714,01/01/2022,,80.0,78.0,,M,,Narrative: hospice pt,Y,04/26/2021,,,,,,,U,02/16/2021,04/24/2021,67.0,,OTH,,,,,,,2,01/01/2022,,Y,Y,,COVID19,PFIZER\BIONTECH,,UNK,,,COVID19 (COVID19 (PFIZER-BIONTECH)),Death,25.1,,,,,,,,
901,2504173,01/01/2022,,89.0,87.0,,M,,Narrative: hospice pt,Y,05/24/2021,,,,,,,U,02/02/2021,05/24/2021,111.0,,OTH,,,,,,,2,01/01/2022,,Y,Y,,COVID19,PFIZER\BIONTECH,,UNK,,,COVID19 (COVID19 (PFIZER-BIONTECH)),Death,25.1,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
375550,2541324,12/23/2022,,,,,U,,"DIED; This spontaneous report received from a consumer via a company representative through social media concerned multiple patients of an unspecified age, sex, race and ethnicity. The patient's weight, height, and medical history were not reported. The patients received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, and batch number were not reported, expiry: unknown) dose not reported,1 total, administered on an unspecified date for covid-19 prophylaxis. The batch number was not reported. Per procedure, no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patients died from unknown cause of death after they were fully vaccinated. It was unspecified if an autopsy was performed. The reporter stated that, ""They were right the only people that I know who have died are fully vaccinated"". The action taken with covid-19 vaccine ad26.cov2.s was not applicable. This report was serious (Death).; Sender's Comments: V0-20221243109-Died. Insufficient information is available to make a causality assessment. Therefore, this event is considered unclassifiable.; Reported Cause(s) of Death: UNKNOWN CAUSE OF DEATH",Y,,,,,,,,N,,,,,UNK,,,,,,USJNJFOC20221243109,2,12/22/2022,,,,,COVID19,JANSSEN,,1,,,COVID19 (COVID19 (JANSSEN)),Death,25.1,,,,,,,,
375554,2541326,12/23/2022,,,,,M,,"ENDED UP PASSING AWAY; GOT WORSE AND WORSE; This spontaneous report received from a consumer via a company representative via social media concerned a male of unspecified age, race and ethnicity. The patient's weight, height, and medical history were not reported. The patient received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, batch number and expiry were not reported) dose, start therapy date were not reported, 1 total, administered for covid-19 prophylaxis. The batch number was not reported. Per procedure no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patient got worse and worse and on an unspecified date patient ended up passing away. It was reported that ""My husband got thanks j j shot too years ago and then he got worse and worse and ended up passing away"". On an unspecified date, the patient died from unknown cause of death. It was unknown whether an autopsy was performed. The action taken with covid-19 vaccine ad26.cov2.s was not applicable. The outcome of got worse and worse was not reported and on an unspecified date the patient ended up passing away. This report was serious (Death).; Sender's Comments: V0: 20221243958-Ended up passing away. Insufficient information is available to make a causality assessment. Therefore, this event is considered unclassifiable.; Reported Cause(s) of Death: UNKNOWN CAUSE OF DEATH",Y,,,,,,,,N,,,,,UNK,,,,,,USJNJFOC20221243958,2,12/22/2022,,,,,COVID19,JANSSEN,,1,,,COVID19 (COVID19 (JANSSEN)),Death,25.1,General physical health deterioration,25.1,,,,,,
375562,2541334,12/23/2022,,,,,M,,"HEART FAILURE; This spontaneous report received from a consumer via a company representative via social media concerned a 18 year old male of an unspecified race and ethnicity. The patient's weight, height, and medical history were not reported. The patient received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, and batch number were not reported, expiry: unknown) dose was not reported, 1 total, start therapy date were not reported for covid-19 prophylaxis. The batch number was not reported. Per procedure, no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patient died from heart failure. It was unspecified if an autopsy was performed. The reporter stated that ""No, you do not have the data. Because injuries are not being reported into VAERS. I had 1 coworker whose lips and tongue went numb after his vaccine, and he nearly died. 2 others had severe tinnitus. One had hands so painful he sat there rubbing them nearly crying. Another had he and his wife both experiencing numb hands with loss of grip. Another coworker's wife has myocarditis. My supervisor's daughter had her 18 year old best friend die of heart failure after his vaccine. These adverse events are not rare, look in every comment section about Covid vaccines. And do not give me that ""anecdotal"" stuff. Big pharma can not hide behind that lie forever "". The action taken with covid-19 vaccine ad26.cov2.s was not applicable. This report was serious (Death). This case, from the same reporter is linked to 20221243340, 20221243356, 20221243261, 20221243606, 20221245881 and 20221245969.; Sender's Comments: V0: 20221245816- Heart failure. The event has an unknown/unclear temporal relationship, is unlabeled, and has unknown scientific plausibility. There is no information on any other factors potentially associated with the event. Therefore, the WHO Causality is considered indeterminate. The company causality is considered unassessable.; Reported Cause(s) of Death: HEART FAILURE",Y,,,,,,,,N,,,,,UNK,,,,,,USJNJFOC20221245816,2,12/22/2022,,,,,COVID19,JANSSEN,,1,,,COVID19 (COVID19 (JANSSEN)),Cardiac failure,25.1,,,,,,,,
375647,2541439,12/23/2022,NY,75.0,75.0,,M,,Cardiac arrest/heart attack,Y,02/10/2022,,,,,,,N,09/11/2021,02/01/2022,143.0,,PVT,,Unknown,NONE,Was cleared of COPD by doctor,,,2,12/23/2022,,,,NONE,COVID19,PFIZER\BIONTECH,FC3183,1,IM,,COVID19 (COVID19 (PFIZER-BIONTECH)),Cardiac arrest,25.1,Myocardial infarction,25.1,,,,,,


Removing duplicate data

In [24]:
pd.set_option('display.max_colwidth', None)
r = rr.drop_duplicates(subset=['VAERS_ID'],keep='first')
r[['VAERS_ID','SYMPTOM_TEXT']]


Unnamed: 0,VAERS_ID,SYMPTOM_TEXT
606,1997395,"Hospitalized for fever, seizure, pneumonia 9/3/21 Death by cardiac arrest from blood clot on September 16, 2021"
669,1997432,"Soon after getting J&J Booster, Patient started complaining about shortness of breath that would come and go. On 12/22/2021 he was feeling like ""crap"" and thought it was COVID and was waiting to get tested. We found him dead in his apartment, and the autopsy revealed pulmonary thrombo embolism."
826,2501714,Narrative: hospice pt
901,2504173,Narrative: hospice pt
977,2504256,Narrative: Hospice pt
...,...,...
375550,2541324,"DIED; This spontaneous report received from a consumer via a company representative through social media concerned multiple patients of an unspecified age, sex, race and ethnicity. The patient's weight, height, and medical history were not reported. The patients received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, and batch number were not reported, expiry: unknown) dose not reported,1 total, administered on an unspecified date for covid-19 prophylaxis. The batch number was not reported. Per procedure, no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patients died from unknown cause of death after they were fully vaccinated. It was unspecified if an autopsy was performed. The reporter stated that, ""They were right the only people that I know who have died are fully vaccinated"". The action taken with covid-19 vaccine ad26.cov2.s was not applicable. This report was serious (Death).; Sender's Comments: V0-20221243109-Died. Insufficient information is available to make a causality assessment. Therefore, this event is considered unclassifiable.; Reported Cause(s) of Death: UNKNOWN CAUSE OF DEATH"
375554,2541326,"ENDED UP PASSING AWAY; GOT WORSE AND WORSE; This spontaneous report received from a consumer via a company representative via social media concerned a male of unspecified age, race and ethnicity. The patient's weight, height, and medical history were not reported. The patient received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, batch number and expiry were not reported) dose, start therapy date were not reported, 1 total, administered for covid-19 prophylaxis. The batch number was not reported. Per procedure no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patient got worse and worse and on an unspecified date patient ended up passing away. It was reported that ""My husband got thanks j j shot too years ago and then he got worse and worse and ended up passing away"". On an unspecified date, the patient died from unknown cause of death. It was unknown whether an autopsy was performed. The action taken with covid-19 vaccine ad26.cov2.s was not applicable. The outcome of got worse and worse was not reported and on an unspecified date the patient ended up passing away. This report was serious (Death).; Sender's Comments: V0: 20221243958-Ended up passing away. Insufficient information is available to make a causality assessment. Therefore, this event is considered unclassifiable.; Reported Cause(s) of Death: UNKNOWN CAUSE OF DEATH"
375562,2541334,"HEART FAILURE; This spontaneous report received from a consumer via a company representative via social media concerned a 18 year old male of an unspecified race and ethnicity. The patient's weight, height, and medical history were not reported. The patient received covid-19 vaccine ad26.cov2.s (suspension for injection, route of admin, and batch number were not reported, expiry: unknown) dose was not reported, 1 total, start therapy date were not reported for covid-19 prophylaxis. The batch number was not reported. Per procedure, no follow-up will be requested for this case. No concomitant medications were reported. On an unspecified date, the patient died from heart failure. It was unspecified if an autopsy was performed. The reporter stated that ""No, you do not have the data. Because injuries are not being reported into VAERS. I had 1 coworker whose lips and tongue went numb after his vaccine, and he nearly died. 2 others had severe tinnitus. One had hands so painful he sat there rubbing them nearly crying. Another had he and his wife both experiencing numb hands with loss of grip. Another coworker's wife has myocarditis. My supervisor's daughter had her 18 year old best friend die of heart failure after his vaccine. These adverse events are not rare, look in every comment section about Covid vaccines. And do not give me that ""anecdotal"" stuff. Big pharma can not hide behind that lie forever "". The action taken with covid-19 vaccine ad26.cov2.s was not applicable. This report was serious (Death). This case, from the same reporter is linked to 20221243340, 20221243356, 20221243261, 20221243606, 20221245881 and 20221245969.; Sender's Comments: V0: 20221245816- Heart failure. The event has an unknown/unclear temporal relationship, is unlabeled, and has unknown scientific plausibility. There is no information on any other factors potentially associated with the event. Therefore, the WHO Causality is considered indeterminate. The company causality is considered unassessable.; Reported Cause(s) of Death: HEART FAILURE"
375647,2541439,Cardiac arrest/heart attack


# Number of unique VAERS ID

In [25]:
VID = VAERSM.drop_duplicates(subset=['VAERS_ID'],keep='first')
print(len(VID))

240841


# Number of individuals with "stroke" listed as a symptom after receiving a vaccine

In [26]:
stst = VID[VID['SYMPTOM_TEXT'].str.contains('stroke',na=False, flags=re.IGNORECASE, regex=True)]
print(len(stst))


2099


# Number of individuals with "lymph node" listed as a symptom after receiving a vaccine

In [27]:
lnln = VID[VID['SYMPTOM_TEXT'].str.contains('lymph node',na=False, flags=re.IGNORECASE, regex=True)]
print(len(lnln))

3709


# Number of individuals with "heart attack" listed as a symptom after receiving a vaccine

In [28]:
htht = VID[VID['SYMPTOM_TEXT'].str.contains('heart attack',na=False, flags=re.IGNORECASE, regex=True)]
print(len(htht))

981


# Number of individuals with "myocarditis" listed as a symptom after receiving a vaccine

In [29]:
mymy = VID[VID['SYMPTOM_TEXT'].str.contains('myocarditis',na=False, flags=re.IGNORECASE, regex=True)]
print(len(mymy))



1028


# Number of individuals with "blood clot" listed as a symptom after receiving a vaccine

In [30]:
bcbc = VID[VID['SYMPTOM_TEXT'].str.contains('blood clot',na=False, flags=re.IGNORECASE, regex=True)]
print(len(bcbc))

1713


# Number of individuals who were hospitalised after receiving a vaccine

In [31]:
hh = VID.query('HOSPITAL=="Y"')
print(len(hh))

28225


# Number of individuals who received a Moderna vaccine


In [32]:
mdmd = VID[VID['VAX_MANU'].str.contains('MODERNA',na=False, flags=re.IGNORECASE, regex=True)]
print(len(mdmd))

88443


# Number of Moderna doses were received for the Moderna vaccine 

In [33]:
# Calculate the total number of doses of the MODERNA COVID-19 vaccine that have been administered
mdnd = len(VID[(VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'] == 'MODERNA')])

# Print the total number of doses of the MODERNA COVID-19 vaccine that have been administered
print(mdnd)

82529


# Number of individuals who received the Moderna vaccine and died

In [34]:
mdde = VID[VID['VAX_MANU'].str.contains('MODERNA',na=False, flags=re.IGNORECASE, regex=True) & (VID['DIED'] == 'Y')]
print(f'Number of individuals who died after receiving the PFIZER/BIONTECH COVID-19 vaccine: {len(mdde)}')

Number of individuals who died after receiving the PFIZER/BIONTECH COVID-19 vaccine: 2758


# Probability of death after taking a Moderna vaccine

In [35]:
print(len(mdde)/len(mdmd))

0.031183926370656808


# Number of individuals who received a PFIZER\BIONTECH vaccine

In [36]:
pfbn = VID[VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE))]
print(f'Number of individuals who received the Pfizer/Biontech COVID-19 vaccine: {len(pfbn)}')

Number of individuals who received the Pfizer/Biontech COVID-19 vaccine: 108929


# Number of individuals who received the PFIZER\BIONTECH vaccine and died

In [37]:
pfbnde = VID[VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE)) & (VID['DIED'] == 'Y')]
print(f'Number of individuals who died after receiving the PFIZER/BIONTECH COVID-19 vaccine: {len(pfbnde)}')

Number of individuals who died after receiving the PFIZER/BIONTECH COVID-19 vaccine: 2730


# Probability of death after taking a Pzifer/Biontech vaccine 

In [38]:
print(len(pfbnde)/len(pfbn))

0.025062196476604025


# Number of individuals with "disabled" listed as a symptom after receiving a vaccine

In [39]:
dd = VID.query('DISABLE=="Y"')
print(len(dd))

5299


# Number of individual birth defects after receiving a vaccine

In [40]:
bde = VID.query('BIRTH_DEFECT=="Y"')
print(len(bde))

141


# Number of individuals who received a COVID vaccine 

In [41]:
cv19 = VID[VID['VAX_TYPE'].str.contains('COVID19',na=False, flags=re.IGNORECASE, regex=True)]
print(len(cv19))

207411


# Number of individual males

In [42]:
mm = VID.query('SEX=="M"')
print(len(mm))

87106


# Number of indvidual females

In [43]:
ff = VID.query('SEX=="F"')
print(len(ff))

134582


# Number of individual undisclosed genders

In [44]:
other_genders = VID[~VID['SEX'].isin(['M', 'F'])]
print(f'Number of individuals with a gender that is not "M" or "F": {len(other_genders)}')

Number of individuals with a gender that is not "M" or "F": 19153


# Number of individuals who died who received a vaccine

In [45]:
print(len(r))

6378


# Mean age of individuals who have died

In [46]:
mean_age_of_deaths = VID[VID['DIED'] == 'Y']['AGE_YRS'].mean()
print(f'Mean age of deaths: {mean_age_of_deaths}')

Mean age of deaths: 73.68455412907703


# Median age of individuals who have died

In [47]:
median_age_of_deaths = VID[VID['DIED'] == 'Y']['AGE_YRS'].median()
print(f'Median age of deaths: {median_age_of_deaths}')

Median age of deaths: 76.0


# Standard deviation of the age of individuals who have died

In [48]:
std_age_of_deaths = VID[VID['DIED'] == 'Y']['AGE_YRS'].std()
print(f'Standard deviation of age of deaths: {std_age_of_deaths}')

Standard deviation of age of deaths: 15.306238683167143


# Calculate the minimum and maximum ages of individuals who have died

In [49]:
min_age_of_deaths = VID[VID['DIED'] == 'Y']['AGE_YRS'].min()
max_age_of_deaths = VID[VID['DIED'] == 'Y']['AGE_YRS'].max()
print(f'Min age of deaths: {min_age_of_deaths}, Max age of deaths: {max_age_of_deaths}')

Min age of deaths: 0.08, Max age of deaths: 107.0


# The probability of individuals who were hospitalised after receiving a vaccine

In [50]:
hv = len(hh)/len(VID)
print(hv)

0.11719350110653917


# The probability of individuals who were disabled after receiving a vaccine

In [51]:
dv = len(dd)/len(VID)
print(dv)

0.0220020677542445


# The probability of individuals with "myocarditis" listed as a symptom after receiving vaccine

In [52]:
mv = len(mymy)/len(VID)
print(mv)

0.004268376231621692


# The probability of death given that the individual received a vaccine  

In [53]:
print(len(r)/len(VID))

0.026482201950664547


# Number of individuals with "stroke" listed as a symptom after receiving the COVID-19 vaccine

In [54]:
# Calculate the number of individuals with "stroke" listed as a symptom after receiving the COVID-19 vaccine
cvst = VID[(VID['SYMPTOM_TEXT'].str.contains('stroke',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19')]
print(f'Number of individuals with "stroke" listed as a symptom after receiving the COVID-19 vaccine: {len(cvst)}')



Number of individuals with "stroke" listed as a symptom after receiving the COVID-19 vaccine: 1912


# Number of individuals with "lymph node" listed as a symptom after receiving the COVID-19 vaccine

In [55]:
# Calculate the number of individuals with "lymph node" listed as a symptom after receiving the COVID-19 vaccine
cvln = VID[(VID['SYMPTOM_TEXT'].str.contains('lymph node',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19')]
print(f'Number of individuals with "lymph node" listed as a symptom after receiving the COVID-19 vaccine: {len(cvln)}')

Number of individuals with "lymph node" listed as a symptom after receiving the COVID-19 vaccine: 3266


# Number of individuals with "heart attack" listed as a symptom after receiving the COVID-19 vaccine

In [56]:
# Calculate the number of individuals with "heart attack" listed as a symptom after receiving the COVID-19 vaccine
cvha = VID[(VID['SYMPTOM_TEXT'].str.contains('heart attack',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19')]
print(f'Number of individuals with "heart attack" listed as a symptom after receiving the COVID-19 vaccine: {len(cvha)}')

Number of individuals with "heart attack" listed as a symptom after receiving the COVID-19 vaccine: 891


# Number of individuals with "myocarditis" listed as a symptom after receiving the COVID-19 vaccine

In [57]:
# Calculate the number of individuals with "myocarditis" listed as a symptom after receiving the COVID-19 vaccine
cvma = VID[(VID['SYMPTOM_TEXT'].str.contains('myocarditis',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19')]
print(f'Number of individuals with "myocarditis" listed as a symptom after receiving the COVID-19 vaccine: {len(cvma)}')

Number of individuals with "myocarditis" listed as a symptom after receiving the COVID-19 vaccine: 967


# Number of individuals with "blood clot" listed as a symptom after receiving the COVID-19 vaccine

In [58]:
# Calculate the number of individuals with "blood clot" listed as a symptom after receiving the COVID-19 vaccine
cvbc = VID[(VID['SYMPTOM_TEXT'].str.contains('blood clot',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19')]
print(f'Number of individuals with "blood clot" listed as a symptom after receiving the COVID-19 vaccine: {len(cvbc)}')

Number of individuals with "blood clot" listed as a symptom after receiving the COVID-19 vaccine: 1631


# Number of individuals with "stroke" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine

In [59]:
# Calculate the number of individuals with "stroke" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine
cvstpf = VID[(VID['SYMPTOM_TEXT'].str.contains('stroke',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE)))]
print(f'Number of individuals with "stroke" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: {len(cvstpf)}')

Number of individuals with "stroke" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: 923


# Number of individuals with "stroke" listed as a symptom after receiving the Moderna COVID-19 vaccine

In [60]:
# Calculate the number of individuals with "stroke" listed as a symptom after receiving the Moderna COVID-19 vaccine
cvstma = VID[(VID['SYMPTOM_TEXT'].str.contains('stroke',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('MODERNA', flags=re.IGNORECASE)))]
print(f'Number of individuals with "stroke" listed as a symptom after receiving the Moderna COVID-19 vaccine: {len(cvstma)}')

Number of individuals with "stroke" listed as a symptom after receiving the Moderna COVID-19 vaccine: 769


# Number of individuals with "lymph nodes" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine

In [61]:
# Calculate the number of individuals with "lymph nodes" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine
cvlnpf = VID[(VID['SYMPTOM_TEXT'].str.contains('lymph node',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE)))]
print(f'Number of individuals with "lymph node" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: {len(cvlnpf)}')

Number of individuals with "lymph node" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: 2095


# Number of individuals with "lymph node" listed as a symptom after receiving the Moderna COVID-19 vaccine

In [62]:
# Calculate the number of individuals with "lymph node" listed as a symptom after receiving the Moderna COVID-19 vaccine
cvlnma = VID[(VID['SYMPTOM_TEXT'].str.contains('lymph node',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('MODERNA', flags=re.IGNORECASE)))]
print(f'Number of individuals with "lymph node" listed as a symptom after receiving the Moderna COVID-19 vaccine: {len(cvlnma)}')

Number of individuals with "lymph node" listed as a symptom after receiving the Moderna COVID-19 vaccine: 1092


# Number of individuals with "heart attack" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine

In [63]:
# Calculate the number of individuals with "heart attack" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine
cvhapf = VID[(VID['SYMPTOM_TEXT'].str.contains('heart attack',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE)))]
print(f'Number of individuals with "heart attack" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: {len(cvhapf)}')

Number of individuals with "heart attack" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: 493


# Number of individuals with "heart attack" listed as a symptom after receiving the Moderna COVID-19 vaccine

In [64]:
# Calculate the number of individuals with "heart attack" listed as a symptom after receiving the Moderna COVID-19 vaccine
cvhama = VID[(VID['SYMPTOM_TEXT'].str.contains('heart attack',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('MODERNA', flags=re.IGNORECASE)))]
print(f'Number of individuals with "heart attack" listed as a symptom after receiving the Moderna COVID-19 vaccine: {len(cvhama)}')

Number of individuals with "heart attack" listed as a symptom after receiving the Moderna COVID-19 vaccine: 307


# Number of individuals with "myocarditis" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine

In [65]:
# Calculate the number of individuals with "myocarditis" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine
cvmypf = VID[(VID['SYMPTOM_TEXT'].str.contains('myocarditis',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE)))]
print(f'Number of individuals with "myocarditis" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: {len(cvmypf)}')

Number of individuals with "myocarditis" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: 530


# Number of individuals with "myocarditis" listed as a symptom after receiving the Moderna COVID-19 vaccine

In [66]:
# Calculate the number of individuals with "myocarditis" listed as a symptom after receiving the Moderna COVID-19 vaccine
cvmyma = VID[(VID['SYMPTOM_TEXT'].str.contains('myocarditis',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('MODERNA', flags=re.IGNORECASE)))]
print(f'Number of individuals with "myocarditis" listed as a symptom after receiving the Moderna COVID-19 vaccine: {len(cvmyma)}')

Number of individuals with "myocarditis" listed as a symptom after receiving the Moderna COVID-19 vaccine: 381


# Number of individuals with "blood clot" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine

In [67]:
# Calculate the number of individuals with "blood clot" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine
cvbcpf = VID[(VID['SYMPTOM_TEXT'].str.contains('blood clot',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('PFIZER\\\\BIONTECH', flags=re.IGNORECASE)))]
print(f'Number of individuals with "blood clot" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: {len(cvbcpf)}')

Number of individuals with "blood clot" listed as a symptom after receiving the Pfizer/Biontech COVID-19 vaccine: 748


# Number of individuals with "blood clot" listed as a symptom after receiving the Moderna COVID-19 vaccine

In [68]:
# Calculate the number of individuals with "blood clot" listed as a symptom after receiving the Moderna COVID-19 vaccine
cvbcma = VID[(VID['SYMPTOM_TEXT'].str.contains('blood clot',na=False, flags=re.IGNORECASE, regex=True)) & (VID['VAX_TYPE'] == 'COVID19') & (VID['VAX_MANU'].str.contains(re.compile('MODERNA', flags=re.IGNORECASE)))]
print(f'Number of individuals with "blood clot" listed as a symptom after receiving the Moderna COVID-19 vaccine: {len(cvbcma)}')

Number of individuals with "blood clot" listed as a symptom after receiving the Moderna COVID-19 vaccine: 541


# Number of individuals who died after receiving the COVID-19 vaccine

In [69]:
cvde = VID[(VID['VAX_TYPE'] == 'COVID19') & (VID['DIED'] == 'Y')]
# Print the number of individuals who died after receiving the COVID-19 vaccine
print(f'Number of individuals who died after receiving the COVID-19 vaccine: {len(cvde)}')

Number of individuals who died after receiving the COVID-19 vaccine: 6088


# The probability of individuals aquiring a "stroke" after receiving a COVID-19 vaccine

In [70]:
print(len(cvst)/len(cv19))

0.009218411752510716


# The probability of individuals aquiring a "lymph node" after receiving a COVID-19 vaccine

In [71]:
print(len(cvln)/len(cv19))

0.01574651296218619


# The probability of individuals aquiring a "heart attack" after receiving a COVID-19 vaccine

In [72]:
print(len(cvha)/len(cv19))

0.004295818447430464


# The probability of individuals aquiring a "myocarditis" after receiving a COVID-19 vaccine

In [73]:
print(len(cvma)/len(cv19))

0.004662240671902647


# The probability of individuals aquiring a "blood clot" after receiving a COVID-19 vaccine

In [74]:
print(len(cvbc)/len(cv19))

0.007863613790975407


# The probability of dying after receiving the COVID-19 vaccine

In [75]:
print(len(cvde)/len(cv19))

0.029352348718245415
