# This file of code outlines the framework for the following project.
### This shows a block of code for each year that cleans and merges all the data into a single file to be analyzed. This code will serve as an outline to automate this cleaning and merging with a for loop. 

The Data Wrangling of VAERS vaccine reports from 1990 to 2022. Vaccine injuries are reported to the CDC and the FDA via VAERS. VAERS is an early warning system to detect potential safety problems with vaccine.  

The data used can be found at https://vaers.hhs.gov/data.html

The data consists of 3 files for each year since 1990: YEARVAERSVAX, YEARVAERSDATA and YEARVAERSSYMPTOMS. For the purpose of this analysis I did not find the data in VAERSSYMPTOMS to be quantifiable so that data was dropped. 

In [2]:
import pandas as pd

# 1990:

### Import the data sets

In [106]:
vaersdata90 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1990/1990VAERSDATA.csv',encoding = 'cp1252')

In [107]:
vaersvax90 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1990/1990VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [108]:
vax90 = vaersvax90[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [109]:
data90 = vaersdata90[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [110]:
vaers1990 = pd.merge(vax90, data90, on= 'VAERS_ID')

In [111]:
vaers1990['Year'] = 1990

### Saved merged dataset by year as UTF-8 Encoding

In [112]:
vaers1990.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1991.csv', encoding = 'utf-8')

# 1991:

### Import the data sets

In [113]:
vaersdata91 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1991/1991VAERSDATA.csv',encoding = 'cp1252')

In [114]:
vaersvax91 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1991/1991VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [115]:
vax91 = vaersvax91[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [116]:
data91 = vaersdata91[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [117]:
vaers1991 = pd.merge(vax91, data91, on= 'VAERS_ID')

In [118]:
# The combined datasets do not have a vairable to identify them by year
# This adds the respective year to each file that is combined by year
vaers1991['Year'] = 1991

In [119]:
# Saving the progress of each year combined file
vaers1991.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1991.csv', encoding = 'utf-8')

In [120]:
# Concatenating the newly combined year to the cumulative CSV
vaers90_91 = pd.concat([vaers1990, vaers1991])

# 1992:

### Import the data sets

In [121]:
vaersdata92 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1992/1992VAERSDATA.csv',encoding = 'cp1252')

In [122]:
vaersvax92 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1992/1992VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [123]:
vax92 = vaersvax92[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [124]:
data92 = vaersdata92[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [125]:
vaers1992 = pd.merge(vax92, data92, on= 'VAERS_ID')

In [126]:
vaers1992['Year'] = 1992

In [127]:
vaers1992.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1992.csv', encoding = 'utf-8')

In [128]:
vaers90_92 = pd.concat([vaers90_91, vaers1992])

# 1993:

### Import the data sets

In [129]:
vaersdata93 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1993/1993VAERSDATA.csv',encoding = 'cp1252')

In [130]:
vaersvax93 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1993/1993VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [131]:
vax93 = vaersvax93[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [132]:
data93 = vaersdata93[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [133]:
vaers1993 = pd.merge(vax93, data93, on= 'VAERS_ID')

In [134]:
vaers1993['Year'] = 1993

In [135]:
vaers1993.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1993.csv', encoding = 'utf-8')

In [136]:
vaers90_93 = pd.concat([vaers90_92, vaers1993])

# 1994:

### Import the data sets

In [137]:
vaersdata94 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1994/1994VAERSDATA.csv',encoding = 'cp1252')

In [138]:
vaersvax94 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1994/1994VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [139]:
vax94 = vaersvax94[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [140]:
data94 = vaersdata94[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [141]:
vaers1994 = pd.merge(vax94, data94, on= 'VAERS_ID')

In [142]:
vaers1994['Year'] = 1994

In [143]:
vaers1994.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1994.csv', encoding = 'utf-8')

In [144]:
vaers90_94 = pd.concat([vaers90_93, vaers1994])

# 1995:

### Import the data sets

In [145]:
vaersdata95 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1995/1995VAERSDATA.csv',encoding = 'cp1252')

In [146]:
vaersvax95 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1995/1995VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [147]:
vax95 = vaersvax95[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [148]:
data95 = vaersdata95[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [149]:
vaers1995 = pd.merge(vax95, data95, on= 'VAERS_ID')

In [150]:
vaers1995['Year'] = 1991

In [151]:
vaers1995.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1995.csv', encoding = 'utf-8')

In [152]:
vaers90_95 = pd.concat([vaers90_94, vaers1995])

# 1996:

### Import the data sets

In [153]:
vaersdata96 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1996/1996VAERSDATA.csv',encoding = 'cp1252')

In [154]:
vaersvax96 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1996/1996VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [155]:
vax96 = vaersvax96[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [156]:
data96 = vaersdata96[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [157]:
vaers1996 = pd.merge(vax96, data96, on= 'VAERS_ID')

In [158]:
vaers1996['Year'] = 1996

In [159]:
vaers1996.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1996.csv', encoding = 'utf-8')

In [160]:
vaers90_96 = pd.concat([vaers90_95, vaers1996])

# 1997:

### Import the data sets

In [161]:
vaersdata97 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1997/1997VAERSDATA.csv',encoding = 'cp1252')

In [162]:
vaersvax97 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1997/1997VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [163]:
vax97 = vaersvax97[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [164]:
data97 = vaersdata97[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [165]:
vaers1997 = pd.merge(vax97, data97, on= 'VAERS_ID')

In [166]:
vaers1997['Year'] = 1997

In [167]:
vaers1997.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1997.csv', encoding = 'utf-8')

In [168]:
vaers90_97 = pd.concat([vaers90_96, vaers1997])

# 1998:

### Import the data sets

In [169]:
vaersdata98 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1998/1998VAERSDATA.csv',encoding = 'cp1252')

In [170]:
vaersvax98 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1998/1998VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [171]:
vax98 = vaersvax98[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [172]:
data98 = vaersdata98[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [173]:
vaers1998 = pd.merge(vax98, data98, on= 'VAERS_ID')

In [174]:
vaers1998['Year'] = 1998

In [175]:
vaers1998.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1998.csv', encoding = 'utf-8')

In [176]:
vaers90_98 = pd.concat([vaers90_97, vaers1998])

# 1999:

### Import the data sets

In [177]:
vaersdata99 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1999/1999VAERSDATA.csv',encoding = 'cp1252')

In [178]:
vaersvax99 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/1999/1999VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [179]:
vax99 = vaersvax99[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [180]:
data99 = vaersdata99[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [181]:
vaers1999 = pd.merge(vax99, data99, on= 'VAERS_ID')

In [182]:
vaers1999['Year'] = 1999

In [183]:
vaers1999.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers1999.csv', encoding = 'utf-8')

In [184]:
vaers90_99 = pd.concat([vaers90_98, vaers1999])

# 2000:

### Import the data sets

In [185]:
vaersdata00 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2000/2000VAERSDATA.csv',encoding = 'cp1252')

In [186]:
vaersvax00 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2000/2000VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [187]:
vax00 = vaersvax00[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [188]:
data00 = vaersdata00[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [189]:
vaers2000 = pd.merge(vax00, data00, on= 'VAERS_ID')

In [190]:
vaers2000['Year'] = 2000

In [191]:
vaers2000.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2000.csv', encoding = 'utf-8')

In [192]:
vaers90_00 = pd.concat([vaers90_99, vaers2000])

# 2001:

### Import the data sets

In [193]:
vaersdata01 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2001/2001VAERSDATA.csv',encoding = 'cp1252')

In [194]:
vaersvax01 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2001/2001VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [195]:
vax01 = vaersvax01[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [196]:
data01 = vaersdata01[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [197]:
vaers2001 = pd.merge(vax01, data01, on= 'VAERS_ID')

In [198]:
vaers2001['Year'] = 2001

In [199]:
vaers2001.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2001.csv', encoding = 'utf-8')

In [200]:
vaers90_01 = pd.concat([vaers90_00, vaers2001])

# 2002:

### Import the data sets

In [201]:
vaersdata02 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2002/2002VAERSDATA.csv',encoding = 'cp1252')

In [202]:
vaersvax02 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2002/2002VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [203]:
vax02 = vaersvax02[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [204]:
data02 = vaersdata02[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [205]:
vaers2002 = pd.merge(vax02, data02, on= 'VAERS_ID')

In [206]:
vaers2002['Year'] = 2002

In [207]:
vaers2002.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2002.csv', encoding = 'utf-8')

In [208]:
vaers90_02 = pd.concat([vaers90_01, vaers2002])

# 2003:

### Import the data sets

In [209]:
vaersdata03 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2003/2003VAERSDATA.csv',encoding = 'cp1252')

In [210]:
vaersvax03 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2003/2003VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [211]:
vax03 = vaersvax03[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [212]:
data03 = vaersdata03[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [213]:
vaers2003 = pd.merge(vax03, data03, on= 'VAERS_ID')

In [214]:
vaers2003['Year'] = 2003

In [215]:
vaers2003.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2003.csv', encoding = 'utf-8')

In [216]:
vaers90_03 = pd.concat([vaers90_02, vaers2003])

# 2004:

### Import the data sets

In [217]:
vaersdata04 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2004/2004VAERSDATA.csv',encoding = 'cp1252')

In [218]:
vaersvax04 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2004/2004VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [219]:
vax04 = vaersvax04[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [220]:
data04 = vaersdata04[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [221]:
vaers2004 = pd.merge(vax04, data04, on= 'VAERS_ID')

In [222]:
vaers2004['Year'] = 2004

In [223]:
vaers2004.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2004.csv', encoding = 'utf-8')

In [224]:
vaers90_04 = pd.concat([vaers90_03, vaers2004])

# 2005:

### Import the data sets

In [225]:
vaersdata05 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2005/2005VAERSDATA.csv',encoding = 'cp1252')

In [226]:
vaersvax05 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2005/2005VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [227]:
vax05 = vaersvax05[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [228]:
data05 = vaersdata05[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [229]:
vaers2005 = pd.merge(vax05, data05, on= 'VAERS_ID')

In [230]:
vaers2005['Year'] = 2005

In [231]:
vaers2005.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2005.csv', encoding = 'utf-8')

In [232]:
vaers90_05 = pd.concat([vaers90_04, vaers2005])

# 2006:

### Import the data sets

In [233]:
vaersdata06 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2006/2006VAERSDATA.csv',encoding = 'cp1252')

In [234]:
vaersvax06 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2006/2006VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [235]:
vax06 = vaersvax06[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [236]:
data06 = vaersdata06[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [237]:
vaers2006 = pd.merge(vax06, data06, on= 'VAERS_ID')

In [238]:
vaers2006['Year'] = 2006

In [239]:
vaers2006.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2006.csv', encoding = 'utf-8')

In [240]:
vaers90_06 = pd.concat([vaers90_05, vaers2006])

# 2007:

### Import the data sets

In [241]:
vaersdata07 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2007/2007VAERSDATA.csv',encoding = 'cp1252')

In [242]:
vaersvax07 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2007/2007VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [243]:
vax07 = vaersvax07[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [244]:
data07 = vaersdata07[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [245]:
vaers2007 = pd.merge(vax07, data07, on= 'VAERS_ID')

In [246]:
vaers2007['Year'] = 2007

In [247]:
vaers2007.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2007.csv', encoding = 'utf-8')

In [248]:
vaers90_07 = pd.concat([vaers90_06, vaers2007])

# 2008:

### Import the data sets

In [249]:
vaersdata08 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2008/2008VAERSDATA.csv',encoding = 'cp1252')

In [250]:
vaersvax08 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2008/2008VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [251]:
vax08 = vaersvax08[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [252]:
data08 = vaersdata08[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [253]:
vaers2008 = pd.merge(vax08, data08, on= 'VAERS_ID')

In [254]:
vaers2008['Year'] = 2008

In [255]:
vaers2008.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2008.csv', encoding = 'utf-8')

In [256]:
vaers90_08 = pd.concat([vaers90_07, vaers2008])

# 2009:

### Import the data sets

In [257]:
vaersdata09 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2009/2009VAERSDATA.csv',encoding = 'cp1252')

  vaersdata09 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2009/2009VAERSDATA.csv',encoding = 'cp1252')


In [258]:
vaersvax09 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2009/2009VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [259]:
vax09 = vaersvax09[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [260]:
data09 = vaersdata09[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [261]:
vaers2009 = pd.merge(vax09, data09, on= 'VAERS_ID')

In [262]:
vaers2009['Year'] = 2009

In [263]:
vaers2009.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2009.csv', encoding = 'utf-8')

In [264]:
vaers90_09 = pd.concat([vaers90_08, vaers2009])

# 2010:

### Import the data sets

In [265]:
vaersdata10 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2010/2010VAERSDATA.csv',encoding = 'cp1252')

In [266]:
vaersvax10 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2010/2010VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [267]:
vax10 = vaersvax10[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [268]:
data10 = vaersdata10[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [269]:
vaers2010 = pd.merge(vax10, data10, on= 'VAERS_ID')

In [270]:
vaers2010['Year'] = 2010

In [271]:
vaers2010.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2010.csv', encoding = 'utf-8')

In [272]:
vaers90_10 = pd.concat([vaers90_09, vaers2010])

# 2011:

### Import the data sets

In [273]:
vaersdata11 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2011/2011VAERSDATA.csv',encoding = 'cp1252')

In [274]:
vaersvax11 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2011/2011VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [275]:
vax11 = vaersvax11[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [276]:
data11 = vaersdata11[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [277]:
vaers2011 = pd.merge(vax11, data11, on= 'VAERS_ID')

In [278]:
vaers2011['Year'] = 2011

In [279]:
vaers2011.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2011.csv', encoding = 'utf-8')

In [280]:
vaers90_11 = pd.concat([vaers90_10, vaers2011])

# 2012:

### Import the data sets

In [281]:
vaersdata12 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2012/2012VAERSDATA.csv',encoding = 'cp1252')

  vaersdata12 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2012/2012VAERSDATA.csv',encoding = 'cp1252')


In [282]:
vaersvax12 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2012/2012VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [283]:
vax12 = vaersvax12[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [284]:
data12 = vaersdata12[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [285]:
vaers2012 = pd.merge(vax12, data12, on= 'VAERS_ID')

In [286]:
vaers2012['Year'] = 2012

In [287]:
vaers2012.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2012.csv', encoding = 'utf-8')

In [288]:
vaers90_12 = pd.concat([vaers90_11, vaers2012])

# 2013:

### Import the data sets

In [289]:
vaersdata13 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2013/2013VAERSDATA.csv',encoding = 'cp1252')

In [290]:
vaersvax13 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2013/2013VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [291]:
vax13 = vaersvax13[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [292]:
data13 = vaersdata13[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [293]:
vaers2013 = pd.merge(vax13, data13, on= 'VAERS_ID')

In [294]:
vaers2013['Year'] = 2013

In [295]:
vaers2013.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2013.csv', encoding = 'utf-8')

In [296]:
vaers90_13 = pd.concat([vaers90_12, vaers2013])

# 2014:

### Import the data sets

In [297]:
vaersdata14 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2014/2014VAERSDATA.csv',encoding = 'cp1252')

In [298]:
vaersvax14 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2014/2014VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [299]:
vax14 = vaersvax14[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [300]:
data14 = vaersdata14[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [301]:
vaers2014 = pd.merge(vax14, data14, on= 'VAERS_ID')

In [302]:
vaers2014['Year'] = 2014

In [303]:
vaers2014.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2014.csv', encoding = 'utf-8')

In [304]:
vaers90_14 = pd.concat([vaers90_13, vaers2014])

# 2015:

### Import the data sets

In [305]:
vaersdata15 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2015/2015VAERSDATA.csv',encoding = 'cp1252')

In [306]:
vaersvax15 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2015/2015VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [307]:
vax15 = vaersvax15[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [308]:
data15 = vaersdata15[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [309]:
vaers2015 = pd.merge(vax15, data15, on= 'VAERS_ID')

In [310]:
vaers2015['Year'] = 2015

In [311]:
vaers2015.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2015.csv', encoding = 'utf-8')

In [312]:
vaers90_15 = pd.concat([vaers90_14, vaers2015])

# 2016:

### Import the data sets

In [313]:
vaersdata16 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2016/2016VAERSDATA.csv',encoding = 'cp1252')

In [314]:
vaersvax16 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2016/2016VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [315]:
vax16 = vaersvax16[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [316]:
data16 = vaersdata16[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [317]:
vaers2016 = pd.merge(vax16, data16, on= 'VAERS_ID')

In [318]:
vaers2016['Year'] = 2016

In [319]:
vaers2016.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2016.csv', encoding = 'utf-8')

In [320]:
vaers90_16 = pd.concat([vaers90_15, vaers2016])

# 2017:

### Import the data sets

In [321]:
vaersdata17 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2017/2017VAERSDATA.csv',encoding = 'cp1252')

  vaersdata17 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2017/2017VAERSDATA.csv',encoding = 'cp1252')


In [322]:
vaersvax17 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2017/2017VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [323]:
vax17 = vaersvax17[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [324]:
data17 = vaersdata17[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [325]:
vaers2017 = pd.merge(vax17, data17, on= 'VAERS_ID')

In [326]:
vaers2017['Year'] = 2017

In [327]:
vaers2017.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2017.csv', encoding = 'utf-8')

In [328]:
vaers90_17 = pd.concat([vaers90_16, vaers2017])

# 2018:

### Import the data sets

In [329]:
vaersdata18 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2018/2018VAERSDATA.csv',encoding = 'cp1252')

In [330]:
vaersvax18 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2018/2018VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [331]:
vax18 = vaersvax18[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [332]:
data18 = vaersdata18[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [333]:
vaers2018 = pd.merge(vax18, data18, on= 'VAERS_ID')

In [334]:
vaers2018['Year'] = 2018

In [335]:
vaers2018.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2018.csv', encoding = 'utf-8')

In [336]:
vaers90_18 = pd.concat([vaers90_17, vaers2018])

# 2019:

### Import the data sets

In [337]:
vaersdata19 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2019/2019VAERSDATA.csv',encoding = 'cp1252')

In [338]:
vaersvax19 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2019/2019VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [339]:
vax19 = vaersvax19[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [340]:
data19 = vaersdata19[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [341]:
vaers2019 = pd.merge(vax19, data19, on= 'VAERS_ID')

In [342]:
vaers2019['Year'] = 2019

In [343]:
vaers2019.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2019.csv', encoding = 'utf-8')

In [344]:
vaers90_19 = pd.concat([vaers90_18, vaers2019])

# 2020:

### Import the data sets

In [345]:
vaersdata20 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2020/2020VAERSDATA.csv',encoding = 'cp1252')

  vaersdata20 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2020/2020VAERSDATA.csv',encoding = 'cp1252')


In [346]:
vaersvax20 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2020/2020VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [347]:
vax20 = vaersvax20[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [348]:
data20 = vaersdata20[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [349]:
vaers2020 = pd.merge(vax20, data20, on= 'VAERS_ID')

In [350]:
vaers2020['Year'] = 2020

In [351]:
vaers2020.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2020.csv', encoding = 'utf-8')

In [352]:
vaers90_20 = pd.concat([vaers90_19, vaers2020])

# 2021:

### Import the data sets

In [3]:
vaersdata21 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2021/2021VAERSDATA.csv')

FileNotFoundError: [Errno 2] No such file or directory: 'C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2021/2021VAERSDATA.csv'

In [None]:
vaersvax21 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2021/2021VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [None]:
vax21 = vaersvax21[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [None]:
data21 = vaersdata21[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [None]:
vaers2021 = pd.merge(vax21, data21, on= 'VAERS_ID')

In [None]:
vaers2021['Year'] = 2021

In [None]:
vaers2021.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2021.csv', encoding = 'utf-8')

In [None]:
vaers90_21 = pd.concat([vaers90_20, vaers2021])

# 2022:

### Import the data sets

In [None]:
vaersdata22 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2022/2022VAERSDATA.csv',encoding = 'cp1252')

In [None]:
vaersvax22 = pd.read_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS-data/2022/2022VAERSVAX.csv',encoding = 'cp1252')

### Condense the two data sets down to useful information for analysis

In [None]:
vax22 = vaersvax22[['VAERS_ID', 'VAX_TYPE', 'VAX_MANU', 'VAX_LOT', 'VAX_NAME']]

In [None]:
data22 = vaersdata22[['VAERS_ID', 'AGE_YRS', 'STATE', 'SYMPTOM_TEXT', 'DIED', 'ER_VISIT']]

### Merge the condensed datasets

In [None]:
vaers2022 = pd.merge(vax22, data22, on= 'VAERS_ID')

In [None]:
vaers2022['Year'] = 2022

In [None]:
vaers2022.to_csv('C:/Users/chris/Desktop/WozU_Data_Science/VAERS_CleanData/vaers2022.csv', encoding = 'utf-8')

In [None]:
vaers90_22 = pd.concat([vaers90_21, vaers2022])