## Final Report 
### Imports

In [36]:
# Imports

# Display plots directly in the notebook instead of in a new window
%matplotlib inline

# Import libraries
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import patsy
import statsmodels.api as sm
import os 
from nltk.sentiment.vader import SentimentIntensityAnalyzer 

### Reading in the UC School csv files

In [2]:
# Read in Berekeley
df_ucb = pd.read_csv(os.path.join('Datasets', 'UC_Berkeley.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Read in Davis
df_ucd = pd.read_csv(os.path.join('Datasets', 'UC_Davis.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'text':'str', 'school':'str'})

# Read in Irvine
#df_uci = pd.read_csv(os.path.join('Datasets', 'UC_Irvine.csv'), 
#                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Read in Los Angeles
df_ucla = pd.read_csv(os.path.join('Datasets', 'UC_Los_Angeles.csv'), 
                      dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Read in Merced
df_ucm = pd.read_csv(os.path.join('Datasets', 'UC_Merced.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'content':'str', 'school':'str'})

# Read in Riverside
#df_ucr = pd.read_csv(os.path.join('Datasets', 'UC_Riverside.csv'), 
#                     dtype={'date': 'str', 'word_count':'str', 'school':'str'})

# Read in San Diego
df_ucsd = pd.read_csv(os.path.join('Datasets', 'UC_San_Diego.csv'), 
                      dtype={'date': 'str', 'word_count':'str', 'school':'str'})

# Read in Santa Barbra
df_ucsb = pd.read_csv(os.path.join('Datasets', 'UC_Santa_Barbara.csv'),
                      dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Read in Santa Cruz
df_ucsc = pd.read_csv(os.path.join('Datasets', 'UC_Santa_Cruz.csv'), 
                      dtype={'date': 'str', 'word_count':int, 'content':'str', 'school':'str'})


### Take a look at UC Berkeley 

In [3]:
# Adding a 'state' column and setting its default value to 'CA'
df_ucb['state'] = 'CA'

# Dropping the 'link' column associated with each update
df_ucb = df_ucb.drop(['link'], axis =1)

# Reordering the columns into a more readable format
df_ucb = df_ucb[['date','school','state','content','word_count']]

# Printing dataframe so we can view all entries
print(df_ucb.to_string())

           date    school state                                            content  word_count
0     18-May-20  Berkeley    CA  We are writing today to share news about budge...         397
1     16-May-20  Berkeley    CA  Members of the remarkable and resilient gradua...        1368
2     14-May-20  Berkeley    CA  A simulated Commencement 2020 will take place ...        2291
3     12-May-20  Berkeley    CA  Last Tuesday, our campus participated in #Givi...         887
4     12-May-20  Berkeley    CA  There are two major budget concerns Chancellor...         354
5      6-May-20  Berkeley    CA  We are writing today to provide an update on o...         680
6      6-May-20  Berkeley    CA  We understand that many faculty, staff, and st...         605
7      4-May-20  Berkeley    CA  Tomorrow is #GivingTuesdayNow, a new global da...         394
8   29-April-20  Berkeley    CA  The Bay Area’s shelter-in-place order has been...         247
9   23-April-20  Berkeley    CA  In response to co

### Take a look at UC Davis 

In [4]:
# Renaming text column to content
df_ucd = df_ucd.rename(columns = {'text':'content'})

# Adding a 'state' column and setting its default value to 'CA'
df_ucd['state'] = 'CA'

# Reordering the columns into a more readable format
df_ucd = df_ucd[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_ucd.to_string())

         date school state                                            content
0   31-Jan-20  Davis    CA  Fight it like the flu\nUpdated 5 p.m. Jan. 31 ...
1    1-Feb-20  Davis    CA  Yolo County info page\nYolo County, in which t...
2    3-Feb-20  Davis    CA  Screening at airports\nUpdated 9 p.m. Feb. 3  ...
3    7-Feb-20  Davis    CA  No reports of coronavirus\nUpdated 11:30 a.m. ...
4   10-Feb-20  Davis    CA  UC Davis Live\nUpdated Feb. 10 Watch UC Davis ...
5   13-Feb-20  Davis    CA  Travel FAQ\nUpdated 11:30 p.m. Feb. 13  Global...
6   25-Feb-20  Davis    CA  New travel notices\nUpdated 6:55 p.m. Feb. 25 ...
7   27-Feb-20  Davis    CA  Level 3 countries off-limits\nUpdated 7 a.m. F...
8   27-Feb-20  Davis    CA  COVID-19 patient\nUpdated 7:50 a.m. Feb. 27  I...
9   27-Feb-20  Davis    CA  3 in isolation\nUpdated 3 p.m. Feb. 27  Chance...
10  27-Feb-20  Davis    CA  Media availability\nUpdated 4 p.m. Feb. 27  UC...
11  28-Feb-20  Davis    CA  Reject xenophobia\nUpdated 10 a.m. F

### Take a look at UC Irvine 

In [5]:
# Take a look at Irvine
#df_uci['state'] = 'CA'
#df_uci.head()

### Take a look at UC Los Angeles 

In [6]:
# Adding a 'state' column and setting its default value to 'CA'
df_ucla['state'] = 'CA'

# Reordering the columns into a more readable format
df_ucla = df_ucla[['date','school','state','word_count']]

# Printing dataframe so we can view all entries
print(df_ucla.to_string())

         date       school state  word_count
0   23-Jan-20  Los Angeles    CA         318
1   31-Jan-20  Los Angeles    CA         434
2    4-Feb-20  Los Angeles    CA         402
3   20-Feb-20  Los Angeles    CA         370
4   27-Feb-20  Los Angeles    CA         220
5    2-Mar-20  Los Angeles    CA         402
6    4-Mar-20  Los Angeles    CA         635
7    5-Mar-20  Los Angeles    CA         223
8    6-Mar-20  Los Angeles    CA         495
9    6-Mar-20  Los Angeles    CA         241
10   6-Mar-20  Los Angeles    CA          81
11   7-Mar-20  Los Angeles    CA         468
12  10-Mar-20  Los Angeles    CA         759
13  12-Mar-20  Los Angeles    CA         401
14  12-Mar-20  Los Angeles    CA        1260
15  13-Mar-20  Los Angeles    CA         203
16  13-Mar-20  Los Angeles    CA        1727
17  14-Mar-20  Los Angeles    CA        2111
18  16-Mar-20  Los Angeles    CA         335
19  16-Mar-20  Los Angeles    CA         443
20  17-Mar-20  Los Angeles    CA         850
21  17-Mar

### Take a look at UC Merced 

In [7]:
# Adding a 'state' column and setting its default value to 'CA'
df_ucm['state'] = 'CA'

# Reordering the columns into a more readable format
df_ucm = df_ucm[['date','school','state','content', 'word_count']]

# Printing dataframe so we can view all entries
print(df_ucm.to_string())

         date  school state                                            content  word_count
0    4-Feb-20  Merced    CA  Coronavirus Update\nFebruary 4, 2020\nInformat...         190
1   28-Feb-20  Merced    CA  UPDATE: What You Need to Know About COVID-19\n...         457
2    6-Mar-20  Merced    CA  COVID-19: Protect Yourself and Each Other\nMar...         468
3    8-Mar-20  Merced    CA  COVID-19: University Travel Guidance\nMarch 8,...         411
4    9-Mar-20  Merced    CA  COVID-19 Instructional Continuity\nMarch 9, 20...         489
5   10-Mar-20  Merced    CA  COVID-19: Update on Academic Operations\nMarch...         191
6   10-Mar-20  Merced    CA  COVID-19 and Research Continuity at UC Merced\...         650
7   10-Mar-20  Merced    CA  COVID-19 Live Webinar Tomorrow\nMarch 10, 2020...         309
8   10-Mar-20  Merced    CA  UPDATE: Moving Toward Remote Learning\nMarch 1...         374
9   11-Mar-20  Merced    CA  UPDATE: Moving Toward Remote Learning - Studen...         457

### Take a look at UC Riverside 

In [8]:
# Adding a 'state' column and setting its default value to 'CA'
#df_ucr['state'] = 'CA'
#df_ucr.head()

### Take a look at UC San Diego 

In [9]:
# Adding a 'state' column and setting its default value to 'CA'
df_ucsd['state'] = 'CA'

# Reordering the columns into a more readable format
df_ucsd = df_ucsd[['date','school','state','word_count']]

# Printing dataframe so we can view all entries
print(df_ucsd.to_string()) # You will notice NaNs at the bottom of the data frame

         date school state word_count
0   22-Jan-20  Diego    CA        285
1   23-Jan-20  Diego    CA        507
2   27-Jan-20  Diego    CA        807
3   30-Jan-20  Diego    CA        280
4   30-Jan-20  Diego    CA        873
5   31-Jan-20  Diego    CA       1393
6    3-Feb-20  Diego    CA        799
7    5-Feb-20  Diego    CA       1485
8   14-Feb-20  Diego    CA        355
9   26-Feb-20  Diego    CA        410
10  26-Feb-20  Diego    CA        490
11  28-Feb-20  Diego    CA        694
12   4-Mar-20  Diego    CA        612
13   5-Mar-20  Diego    CA        566
14   8-Mar-20  Diego    CA        572
15   9-Mar-20  Diego    CA         59
16   9-Mar-20  Diego    CA        902
17  11-Mar-20  Diego    CA        264
18  12-Mar-20  Diego    CA        335
19  13-Mar-20  Diego    CA       1379
20  13-Mar-20  Diego    CA        348
21  13-Mar-20  Diego    CA        592
22  16-Mar-20  Diego    CA        252
23  16-Mar-20  Diego    CA        482
24  16-Mar-20  Diego    CA        843
25  17-Mar-2

In [10]:
# Dropping the empty rows at the bottom of df_ucsd
df_ucsd = df_ucsd.dropna()

# Now that the 4 rows with missing data on the bottom with the NaN values have been removed 
# We can convert word_count column back into an integer
convert_dict = {'word_count': int}
df_ucsd = df_ucsd.astype(convert_dict)

# Check out our updated df_ucsd
print(df_ucsd.to_string()) 

         date school state  word_count
0   22-Jan-20  Diego    CA         285
1   23-Jan-20  Diego    CA         507
2   27-Jan-20  Diego    CA         807
3   30-Jan-20  Diego    CA         280
4   30-Jan-20  Diego    CA         873
5   31-Jan-20  Diego    CA        1393
6    3-Feb-20  Diego    CA         799
7    5-Feb-20  Diego    CA        1485
8   14-Feb-20  Diego    CA         355
9   26-Feb-20  Diego    CA         410
10  26-Feb-20  Diego    CA         490
11  28-Feb-20  Diego    CA         694
12   4-Mar-20  Diego    CA         612
13   5-Mar-20  Diego    CA         566
14   8-Mar-20  Diego    CA         572
15   9-Mar-20  Diego    CA          59
16   9-Mar-20  Diego    CA         902
17  11-Mar-20  Diego    CA         264
18  12-Mar-20  Diego    CA         335
19  13-Mar-20  Diego    CA        1379
20  13-Mar-20  Diego    CA         348
21  13-Mar-20  Diego    CA         592
22  16-Mar-20  Diego    CA         252
23  16-Mar-20  Diego    CA         482
24  16-Mar-20  Diego    C

### Take a look at UC Santa Barbara 

In [11]:
# Adding a 'state' column and setting its default value to 'CA'
df_ucsb['state'] = 'CA'
df_ucsb = df_ucsb.drop(['link'], axis =1)

# Reordering the columns into a more readable format
df_ucsb = df_ucsb[['date','school','state','content', 'word_count']]

# Printing dataframe so we can view all entries
print(df_ucsb.to_string())

         date         school state                                            content  word_count
0   14-May-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nI...        1546
1   18-Apr-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nW...         498
2   13-Apr-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nW...         395
3   07-Apr-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nI...         484
4   02-Apr-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nI...          74
5   31-Mar-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nW...        1262
6   26-Mar-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nT...         603
7   19-Mar-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nT...         380
8   18-Mar-20  Santa Barbara    CA  Dear Members of Our Campus Community,\r\n\r\nI...         452
9   17-Mar-20  Santa

### Take a look at Santa Cruz

In [12]:
# Adding a 'state' column and setting its default value to 'CA'
df_ucsc['state'] = 'CA'

# Reordering the columns into a more readable format
df_ucsc = df_ucsc[['date','school','state','content', 'word_count']]

# Printing dataframe so we can view all entries
print(df_ucsc.to_string())

         date      school state                                            content  word_count
0   24-Jan-20  Santa Cruz    CA  The UC Santa Cruz Student Health Center offers...         414
1   30-Jan-20  Santa Cruz    CA  UC Santa Cruz health officials are closely mon...         382
2   31-Jan-20  Santa Cruz    CA  Due to the dynamic situation with the coronavi...         338
3    4-Feb-20  Santa Cruz    CA  The UC Office of the President has directed th...        1276
4    4-Feb-20  Santa Cruz    CA  To: UC Santa Cruz Community\nFrom: Public Affa...         989
5    5-Feb-20  Santa Cruz    CA  UCSF is hosting a town hall today on the novel...         273
6    7-Feb-20  Santa Cruz    CA  The UC Santa Cruz Student Health Center shared...         700
7    7-Feb-20  Santa Cruz    CA  Students: How to get a flu vaccine\nFebruary 0...         359
8   10-Feb-20  Santa Cruz    CA  Campus community members can learn more about ...         178
9   11-Feb-20  Santa Cruz    CA  Seven confirmed c

### Combining all of our UC data frames

In [13]:
# concatenating the dataframes together
df_ca = pd.concat([df_ucsc, df_ucm, df_ucd, df_ucb, df_ucsd, df_ucsb, df_ucla], sort= True)
df_ca = df_ca[['date','school','state','content', 'word_count']]

# looking at the entire dataframe
print(df_ca.to_string())

           date         school state                                            content  word_count
0     24-Jan-20     Santa Cruz    CA  The UC Santa Cruz Student Health Center offers...       414.0
1     30-Jan-20     Santa Cruz    CA  UC Santa Cruz health officials are closely mon...       382.0
2     31-Jan-20     Santa Cruz    CA  Due to the dynamic situation with the coronavi...       338.0
3      4-Feb-20     Santa Cruz    CA  The UC Office of the President has directed th...      1276.0
4      4-Feb-20     Santa Cruz    CA  To: UC Santa Cruz Community\nFrom: Public Affa...       989.0
5      5-Feb-20     Santa Cruz    CA  UCSF is hosting a town hall today on the novel...       273.0
6      7-Feb-20     Santa Cruz    CA  The UC Santa Cruz Student Health Center shared...       700.0
7      7-Feb-20     Santa Cruz    CA  Students: How to get a flu vaccine\nFebruary 0...       359.0
8     10-Feb-20     Santa Cruz    CA  Campus community members can learn more about ...       178.0


### Reading in Texas school csv files

In [14]:
# Read in Texas State University (UNICODEDECODE ERRROR)
#df_tsu = pd.read_csv(os.path.join('Datasets', 'Texas_State_University.csv'), 
#                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Read in University Austin Texas
df_uat = pd.read_csv(os.path.join('Datasets', 'University_Austin_Texas.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Read in Texas A&M University
df_utm = pd.read_csv(os.path.join('Datasets', 'U_T&M.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})


# Read in University North Texas
df_unt = pd.read_csv(os.path.join('Datasets', 'UNT.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Reading in University of Houston
df_uh = pd.read_csv(os.path.join('Datasets', 'University_Houston.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})



## Take a look at Texas State University

In [15]:
#df_tsu

## Take a look at University of Austin Texas

In [16]:
# Renaming text column to content
df_uat = df_uat.rename(columns = {'text':'content'})

# Adding a 'state' column and setting its default value to 'TX'
df_uat['state'] = 'TX'

# Reordering the columns into a more readable format
df_uat = df_uat[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_uat.to_string())

         date  school state                                            content
0   12-May-20  Austin    TX  Admissions has suspended campus visits, Admiss...
1   13-May-20  Austin    TX  COVID-19 Identified within UT Community - from...
2   15-May-20  Austin    TX  Through March 30, students are on spring break...
3   16-May-20  Austin    TX  Starting March 16, 2020, all campus buildings ...
4   17-May-20  Austin    TX  Starting March 16, 2020, all campus buildings ...
5   18-May-20  Austin    TX  New COVID-19 Cases in UT Community - from Pres...
6   19-May-20  Austin    TX  Working Through These Remote Days Ahead - from...
7   20-May-20  Austin    TX  Dear UT Community,\r\n\r\nI just wanted to sha...
8   23-May-20  Austin    TX  Reimbursement for services no longer available...
9   24-May-20  Austin    TX  City of Austin Stay Home  Work SafeOrder - fro...
10  25-May-20  Austin    TX  May 21-23 commencement and graduation ceremoni...
11  27-May-20  Austin    TX  Online Classes Grading 

## Take a look at Texas A&M University

In [17]:
# Renaming text column to content
df_utm = df_utm.rename(columns = {'text':'content'})

# Adding a 'state' column and setting its default value to 'TX'
df_utm['state'] = 'TX'

# Reordering the columns into a more readable format
df_utm = df_utm[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_utm.to_string())

         date   school state                                            content
0   28-Feb-20  T_A&M_U    TX  February 28, 2020, 5:45 p.m. CST Dear Texas A&...
1    2-Mar-20  T_A&M_U    TX  March 2, 2020, 7:55 p.m. CST Texas A&M Univers...
2    3-Mar-20  T_A&M_U    TX  March 3, 2020, 5:45 p.m. CST Texas A&M continu...
3    6-Mar-20  T_A&M_U    TX  March 6, 2020, 4:30 p.m. CST Students, faculty...
4    9-Mar-20  T_A&M_U    TX  March 9, 2020, 5:00 p.m. CDT Texas A&M Cancels...
5   10-Mar-20  T_A&M_U    TX  Updated: March 10, 2020, 6:20 p.m. CDT Texas A...
6   11-Mar-20  T_A&M_U    TX  March 11, 2020, 11:30 p.m. CDT Dear Texas A&M ...
7   12-Mar-20  T_A&M_U    TX  March 12, 2020, 5:00 p.m. CDT Classes Canceled...
8   13-Mar-20  T_A&M_U    TX  Updated: March 13, 2020, 5:45 p.m. CDT Dear Te...
9   14-Mar-20  T_A&M_U    TX  March 14, 2020, 4:55 p.m. CDT Student Worker G...
10  14-Mar-20  T_A&M_U    TX  March 14, 2020, 5:00 p.m. CDT Guidance Regardi...
11  15-Mar-20  T_A&M_U    TX  March 15, 

## Take a look at University of North Texas

In [18]:
# Adding a 'state' column and setting its default value to 'TX'
df_unt['state'] = 'TX'

# Dropping the 'link' column associated with each update
df_unt = df_unt.drop(['link'], axis =1) 

# Reordering the columns into a more readable format
df_unt = df_unt[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_unt.to_string())


           date                     school state                                            content
0   18-May-2020  University of North Texas    TX  Dear UNT community,\r\n\r\nDenton County Publi...
1   15-May-2020  University of North Texas    TX  Final COVID-19 Regular Update\r\n\r\nToday’s e...
2   13-May-2020  University of North Texas    TX  In an effort to keep our community as healthy ...
3   11-May-2020  University of North Texas    TX  Have you been wearing a cloth face cover? Acco...
4   11-May-2020  University of North Texas    TX  Dear UNT undergraduate students,\r\n\r\nWe hop...
5    8-May-2020  University of North Texas    TX  Join Rec Sports for 4 weeks as we "Choose to M...
6    7-May-2020  University of North Texas    TX  A UNT student reported a positive COVID-19 tes...
7    6-May-2020  University of North Texas    TX  President Smatresk hosted a virtual Town Hall ...
8    4-May-2020  University of North Texas    TX  President Smatresk will be hosting a virtual T...


## Take a look at University of Houston

In [19]:
# Adding a 'state' column and setting its default value to 'TX'
df_uh['state'] = 'TX'

# Dropping the empty rows at the bottom of df_uh
df_uh = df_uh.dropna()

# Renamine the columns to match other Texas data frames
df_uh.columns = ['date', 'content', 'school', 'state']

# Reordering the columns into a more readable format
df_uh = df_uh[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_uh.to_string())

      date   school state                                            content
0   27-Jan  Houston    TX  Dear Faculty, Students and Staff,\n\nThe Unive...
1   28-Jan  Houston    TX  Dear Faculty, Students and Staff,\n\nAt this t...
2    2-Mar  Houston    TX  Dear Students, Faculty and Staff,\n\nThe Unive...
3    4-Mar  Houston    TX  UHS Faculty, Staff and Students,\n\nWe continu...
4    6-Mar  Houston    TX  Dear Faculty:\n\nThere are now five confirmed ...
5    9-Mar  Houston    TX  Dear Students,\n\nAs we continue to see more a...
6    9-Mar  Houston    TX  Dear Faculty and Staff,\n\nAs we continue to s...
7   10-Mar  Houston    TX  Dear Department Chairs and Associate Deans for...
8   11-Mar  Houston    TX  Dear Faculty, Staff and Students –\n\nTo allow...
9   11-Mar  Houston    TX  Dear UH Student:\n\nAs communicated by Preside...
10  12-Mar  Houston    TX  Dear Staff:\n\nFollowing the recent announceme...
11  12-Mar  Houston    TX  Dear Faculty and Staff,\n\nSince my last commu...

## Combining all of our Texas dataframes

In [20]:
# concatenating the dataframes together
df_tx = pd.concat([df_uat, df_utm, df_unt, df_uh], sort= True)
df_tx = df_tx[['date','school','state','content']]

# looking at the entire dataframe
print(df_tx.to_string())

           date                     school state                                            content
0     12-May-20                     Austin    TX  Admissions has suspended campus visits, Admiss...
1     13-May-20                     Austin    TX  COVID-19 Identified within UT Community - from...
2     15-May-20                     Austin    TX  Through March 30, students are on spring break...
3     16-May-20                     Austin    TX  Starting March 16, 2020, all campus buildings ...
4     17-May-20                     Austin    TX  Starting March 16, 2020, all campus buildings ...
5     18-May-20                     Austin    TX  New COVID-19 Cases in UT Community - from Pres...
6     19-May-20                     Austin    TX  Working Through These Remote Days Ahead - from...
7     20-May-20                     Austin    TX  Dear UT Community,\r\n\r\nI just wanted to sha...
8     23-May-20                     Austin    TX  Reimbursement for services no longer available...


28        4-May                    Houston    TX  Dear Colleagues,\n\nI hope you and your famili...


## Reading in Florida csv files

In [21]:
# Reading in Florida State University (UNICODE ERROR)
#df_fsu = pd.read_csv(os.path.join('Datasets', 'Florida_State_Univeristy.csv'), 
#                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Reading in University of Central Florida
df_ucf = pd.read_csv(os.path.join('Datasets', 'UCF.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Reading in Universirty of Florida
df_uf = pd.read_csv(os.path.join('Datasets', 'University_Florida.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Reading in University South Florida
df_usf = pd.read_csv(os.path.join('Datasets', 'USoFlorida.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

# Reading in University of Miami
df_um = pd.read_csv(os.path.join('Datasets', 'University_Miami.csv'), 
                     dtype={'date': 'str', 'word_count':int, 'school':'str'})

## Take a look at Florida State University

In [22]:
#df_fsu

## Take a look at University of Central Florida

In [27]:
# Adding a 'state' column and setting its default value to 'TX'
df_ucf['state'] = 'FL'

# Dropping the 'link' column associated with each update
df_ucf = df_ucf.drop(['link'], axis =1) 

# Reordering the columns into a more readable format
df_ucf = df_ucf[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_ucf.to_string())

           date                         school state                                            content
0   21-May-2020  University of Central Florida    FL  As we are all adjusting to the different reali...
1   20-May-2020  University of Central Florida    FL  COVID-19 has impacted all of us in some way. T...
2   13-May-2020  University of Central Florida    FL  As businesses and other entities across the st...
3   13-May-2020  University of Central Florida    FL  We would like to thank you for your continued ...
4   11-May-2020  University of Central Florida    FL  To continue to support our Knights during this...
5   11-May-2020  University of Central Florida    FL  On this first day of our summer classes, we ho...
6   10-May-2020  University of Central Florida    FL  We would like to thank you for your continued ...
7    4-May-2020  University of Central Florida    FL  Thank you for your patience as we navigate the...
8   30-Apr-2020  University of Central Florida    FL  The messag

## Take a look at University of Florida

In [28]:
# Renaming text column to content
df_uf = df_uf.rename(columns = {'text':'content'})

# Adding a 'state' column and setting its default value to 'TX'
df_uf['state'] = 'FL'

# Reordering the columns into a more readable format
df_uf = df_uf[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_uf.to_string())

         date   school state                                            content
0   24-Jan-20  Florida    FL  JANUARY 24: GUIDANCE ON COVID-19\r\nUniversity...
1   31-Jan-20  Florida    FL  JANUARY 31: GUIDANCE ON COVID-19\r\nWith the W...
2   10-Feb-20  Florida    FL  FEBRUARY 10: GUIDANCE ON COVID-19\r\nAs the ou...
3   11-Feb-20  Florida    FL  FEBRUARY 11: GUIDANCE ON COVID-19\r\nTravelers...
4   28-Feb-20  Florida    FL  FEBRUARY 28: GUIDANCE ON COVID-19\r\nAs cases ...
5    2-Mar-20  Florida    FL  MARCH 2: GUIDANCE ON COVID-19\r\nWith the stat...
6    6-Mar-20  Florida    FL  MARCH 6: UF PREPARING FOR RETURN FROM SPRING B...
7    9-Mar-20  Florida    FL  MARCH 9 UPDATE: COVID-19 AND ONLINE CLASSES\r\...
8   11-Mar-20  Florida    FL  MARCH 11: A MESSAGE FROM PRESIDENT KENT FUCHS\...
9   13-Mar-20  Florida    FL  MARCH 13: MESSAGE REGARDING ALACHUA COUNTY PUB...
10  16-Mar-20  Florida    FL  MARCH 16: UPDATED POLICIES FOR TRAVEL, CAMPUS ...
11  17-Mar-20  Florida    FL  MARCH 17: 

## Take a look at University of South Florida

In [29]:
# Renaming text column to content
df_usf = df_usf.rename(columns = {'text':'content'})

# Adding a 'state' column and setting its default value to 'TX'
df_usf['state'] = 'FL'

# Reordering the columns into a more readable format
df_usf = df_usf[['date','school','state','content', 'word_count']]

# Printing dataframe so we can view all entries
print(df_usf.to_string())

         date school state                                            content  word_count
0   27-Jan-20    USF    FL  JANUARY 27, 2020COMMUNITY Dear USF students, f...         503
1   31-Jan-20    USF    FL  JANUARY 31, 2020COMMUNITY Dear USF community, ...         471
2   28-Feb-20    USF    FL  FEBRUARY 28, 2020COMMUNITY Dear USF community,...         901
3    2-Mar-20    USF    FL  Dear USF community, The University of South Fl...         544
4   11-Mar-20    USF    FL  MARCH 11, 2020COMMUNITY, FACULTY, STAFF, STUDE...         787
5   11-Mar-20    USF    FL  MARCH 11, 2020PARENTS AND FAMILY The Universit...         314
6   12-Mar-20    USF    FL  MARCH 12, 2020STUDENTS Dear USF Education Abro...         256
7   13-Mar-20    USF    FL  MARCH 13, 2020STUDENTS Dear USF students, The ...         367
8   13-Mar-20    USF    FL  MARCH 13, 2020FACULTY Dear Colleagues, I am wr...         243
9   15-Mar-20    USF    FL  MARCH 15, 2020COMMUNITY, FACULTY, STAFF, STUDE...         364
10  17-Mar

## Take a look at University of Miami

In [33]:
# Adding a 'state' column and setting its default value to 'TX'
df_um['state'] = 'FL'

# Dropping the empty rows at the bottom of df_um
df_um = df_um.dropna()

# Renamine the columns to match other Texas data frames
df_um.columns = ['date', 'content', 'school', 'state']

# Reordering the columns into a more readable format
df_um = df_um[['date','school','state','content']]

# Printing dataframe so we can view all entries
print(df_um.to_string())

         date school                                              state content
0   27-Jan-20     FL  Health Advisory: Novel Coronavirus (2019-nCoV)...   Miami
1   31-Jan-20     FL  To the University of Miami Community,\n\nWe ar...   Miami
2   26-Feb-20     FL  To the University of Miami Community,\n\nFollo...   Miami
3   28-Feb-20     FL  To the University of Miami Community,\n\nThe U...   Miami
4   05-Mar-20     FL  Dear Faculty:\n\nAs we prepare for spring brea...   Miami
5   06-Mar-20     FL  University of Miami President Julio Frenk disc...   Miami
6   11-Mar-20     FL  To the University of Miami Community,\n\nWe ar...   Miami
7   12-Mar-20     FL  To the University of Miami Community,\n\nThe U...   Miami
8   13-Mar-20     FL  Dear Faculty,\n\nThe COVID-19 pandemic is disr...   Miami
9   14-Mar-20     FL  UPDATE: HR POLICIES\n\nDear Gables and Marine ...   Miami
10  14-Mar-20     FL  University of Miami President Julio Frenk upda...   Miami
11  16-Mar-20     FL  Dear Faculty,\n\nW

## Combining all of our Florida  dataframes

In [34]:
# concatenating the dataframes together
df_fl = pd.concat([df_ucf, df_uf,df_usf, df_um], sort= True)
df_fl = df_fl[['date','school','state','content', 'word_count']]

# looking at the entire dataframe
print(df_tx.to_string())

           date                     school state                                            content
0     12-May-20                     Austin    TX  Admissions has suspended campus visits, Admiss...
1     13-May-20                     Austin    TX  COVID-19 Identified within UT Community - from...
2     15-May-20                     Austin    TX  Through March 30, students are on spring break...
3     16-May-20                     Austin    TX  Starting March 16, 2020, all campus buildings ...
4     17-May-20                     Austin    TX  Starting March 16, 2020, all campus buildings ...
5     18-May-20                     Austin    TX  New COVID-19 Cases in UT Community - from Pres...
6     19-May-20                     Austin    TX  Working Through These Remote Days Ahead - from...
7     20-May-20                     Austin    TX  Dear UT Community,\r\n\r\nI just wanted to sha...
8     23-May-20                     Austin    TX  Reimbursement for services no longer available...
