# Project 5: Optimizing Evacuation Routes using Real-Time Traffic Information

Kelly Slatery | US-DSI-10 | 02.21.2020

## Test Data Predictions

In [1]:
# Imports
import numpy as np
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
%matplotlib inline

from sklearn.model_selection import cross_val_score
from sklearn.metrics import confusion_matrix
import pickle

## Import Test Data

In [2]:
# Import test data file
df = pd.read_csv('./data/test_data/final_test_data.csv')
df.shape

(3087, 3)

In [3]:
df.head()

Unnamed: 0,dates&time,user,tweet
0,2017-08-31 21:34:27+00:00,DallasPD,Reminder: Texas State Law prohibiting texting ...
1,2017-08-31 21:03:18+00:00,DallasPD,Brotherhood for the Fallen Charity Event
2,2017-08-31 17:16:43+00:00,DallasPD,FREE #TRINITY EVENT - Artisan Fair Market - Se...
3,2017-08-31 17:13:36+00:00,DallasPD,Our thoughts and prayers are with the Sacramen...
4,2017-08-31 17:10:47+00:00,DallasPD,How can Dallas residents help animals affected...


In [4]:
# Define X for modeling
X = df['tweet']
X.head()

0    Reminder: Texas State Law prohibiting texting ...
1             Brotherhood for the Fallen Charity Event
2    FREE #TRINITY EVENT - Artisan Fair Market - Se...
3    Our thoughts and prayers are with the Sacramen...
4    How can Dallas residents help animals affected...
Name: tweet, dtype: object

## Import Model

In [5]:
# Import model and look at first 5 predictions
model = pickle.load(open('./assets/lr_cv.sav','rb'))
print(model.predict(X)[:5])

[0 0 0 0 0]


In [6]:
# Create a new column with the predictions
df['class'] = list(model.predict(X))
df.head()

Unnamed: 0,dates&time,user,tweet,class
0,2017-08-31 21:34:27+00:00,DallasPD,Reminder: Texas State Law prohibiting texting ...,0
1,2017-08-31 21:03:18+00:00,DallasPD,Brotherhood for the Fallen Charity Event,0
2,2017-08-31 17:16:43+00:00,DallasPD,FREE #TRINITY EVENT - Artisan Fair Market - Se...,0
3,2017-08-31 17:13:36+00:00,DallasPD,Our thoughts and prayers are with the Sacramen...,0
4,2017-08-31 17:10:47+00:00,DallasPD,How can Dallas residents help animals affected...,0


In [7]:
# Look at useful tweets
print(df[df['class']==1].shape)
df[df['class']==1].head()

(103, 4)


Unnamed: 0,dates&time,user,tweet,class
239,2017-09-01 04:36:40+00:00,EPPOLICE,"I-10 East at Airway, scheduled road work, all ...",1
240,2017-09-01 04:09:53+00:00,EPPOLICE,"I-10 East at Mesa, schedule road work, all lan...",1
242,2017-09-01 00:39:43+00:00,EPPOLICE,"I-10 East @US-54, Collision, Right Lane Closed...",1
247,2017-08-31 23:10:23+00:00,EPPOLICE,"I-10 East @Schuster, Collision, Right Shoulder...",1
248,2017-08-31 22:51:34+00:00,EPPOLICE,"I-10 West @Trowbridge, Collision, Right Lane C...",1


In [8]:
df[df['class']==1].tail()

Unnamed: 0,dates&time,user,tweet,class
2914,2017-08-25 13:00:53+00:00,I35travel,Waxahachie | US 287 Business WB@I-35 E | Vario...,1
2948,2017-08-31 18:31:58+00:00,TxDOTLufkin,ALERT: SL 287 East remains closed in Lufkin. A...,1
3040,2017-08-30 02:10:33+00:00,my290Houston,US 290 EB closed from Fry to Barker Cypress is...,1
3053,2017-08-29 15:48:59+00:00,my290Houston,"No, if you do not need to travel, please stay ...",1
3069,2017-08-28 13:59:02+00:00,my290Houston,US 290 mainlanes & frontage are closed in both...,1


## Export Data with Predictions

In [9]:
df.to_csv('./data/final_data_with_predictions.csv', index=False)