In [None]:
# code required for running model post creation:

# import dependencies
import numpy as np
import pandas as pd

from sklearn.preprocessing import LabelEncoder
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.externals import joblib

from keras.models import load_model

# load vectorizer and label encoder
vectorizer = joblib.load('vectorizer.pkl')
label_encoder = joblib.load('label_encoder.pkl') 

# load the model
model = load_model("auth_model_trained.h5")

# test the data, assuming that the input data is in the same format as the original auth.txt.gz file without the SuccessFailure column.

# start by converting the data into a useable format
# create the header
header = ["Time", "SourceUserDomain", "DestUserDomain", "SourceComputer", "DestComputer", "AuthType", "LogonType", "AuthOrientation"]

# create a test data frame, replace the file path with that of the test data, change column names to headers, drop unnecessary columns
test_df = pd.read_csv('./Data/CSVs/tester.csv', header=None)
test_df.columns = header
test_df = test_df.drop(["DestUserDomain", "SourceComputer", "DestComputer", "DestUserDomain", "Time", "AuthType"], axis=1)

# transform the data into the proper testing format
test = test_df["SourceUserDomain"] + ' ' + test_df["LogonType"] + ' ' + test_df["AuthOrientation"]

# run the test data through the vectorizer, model, and label encoder
test_vec = vectorizer.transform(test)
encoded_test = model.predict_classes(test_vec)
predict_label = label_encoder.inverse_transform(encoded_test)
print("Logon Prediction: " + predict_label[0])