In [1]:
%run ../src/model/run_script.ipynb

In [2]:
conf = get_conf()

trans = get_datasources(conf)["trans_info"]
item = get_datasources(conf)["item_info"]
stores = get_datasources(conf)["outlets_info"]

trans = pre_process_transaction_info(trans)
item = pre_process_item_info(item)
store = pre_process_stores_info(stores)
no_categories = conf['params']["no_categories"]
cutoff = conf['train_test_split']["cutoff"]

# Create Master table
master_table=create_master_table(trans,item,no_categories,store)

#Encode the Categorical columns
data = one_hot_encode_columns(master_table)

# Splitting the data into training and test sets
X_train, X_test, y_train, y_test = create_train_test_split(data, cutoff)

# Load the saved model
best_model_grid = joblib.load('best_model_grid.pkl')
# Load the saved predictions
y_pred = joblib.load('y_pred.pkl')

# Select feature names with non-zero importance
selected_features, selected_importances = selected_features(best_model_grid, X_train.columns)

# Calculating the model performance using accuracy metrics
rmsle, mae, r2, adj_r2, total_mape, avg_mape = calculate_model_accuracy(y_test, y_pred, selected_features)

In [3]:
print("\nRoot Mean Squared Squared Logarithmic Error (RMSLE):", round(rmsle, 3))
print("Mean Absolute Error (MAE):", round(mae, 3))
print("R-squared (R2) Score:", round(r2, 3))
print("Adjusted R-squared:", round(adj_r2, 3))
print("Total Mean Absolute Percentage Error (MAPE):", round(total_mape, 3))
print("Average Mean Absolute Percentage Error (MAPE):", round(avg_mape, 3))


Root Mean Squared Squared Logarithmic Error (RMSLE): 1.806
Mean Absolute Error (MAE): 84.705
R-squared (R2) Score: 0.926
Adjusted R-squared: 0.922
Total Mean Absolute Percentage Error (MAPE): 12.719
Average Mean Absolute Percentage Error (MAPE): 24.393
