# SAMueL-2 full production analysis

## Import packages

In [1]:
import warnings
warnings.filterwarnings("ignore")

import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
from utils.data_process import DataProcess
from utils.descriptive_stats import DescriptiveStatistics
from utils.pathway import Pathway
from utils.reporting import GlobalReport
from utils.thrombolysis_choice_outcome import ThrombolysisChoiceOutcome


## Create data for models

See 'data' folder for processing of raw data.

In [2]:
data_processor = DataProcess(
    year_min=2016,
    year_max=2021,
    limit_to_ambo=False,
)

data_processor.run()

All rows: 358925, ML rows:132426, Fraction: 0.37


## Model Run

In [3]:
# Descriptive statistics
ds = DescriptiveStatistics()
ds.run()

In [4]:
# ML Models
choice_outcome_model = ThrombolysisChoiceOutcome()
choice_outcome_model.run()

ROC AUC: 0.938
Actual thrombolysis: 0.300
Predicted thrombolysis: 0.299
Outcome multiclass ROC AUC 0.852


In [5]:
pathway = Pathway(
    data_processor.pathway_simulation_parameters, trials=10)
pathway.run()