# SAMueL-2 full production analysis

## Import packages

In [1]:
import warnings
warnings.filterwarnings("ignore")

import pandas as pd
from utils.data_process import DataProcess
from utils.descriptive_stats import DescriptiveStatistics
from utils.pathway import Pathway
from utils.reporting import GlobalReport
from utils.thrombolysis_choice_model import ThrombolysisChoiceModel


## Create data for models

See 'data' folder for processing of raw data.

In [2]:
process_new_data = True

if process_new_data:
    data_processor = DataProcess(year_min=2016, year_max=2019)
    data_processor.create_ml_data()
    data_processor.calculate_paramters_for_pathway_simulation()

All rows: 233501, ML rows:87918, Fraction: 0.38


## Descriptive statistics

In [3]:
ds = DescriptiveStatistics(year_min=2019)
ds.run()

## Thrombolysis decision model

In [4]:
thrombolysis_choice_model = ThrombolysisChoiceModel()
thrombolysis_choice_model.run()

Accuracy: 0.846
Balanced accuracy: 0.817
ROC AUC: 0.915
Actual thrombolysis: 0.303
Predicted thrombolysis: 0.301


## Pathway model

In [5]:
# Initialize pathway simulation with base case parameters
pathway = Pathway(
    data_processor.pathway_simulation_parameters,
    thrombolysis_choice_model.benchmark_thrombolysis,
    trials=10)
pathway.run()

## Reporting

In [6]:
report = GlobalReport()
report.create_report()