# SAMueL-2 full production analysis

## Import packages

In [1]:
import warnings
warnings.filterwarnings("ignore")

import pandas as pd
from utils.data_process import DataProcess
from utils.descriptive_stats import DescriptiveStatistics
from utils.pathway import Pathway
from utils.reporting import GlobalReport
from utils.thrombolysis_choice_model import ThrombolysisChoiceModel
from utils.thrombolysis_outcome_model import OutcomeModel

## Create data for models

See 'data' folder for processing of raw data.

In [2]:
data_processor = DataProcess(
    year_min=2019,
    year_max=2021,
    limit_to_ambo=False,
)

data_processor.run()

All rows: 185673, ML rows:66820, Fraction: 0.36


## Model Run

In [3]:
run_model = True

if run_model:
    # Descriptive statistics
    ds = DescriptiveStatistics()
    #ds.run()
    
    # Thrombolysis decision model
    thrombolysis_choice_model = ThrombolysisChoiceModel()
    #thrombolysis_choice_model.run()

    # Outcome model
    outcome_model = OutcomeModel()
    outcome_model.run()

    # Pathway simulation
    #
    # pathway = Pathway(
    #    data_processor.pathway_simulation_parameters,
    #    thrombolysis_choice_model.benchmark_thrombolysis,
    #    trials=100)
    #pathway.run()

Outcome multiclass ROC AUC 0.781


## Reporting

In [4]:
report = GlobalReport()
report.create_report()

## To Do

* Restrict stroke units to minimum admissions and thrombolysis use (can currently crash with restricted data years)