# Load packages

In [1]:
import pandas as pd
from pathlib import Path
from tableone import TableOne

# Set up paths

In [4]:
code_dir = Path.cwd()
statistics_dir = code_dir.parent
source_dir = statistics_dir / "input"
output_dir = statistics_dir / "output/tableone"
output_dir.mkdir(exist_ok=True, parents=True)

# Load data

In [5]:
statistics_df = pd.read_csv(source_dir / 'statistics_df_randomized.csv', index_col = "sub_id")
pwi_vs_trial_df = pd.read_csv(source_dir / 'pwi_vs_trial_df.csv', index_col = "sub_id")

### Variable dictionary for symptomatic intracranial hemmorrhage
- SAB1 SICH according to SITS-MOST
- SAB2 SICH according to ECASS-2
- SAB3 SICH according to ECASS-3
- SAB4 SICH according to NINDS

# Create Table 1

In [None]:
# Specify columns and categorical variables
columns = [
    "AGE", 
    "SEX", 
    "NIHSSSCORE_V00", 
    "Arterial_hypertension", 
    "Hypercholesterolemia", 
    "Diabetes_mellitus_type_II", 
    "Atrial_fibrillation", 
    "Ischemic_stroke",
    "stroke_volume_v00",
    "rapid_pwi_volume_v00",
    "treatment", 
    "LVO_V0",
    "hemorrhage",
    "hemorrhage_type_hi1",
    "hemorrhage_type_hi2",
    "hemorrhage_type_ph1",
    "hemorrhage_type_ph2",
    "hemorrhage_type_other",
    "SAB1", 
    "SAB2", 
    "SAB3", 
    "SAB4", 
    "excellent_outcome",
    "NIHSSSCORE_V05"
    ]

categorical = [
    "SEX", 
    "Arterial_hypertension", 
    "Hypercholesterolemia", 
    "Diabetes_mellitus_type_II", 
    "Atrial_fibrillation", 
    "Ischemic_stroke",  
    "treatment", 
    "LVO_V0",
    "hemorrhage",
    "hemorrhage_type_hi1",
    "hemorrhage_type_hi2",
    "hemorrhage_type_ph1",
    "hemorrhage_type_ph2",
    "hemorrhage_type_other", 
    "SAB1", 
    "SAB2", 
    "SAB3", 
    "SAB4", 
    "excellent_outcome"
    ]

nonnormal = ["NIHSSSCORE_V00", "NIHSSSCORE_V05"]

# Create Table 1
table1 = TableOne(statistics_df, columns=columns, nonnormal=nonnormal, categorical=categorical)

# Save Table 1
table1.to_csv(output_dir / "table_1.csv")

# Print Table 1
table1

# Comparison of perfusion sample with RCT sample

In [None]:
# Specify columns and categorical variables
columns = [
    "AGE", 
    "SEX", 
    "NIHSSSCORE_V00", 
    "Arterial_hypertension", 
    "Hypercholesterolemia", 
    "Diabetes_mellitus_type_II", 
    "Atrial_fibrillation", 
    "Ischemic_stroke",
    "stroke_volume_v00",
    "treatment", 
    "LVO_V0",
    "hemorrhage",
    "hemorrhage_type_hi1",
    "hemorrhage_type_hi2",
    "hemorrhage_type_ph1",
    "hemorrhage_type_ph2",
    "hemorrhage_type_other",
    "SAB1", 
    "SAB2", 
    "SAB3", 
    "SAB4", 
    "excellent_outcome",
    "NIHSSSCORE_V05"
    ]

categorical = [
    "SEX", 
    "Arterial_hypertension", 
    "Hypercholesterolemia", 
    "Diabetes_mellitus_type_II", 
    "Atrial_fibrillation", 
    "Ischemic_stroke",  
    "treatment", 
    "LVO_V0",
    "hemorrhage",
    "hemorrhage_type_hi1",
    "hemorrhage_type_hi2",
    "hemorrhage_type_ph1",
    "hemorrhage_type_ph2",
    "hemorrhage_type_other",
    "SAB1", 
    "SAB2", 
    "SAB3", 
    "SAB4", 
    "excellent_outcome"
    ]

nonnormal = ["NIHSSSCORE_V00", "NIHSSSCORE_V05"]

# Create Table S1
table_s1 = TableOne(pwi_vs_trial_df, columns=columns, categorical=categorical, nonnormal=nonnormal, groupby='pwi_sample', pval=True)

# Save Table S1
table_s1.to_csv(output_dir / "table_s1.csv")

# Print Table S1
table_s1