# INCREMENT-SOT CAZ-AVI

Análisis estadístico para la cohort **INCREMENT-SOT CAZ-AVI** para el estudio retrospectivo del tratamiento con CAZ-AVI frente al resto de terapias disponibles en diferentes centros.

## Control por Propensity-score

                                              ["Age", "Gender",
                                               "Biliary_stenosis", "CMV_disease",
                                               "Kidney_disease", "Post_transplant_dialysis",
                                               "Score_Charlson_AMN", "Acquisition",
                                               "SIRS_SevereORSchock", "Pitt_Score",
                                               "Source_infection_Urinary_tract",
                                               "Source_infection_Pneumonia",
                                               "SourceControl_before30days", "Surgical_debridement",
                                               "Carbapenemase", "Removal_Replacement_vascular_line",
                                               "Myocardial_Infarct", "Diabetes_Mellitus",
                                               "Chronic_Pulmonary_Disease"]



## Tablas

### Tabla 1

In [1]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import BivariantTable

result = BivariantTable(dataframe = workDataframe,
                        classVariable = "Cohort_Cazavi",
                        excludedVariables = ["Pt", "ps_cvsm", "Caso_REC_3digitos"]).run()

result.to_excel("tabla_1_raw.xlsx")
result

Unnamed: 0,Variable,All,no,yes,P_value,Test,Variable_type,Normality,Homocedasticity
0,Center,,,,0.001,Pearson Chi Square Test,categorical,,
1,----> Center-FMUSP,8 (0.05),7 (0.11),1 (0.01),0.031,Pearson Chi Square Test,categorical,,
2,----> Center-Gemelli,19 (0.13),4 (0.06),15 (0.18),0.053,Pearson Chi Square Test,categorical,,
3,----> Center-HCKT,21 (0.14),16 (0.24),5 (0.06),0.003,Pearson Chi Square Test,categorical,,
4,----> Center-HPG23,8 (0.05),3 (0.05),5 (0.06),0.975,Pearson Chi Square Test,categorical,,
...,...,...,...,...,...,...,...,...,...
2,----> Source_infection_Vascular_access-yes,25 (0.17),16 (0.24),9 (0.11),0.051,Pearson Chi Square Test,categorical,,
0,Source_infection_other,,,,0.070,Pearson Chi Square Test,categorical,,
1,----> Source_infection_other-no,143 (0.96),66 (1.00),77 (0.93),0.070,Pearson Chi Square Test,categorical,,
2,----> Source_infection_other-yes,6 (0.04),0 (0.00),6 (0.07),0.070,Pearson Chi Square Test,categorical,,


### Tabla 2.A

In [2]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import LogisticRegression

targetVariable = ["Gender",
                  "ICS_SOT_score",
                  "Cohort_Cazavi",
                  "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_14d",
                            targetVariable = targetVariable).run()

result.params.to_excel("tabla_2a_params_raw.xlsx")
result.summary.to_excel("tabla_2a_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aOR,CI 2.5%,CI 97.5%,P value,Coef,Raw CI 2.5%,Raw CI 97.5%,Standard Err.
0,Intercept,3.708645,0.967821,14.211352,0.055845,1.310667,-0.032708,2.654041,0.685408
1,ICS_SOT_score,0.81371,0.737184,0.89818,4.3e-05,-0.206151,-0.304918,-0.107385,0.050392
2,ps_cvsb,1.627478,0.21309,12.429867,0.638699,0.487032,-1.546039,2.520102,1.0373
3,Gender_male,2.624401,1.009805,6.820605,0.047705,0.964853,0.009758,1.919948,0.487302
4,Cohort_Cazavi_yes,2.649322,1.025685,6.843142,0.044184,0.974304,0.025361,1.923247,0.484164


In [3]:
result.summary

Unnamed: 0,Value,CI 2.5%,CI 97.5%
Area under curve ROC,0.789794,0.69936,0.880229
Best Cutoff,0.729561,0.677212,0.781911
Accuracy,0.742857,0.668748,0.816966
Error,0.257143,0.183034,0.331252
Precision,0.882353,0.813655,0.951051
Recall,0.742574,0.654246,0.830903
F1,0.806452,0.742667,0.870236
Sensitivity,0.742574,0.654246,0.830903
Specificity,0.74359,0.604629,0.88255
PPV,0.882353,0.813655,0.951051


### Tabla 2.B

In [4]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["ICS_SOT_score"] >= 8]

from pystats_utils.test.multivariant import LogisticRegression

targetVariable = ["Gender",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_14d",
                            targetVariable = targetVariable).run()

result.params.to_excel("tabla_2b_params_raw.xlsx")
result.summary.to_excel("tabla_2b_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aOR,CI 2.5%,CI 97.5%,P value,Coef,Raw CI 2.5%,Raw CI 97.5%,Standard Err.
0,Intercept,0.135072,0.03124,0.584016,0.007364,-2.001947,-3.466068,-0.537826,0.747014
1,ps_cvsb,1.870961,0.163374,21.426295,0.614553,0.626452,-1.811714,3.064619,1.243985
2,Gender_male,4.595092,1.356525,15.565411,0.014293,1.524989,0.304926,2.745051,0.622492
3,Cohort_Cazavi_yes,4.133872,1.274053,13.413017,0.018114,1.419215,0.242203,2.596226,0.600527


In [5]:
result.summary

Unnamed: 0,Value,CI 2.5%,CI 97.5%
Area under curve ROC,0.7507,0.629551,0.871849
Best Cutoff,0.481933,0.367063,0.596804
Accuracy,0.723684,0.622453,0.824915
Error,0.276316,0.175085,0.377547
Precision,0.769231,0.632338,0.906124
Recall,0.714286,0.576917,0.851654
F1,0.740741,0.630939,0.850543
Sensitivity,0.714286,0.576917,0.851654
Specificity,0.735294,0.584181,0.886407
PPV,0.769231,0.632338,0.906124


### Tabla 3.A

In [6]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import LogisticRegression

targetVariable = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariable = targetVariable).run()

result.params.to_excel("tabla_3a_params_raw.xlsx")
result.summary.to_excel("tabla_3a_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aOR,CI 2.5%,CI 97.5%,P value,Coef,Raw CI 2.5%,Raw CI 97.5%,Standard Err.
0,Intercept,3.510539,0.873811,14.103605,0.076752,1.25577,-0.134891,2.64643,0.709534
1,ICS_SOT_score,0.803338,0.72388,0.891519,3.8e-05,-0.218979,-0.32313,-0.114829,0.053139
2,ps_cvsb,1.926675,0.232546,15.962764,0.543268,0.655796,-1.458667,2.770259,1.078827
3,Gender_male,3.078909,1.137658,8.332631,0.026838,1.124575,0.128972,2.120179,0.50797
4,Cohort_Cazavi_yes,3.140749,1.174849,8.396233,0.02254,1.144461,0.16114,2.127783,0.501704


In [7]:
result.summary

Unnamed: 0,Value,CI 2.5%,CI 97.5%
Area under curve ROC,0.811598,0.725026,0.89817
Best Cutoff,0.735433,0.670701,0.800164
Accuracy,0.771429,0.700297,0.842561
Error,0.228571,0.157439,0.299703
Precision,0.908046,0.846635,0.969457
Recall,0.76699,0.684705,0.849276
F1,0.831579,0.773098,0.89006
Sensitivity,0.76699,0.684705,0.849276
Specificity,0.783784,0.645576,0.921992
PPV,0.908046,0.846635,0.969457


### Tabla 3.B

In [8]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["ICS_SOT_score"] >= 8]

from pystats_utils.test.multivariant import LogisticRegression

targetVariable = ["Gender",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariable = targetVariable).run()

result.params.to_excel("tabla_3b_params_raw.xlsx")
result.summary.to_excel("tabla_3b_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aOR,CI 2.5%,CI 97.5%,P value,Coef,Raw CI 2.5%,Raw CI 97.5%,Standard Err.
0,Intercept,0.107991,0.023753,0.490978,0.003969,-2.225705,-3.740053,-0.711357,0.772641
1,ps_cvsb,2.666262,0.221467,32.099379,0.439821,0.980678,-1.507481,3.468837,1.269492
2,Gender_male,4.99228,1.439457,17.314071,0.011275,1.607893,0.364266,2.85152,0.634515
3,Cohort_Cazavi_yes,4.466102,1.347233,14.805213,0.014389,1.496516,0.298053,2.694979,0.611472


In [9]:
result.summary

Unnamed: 0,Value,CI 2.5%,CI 97.5%
Area under curve ROC,0.775194,0.6584,0.891987
Best Cutoff,0.513837,0.418033,0.609642
Accuracy,0.723684,0.623035,0.824333
Error,0.276316,0.175667,0.376965
Precision,0.789474,0.65629,0.922657
Recall,0.697674,0.558633,0.836716
F1,0.740741,0.630866,0.850615
Sensitivity,0.697674,0.558633,0.836716
Specificity,0.757576,0.607464,0.907688
PPV,0.789474,0.65629,0.922657


### Tabla 4.A

In [10]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import CoxPhRegression

targetVariable = ["Gender",
                   "Age",
                   "ICS_SOT_score",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = CoxPhRegression(dataframe = workDataframe,
                         eventVariable = "Mortality_31d",
                         timeVariable = "Time2death_31d",
                         targetVariable = targetVariable).run()

result.params.to_excel("tabla_4a_params_raw.xlsx")
result.summary.to_excel("tabla_4a_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aHR,CI 2.5%,CI 97.5%,P values,Raw Coef,Raw CI 2.5%,Raw CI 97.5%,Std Error
Age,Age,0.989691,0.954694,1.025972,0.572677,-0.010362,-0.046365,0.02564,0.018369
ICS_SOT_score,ICS_SOT_score,1.177578,1.080303,1.283612,0.000203,0.16346,0.077242,0.249678,0.04399
ps_cvsb,ps_cvsb,0.703427,0.096199,5.143624,0.728922,-0.351792,-2.341341,1.637758,1.015095
Gender_male,Gender_male,0.425206,0.192208,0.940649,0.034772,-0.855181,-1.649176,-0.061185,0.405107
Cohort_Cazavi_yes,Cohort_Cazavi_yes,0.597564,0.229997,1.552556,0.290534,-0.514894,-1.46969,0.439903,0.48715


In [11]:
result.summary

Unnamed: 0,Values
Concordance,0.762722
Partial AIC,255.874187
Partial log-likelihood,-122.937093
Log-likelihood ratio statistic,25.06479
Log-likelihood ratio df,5.0
Log-likelihood ratio p value,0.000135
Log-likelihood ratio -log2(p),12.85073


### Tabla 4.B

In [12]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["ICS_SOT_score"] >= 8]


from pystats_utils.test.multivariant import CoxPhRegression

targetVariable = ["Gender",
                   "Age",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = CoxPhRegression(dataframe = workDataframe,
                         eventVariable = "Mortality_31d",
                         timeVariable = "Time2death_31d",
                         targetVariable = targetVariable).run()

result.params.to_excel("tabla_4b_params_raw.xlsx")
result.summary.to_excel("tabla_4b_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aHR,CI 2.5%,CI 97.5%,P values,Raw Coef,Raw CI 2.5%,Raw CI 97.5%,Std Error
Age,Age,0.996318,0.955882,1.038464,0.861463,-0.003689,-0.045121,0.037743,0.021139
ps_cvsb,ps_cvsb,0.581527,0.07714,4.383875,0.598904,-0.542097,-2.562128,1.477933,1.030647
Gender_male,Gender_male,0.461501,0.203834,1.044886,0.063646,-0.773272,-1.590451,0.043908,0.416936
Cohort_Cazavi_yes,Cohort_Cazavi_yes,0.56612,0.216886,1.477698,0.245127,-0.568949,-1.528383,0.390485,0.489516


In [13]:
result.summary

Unnamed: 0,Values
Concordance,0.659218
Partial AIC,214.688686
Partial log-likelihood,-103.344343
Log-likelihood ratio statistic,8.798051
Log-likelihood ratio df,4.0
Log-likelihood ratio p value,0.06635
Log-likelihood ratio -log2(p),3.913754


## Tablas suplementarias

### Tabla S2

In [14]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Global"] == "yes"]

from pystats_utils.pipeline import UnivariantTable

result = UnivariantTable(dataframe = workDataframe,
                         excludedVariables = ["Pt", "Caso_REC_3digitos"]).run()

result.to_excel("tabla_S2_raw.xlsx")
result

Unnamed: 0,Variable,Information,Non empty
0,Center,,210
1,----> Center_FMUSP,14 (6.67),
2,----> Center_Gemelli,20 (9.52),
3,----> Center_HCKT,38 (18.10),
4,----> Center_HPG23,9 (4.29),
...,...,...,...
274,Source_infection_other,,210
275,----> Source_infection_other_no,204 (97.14),
276,----> Source_infection_other_yes,6 (2.86),
277,ps_cvsb,0.56 (0.37 - 0.76),140


### Tabla S4

In [15]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Global"] == "yes"]

from pystats_utils.pipeline import CutoffTable

result = CutoffTable(dataframe = workDataframe,
                    classVariable = "Mortality_31d",
                    targetVariable = "ICS_SOT_score").run()

result.to_excel("tabla_S4_raw.xlsx")
result

Unnamed: 0,Cutoff,Proportion,True positive,False positive,True negative,False negative,Sensitivity,Specificity,PPV,NPV,Accuracy
0,Var >= 0,100.0,49,161,0,0,1.00 (1.00 - 1.00),0.00 (0.00 - 0.00),0.23 (0.18 - 0.29),nan (0.00 - 1.00),0.23 (0.18 - 0.29)
1,Var >= 1,89.52,49,139,22,0,1.00 (1.00 - 1.00),0.14 (0.09 - 0.19),0.26 (0.20 - 0.32),1.00 (1.00 - 1.00),0.34 (0.28 - 0.40)
2,Var >= 2,89.52,49,139,22,0,1.00 (1.00 - 1.00),0.14 (0.08 - 0.19),0.26 (0.20 - 0.32),1.00 (1.00 - 1.00),0.34 (0.27 - 0.40)
3,Var >= 3,87.14,48,135,26,1,0.98 (0.94 - 1.00),0.16 (0.10 - 0.22),0.26 (0.20 - 0.33),0.96 (0.89 - 1.00),0.35 (0.28 - 0.42)
4,Var >= 4,79.05,47,119,42,2,0.96 (0.90 - 1.00),0.26 (0.19 - 0.33),0.28 (0.22 - 0.35),0.95 (0.89 - 1.00),0.42 (0.36 - 0.49)
5,Var >= 5,70.48,46,102,59,3,0.94 (0.87 - 1.00),0.37 (0.29 - 0.44),0.31 (0.23 - 0.39),0.95 (0.90 - 1.00),0.50 (0.43 - 0.57)
6,Var >= 6,69.05,46,99,62,3,0.94 (0.87 - 1.00),0.39 (0.31 - 0.46),0.32 (0.24 - 0.39),0.95 (0.90 - 1.00),0.51 (0.45 - 0.58)
7,Var >= 7,66.19,46,93,68,3,0.94 (0.87 - 1.00),0.42 (0.34 - 0.50),0.33 (0.25 - 0.41),0.96 (0.91 - 1.00),0.54 (0.47 - 0.61)
8,Var >= 8,59.05,46,78,83,3,0.94 (0.87 - 1.00),0.52 (0.44 - 0.59),0.37 (0.29 - 0.46),0.97 (0.93 - 1.00),0.61 (0.55 - 0.68)
9,Var >= 9,45.71,36,60,101,13,0.73 (0.61 - 0.86),0.63 (0.55 - 0.70),0.38 (0.28 - 0.47),0.89 (0.83 - 0.94),0.65 (0.59 - 0.72)


### Tabla S5.A

In [16]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import ExtendedContingencyTable

workDataframe["ICS_ge8"] = workDataframe.ICS_SOT_score >= 8
workDataframe["ICS_ge8"] = workDataframe["ICS_ge8"].replace(True, "yes").replace(False, "no")

result = ExtendedContingencyTable(dataframe = workDataframe,
                                  classVariable = "Cohort_Cazavi",
                                  targetVariable = "Clinical_success_14d",
                                  cohortVariable = "ICS_ge8").run()

result.to_excel("tabla_S5a_raw.xlsx")
result

Unnamed: 0,Cohort-ICS_ge8,All,Cohort_Cazavi no,Cohort_Cazavi yes,P value
0,All,107/149 (71.81),40/66 (60.61),67/83 (80.72),0.011
1,no,62/68 (91.18),26/30 (86.67),36/38 (94.74),0.463
2,yes,45/81 (55.56),14/36 (38.89),31/45 (68.89),0.013


### Tabla S5.B

In [17]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import ExtendedContingencyTable

workDataframe["ICS_ge8"] = workDataframe.ICS_SOT_score >= 8
workDataframe["ICS_ge8"] = workDataframe["ICS_ge8"].replace(True, "yes").replace(False, "no")

result = ExtendedContingencyTable(dataframe = workDataframe,
                                  classVariable = "Cohort_Cazavi",
                                  targetVariable = "Clinical_success_30d",
                                  cohortVariable = "ICS_ge8").run()

result.to_excel("tabla_S5b_raw.xlsx")
result

Unnamed: 0,Cohort-ICS_ge8,All,Cohort_Cazavi no,Cohort_Cazavi yes,P value
0,All,109/149 (73.15),40/66 (60.61),69/83 (83.13),0.004
1,no,63/68 (92.65),26/30 (86.67),37/38 (97.37),0.226
2,yes,46/81 (56.79),14/36 (38.89),32/45 (71.11),0.007


### Tabla S5.C

In [18]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import ExtendedContingencyTable

workDataframe["ICS_ge8"] = workDataframe.ICS_SOT_score >= 8
workDataframe["ICS_ge8"] = workDataframe["ICS_ge8"].replace(True, "yes").replace(False, "no")

result = ExtendedContingencyTable(dataframe = workDataframe,
                                  classVariable = "Cohort_Cazavi",
                                  targetVariable = "Mortality_31d",
                                  cohortVariable = "ICS_ge8").run()

result.to_excel("tabla_S5c_raw.xlsx")
result

Unnamed: 0,Cohort-ICS_ge8,All,Cohort_Cazavi no,Cohort_Cazavi yes,P value
0,All,29/149 (19.46),18/66 (27.27),11/83 (13.25),0.053
1,no,2/68 (2.94),2/30 (6.67),0/38 (0.00),0.372
2,yes,27/81 (33.33),16/36 (44.44),11/45 (24.44),0.097


### Tabla S6

In [19]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_14d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_S6_raw.xlsx")
result

Unnamed: 0,Variable,OR(95CI),P value
0,Center_Code_Brasil_1,0.29 (0.11 - 0.75),0.011
1,Center_Code_Brasil_2,0.37 (0.09 - 1.55),0.173
2,Center_Code_Italy_1,1.22 (0.48 - 3.13),0.678
3,Center_Code_Italy_2,376156.84 (0.00 - inf),0.979
4,Center_Code_Italy_3,1.30 (0.44 - 3.81),0.631
...,...,...,...
161,Source_infection_Vascular_access_yes,0.52 (0.21 - 1.28),0.154
162,Source_infection_other_no,0.50 (0.06 - 4.39),0.530
163,Source_infection_other_yes,2.01 (0.23 - 17.73),0.530
164,ps_cvsb,6.18 (1.28 - 29.81),0.023


### Tabla S7

In [20]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_30d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_S7_raw.xlsx")
result

Unnamed: 0,Variable,OR(95CI),P value
0,Center_Code_Brasil_1,0.27 (0.10 - 0.69),0.006
1,Center_Code_Brasil_2,0.34 (0.08 - 1.44),0.144
2,Center_Code_Italy_1,1.12 (0.44 - 2.89),0.807
3,Center_Code_Italy_2,351420.90 (0.00 - inf),0.979
4,Center_Code_Italy_3,1.20 (0.41 - 3.53),0.735
...,...,...,...
160,Source_infection_Vascular_access_yes,0.48 (0.19 - 1.18),0.108
161,Source_infection_other_no,0.53 (0.06 - 4.71),0.572
162,Source_infection_other_yes,1.88 (0.21 - 16.56),0.572
163,ps_cvsb,8.62 (1.69 - 43.84),0.009


### Tabla S8

In [21]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import CoxExploration


result = CoxExploration(dataframe = workDataframe,
                        eventVariable = "Mortality_31d",
                        timeVariable = "Time2death_31d",
                        excludedVariables = ["Pt", "Caso_REC_3digitos",
                                             "Center"]).run()

result.to_excel("tabla_S8_raw.xlsx")
result

Unnamed: 0,Variable,HR(95CI),P value
0,Center_Code_Brasil_1,3.88 (1.80 - 8.35,0.001
1,Center_Code_Brasil_2,3.82 (1.33 - 11.01,0.013
2,Center_Code_Italy_1,0.29 (0.07 - 1.23,0.093
3,Center_Code_Italy_2,0.00 (0.00 - inf,0.996
4,Center_Code_Italy_3,0.69 (0.21 - 2.28,0.542
...,...,...,...
172,Source_infection_Vascular_access_yes,2.67 (1.22 - 5.87,0.014
173,Source_infection_other_no,8635894.90 (0.00 - inf,0.995
174,Source_infection_other_yes,0.00 (0.00 - inf,0.995
175,ps_cvsb,0.23 (0.05 - 1.10,0.066


### Tabla S9.A

In [22]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]

from pystats_utils.pipeline import ExtendedContingencyTable

workDataframe["ICS_ge8"] = workDataframe.ICS_SOT_score >= 8
workDataframe["ICS_ge8"] = workDataframe["ICS_ge8"].replace(True, "yes").replace(False, "no")

result = ExtendedContingencyTable(dataframe = workDataframe,
                                  classVariable = "Cohort_Combi",
                                  targetVariable = "Clinical_success_14d",
                                  cohortVariable = "ICS_ge8").run()

result.to_excel("tabla_S9a_raw.xlsx")
result


Unnamed: 0,Cohort-ICS_ge8,All,Cohort_Combi no,Cohort_Combi yes,P value
0,All,67/83 (80.72),53/67 (79.10),14/16 (87.50),0.68
1,no,36/38 (94.74),30/31 (96.77),6/7 (85.71),0.805
2,yes,31/45 (68.89),23/36 (63.89),8/9 (88.89),0.295


### Tabla S9.B

In [23]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]

from pystats_utils.pipeline import ExtendedContingencyTable

workDataframe["ICS_ge8"] = workDataframe.ICS_SOT_score >= 8
workDataframe["ICS_ge8"] = workDataframe["ICS_ge8"].replace(True, "yes").replace(False, "no")

result = ExtendedContingencyTable(dataframe = workDataframe,
                                  classVariable = "Cohort_Combi",
                                  targetVariable = "Clinical_success_30d",
                                  cohortVariable = "ICS_ge8").run()

result.to_excel("tabla_S9b_raw.xlsx")
result

Unnamed: 0,Cohort-ICS_ge8,All,Cohort_Combi no,Cohort_Combi yes,P value
0,All,69/83 (83.13),54/67 (80.60),15/16 (93.75),0.373
1,no,37/38 (97.37),30/31 (96.77),7/7 (100.00),1.0
2,yes,32/45 (71.11),24/36 (66.67),8/9 (88.89),0.366


### Tabla S9.C

In [24]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]

from pystats_utils.pipeline import ExtendedContingencyTable

workDataframe["ICS_ge8"] = workDataframe.ICS_SOT_score >= 8
workDataframe["ICS_ge8"] = workDataframe["ICS_ge8"].replace(True, "yes").replace(False, "no")

result = ExtendedContingencyTable(dataframe = workDataframe,
                                  classVariable = "Cohort_Combi",
                                  targetVariable = "Mortality_31d",
                                  cohortVariable = "ICS_ge8").run()

result.to_excel("tabla_S9c_raw.xlsx")
result

Unnamed: 0,Cohort-ICS_ge8,All,Cohort_Combi no,Cohort_Combi yes,P value
0,All,11/83 (13.25),10/67 (14.93),1/16 (6.25),0.611
1,no,0/38 (0.00),0/31 (0.00),0/7 (0.00),1.0
2,yes,11/45 (24.44),10/36 (27.78),1/9 (11.11),0.544


### Tabla S10.A

In [25]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]


from pystats_utils.test.multivariant import LogisticRegression

targetVariable = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Combi",
                   "ps_cvsm"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_14d",
                            targetVariable = targetVariable).run()

result.params.to_excel("tabla_S10a_params_raw.xlsx")
result.summary.to_excel("tabla_S10a_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aOR,CI 2.5%,CI 97.5%,P value,Coef,Raw CI 2.5%,Raw CI 97.5%,Standard Err.
0,Intercept,15.568647,2.781923,87.127786,0.001782,2.745259,1.023142,4.467376,0.878647
1,ICS_SOT_score,0.793415,0.666745,0.94415,0.009119,-0.231409,-0.405348,-0.05747,0.088746
2,ps_cvsm,0.573863,0.014377,22.905275,0.767806,-0.555365,-4.242096,3.131367,1.88102
3,Gender_male,3.075491,0.724568,13.054189,0.127718,1.123464,-0.32218,2.569109,0.737587
4,Cohort_Combi_yes,1.77386,0.252089,12.482015,0.564782,0.573158,-1.377972,2.524289,0.995493


In [26]:
result.summary

Unnamed: 0,Value,CI 2.5%,CI 97.5%
Area under curve ROC,0.753846,0.597799,0.909894
Best Cutoff,0.781876,0.703484,0.860268
Accuracy,0.708861,0.607419,0.810303
Error,0.291139,0.189697,0.392581
Precision,0.92,0.842543,0.997457
Recall,0.707692,0.594334,0.821051
F1,0.8,0.717474,0.882526
Sensitivity,0.707692,0.594334,0.821051
Specificity,0.714286,0.474516,0.954055
PPV,0.92,0.842543,0.997457


### Tabla S10.B

In [27]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]


from pystats_utils.test.multivariant import LogisticRegression

targetVariable = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Combi",
                   "ps_cvsm"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariable = targetVariable).run()

result.params.to_excel("tabla_S10b_params_raw.xlsx")
result.summary.to_excel("tabla_S10b_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aOR,CI 2.5%,CI 97.5%,P value,Coef,Raw CI 2.5%,Raw CI 97.5%,Standard Err.
0,Intercept,24.8998,3.409957,181.820512,0.001528,3.21486,1.2267,5.20302,1.014386
1,ICS_SOT_score,0.749022,0.608459,0.922056,0.006426,-0.288987,-0.496825,-0.081149,0.106042
2,ps_cvsm,0.247696,0.003918,15.658846,0.509488,-1.395553,-5.542141,2.751036,2.115645
3,Gender_male,5.27715,1.04059,26.76205,0.044644,1.663386,0.039788,3.286985,0.828382
4,Cohort_Combi_yes,4.523048,0.377051,54.257877,0.233837,1.509186,-0.975376,3.993748,1.267657


In [28]:
result.summary

Unnamed: 0,Value,CI 2.5%,CI 97.5%
Area under curve ROC,0.799751,0.655509,0.943994
Best Cutoff,0.874328,0.786362,0.962295
Accuracy,0.658228,0.556262,0.760194
Error,0.341772,0.239806,0.443738
Precision,0.934783,0.863294,1.0
Recall,0.641791,0.528623,0.754959
F1,0.761062,0.674897,0.847227
Sensitivity,0.641791,0.528623,0.754959
Specificity,0.75,0.48722,1.0
PPV,0.934783,0.863294,1.0


### Tabla S10.C

In [29]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]

targetVariable = ["Gender",
                   "Age",
                   "ICS_SOT_score",
                   "Cohort_Combi",
                   "ps_cvsm"]

from pystats_utils.test.multivariant import CoxPhRegression

result = CoxPhRegression(dataframe = workDataframe,
                         eventVariable = "Mortality_31d",
                         timeVariable = "Time2death_31d",
                         targetVariable = targetVariable).run()

result.params.to_excel("tabla_S10c_params_raw.xlsx")
result.summary.to_excel("tabla_S10c_metrics_raw.xlsx")
result.params

Unnamed: 0,Predictor,aHR,CI 2.5%,CI 97.5%,P values,Raw Coef,Raw CI 2.5%,Raw CI 97.5%,Std Error
Age,Age,1.001658,0.943332,1.06359,0.956843,0.001656,-0.058337,0.06165,0.030609
ICS_SOT_score,ICS_SOT_score,1.355165,1.10116,1.667763,0.004106,0.303923,0.096364,0.511483,0.1059
ps_cvsm,ps_cvsm,3.950079,0.053944,289.247031,0.530595,1.373736,-2.91981,5.667281,2.190625
Gender_male,Gender_male,0.120098,0.024505,0.588587,0.00896,-2.11945,-3.708869,-0.53003,0.810943
Cohort_Combi_yes,Cohort_Combi_yes,0.31687,0.033062,3.036932,0.318939,-1.149265,-3.409378,1.110848,1.15314


In [30]:
result.summary

Unnamed: 0,Values
Concordance,0.818057
Partial AIC,80.975273
Partial log-likelihood,-35.487636
Log-likelihood ratio statistic,15.225826
Log-likelihood ratio df,5.0
Log-likelihood ratio p value,0.00944
Log-likelihood ratio -log2(p),6.727033


## Tabla sin numerar

### Tabla KPC Éxito clínico 14 días

In [31]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["Carbapenemase"] == "KPC"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_14d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_kpc_cs14d_raw.xlsx")

### Tabla KPC Éxito clínico 30 días

In [32]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["Carbapenemase"] == "KPC"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_30d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_kpc_cs30d_raw.xlsx")

### Tabla KPC Mortalidad 30 días

In [33]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["Carbapenemase"] == "KPC"]

from pystats_utils.pipeline import CoxExploration


result = CoxExploration(dataframe = workDataframe,
                        eventVariable = "Mortality_31d",
                        timeVariable = "Time2death_31d",
                        excludedVariables = ["Pt", "Caso_REC_3digitos",
                                             "Center"]).run()

result.to_excel("tabla_kpc_m30d_raw.xlsx")

### Tabla OXA-48 Éxito clínico 14 días

In [34]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["Carbapenemase"] == "OXA-48"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_14d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_oxa_cs14d_raw.xlsx")

### Tabla OXA-48 Éxito clínico 30 días

In [35]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["Carbapenemase"] == "OXA-48"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_30d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_oxa_cs30d_raw.xlsx")

### Tabla OXA-48 Mortalidad 30 días

In [36]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[workDataframe["Carbapenemase"] == "OXA-48"]

from pystats_utils.pipeline import CoxExploration


result = CoxExploration(dataframe = workDataframe,
                        eventVariable = "Mortality_31d",
                        timeVariable = "Time2death_31d",
                        excludedVariables = ["Pt", "Caso_REC_3digitos",
                                             "Center"]).run()

result.to_excel("tabla_oxa_m30d_raw.xlsx")