# INCREMENT-SOT CAZ-AVI

Análisis estadístico para la cohort **INCREMENT-SOT CAZ-AVI** para el estudio retrospectivo del tratamiento con CAZ-AVI frente al resto de terapias disponibles en diferentes centros.

## Control por Propensity-score

### Tratamiento BAT vs Tratamiento CAZ-AVI

In [3]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import LogisticRegression

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Cohort_Cazavi",
                            targetVariables = ["Age", "Gender",
                                               "Biliary_stenosis", "CMV_disease",
                                               "Kidney_disease", "Post_transplant_dialysis",
                                               "Score_Charlson_AMN", "Acquisition",
                                               "SIRS_SevereORSchock", "Pitt_Score",
                                               "Source_infection_Urinary_tract",
                                               "Source_infection_Pneumonia",
                                               "SourceControl_before30days", "Surgical_debridement",
                                               "Carbapenemase", "Removal_Replacement_vascular_line",
                                               "Myocardial_Infarct", "Diabetes_Mellitus",
                                               "Chronic_Pulmonary_Disease"]).run()

result.prediction.name = "ps_cvsb"
dataframe = dataframe.join(result.prediction)
dataframe.to_excel("./test/database/database_ps.xlsx")

Optimization terminated successfully.
         Current function value: 0.550326
         Iterations 6


### Tratamiento CAZ-AVI mono vs Tratamiento CAZ-AVI combi

In [4]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]

from pystats_utils.test.multivariant import LogisticRegression

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Cohort_Combi",
                            targetVariables = ["Age", "Gender",
                                               "Biliary_stenosis", "CMV_disease",
                                               "Kidney_disease", "Post_transplant_dialysis",
                                               "Score_Charlson_AMN", "Acquisition",
                                               "SIRS_SevereORSchock", "Pitt_Score",
                                               "Source_infection_Urinary_tract",
                                               "Source_infection_Pneumonia",
                                               "SourceControl_before30days", "Surgical_debridement",
                                               "Carbapenemase", "Removal_Replacement_vascular_line",
                                               "Myocardial_Infarct", "Diabetes_Mellitus",
                                               "Chronic_Pulmonary_Disease"]).run()

result.prediction.name = "ps_cvsm"
dataframe = dataframe.join(result.prediction)
dataframe.to_excel("./test/database/database_ps.xlsx")

         Current function value: 0.357314
         Iterations: 35


  result = func(self.values, **kwargs)


## Tablas

### Tabla 1

In [9]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import BivariantTable

result = BivariantTable(dataframe = workDataframe,
                        classVariable = "Cohort_Cazavi",
                        excludedVariables = ["Pt", "ps_cvsm", "Caso_REC_3digitos"]).run()

result.to_excel("tabla_1_raw.xlsx")

### Tabla 2.A

In [10]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import LogisticRegression

targetVariables = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_14d",
                            targetVariables = targetVariables).run()

result.params.to_excel("tabla_2a_params_raw.xlsx")
result.summary.to_excel("tabla_2a_metrics_raw.xlsx")

Optimization terminated successfully.
         Current function value: 0.441070
         Iterations 6


### Tabla 2.B

In [5]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[dataframe["ICS_SOT_score"] >= 8]

from pystats_utils.test.multivariant import LogisticRegression

targetVariables = ["Gender",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_14d",
                            targetVariables = targetVariables).run()

result.params.to_excel("tabla_2b_params_raw.xlsx")
result.summary.to_excel("tabla_2b_metrics_raw.xlsx")

  workDataframe = workDataframe[dataframe["ICS_SOT_score"] >= 8]


### Tabla 3.A

In [12]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import LogisticRegression

targetVariables = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariables = targetVariables).run()

result.params.to_excel("tabla_3a_params_raw.xlsx")
result.summary.to_excel("tabla_3a_metrics_raw.xlsx")

Optimization terminated successfully.
         Current function value: 0.443584
         Iterations 6


### Tabla 3.B

In [6]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]
workDataframe = workDataframe[dataframe["ICS_SOT_score"] >= 8]

from pystats_utils.test.multivariant import LogisticRegression

targetVariables = ["Gender",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariables = targetVariables).run()

result.params.to_excel("tabla_3b_params_raw.xlsx")
result.summary.to_excel("tabla_3b_metrics_raw.xlsx")

  workDataframe = workDataframe[dataframe["ICS_SOT_score"] >= 8]


### Tabla 4.A

In [3]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.test.multivariant import CoxPhRegression

targetVariables = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Cazavi",
                   "ps_cvsb"]

result = CoxPhRegression(dataframe = workDataframe,
                         eventVariable = "Mortality_31d",
                         timeVariable = "Time2death_31d",
                         targetVariables = targetVariables).run()

result.params.to_excel("tabla_4a_raw.xlsx")


0,1
model,lifelines.CoxPHFitter
duration col,'Time2death_31d'
event col,'Mortality_31d'
baseline estimation,breslow
number of observations,140
number of events observed,28
partial log-likelihood,-123.09
time fit was run,2022-11-04 02:10:46 UTC

Unnamed: 0,coef,exp(coef),se(coef),coef lower 95%,coef upper 95%,exp(coef) lower 95%,exp(coef) upper 95%,cmp to,z,p,-log2(p)
ICS_SOT_score,0.16,1.18,0.04,0.08,0.25,1.08,1.28,0.0,3.68,<0.005,12.06
ps_cvsb,-0.41,0.66,1.0,-2.38,1.55,0.09,4.73,0.0,-0.41,0.68,0.55
Gender_male,-0.85,0.43,0.41,-1.65,-0.06,0.19,0.94,0.0,-2.1,0.04,4.82
Cohort_Cazavi_yes,-0.48,0.62,0.48,-1.42,0.46,0.24,1.58,0.0,-1.0,0.32,1.66

0,1
Concordance,0.77
Partial AIC,254.19
log-likelihood ratio test,24.75 on 4 df
-log2(p) of ll-ratio test,14.11


TypeError: 'DataFrame' object is not callable

### Tabla 4.B

In [2]:
result.params

Unnamed: 0,aHR,CI 2.5%,CI 97.5%,P values,Raw Coef,Raw CI 2.5%,Raw CI 97.5%,Std Error
ps_cvsb,0.654769,0.102804,4.170301,0.653944,-0.423473,-2.274935,1.427988,0.944641
Gender_male,0.55858,0.260286,1.198726,0.134985,-0.582357,-1.345974,0.181259,0.389607
Cohort_Cazavi_yes,0.47193,0.191929,1.160417,0.10187,-0.750924,-1.650628,0.14878,0.459041


## Tablas suplementarias

### Tabla S1

0    1
1    2
2    3
dtype: int64

### Tabla S6

In [2]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_14d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_S6_raw.xlsx")

  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  result = func(self.values, **kwargs)
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  result = func(self.values, **kwargs)
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  result = func(self.values, **kwargs)
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _

### Tabla S7

In [3]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Treatment"] == "yes"]

from pystats_utils.pipeline import LogisticExploration

result = LogisticExploration(dataframe = workDataframe,
                             classVariable = "Clinical_success_30d",
                             excludedVariables = ["Pt", "Caso_REC_3digitos",
                                                  "Center"]).run()

result.to_excel("tabla_S7_raw.xlsx")

  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  result = func(self.values, **kwargs)
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  result = func(self.values, **kwargs)
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, len(result))
  _warn_prf(average, modifier, msg_start, 

### Tabla S10.A

In [7]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]


from pystats_utils.test.multivariant import LogisticRegression

targetVariables = ["Gender",
                   "ICS_SOT_score",
                   "Cohort_Combi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariables = targetVariables).run()

result.params.to_excel("tabla_S10a_params_raw.xlsx")
result.summary.to_excel("tabla_S10a_metrics_raw.xlsx")

### Tabla S10.B

In [8]:
import pandas as pd

dataframe = pd.read_excel("./test/database/database_ps.xlsx")
workDataframe = dataframe[dataframe["Cohort_Cazavi"] == "yes"]
workDataframe = workDataframe[workDataframe["ICS_SOT_score"] >= 8]

from pystats_utils.test.multivariant import LogisticRegression

targetVariables = ["Gender",
                   "Cohort_Combi",
                   "ps_cvsb"]

result = LogisticRegression(dataframe = workDataframe,
                            classVariable = "Clinical_success_30d",
                            targetVariables = targetVariables).run()

result.params.to_excel("tabla_S10b_params_raw.xlsx")
result.summary.to_excel("tabla_S10b_metrics_raw.xlsx")