# Etapa 3: Análisis de supervivencia

In [None]:
# Montamos la unidad de Google Drive.
from google.colab import drive
drive.mount('/content/drive')

%cd /content/drive/MyDrive/TFM

In [None]:
!pip install lifelines

In [None]:
# Importamos módulos necesarios.
import pandas as pd
import numpy as np

import matplotlib.pyplot as plt
import seaborn as sns
from lifelines import KaplanMeierFitter

from utils import read_data

# Aplicamos configuración sobre la visualización de los DataFrames.
pd.set_option('future.no_silent_downcasting', True)
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)

sns.set_theme()

# Ruta de los archivos de origen.
input_path = 'data/processed/'

In [None]:
# Carga de todos los datos.
demographic = read_data(f'{input_path}demographic.csv')
diagnosis_prior = read_data(f'{input_path}diagnosis_prior.csv')
diagnosis_primary = read_data(f'{input_path}diagnosis_primary.csv')
diagnosis_other = read_data(f'{input_path}diagnosis_other.csv')
diagnosis_type = read_data(f'{input_path}diagnosis_type.csv')
treatment_ebrt = read_data(f'{input_path}treatment_ebrt.csv')
treatment_chemo = read_data(f'{input_path}treatment_chemo.csv')
treatment_type = read_data(f'{input_path}treatment_type.csv')
mutation_gene = read_data(f'{input_path}mutation_gene.csv')

In [None]:
kmf = KaplanMeierFitter()

kmf.fit(demographic['Overall Survival'], event_observed=demographic['Vital Status'])

print(f'Tiempo medio de supervivencia: {kmf.median_survival_time_:.0f} días\n')

plt.figure(figsize=(10, 6))

kmf.plot(label="Curva de Supervivencia", ci_show=True, color='blue', show_censors=True)

plt.title('Curva de Supervivencia de Kaplan-Meier')
plt.xlabel('Días')
plt.ylabel('Probabilidad de Supervivencia')
plt.show()