# Simplified survival analysis workflow for RENKU

#### 1. Setup

In [None]:
# General setup
%run lib/workflow
import os
wf = Workflow()

input_dataset_name = "counts"
results_dataset_name = "results"
input_dir = os.path.join("data", input_dataset_name)
if not os.path.exists(input_dir):
    os.makedirs(input_dir)
results_dir =  os.path.join("data/", results_dataset_name)

#### 2. Download counts data

Drag and drop the count data file in project's data/counts directory using the JupyterLab web interface or any other method.

#### 3. Create a RENKU dataset for the counts data

In [None]:
# Create a RENKU dataset for the counts data
count_data_file = input("File :")
!sed -i "/\/data\/\*/d;/\/figs\/\*/d;/\*\.nb\.html/d" .gitignore
input_dataset_metadata = wf.dataset_create(dataset_name = input_dataset_name)
wf.dataset_add(dataset_name = input_dataset_name,
              file = count_data_file)

#### 4. Analyze the counts data

In [None]:
# Use the docker image packrat directory
!renku-r ln-packrat-lib -p . -s /home/rstudio/packrat -v -f
# Analyze the counts data using the lib/build_survival_curves.R script
wf.build_survival_curves(input_fp = count_data_file,
                        output = results_dir)

#### 5. Create a RENKU dataset for the analysis results

In [None]:
# Create a RENKU dataset for the analysis results
!sed -i "/\/data\/\*/d;/\/figs\/\*/d;/\*\.nb\.html/d" .gitignore
results_dataset_metadata = wf.dataset_create(dataset_name = results_dataset_name)
wf.dataset_add(dataset_name = results_dataset_name,
               file = results_dir)

#### 6. Save your work in RENKU!

In [None]:
%%bash -s "{input('Git commit message: ')}"
sed -i "/\/data\/\*/d;/\/figs\/\*/d;/\*\.nb\.html/d" .gitignore
git add -A
git commit -m "$1"
git push