# Preamble

This notebook contains generic imports and functions related to data analysis.
It can be included in another notebook by calling `%run '_preamble.ipynb'`.

In [1]:
# This is handled in '~/.ipython/profile_default/ipython_config.py'
# %load_ext autoreload
# %autoreload 2
%load_ext rpy2.ipython

# STL
import sys
import os, os.path
from datetime import datetime, timedelta

print(f'Python version: {".".join([str(x) for x in sys.version_info[0:3]])}')

# data science stuff
import numpy as np
print(f'NumPy version: {np.__version__}')

import pandas as pd
pd.set_option('precision', 2)
pd.set_option('display.max_columns', 999)

print(f'Pandas version: {pd.__version__}')

# Visualisation
import altair as alt
from altair.expr import datum, if_
from altair import expr
alt.renderers.enable('default')
# alt.renderers.enable('altair_saver', fmts=['vega-lite', 'png'])
alt.data_transformers.disable_max_rows()

import matplotlib.pyplot as plt
%matplotlib inline
from IPython.display import HTML, Markdown

# Jupyter Notebook Tools
import data_science_tools as tools
from data_science_tools.boxes import info, warn, error
from data_science_tools.pandas import head, tail

# NCR/cancer-specific stuff
# import ncr

# Survival analysis!
from lifelines import CoxPHFitter, KaplanMeierFitter
from lifelines.utils import ConvergenceError
from sklearn.linear_model import LogisticRegression

# Statistics
from scipy import stats


# Ignore warnings
import warnings
warnings.simplefilter("ignore")
pd.options.display.max_columns = 999


Python version: 3.8.13
NumPy version: 1.20.3
Pandas version: 1.3.2


In [2]:
print("This script was last run on", datetime.now().strftime('%A, %d-%m-%Y, %H:%M'))
print()

This script was last run on Monday, 14-06-2021, 09:07



In [3]:
logging_setup = False

In [4]:
# Print current working directory
print(f'Current working directory: "{os.getcwd()}"\n')

# Print kernel ID
__kernel_id = tools.jupyter.get_kernel_id()
print(f'connect to this kernel with:\n  jupyter console --existing {__kernel_id}')
print()

Current working directory: "/Users/melle/OneDrive/OneDrive - IKNL/04 - Projecten/Observational data for CER (internship)/src/giordano-melle"

connect to this kernel with:
  jupyter console --existing 50e9ec6c-5b09-4a7e-ade3-ad92c0b535d4



In [9]:
# Global variables for plotting
plot_height=350
plot_width=400

table_nr = 1