# Supplemental Tables

This Jupyter notebook reproduces a number of Supplemental Tables that are not included in any of the other notebooks. 

In [19]:
%reload_ext autoreload
%autoreload 2

%matplotlib inline

import sys
sys.path.append('../src')

from io import StringIO

import numpy as np
import pandas as pd

## Supplementary Table S2 - ILC insertions

Overview of all insertions identified by IM-Fusion in the ILC dataset.

In [36]:
insertion_column_map = {
    'transposon_anchor': 'feature_anchor',
    'id': 'Iinsertion_id', 
    'seqname': 'chromosome', 
    'orientation': 'gene_orientation'
}

insertions_sb = (
    pd.read_csv('../data/processed/sb/star/insertions.txt', sep='\t')
      .rename(columns=column_map)
      .rename(columns=lambda c: c.replace('_', ' ').capitalize()))
insertions_sb.to_excel('../reports/supplemental/tables/table_s2_insertions_sb.xlsx', index=False)

## Supplementary Table S3 - ILC CTGs

Overview of the CTGs identified by IM-Fusion in the ILC dataset.

In [2]:
ctgs = pd.read_csv('../data/processed/sb/star/ctgs.txt', sep='\t')

ctg_overview = (ctgs
 .assign(de_direction=lambda df: df['de_direction'].map({-1: 'down', 1: 'up'}))
 .drop(['de_test', 'gene_id'], axis=1)
 .rename(columns={
     'gene_name': 'Gene',
     'p_value': 'CTG p-value',
     'q_value': 'CTG q-value',
     'n_samples': 'Num. samples',
     'de_pvalue': 'DE p-value',
     'de_direction': 'DE direction'
 }))

ctg_overview.head()

Unnamed: 0,Gene,CTG p-value,CTG q-value,Num. samples,DE p-value,DE direction
0,Ppp1r12a,2.136308e-99,7.370264e-97,41,4.9282890000000006e-17,down
1,Trps1,3.81343e-95,1.315633e-92,44,5.408386e-16,down
2,Fgfr2,5.90285e-70,2.036483e-67,52,0.1051432,up
3,Myh9,9.094464e-70,3.13759e-67,27,1.927143e-08,down
4,Trp53bp2,2.548673e-27,8.792922e-25,12,4.034261e-07,up


## Supplementary Table S5 - B-ALL insertions

Overview of all insertions identified by IM-Fusion in the B-ALL dataset.

In [39]:
insertions_sanger = (
    pd.read_csv('../data/processed/sanger/star/insertions.txt', sep='\t')
      .rename(columns=column_map)
     .rename(columns=lambda c: c.replace('_', ' ').capitalize()))
insertions_sanger.to_excel('../reports/supplemental/tables/table_s5_insertions_sanger.xlsx', index=False)