In [1]:
import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
import seaborn as sns

In [2]:
import cooler
import bioframe

import cooltools

from packaging import version
if version.parse(cooltools.__version__) < version.parse('0.5.2'):
    raise AssertionError("tutorials rely on cooltools version 0.5.2 or higher,"+
                         "please check your cooltools version and update to the latest")

In [4]:
hg38_chromsizes = bioframe.fetch_chromsizes('hg38')
hg38_cens = bioframe.fetch_centromeres('hg38')
hg38_arms = bioframe.make_chromarms(hg38_chromsizes, hg38_cens) 

In [4]:
resolution = 10000

In [3]:
lucap_35cr_path = "/projects/b1126/Viriya/hic/lucap/m1398/LuCaP35CR-Arima-allReps-filtered.mcool"
lucap_93_path = "/projects/b1126/Viriya/hic/lucap/m1399/LuCaP93-Arima-allReps-filtered.mcool"
lucap_145_path = "/projects/b1126/Viriya/hic/lucap/m1400/LuCaP145.2-Arima-allReps-filtered.mcool"
lucap_147_path = "/projects/b1126/Viriya/hic/lucap/m1401/LuCaP147-Arima-allReps-filtered.mcool"
nci_path = "/projects/b1126/Viriya/hic/lucap/m1402/NCI-H660-Arima-allReps-filtered.mcool"

In [5]:
lucap35 = cooler.Cooler(f'{lucap_35cr_path}::resolutions/{resolution}')
lucap93 = cooler.Cooler(f'{lucap_93_path}::resolutions/{resolution}')
lucap145 = cooler.Cooler(f'{lucap_145_path}::resolutions/{resolution}')
lucap147 = cooler.Cooler(f'{lucap_147_path}::resolutions/{resolution}')
nci = cooler.Cooler(f'{nci_path}::resolutions/{resolution}')

In [7]:
expected_lucap35 = cooltools.expected_cis(lucap35, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap93 = cooltools.expected_cis(lucap93, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap145 = cooltools.expected_cis(lucap145, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap147 = cooltools.expected_cis(lucap147, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_nci = cooltools.expected_cis(nci, view_df=hg38_arms, nproc=2, chunksize=1_000_000)

In [9]:
expected_lucap35.to_csv('expected_10kb_lucap35CR.tsv', sep='\t', index=False, header=True)
expected_lucap93.to_csv('expected_10kb_lucap93.tsv', sep='\t', index=False, header=True)
expected_lucap145.to_csv('expected_10kb_lucap145.tsv', sep='\t', index=False, header=True)
expected_lucap147.to_csv('expected_10kb_lucap147.tsv', sep='\t', index=False, header=True)
expected_nci.to_csv('expected_10kb_nci.tsv', sep='\t', index=False, header=True)

In [8]:
lucap70cr_path = "/projects/b1126/Viriya/hic/lucap/m1494/LuCaP70CR-Arima-allReps-filtered.mcool"
lucap77cr_path = "/projects/b1126/Viriya/hic/lucap/m1528/LuCaP77CR-Arima-allReps-filtered.mcool"
lucap1451_path = "/projects/b1126/Viriya/hic/lucap/m1530/LuCaP145.1-Arima-allReps-filtered.mcool"

In [15]:
lucap77cr = cooler.Cooler(f'{lucap77cr_path}::resolutions/{resolution}')
lucap70cr = cooler.Cooler(f'{lucap70cr_path}::resolutions/{resolution}')
lucap1451 = cooler.Cooler(f'{lucap1451_path}::resolutions/{resolution}')

In [16]:
expected_lucap70cr = cooltools.expected_cis(lucap70cr, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap77cr = cooltools.expected_cis(lucap77cr, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap1451 = cooltools.expected_cis(lucap1451, view_df=hg38_arms, nproc=2, chunksize=1_000_000)

In [17]:
expected_lucap70cr.to_csv('expected_10kb_lucap70CR.tsv', sep='\t', index=False, header=True)
expected_lucap77cr.to_csv('expected_10kb_lucap77R.tsv', sep='\t', index=False, header=True)
expected_lucap1451.to_csv('expected_10kb_lucap1451.tsv', sep='\t', index=False, header=True)

In [15]:
lucap862cr_path = "/projects/b1126/Viriya/hic/lucap/m1566/LuCaP86.2CR-Arima-allReps-filtered.mcool"
lucap105cr_path = "/projects/b1126/Viriya/hic/lucap/m1567/LuCaP105CR-Arima-allReps-filtered.mcool"
lucap147cr_path = "/projects/b1126/Viriya/hic/lucap/m1568/LuCaP147CR-Arima-allReps-filtered.mcool"
lucap167cr_path = "/projects/b1126/Viriya/hic/lucap/m1569/LuCaP167CR-Arima-allReps-filtered.mcool"
lucap1731_path = "/projects/b1126/Viriya/hic/lucap/m1570/LuCaP173.1-Arima-allReps-filtered.mcool"

In [24]:
lucap862cr = cooler.Cooler(f'{lucap862cr_path}::resolutions/{resolution}')
lucap105cr = cooler.Cooler(f'{lucap105cr_path}::resolutions/{resolution}')
lucap147cr = cooler.Cooler(f'{lucap147cr_path}::resolutions/{resolution}')
lucap167cr = cooler.Cooler(f'{lucap167cr_path}::resolutions/{resolution}')
lucap1731 = cooler.Cooler(f'{lucap1731_path}::resolutions/{resolution}')

In [25]:
expected_lucap862cr = cooltools.expected_cis(lucap862cr, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap105cr = cooltools.expected_cis(lucap105cr, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap147cr = cooltools.expected_cis(lucap147cr, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap167cr = cooltools.expected_cis(lucap167cr, view_df=hg38_arms, nproc=2, chunksize=1_000_000)
expected_lucap1731 = cooltools.expected_cis(lucap1731, view_df=hg38_arms, nproc=2, chunksize=1_000_000)

In [26]:
expected_lucap862cr.to_csv('expected_10kb_lucap86.2CR.tsv', sep='\t', index=False, header=True)
expected_lucap105cr.to_csv('expected_10kb_lucap105CR.tsv', sep='\t', index=False, header=True)
expected_lucap147cr.to_csv('expected_10kb_lucap147CR.tsv', sep='\t', index=False, header=True)
expected_lucap167cr.to_csv('expected_10kb_lucap167CR.tsv', sep='\t', index=False, header=True)
expected_lucap1731.to_csv('expected_10kb_lucap173.1.tsv', sep='\t', index=False, header=True)