In [1]:
import giraffe
import numpy as np
import pandas as pd

# BRCA
## Loading the data

In [14]:
gene_to_name = lambda gene : gene[0:15]

expression_case = pd.read_csv("BRCA_case.csv", index_col = 0)
expression_control = pd.read_csv("BRCA_nat.csv", index_col = 0)

expression_case.index = map(gene_to_name, expression_case.index)
expression_control.index = map(gene_to_name, expression_control.index)
expression_case.sort_index(inplace=True)
expression_control.sort_index(inplace=True)

In [18]:
motif = pd.read_csv("cancer_breast_otter_motif.csv", index_col = 0)
motif.sort_index(inplace=True)

expression_case = expression_case.loc[expression_case.index.isin(motif.index),:]
expression_control = expression_control.loc[expression_control.index.isin(motif.index),:]
motif = motif.loc[motif.index.isin(expression_case.index), :]

ppi = pd.read_csv("cancer_breast_otter_ppi.csv", index_col = 0)

## Inferring GIRAFFE GRNs

In [26]:
R_case = giraffe.Giraffe(expression_case.to_numpy(), motif.to_numpy(), ppi.to_numpy()).get_regulation()

In [29]:
R_control = giraffe.Giraffe(expression_control.to_numpy(), motif.to_numpy(), ppi.to_numpy()).get_regulation()

In [38]:
pd.DataFrame(R_case, index=motif.index, columns=motif.columns).to_csv("data/brca/network_case.tsv", sep="\t")

In [39]:
pd.DataFrame(R_control, index=motif.index, columns=motif.columns).to_csv("data/brca/network_control.tsv", sep="\t")

# CESC
## Loading the data

In [2]:
gene_to_name = lambda gene : gene[0:15]

expression_case = pd.read_csv("CESC_case.csv", index_col = 0)
expression_control = pd.read_csv("CESC_nat.csv", index_col = 0)

expression_case.index = map(gene_to_name, expression_case.index)
expression_control.index = map(gene_to_name, expression_control.index)
expression_case.sort_index(inplace=True)
expression_control.sort_index(inplace=True)

In [3]:
motif = pd.read_csv("cancer_cervix_otter_motif.csv", index_col = 0)
motif.sort_index(inplace=True)

expression_case = expression_case.loc[expression_case.index.isin(motif.index),:]
expression_control = expression_control.loc[expression_control.index.isin(motif.index),:]
motif = motif.loc[motif.index.isin(expression_case.index), :]

ppi = pd.read_csv("cancer_cervix_otter_ppi.csv", index_col = 0)

## Inferring GIRAFFE GRNs 

In [4]:
R_case = giraffe.Giraffe(expression_case.to_numpy(), motif.to_numpy(), ppi.to_numpy()).get_regulation()

In [6]:
R_control = giraffe.Giraffe(expression_control.to_numpy(), motif.to_numpy(), ppi.to_numpy()).get_regulation()

In [5]:
pd.DataFrame(R_case, index=motif.index, columns=motif.columns).to_csv("data/cesc/network_case.tsv", sep="\t")

In [7]:
pd.DataFrame(R_control, index=motif.index, columns=motif.columns).to_csv("data/cesc/network_control.tsv", sep="\t")

In [10]:
R_control

array([[-1.41590017e-05, -5.42589878e-05, -2.13047952e-06, ...,
        -1.15869830e-06, -6.58308352e-07, -1.10720403e-05],
       [ 1.40295315e-05,  5.35938598e-05,  4.70353780e-06, ...,
         3.68506630e-06,  2.90170965e-06,  1.14952563e-05],
       [-4.69008728e-06, -2.08475158e-05, -1.51473614e-07, ...,
         2.37834783e-07,  2.68224227e-07, -4.41910242e-06],
       ...,
       [-1.68665019e-06, -1.52168077e-05,  2.63134297e-07, ...,
         2.95587341e-07,  6.61290699e-07,  1.19812995e-07],
       [-1.62465331e-05, -6.49121503e-05, -2.94241158e-06, ...,
        -1.96299834e-06, -1.10652149e-06, -1.08949371e-05],
       [-1.84157088e-05, -6.99226875e-05, -3.28591864e-06, ...,
        -2.11574365e-06, -1.37013478e-06, -1.32230189e-05]], dtype=float32)

# LIHC
## Loading the data

In [3]:
gene_to_name = lambda gene : gene[0:15]

expression_case = pd.read_csv("LIHC_case.csv", index_col = 0)
expression_control = pd.read_csv("LIHC_nat.csv", index_col = 0)

expression_case.index = map(gene_to_name, expression_case.index)
expression_control.index = map(gene_to_name, expression_control.index)
expression_case.sort_index(inplace=True)
expression_control.sort_index(inplace=True)

In [5]:
motif = pd.read_csv("cancer_liver_otter_motif.csv", index_col = 0)
motif.sort_index(inplace=True)

expression_case = expression_case.loc[expression_case.index.isin(motif.index),:]
expression_control = expression_control.loc[expression_control.index.isin(motif.index),:]
motif = motif.loc[motif.index.isin(expression_case.index), :]

ppi = pd.read_csv("cancer_liver_otter_ppi.csv", index_col = 0)

## Inferring GIRAFFE GRNs

In [6]:
R_case = giraffe.Giraffe(expression_case.to_numpy(), motif.to_numpy(), ppi.to_numpy()).get_regulation()

In [8]:
R_control = giraffe.Giraffe(expression_control.to_numpy(), motif.to_numpy(), ppi.to_numpy()).get_regulation()

In [7]:
pd.DataFrame(R_case, index=motif.index, columns=motif.columns).to_csv("data/lihc/network_case.tsv", sep="\t")

In [39]:
pd.DataFrame(R_control, index=motif.index, columns=motif.columns).to_csv("data/lihc/network_control.tsv", sep="\t")