In [1]:
# *** A simple demo to process the compiled dataset step by step
# this file is general to every fold of data in the cross validation
# after this file, the data for different folds is generated by using data_processing_updated_2.ipynb ***

In [None]:
import pandas as pd
import numpy as np
import pickle
import copy
import requests
# prepare cell line data

pd.options.display.max_columns = None
# the folder to store our compiled dataset
prefix = 'D:/B/PROJECT B2_2/dataset/Muthene_dataset/' 
midfix = 'common files/'

# downloaded from: https://depmap.org/portal/download/
# CCLE: Cancer Cell Line Encyclopedia
CCLE_expression = pd.read_csv(prefix + midfix + 'CCLE_expression.csv')
CCLE_expression = CCLE_expression.rename(columns={'Unnamed: 0': 'depmap_id'})

response = requests.get('https://api.drugcomb.org/cell_lines')
drugcomb_cellline_allinfo = response.json()
drugcomb_cellline_allinfo_dict = {}
for i in drugcomb_cellline_allinfo:
    drugcomb_cellline_allinfo_dict[i['name']] = i

# number of cell line contained in drugcomb
print(len(drugcomb_cellline_allinfo_dict))

2320


In [3]:
# the other original files from different sources

# drug related domain knowledge
in_file = open(prefix + midfix + 'drugcomb_alldruginfo_dict.pickle', 'rb')
drugcomb_alldruginfo_dict = pickle.load(in_file)
in_file.close()

# synergy score data
drugcomb = pd.read_csv(prefix + midfix + 'drugcomb_synergy_score.csv')

# side effect data
twosides = pd.read_csv(prefix + midfix + 'twosides_side_effect.csv')

# drug-target interaction
drug_target = pd.read_csv(prefix + midfix + 'drug_target_interaction.csv')

# target-target interaction
target_target = pd.read_csv(prefix + midfix + 'target_target_interaction.csv')

drugcomb = drugcomb.rename(columns={'drug_row': 'drug1', 'drug_col': 'drug2'})
twosides = twosides[['drug1', 'drug2', 'Polypharmacy Side Effect',
                     'Side Effect Name', 'drug1_lower', 'drug2_lower', 'unified_name']]

# check the number of problematic samples based on different synergy score criteria
# zip：None
drugcomb['synergy_zip'] = drugcomb['synergy_zip'].astype('float')
print(drugcomb['synergy_zip'].max(), drugcomb['synergy_zip'].min(),
      drugcomb['synergy_zip'].mean(), drugcomb['synergy_zip'].median())

# hsa: None
drugcomb['synergy_hsa'] = drugcomb['synergy_hsa'].astype('float')
print(drugcomb['synergy_hsa'].max(), drugcomb['synergy_hsa'].min(),
      drugcomb['synergy_hsa'].mean(), drugcomb['synergy_hsa'].median())

# bliss: None
drugcomb['synergy_bliss'] = drugcomb['synergy_bliss'].astype('float')
print(drugcomb['synergy_bliss'].max(), drugcomb['synergy_bliss'].min(
), drugcomb['synergy_bliss'].mean(), drugcomb['synergy_bliss'].median())

# remove the 4 problematic data based on loewe
temp = drugcomb[drugcomb['synergy_loewe'] != '\\N']
temp_drugset = set.union(set(temp['drug1']), set(temp['drug2']))

drugcomb = drugcomb.drop(
    index=(drugcomb.loc[(drugcomb['synergy_loewe'] == '\\N')].index))
drugcomb['synergy_loewe'] = drugcomb['synergy_loewe'].astype('float')

print(drugcomb['synergy_loewe'].max(), drugcomb['synergy_loewe'].min(
), drugcomb['synergy_loewe'].mean(), drugcomb['synergy_loewe'].median())
# the loewe synergy score is lower than others

print('total drug number:', len(temp_drugset))

128.433573916656 -86.1689137467893 -1.1658416418422066 -0.46167060284044703
87.93870313788229 -90.13426667491999 -1.228943063125428 -1.0785883625221
207.19724904478198 -95.0502059205476 -1.3513368723624046 -0.543827700211486
82.9982087530354 -101.379902323728 -8.991664263881768 -4.3698299642188
total drug number: 213


In [4]:
drugcomb.head()

Unnamed: 0,block_id,drug1,drug2,cell_line_name,study_name,tissue_name,conc_row_unit,conc_col_unit,ic50_row,ic50_col,ri_row,ri_col,css_row,css_col,css_ri,S_sum,S_mean,S_max,synergy_zip,synergy_loewe,synergy_hsa,synergy_bliss,drug_row_clinical_phase,drug_col_clinical_phase,drug_row_target_name,drug_col_target_name,drug1_lower,drug2_lower,unified_name
0,462981,prochlorperazine,tamoxifen,TC-32,NCATS_DIPG,bone,uM,uM,0.011618,20.0,-11.816,-7.484,48.08,2.795,25.4375,44.7375,35.0875,32.9215,12.411371,1.358891,0.880952,14.291624,4,4,Prelamin-A/C; Cytochrome P450 2D6; Cytochrome ...,Anti-estrogen binding site (AEBS); Estrogen re...,prochlorperazine,tamoxifen,prochlorperazine_tamoxifen
1,463078,prochlorperazine,mefloquine,TC-32,NCATS_DIPG,bone,uM,uM,0.003762,3.707453,0.815,2.41,2.855,-0.602,1.1265,-2.0985,-0.486,-1.2835,-1.954036,-1.954405,-4.311522,-1.398677,4,4,Prelamin-A/C; Cytochrome P450 2D6; Cytochrome ...,\N,prochlorperazine,mefloquine,prochlorperazine_mefloquine
2,463260,prochlorperazine,Gefitinib,TC-32,NCATS_DIPG,bone,uM,uM,0.1,20.0,-4.949,3.439,20.059,3.567,11.813,13.323,12.568,8.374,0.085606,-1.472113,-2.211179,4.015759,4,4,Prelamin-A/C; Cytochrome P450 2D6; Cytochrome ...,Epidermal growth factor receptor erbB1; Recept...,prochlorperazine,gefitinib,prochlorperazine_gefitinib
3,463534,Dasatinib,prochlorperazine,TC-32,NCATS_DIPG,bone,uM,uM,0.023071,0.046578,13.931,-7.661,10.154,3.041,6.5975,0.3275,3.4625,-7.3335,2.964407,-3.712887,-2.208605,4.015463,4,4,Tyrosine-protein kinase LCK; Tyrosine-protein ...,Prelamin-A/C; Cytochrome P450 2D6; Cytochrome ...,dasatinib,prochlorperazine,dasatinib_prochlorperazine
4,132914,Imatinib,bleomycin,SF-268,ALMANAC,brain,uM,uM,1.997124,0.21727,-1.206,14.845,16.977,16.503,16.74,3.101,9.9205,1.895,-5.967873,-10.254135,1.665557,3.507983,4,4,Tyrosine-protein kinase ABL; Platelet-derived ...,\N,imatinib,bleomycin,imatinib_bleomycin


In [5]:
twosides.head()

Unnamed: 0,drug1,drug2,Polypharmacy Side Effect,Side Effect Name,drug1_lower,drug2_lower,unified_name
0,imipramine,methotrexate,C0043096,loss of weight,imipramine,methotrexate,methotrexate_imipramine
1,imipramine,methotrexate,C0032285,neumonia,imipramine,methotrexate,methotrexate_imipramine
2,imipramine,methotrexate,C0009676,confusion,imipramine,methotrexate,methotrexate_imipramine
3,imipramine,methotrexate,C0398353,Hypoventilation,imipramine,methotrexate,methotrexate_imipramine
4,imipramine,methotrexate,C0000737,abdominal pain,imipramine,methotrexate,methotrexate_imipramine


In [6]:
# give an order to involved drugs (absolute ids)
drugset = list(set.union(set(drugcomb['drug1_lower']), set(drugcomb['drug2_lower'])))
drugset.sort()
drug2absid_dict = {drug: i for i, drug in enumerate(drugset)} # based on drugcomb

# give an order to involved targets (absolute ids)
drug_target = drug_target.rename(columns={'target': 'gene symbol'})
drug_target = drug_target[['drug', 'drug_lower', 'gene symbol']]
temp = set(drug_target['gene symbol'])

target_target = target_target[['gene1 symbol', 'gene2 symbol']]
target_target.iloc[103608]['gene1 symbol'] = 'WTIP'  # modify outdated sample
targetset = list(set.union(set(target_target['gene1 symbol']), set(target_target['gene2 symbol'])))
targetset.sort()

# unify the all the target name to lowercase
temp_2 = set([target.lower() for target in temp])
targetset_2 = set([target.lower() for target in targetset])
print(temp-set(targetset))

print(temp_2-targetset_2)

print(len(temp), len(temp_2), len(targetset), len(targetset_2))

temp_3 = pd.DataFrame([target.lower() for target in targetset])
print(temp_3.iloc[temp_3.duplicated()[temp_3.duplicated() == True].index])

target_target[(target_target['gene1 symbol'].str.lower() == 'wtip') | (
    target_target['gene2 symbol'].str.lower() == 'wtip')]

# incorporate targets in target-target interaction into the target set
targetset = list(set.union(set(targetset), temp))
targetset.sort()
target2absid_dict = {target: i for i, target in enumerate(targetset)} # based on target_target and drug_target

print(len(set(drugcomb['unified_name'])), len(set(twosides['unified_name'])))

# make the number of drug pairs in drugcomb and twosides is the same
twosides_pairset = set(twosides['unified_name'])
drugcomb_pairset = set(drugcomb['unified_name'])
inter_pairset = list(set.intersection(twosides_pairset, drugcomb_pairset))
# fix the order of drug pairs
inter_pairset.sort()

drugcomb_reduced = []  # reduce the extra drug pairs in drugcomb
for row in np.array(drugcomb):
    if(row[-1] in inter_pairset):
        drugcomb_reduced.append(row)

drugcomb = pd.DataFrame(drugcomb_reduced, columns=drugcomb.columns)
print(len(set(drugcomb['unified_name'])), len(set(twosides['unified_name'])))

# currently both datasets have 2764 drug pairs and this number will be further shortened due to the limited acquisition of cell line information

{'CA13', 'ALPPL2', 'ACCN1', 'ABP1', 'ACCN2', 'GPR19'}
{'ca13', 'abp1', 'gpr19', 'accn1', 'alppl2', 'accn2'}
825 825 12796 12796
Empty DataFrame
Columns: [0]
Index: []
2837 2764
2764 2764


In [7]:
# start to determine the number of cell line according to existing cell line information
# 'ACH-'' is the id of depmap, which is a cell line dataset

In [8]:
drugcomb_cellline_allinfo_dict['DU-145']

{'name': 'DU-145',
 'synonyms': 'DU-145; DU-145; Du-145; DU 145; DU_145',
 'cellosaurus_accession': 'CVCL_0105',
 'disease_id': 'C4863',
 'id': 16,
 'tissue_id': 9,
 'depmap_id': 'ACH-000979',
 'cell_model_passport_id': 'SIDM00120',
 'cosmic_id': 905935,
 'ccle_name': 'DU145_PROSTATE',
 'expression_data': 'CellModelPassport'}

In [9]:
cellline_set = list(set(drugcomb['cell_line_name']))
cellline_set.sort()
cellline2absid_dict = {cellline: i for i, cellline in enumerate(cellline_set)}  # complete cell line set, based on drugcomb

counter = 0
# contain basic information of all involved cell lines
drugcomb_cellline_info_table = []
vacant_cellline = []  # cell lines that are not in drugcomb dataset
# cell lines that are in drugcomb dataset originated from depmap
existing_cellline_depmap = []
# cell lines that are in drugcomb dataset originated from CMP
existing_cellline_CMP = []
existing_cellline = []
for cellline in cellline_set:
    if drugcomb_cellline_allinfo_dict[cellline]['expression_data'] == 'NA':
        vacant_cellline.append(cellline)
        counter += 1
    elif drugcomb_cellline_allinfo_dict[cellline]['expression_data'] == 'BROAD_DepMap':
        existing_cellline_depmap.append(cellline)
    elif drugcomb_cellline_allinfo_dict[cellline]['expression_data'] == 'CellModelPassport':
        existing_cellline_CMP.append(cellline)
    else:
        existing_cellline.append(cellline)  # other cases

    drugcomb_cellline_info_table.append(
        drugcomb_cellline_allinfo_dict[cellline])

print(vacant_cellline)  # KBM-7 cannot be found
print('vacant cellline number:', counter)

drugcomb_cellline_info_table = pd.DataFrame(drugcomb_cellline_info_table)

# test for depmap based cell line data, all of them can be the found in CCLE_expression file
expression_in_BROAD_DepMap = drugcomb_cellline_info_table[
    drugcomb_cellline_info_table['expression_data'] == 'BROAD_DepMap']

temp1 = set(CCLE_expression['depmap_id'])
temp2 = set(expression_in_BROAD_DepMap['depmap_id'])
print(temp2-temp1)

drugcomb_cellline_info_table.head() 
# include all information retrieved from drugcomb 
# but not all of cell lines can find expression data neither in CMP nor depmap

['3D7', '501-mel', 'CBRC002', 'CBRC007', 'CBRC008', 'CBRC013', 'CBRC014', 'CBRC016', 'CBRC017', 'CBRC026', 'CBRC029', 'CBRC034', 'CBRC042', 'CBRC043', 'CBRC050', 'CBRC056', 'CBRC058', 'COLO320DM', 'DD2', 'DIPG25', 'EFM192B', 'HB3', 'HL-60(TB)', 'KBM-7', 'LNCAP', 'MCF7F10016', 'MCF7F1003', 'MCF7T52', 'MDA-MB-435', 'MDAMB134V1', 'NCI-H322M', 'NCI/ADR-RES', 'SNB-19', 'TC-32', 'UWB1289+BRCA1', 'WM1716', 'WM1745', 'WM3526', 'WM3619', 'WT2-iPS']
vacant cellline number: 40
set()


Unnamed: 0,name,synonyms,cellosaurus_accession,disease_id,id,tissue_id,depmap_id,cell_model_passport_id,cosmic_id,ccle_name,expression_data
0,3D7,3D7,,C34797,2288,3,,,,,
1,451Lu,451Lu; 451LU; 451-LU; WM 451-Lu; WM-451Lu; WM-...,CVCL_6357,C3510,129,10,ACH-001002,SIDM01240,1287706.0,451LU_SKIN,CellModelPassport
2,501-mel,501-mel; 501-MEL; 501 mel; 501 Mel; 501Mel; 50...,CVCL_4633,C3224,2258,10,,,,,
3,786-0,786-0; 786O; 786-0; 786.O; 786-O RCC; RCC 786-...,CVCL_1051,C9385,1,5,ACH-000649,SIDM00125,905947.0,786O_KIDNEY,BROAD_DepMap
4,A101D,A101D; A-101D,CVCL_1057,C3224,150,10,ACH-000008,SIDM00801,910921.0,A101D_SKIN,BROAD_DepMap


In [11]:
# existing_cellline_depmap: cell line that can find expression data in CCLE dataset
# consider CCLE dataset at first becuase it has more data
drugcomb_depmap = drugcomb[drugcomb['cell_line_name'].isin(existing_cellline_depmap)]

# remaining cell lines
print('remaining cell lines after using CCLE:', len(set(drugcomb_depmap['cell_line_name'])))
# remaining drugs
print('remaining drugs after using CCLE:', len(set(drugcomb_depmap['drug1_lower']).union(set(drugcomb_depmap['drug2_lower']))))

# store the number of drug-drug pairs that current each cell line corresponds to
cellline_num_list = []
for cellline in set(drugcomb_depmap['cell_line_name']):
    num = drugcomb_depmap[drugcomb_depmap['cell_line_name'] == cellline].shape[0]
    cellline_num_list.append([cellline, num])

cellline_num_list = pd.DataFrame(cellline_num_list)
cellline_num_list = cellline_num_list.sort_values([1], ascending=(False)).reset_index(drop=True)

# [0]: total drug-drug-cell line samples according to remaining cell lines
# [1]: total drug-drug-cell line samples according to further selected cell lines of remaining cell lines
# every top-40 cell line corresponding to at least 200 drug-drug pairs, top-60: 37
selected_cellline_num = 60
print('before further selecting cell lines:', drugcomb_depmap.shape[0], 'after:', cellline_num_list[:selected_cellline_num][1].sum())

# based on selected_cellline_num
cellline_set_reduced = list(cellline_num_list[:selected_cellline_num][0])
cellline_set_reduced.sort()
cellline2relid_dict = {cellline: i for i, cellline in enumerate(cellline_set_reduced)}

# further reduce the cell line number in depmap based dataset
drugcomb_depmap_reduced = drugcomb_depmap[drugcomb_depmap['cell_line_name'].isin(cellline2relid_dict.keys())].reset_index(drop=True)
drugset_reduced = list(set(drugcomb_depmap_reduced['drug1_lower']).union(set(drugcomb_depmap_reduced['drug2_lower'])))
drugset_reduced.sort()
drug2relid_dict = {drug: i for i, drug in enumerate(drugset_reduced)}  # based on selected_cellline_num

# current drug, target, cellline set have the complete number of samples
print('absolute entity number:', len(drug2absid_dict), len(target2absid_dict), len(cellline2absid_dict))
# currently only determine the relative drug and cell line ids (not including target ids)
print('relative entity number:', len(drug2relid_dict), len(cellline2relid_dict))

print('the least number of drugs corresponding to one cell line:', cellline_num_list.iloc[selected_cellline_num-1][1])

# under selected CCLE cell lines:
# interestingly, top40 cell lines only include 48 drugs, top40-60 cell lines include at least 37 drugs
# which means that, drugs corresponding to different cell lines could be totally different
# adding top40-top60 could increase the difficulty of model prediction

# *** the following experiments are based on drugcomb_cellline_depmap_reduced dataset and drug2relid_dict ***

remaining cell lines after using CCLE: 93
remaining drugs after using CCLE: 106
before further selecting cell lines: 11907 after: 11166
absolute entity number: 213 12802 147
relative entity number: 106 60
the least number of drugs corresponding to one cell line: 37


In [13]:
print(drugcomb_depmap_reduced.shape) # samples after selecting fixed number of cell lines
drugcomb_depmap_reduced.head()

(11166, 29)


Unnamed: 0,block_id,drug1,drug2,cell_line_name,study_name,tissue_name,conc_row_unit,conc_col_unit,ic50_row,ic50_col,ri_row,ri_col,css_row,css_col,css_ri,S_sum,S_mean,S_max,synergy_zip,synergy_loewe,synergy_hsa,synergy_bliss,drug_row_clinical_phase,drug_col_clinical_phase,drug_row_target_name,drug_col_target_name,drug1_lower,drug2_lower,unified_name
0,132914,Imatinib,bleomycin,SF-268,ALMANAC,brain,uM,uM,1.997124,0.21727,-1.206,14.845,16.977,16.503,16.74,3.101,9.9205,1.895,-5.967873,-10.254135,1.665557,3.507983,4,4,Tyrosine-protein kinase ABL; Platelet-derived ...,\N,imatinib,bleomycin,imatinib_bleomycin
1,135848,paclitaxel,allopurinol,SF-268,ALMANAC,brain,uM,uM,0.026675,4.675736,29.318,0.146,17.788,4.071,10.9295,-18.5345,-3.8025,-18.3885,-5.326121,-22.472343,-9.719076,-9.262139,4,4,Tubulin; Integrin alpha-V/beta-3; Prelamin-A/C...,Xanthine dehydrogenase; Ras-related protein Ra...,paclitaxel,allopurinol,paclitaxel_allopurinol
2,135980,Fulvestrant,docetaxel,SF-268,ALMANAC,brain,uM,uM,4.0,0.030177,-14.037,4.741,3.049,17.096,10.0725,19.3685,14.7205,5.3315,2.377254,-6.237605,-4.144442,9.601456,4,4,Estrogen receptor alpha; Estrogen receptor bet...,\N,fulvestrant,docetaxel,fulvestrant_docetaxel
3,137713,letrozole,cyclophosphamide,SF-268,ALMANAC,brain,uM,uM,0.044412,33.509424,-1.077,-0.379,2.678,1.556,2.117,3.573,2.845,2.496,0.316095,1.835797,2.4167,4.009233,4,4,Cytochrome P450 19A1,\N,letrozole,cyclophosphamide,letrozole_cyclophosphamide
4,138370,Imatinib,hydroxyurea,SF-268,ALMANAC,brain,uM,uM,0.542648,1.398216,1.269,0.129,-1.341,-0.498,-0.9195,-2.3175,-1.6185,-2.1885,0.036013,-0.616815,-3.276514,-1.881524,4,4,Tyrosine-protein kinase ABL; Platelet-derived ...,Ribonucleoside-diphosphate reductase RR1,imatinib,hydroxyurea,imatinib_hydroxyurea


In [14]:
# retrieve the expression data for selected top cell lines like Transynergy method

# 1. determine the number of targets interact with drugs in drugset
drug_target_depmap_reduced = drug_target[drug_target['drug_lower'].isin(list(drug2relid_dict.keys()))].reset_index(drop=True)

print('len(drug2relid_dict.keys():', len(drug2relid_dict.keys()))
# the genes on which its expression data is calculated for certain cell line
gene4cellline = set(drug_target_depmap_reduced['gene symbol'])

CCLE_gene_name = CCLE_expression.columns
CCLE_gene = set([gene[:gene.find('(')-1] for gene in CCLE_gene_name[1:]])
# CCLE column name to gene name
CCLE_gene_mapping = {gene[:gene.find('(')-1]: gene for gene in CCLE_gene_name[1:]}

for i in gene4cellline - CCLE_gene:
    gene4cellline.remove(i)
# doublecheck, should be an empty set, ensure all expression data based on genes can be found in CCLE
print(gene4cellline - CCLE_gene)

print(CCLE_expression.iloc[0])

# obtain expression data on selected genes
CCLE_expression_depmap_reduced = pd.DataFrame(CCLE_expression, columns=[
                                              'depmap_id']+[CCLE_gene_mapping[genename] for genename in gene4cellline])

cellline_name2depmap = {}  # based on cellline2relid_dict
for name in cellline2relid_dict.keys():
    # name: cell line name
    value = np.array(drugcomb_cellline_info_table[drugcomb_cellline_info_table['name'] == name]['depmap_id'])[0]
    # value: depmap id
    cellline_name2depmap[name] = value

temp_list1 = []
temp_list2 = []
temp_set = set()
for name in cellline2relid_dict:  # based on the order of cellline2relid_dict
    temp = CCLE_expression_depmap_reduced[CCLE_expression_depmap_reduced['depmap_id'] == cellline_name2depmap[name]]
    temp_list1.append(temp)  # expression data for one cell line
    temp_list2.append(name)  # name for one cell line
    if temp.shape[0] == 0:  # data that cannot be found
        temp_set.add(cellline_name2depmap[name])
        print(cellline_name2depmap[name])
        print(name)

assert len(temp_list1) == len(temp_list2), 'len(temp_list1) != len(temp_list2)'
# overwrite previous CCLE_expression_depmap_reduced
CCLE_expression_depmap_reduced = pd.concat(temp_list1)
CCLE_expression_depmap_reduced.insert(0, 'cellline_name', temp_list2, allow_duplicates=False)

print('CCLE_expression_depmap_reduced.shape:', CCLE_expression_depmap_reduced.shape)
CCLE_expression_depmap_reduced.head()

len(drug2relid_dict.keys(): 106
set()
depmap_id                  ACH-001113
TSPAN6 (7105)                  4.9905
TNMD (64102)                        0
DPM1 (8813)                    7.2737
SCYL3 (57147)                 2.76553
                              ...    
POLR2J3 (548644)              5.78188
H2BE1 (114483833)                   0
AL445238.1 (647264)                 0
GET1-SH3BGR (106865373)      0.799087
AC113348.1 (102724657)              0
Name: 0, Length: 19178, dtype: object
CCLE_expression_depmap_reduced.shape: (60, 679)


Unnamed: 0,cellline_name,depmap_id,CHRNA4 (1137),CHRNA2 (1135),FABP7 (2173),TGFBR1 (7046),SCN10A (6336),MMP14 (4323),PSMD1 (5707),CA12 (771),TBXAS1 (6916),PTGER4 (5734),CHRNA6 (8973),HIPK3 (10114),SLC47A1 (55244),DCK (1633),KIT (3815),DHRS1 (115817),DHRS7C (201140),SCN8A (6334),OGG1 (4968),HPGD (3248),CHRNE (1145),ZAP70 (7535),GPR27 (2850),FLT1 (2321),KCNA1 (3736),DHODH (1723),KCNQ1 (3784),GNRHR (2798),FGR (2268),PDE11A (50940),GPR12 (2835),SCN11A (11280),TSSK2 (23617),CA2 (760),MAP3K11 (4296),HTR6 (3362),GPR84 (53831),GPR151 (134391),RDH10 (157506),RDH8 (50700),TAAR6 (319100),CHRNA1 (1134),SSTR2 (6752),AR (367),MAP4K4 (9448),GAK (2580),FDPS (2224),SCAP (22937),FABP4 (2167),FLT3 (2322),NOS2 (4843),SYK (6850),OPRM1 (4988),GPR142 (350383),SBK1 (388228),HRH2 (3274),UTS2R (2837),LYN (4067),PBK (55872),GPR6 (2830),EPHA3 (2042),PLD1 (5337),FGFR4 (2264),LTB4R (1241),AURKA (6790),RBP5 (83758),CACNA1G (8913),JAK3 (3718),PASK (23178),CYP2C9 (1559),SLC6A20 (54716),ERBB2 (2064),NQO2 (4835),NMUR2 (56923),THRB (7068),GPR85 (54329),SLC22A2 (6582),MC4R (4160),CYP2B6 (1555),RIPK1 (8737),CA13 (377677),ANXA1 (301),MAP3K21 (84451),NR3C2 (4306),NPFFR2 (10886),HMGCR (3156),MC2R (4158),MAP3K9 (4293),GPR61 (83873),RDH12 (145226),TAAR1 (134864),NR3C1 (2908),HSD11B1 (3290),LPAR3 (23566),STYK1 (55359),PDE10A (10846),EPX (8288),SIK3 (23387),GPR37L1 (9283),HDAC2 (3066),AOX1 (316),PDE1A (5136),NR2C2 (7182),IRAK4 (51135),GPR21 (2844),HTR3C (170572),MLNR (2862),GALR2 (8811),POLA2 (23649),TLR7 (51284),RGR (5995),MKNK1 (8569),FGFRL1 (53834),CDH5 (1003),NMUR1 (10316),CA5B (11238),NR2E1 (7101),CA3 (761),CCNC (892),LIMK2 (3985),CHRFAM7A (89832),FABP6 (2172),TRIB3 (57761),NTRK2 (4915),CHRNG (1146),CA7 (766),NR1I2 (8856),HTR2C (3358),FYN (2534),CA4 (762),EPHB1 (2047),TLR8 (51311),CDK19 (23097),ADRA1B (147),MELK (9833),FABP3 (2170),KCNMA1 (3778),SLC5A7 (60482),HSD17B14 (51171),TIE1 (7075),TUBB2A (7280),NIM1K (167359),SLC6A7 (6534),TUBD1 (51174),PDPK1 (5170),PHKG1 (5260),LPAR1 (1902),PDE4C (5143),MAP2K5 (5607),DHRSX (207063),HIPK4 (147746),NR1H2 (7376),TUBA1C (84790),RRM1 (6240),PIN1 (5300),CA9 (768),MAPK15 (225689),CCR1 (1230),AGTR2 (186),FABP1 (2168),DECR1 (1666),RIPK3 (11035),ANPEP (290),NPY1R (4886),PSMB5 (5693),GPR52 (9293),GPR148 (344561),ATIC (471),FGFR3 (2261),POLA1 (5422),TBXA2R (6915),CA6 (765),SERPINA7 (6906),ADORA1 (134),MUSK (4593),EPHB4 (2050),GC (2638),HTR2B (3357),MAPK11 (5600),SLC6A3 (6531),RARG (5916),RXFP3 (51289),DECR2 (26063),CYP3A4 (1576),HTR3E (285242),ADRA1A (148),CSNK1E (1454),GPR19 (2842),MATK (4145),NTSR2 (23620),SLC6A4 (6532),MAP3K20 (51776),STK10 (6793),SIK2 (23235),RARA (5914),NPC1L1 (29881),TRIB2 (28951),PDE2A (5138),KCNH2 (3757),SSTR3 (6753),OPRD1 (4985),FABP2 (2169),DRD1 (1812),FABP9 (646480),MCHR1 (2847),LRRK2 (120892),RDH14 (57665),ACVR2A (92),ADRB2 (154),SLC12A3 (6559),PLK4 (10733),CCR5 (1234),TNF (7124),BTK (695),APLNR (187),DRD5 (1816),HTR1A (3350),ADRA1D (146),PTGER2 (5732),EPHA2 (1969),CHRNB1 (1140),CMPK1 (51727),CCR2 (729230),IDO1 (3620),EPHA5 (2044),EGFR (1956),GPR83 (10888),DHRS4L2 (317749),CTNNB1 (1499),NR6A1 (2649),DHRS2 (10202),CHRND (1144),IRAK1 (3654),AURKB (9212),RDH11 (51109),TRHR (7201),PDE5A (8654),EPHA8 (2046),GPR37 (2861),UPP2 (151531),MERTK (10461),PGR (5241),DHRS3 (9249),NEK11 (79858),PXDNL (137902),CRABP1 (1381),BRS3 (680),PTK6 (5753),RBP7 (116362),MMP8 (4317),NFKB1 (4790),TUBB2B (347733),TXK (7294),ESRRB (2103),PDE4B (5142),HPRT1 (3251),BRAF (673),EPHA4 (2043),PIM1 (5292),LPO (4025),TUBA3C (7278),STAT5B (6777),HUNK (30811),SLCO2B1 (11309),HCK (3055),PMP2 (5375),SRMS (6725),GPR3 (2827),SLC6A16 (28968),THRA (7067),CSK (1445),TESK1 (7016),PDSS1 (23590),TSSK6 (83983),STK35 (140901),FGFR2 (2263),PTGS1 (5742),PDSS2 (57107),PKDCC (91461),PDGFRL (5157),RRH (10692),ABL2 (27),QRFPR (84109),SCN2A (6326),TPO (7173),MC3R (4159),CBR1 (873),TYMS (7298),TEC (7006),NPY4R (5540),CSNK1A1 (1452),BDH2 (56898),AGTR1 (185),CYP2C19 (1557),TNNI3K (51086),GPR22 (2845),SLC6A19 (340024),PDE6B (5158),ADORA3 (140),CXCR4 (7852),MYT1 (4661),TUBA1B (10376),PTGR1 (22949),TEK (7010),NPY5R (4889),TNK2 (10188),BMX (660),STK11 (6794),ALOX5 (240),NPPB (4879),CHRM2 (1129),PHOSPHO1 (162466),CCKAR (886),PTPRZ1 (5803),NR0B1 (190),HTR7 (3363),CDKL3 (51265),HIF1A (3091),IRAK2 (3656),IGF1R (3480),TUBB4B (10383),ERBB4 (2066),MAP3K3 (4215),GPR63 (81491),CACNA1H (8912),PXDN (7837),AURKC (6795),HRH1 (3269),OPN1MW (2652),ROR1 (4919),NPC1 (4864),GSK3B (2932),SV2A (9900),RBP2 (5948),SIK1 (150094),RPS6KB1 (6198),TF (7018),DRD2 (1813),STMN4 (81551),HCRTR2 (3062),HTR1F (3355),WEE2 (494551),SLC6A11 (6538),SLC6A13 (6540),SLC12A1 (6557),NPY2R (4887),SLC6A9 (6536),EPHA10 (284656),VCAM1 (7412),GPR176 (11245),EPHB3 (2049),CDKL2 (8999),GPR135 (64582),ITGB2 (3689),FABP5 (2171),ADRA2C (152),DRD4 (1815),SLC22A7 (10864),PRLHR (2834),TOP2B (7155),MLKL (197259),BLM (641),PPARD (5467),TAAR5 (9038),CYP51A1 (1595),PTGFR (5737),ESR1 (2099),MAP3K19 (80122),MAP4K3 (8491),PIM2 (11040),CHRM3 (1131),GPR88 (54112),SRC (6714),TAAR8 (83551),HTR1B (3351),AVPR2 (554),TRPM2 (7226),MAOB (4129),CNR2 (1269),GPR39 (2863),NTRK1 (4914),NR1H3 (10062),PDE7B (27115),EPHA6 (285220),AXL (558),CALM1 (801),CHRM1 (1128),FABP12 (646486),HSD17B1 (3292),TUBB6 (84617),MELTF (4241),SLC6A12 (6539),GART (2618),HTR5A (3361),BMPR1B (658),KCNN4 (3783),PTPRG (5793),STK36 (27148),XDH (7498),RUSC1 (23623),IRAK3 (11213),OPRK1 (4986),NALCN (259232),KCNE1 (3753),YES1 (7525),ADORA2B (136),CLK4 (57396),TRPA1 (8989),CA8 (767),CBR4 (84869),ABCC2 (1244),NR1I3 (9970),OPN1SW (611),C2orf81 (388963),MCHR2 (84539),SLCO1B3 (28234),OPRL1 (4987),VDR (7421),CDK8 (1024),JUP (3728),PTGER3 (5733),NLK (51701),EBP (10682),GGPS1 (9453),ACVRL1 (94),SSTR5 (6755),NTSR1 (4923),PRTFDC1 (56952),ITGAL (3683),EPHB6 (2051),RIPK4 (54101),LPAR2 (9170),CRABP2 (1382),HSD17B13 (345275),TRIB1 (10221),CLK1 (1195),TUBB4A (10382),UPRT (139596),CHRNA3 (1136),LCK (3932),PPARG (5468),CYP2D6 (1565),ARAF (369),NR0B2 (8431),PSMB1 (5689),TNNC2 (7125),CACNA1S (779),PTGIR (5739),TUBB3 (10381),MPO (4353),BDKRB1 (623),TUBA3E (112714),GSTP1 (2950),BCL2 (596),ERN2 (10595),JAK2 (3717),ERBB3 (2065),RAF1 (5894),CHRNB4 (1143),TYRO3 (7301),EPHB2 (2048),SLC6A8 (6535),DDR2 (4921),HTR1D (3352),CACNB2 (783),TNFSF11 (8600),GSK3A (2931),TSSK4 (283629),MINK1 (50488),TUBG2 (27175),NR2F6 (2063),MC1R (4157),SLC6A2 (6530),MET (4233),MAP3K4 (4216),SLC6A1 (6529),TNK1 (8711),TESK2 (10420),FLT4 (2324),CDK7 (1022),FDXR (2232),DHRS7B (25979),INSRR (3645),CHRM4 (1132),DRD3 (1814),RXFP4 (339403),ACKR3 (57007),PDGFRB (5159),CHRNA9 (55584),DDR1 (780),PGD (5226),MC5R (4161),PDGFRA (5156),UPP1 (7378),HSD17B11 (51170),CIT (11113),RIPK2 (8767),TOP1 (7150),LMNA (4000),TOP2A (7153),ABCC8 (6833),MAPK14 (1432),FFAR4 (338557),PKMYT1 (9088),PTGER1 (5731),GPR150 (285601),CYP11B2 (1585),SLC47A2 (146802),TUBA4A (7277),GPR139 (124274),CHRM5 (1133),SLC6A18 (348932),GJA1 (2697),PSMB2 (5690),ADRB3 (155),RARB (5915),PLD2 (5338),MKNK2 (2872),ELN (2006),CCR3 (1232),RECQL (5965),OPN3 (23596),HTR3A (3359),TUBA8 (51807),INSR (3643),CA5A (763),DHFR2 (200895),HIPK2 (28996),CACNA1A (773),FRK (2444),GRPR (2925),CHRNB3 (1142),SCN5A (6331),GPR119 (139760),TYK2 (7297),HRH3 (11255),GPR26 (2849),CYP1A2 (1544),ESR2 (2100),SLC6A6 (6533),AVPR1A (552),TUBE1 (51175),SCN3A (6328),MAP3K2 (10746),HSDL2 (84263),HTR2A (3356),CHRNA7 (1139),ACE (1636),GPR62 (118442),OPN5 (221391),NPFFR1 (64106),CACNA1D (776),TUBB1 (81027),RHO (6010),VEGFA (7422),COQ8A (56997),RBP1 (5947),PECR (55825),GPR65 (8477),SSTR4 (6754),ESRRA (2101),MMP20 (9313),NPBWR2 (2832),ACVR1B (91),RXRB (6257),PDE6A (5145),GHSR (2693),MOS (4342),SLCO1B1 (10599),CCR9 (10803),ADORA2A (135),ITK (3702),RET (5979),GPR45 (11250),CACNA1C (775),IDO2 (169355),EPHA1 (2041),TSSK1B (83942),TAAR2 (9287),MAP3K10 (4294),PIM3 (415116),HRH4 (59340),TUBB8 (347688),ACVR2B (93),PDE6C (5146),KDR (3791),ACVR1 (90),SRD5A1 (6715),RXRA (6256),CCR4 (1233),CXCR6 (10663),GPR78 (27201),SLC6A17 (388662),ACKR2 (1238),PTGDR (5729),OXTR (5021),NMBR (4829),NR2F1 (7025),GPR101 (83550),CATSPER1 (117144),DHRS12 (79758),SDR16C5 (195814),DHFR (1719),TUBG1 (7283),TAOK3 (51347),ALK (238),CACNA1F (778),CHRNA5 (1138),SSTR1 (6751),CTDSP1 (58190),GALR1 (2587),ADRB1 (153),ERN1 (2081),CCKBR (887),TUBB (203068),CA10 (56934),DHRS13 (147015),HCRTR1 (3061),CA1 (759),LTK (4058),NTRK3 (4916),KISS1R (84634),OPN4 (94233),NR1H4 (9971),PRKAB1 (5564),MAP2K1 (5604),PTGS2 (5743),ADRA2A (150),CYP19A1 (1588),TACR1 (6869),SRD5A2 (6716),MMP2 (4313),TSSK3 (81629),PIP4K2C (79837),GPR173 (54328),CDC42BPB (9578),CYP17A1 (1586),MAP4K5 (11183),PROKR1 (10887),ABL1 (25),SLC6A14 (11254),CA11 (770),ADRA2B (151),PSMD2 (5708),ENPP1 (5167),CBR3 (874),PDE7A (5150),KCNA3 (3738),ALOX15 (246),HTR3B (9177),HTR3D (200909),MAPK12 (6300),PPARA (5465),PROKR2 (128674),TUBA3D (113457),HTR1E (3354),MAPK8 (5599),CACNA1B (774),SLC6A5 (9152),LTB4R2 (56413),CHRNB2 (1141),CHRNA10 (57053),TAOK1 (57551),GALR3 (8484),JAK1 (3716),TUBA1A (7846),ABCB1 (5243),UCKL1 (54963),RXRG (6258),SLC6A15 (55117),NR2C1 (7181),TNNC1 (7134),BLK (640),NR2F2 (7026),ESRRG (2104),CSF1R (1436),OPN1LW (5956)
694,786-0,ACH-000649,0.0,0.014355,0.0,4.330558,0.0,7.324901,7.238787,6.603923,3.975447,2.809414,0.0,3.084064,0.028569,5.013016,0.056584,3.69488,0.0,0.042644,3.841973,1.02148,0.0,0.084064,0.042644,0.014355,0.0,3.488001,0.0,0.124328,0.0,0.941106,0.0,0.0,0.263034,5.264912,4.819668,0.0,0.0,0.0,2.594549,0.0,0.0,0.0,0.084064,0.028569,6.596488,6.001127,7.904183,4.684819,0.0,0.0,0.0,3.499527,0.0,0.0,0.084064,0.0,0.0,5.69655,5.807097,0.0,0.014355,3.904966,3.975447,1.238787,7.538538,0.782409,0.0,0.31034,3.374344,0.0,0.0,3.705978,5.824004,0.0,2.046142,1.521051,0.286881,0.0,0.0,4.009885,2.247928,9.462952,4.146492,0.070389,0.070389,5.464015,0.0,2.140779,0.695994,0.0,0.0,4.734981,0.378512,0.042644,3.481557,4.3875,0.0,2.722466,0.124328,7.206917,2.763412,0.176323,4.137504,3.974529,0.0,0.028569,0.0,0.028569,4.658211,0.0,0.014355,4.812498,6.27221,0.028569,0.0,1.536053,0.0,0.014355,6.178117,4.191405,0.0,2.370164,6.449561,0.0,0.014355,0.0,0.0,0.0,2.24184,0.0,0.333424,0.0,3.460743,1.604071,6.32301,0.137504,6.514122,0.0,0.084064,0.263034,6.261907,0.042644,0.0,3.049631,4.263786,0.485427,4.064366,0.0,2.916477,4.404631,0.014355,4.830864,11.218805,6.683135,6.886062,0.0,0.0,0.0,0.0,0.0,6.228434,0.0,3.70044,0.298658,6.97728,0.0,0.0,7.520108,1.974529,4.123501,0.201634,0.0,0.0,4.721919,0.014355,0.321928,0.111031,0.238787,2.411426,0.0,3.0,0.0,3.956986,0.097611,0.0,0.0,6.584812,1.718088,0.124328,0.0,0.0,5.140779,3.866908,2.321928,3.513491,0.028569,0.176323,0.31034,3.485427,0.042644,0.0,0.0,0.0,0.0,0.0,1.367371,4.861955,1.956057,0.028569,0.056584,5.255123,0.0,3.971773,0.070389,0.0,0.0,0.0,0.042644,1.448901,6.450881,1.9855,7.356232,0.0,0.028569,0.15056,5.373996,0.014355,2.937344,7.334407,1.432959,0.659925,0.0,8.191257,7.147001,5.509696,0.042644,0.555816,0.0,0.0,0.028569,0.454176,0.0,1.124328,1.646163,1.618239,0.0,0.0,0.356144,0.263034,0.028569,5.417515,2.395063,0.124328,0.028569,0.189034,6.60585,3.102658,2.035624,4.243364,0.0,0.0,3.331992,0.0,0.594549,0.056584,0.0,0.0,0.757023,0.0,1.536053,5.372256,4.130931,4.555816,0.669027,2.891419,2.722466,0.485427,3.100978,2.31034,0.650765,0.056584,4.137504,1.823749,0.028569,0.0,0.0,6.38111,8.10376,1.803227,0.992768,7.328047,2.634593,0.014355,0.0,0.0,0.124328,0.014355,0.056584,0.042644,0.189034,0.014355,11.895462,5.704319,0.028569,0.084064,2.863938,0.0,5.51885,0.014355,0.226509,0.0,0.367371,0.028569,0.028569,0.321928,1.042644,0.815575,3.710393,2.797013,2.752749,9.716511,0.0,3.812498,1.176323,0.014355,3.122673,0.344828,2.771886,0.0,4.210233,6.201634,4.135863,0.411426,0.0,0.807355,3.879706,0.176323,0.056584,0.0,0.0,0.0,0.0,0.014355,0.070389,0.0,0.0,2.179511,0.0,5.124742,5.460087,0.014355,0.15056,1.144046,1.344828,8.597978,0.0,0.111031,0.014355,0.0,6.161283,4.055716,3.31904,3.50716,0.0,5.730096,1.799087,0.042644,0.0,4.041769,3.576522,0.0,0.0,4.586765,0.0,0.0,0.0,1.201634,0.356144,0.014355,3.125982,0.084064,2.735522,0.0,0.863938,6.938168,8.64958,0.0,0.0,0.286881,7.623004,3.716991,0.250962,6.826803,0.0,1.673556,0.516015,3.82985,3.454176,0.111031,5.720005,0.028569,0.0,0.807355,0.028569,6.100978,2.0,3.650765,1.516015,0.226509,3.185867,1.298658,0.124328,0.0,0.516015,0.0,0.111031,0.111031,1.531069,3.917432,1.117695,0.014355,2.895303,7.793961,4.70044,0.028569,0.0,0.014355,2.788686,0.0,0.014355,5.340562,1.709291,2.689299,0.014355,3.01614,5.910493,0.042644,3.240314,0.454176,0.454176,3.023255,0.163499,4.857981,0.042644,8.541445,0.070389,0.0,0.028569,7.448488,0.0,1.871844,0.070389,8.906921,1.356144,0.070389,2.049631,0.321928,5.678917,0.0,4.093391,3.674687,5.955359,0.333424,0.214125,0.432959,0.0,5.127221,0.918386,3.920293,2.794936,4.216455,1.632268,0.0,7.508587,4.296457,0.0,0.545968,0.659925,0.111031,4.619413,3.237258,4.475085,0.0,0.028569,0.0,0.0,4.908333,0.545968,0.014355,3.347666,7.526695,0.0,0.0,4.789729,4.778209,4.769243,5.821455,6.096346,8.191306,7.426936,0.042644,5.013016,0.0,6.162895,0.028569,0.014355,0.0,0.056584,8.064689,0.0,0.028569,0.0,4.492494,7.468665,0.0,0.124328,3.367371,5.612058,0.111031,0.0,6.821328,3.905928,0.0,1.405992,0.028569,0.0,1.799087,5.11395,0.263034,0.757023,0.163499,0.0,0.014355,0.0,5.526382,0.014355,0.0,0.0,0.014355,5.074249,0.0,2.974529,0.226509,3.845992,5.626147,0.0,0.0,0.111031,0.014355,0.0,0.0,0.298658,0.545968,0.0,6.998872,2.865919,0.286881,3.943921,0.0,0.0,4.018812,0.0,0.0,3.185867,4.05745,0.176323,0.056584,0.0,0.014355,0.0,1.195348,0.0,0.042644,1.356144,0.163499,0.0,0.333424,0.014355,0.0,2.883621,5.228049,0.0,0.028569,1.111031,0.014355,0.042644,4.438958,5.132166,4.566815,0.0,0.111031,0.0,0.014355,0.028569,0.0,1.104337,0.0,0.411426,0.0,1.646163,0.526069,0.014355,5.44228,6.572283,4.01614,0.0,0.0,3.887525,0.014355,5.115616,0.0,0.0,1.748461,0.028569,10.282857,0.0,1.565597,0.0,0.687061,0.014355,0.815575,0.0,0.014355,0.0,4.42156,6.148934,0.214125,0.0,0.0,0.014355,0.0,4.713696,1.111031,4.650765,0.963474,5.075533,0.0,4.280956,0.0,5.687621,0.0,0.15056,0.0,9.403289,3.215679,3.844988,3.545968,0.0,0.014355,0.0,0.0,3.983678,2.931683,0.0,0.189034,0.0,5.950702,0.0,0.0,0.879706,0.070389,0.748461,3.528571,0.0,7.008429,4.465322,4.398487,4.641546,0.0,0.137504,4.793896,0.070389,0.028569,3.880686,0.097611,0.815575,0.0
1316,A2058,ACH-000788,0.0,0.0,4.313971,3.539779,0.0,7.786531,6.597829,0.097611,4.460743,0.584963,0.070389,3.41007,2.543496,4.514753,0.275007,4.08151,0.0,1.056584,4.036503,1.70044,0.084064,0.042644,0.014355,3.489286,0.0,3.70044,0.014355,0.163499,0.028569,0.575312,0.0,0.0,0.0,0.111031,5.928133,0.070389,0.056584,0.014355,4.684819,0.014355,0.0,0.014355,0.250962,0.014355,6.261719,6.258896,8.043793,5.1534,0.0,0.042644,0.028569,0.042644,0.0,0.0,0.163499,0.0,0.0,4.586164,6.735116,0.0,4.469235,4.450221,4.110196,3.063503,6.710944,1.049631,0.111031,0.084064,3.966246,0.0,0.042644,4.754888,5.855242,0.0,1.589763,0.464668,0.0,0.042644,0.0,4.621173,0.713696,8.449479,0.163499,0.214125,0.0,4.988685,0.0,0.298658,0.411426,0.014355,0.0,4.017031,1.910733,3.090853,0.378512,5.878725,0.0,2.9855,0.014355,7.179312,0.214125,0.042644,4.305241,2.817623,0.056584,0.0,0.250962,0.070389,4.960234,0.014355,0.014355,4.346957,6.808256,0.201634,0.097611,0.863938,2.392317,0.014355,5.40973,3.38405,0.992768,1.207893,5.410748,0.226509,0.028569,0.0,0.0,0.0,6.346602,0.0,0.124328,0.0,3.360364,0.111031,5.607626,0.669027,0.823749,0.0,0.526069,1.144046,7.042425,1.063503,0.0,3.046142,3.904002,0.731183,2.100978,0.070389,3.451541,3.997292,0.056584,5.422906,10.2182,6.700856,5.673556,2.157044,0.238787,0.097611,0.0,0.15056,6.45253,0.014355,6.905928,0.0,7.953614,0.084064,0.0,7.476139,2.941106,4.149747,0.925999,0.0,0.0,1.378512,0.0,5.114367,0.0,0.773996,3.399171,0.0,4.44427,0.0,5.14323,0.014355,0.0,0.0,7.183784,0.992768,0.014355,0.0,0.042644,3.58376,4.084064,3.72465,4.97728,0.0,5.776367,0.632268,0.176323,0.028569,1.748461,0.111031,0.0,0.0,0.0,2.403268,4.375039,2.353323,0.432959,0.0,4.502076,0.014355,0.097611,0.163499,0.028569,0.0,0.0,0.014355,0.070389,5.128458,2.367371,6.074034,0.028569,0.0,0.201634,0.163499,0.042644,3.431623,8.254556,1.292782,2.137504,0.014355,6.912051,6.8098,6.215873,0.226509,1.555816,0.0,2.207893,0.0,0.765535,0.0,5.50462,0.941106,0.028569,0.464668,0.0,0.250962,0.124328,5.566511,5.396776,6.158862,2.750607,0.042644,5.449891,6.453847,2.819668,4.228819,2.513491,0.0,0.495695,4.593354,0.084064,0.070389,0.0,0.321928,0.042644,3.061776,0.056584,3.926948,5.986183,3.629939,4.560104,1.189034,2.790772,0.411426,0.389567,3.560715,5.443938,3.094236,0.084064,4.829342,2.523562,0.238787,0.014355,0.0,6.907251,8.318678,0.704872,0.0,6.759156,4.805808,0.042644,0.0,0.0,0.042644,0.014355,1.361768,0.0,0.15056,0.367371,11.191923,6.119771,0.097611,0.0,4.203984,0.31034,4.103498,0.014355,0.0,0.0,0.0,0.0,4.254745,3.370164,2.641546,1.207893,7.631323,1.819668,3.998196,8.902888,0.505891,4.168321,0.014355,0.344828,6.614563,0.422233,1.367371,0.0,2.983678,4.931683,4.646163,4.910733,0.15056,0.565597,4.506526,3.635754,0.389567,0.0,0.0,0.0,0.0,0.0,0.275007,0.0,0.014355,1.879706,0.0,0.097611,3.295723,3.084064,0.163499,1.480265,0.443607,7.678283,0.0,0.163499,0.0,0.0,5.8089,3.075533,3.196922,4.110196,0.0,5.738768,0.298658,0.070389,0.014355,3.412782,3.454176,2.773996,0.014355,4.301588,0.0,0.0,0.137504,0.485427,0.028569,0.0,0.903038,0.970854,2.83996,3.38405,0.536053,6.597084,7.908513,0.0,0.0,1.459432,7.137401,6.663914,0.056584,7.022812,0.0,1.176323,6.746716,3.730096,4.130931,0.226509,5.493775,0.028569,0.0,2.957915,0.669027,5.106851,3.095924,3.283922,0.782409,0.028569,3.229588,1.378512,0.516015,0.400538,0.847997,0.0,0.014355,0.641546,2.970854,3.978196,1.454176,0.097611,3.938286,5.833649,4.752749,0.495695,0.0,0.176323,0.111031,0.137504,0.014355,4.734439,2.017922,3.177918,0.111031,3.755956,5.444601,0.956057,3.134221,0.275007,0.0,1.83996,1.422233,5.216843,0.0,8.350541,0.0,0.0,0.014355,6.863319,0.545968,0.201634,0.070389,9.414432,1.803227,0.0,1.782409,7.294529,5.736605,0.0,5.255501,0.097611,5.634012,5.191405,0.695994,0.757023,0.028569,5.593354,1.584963,5.130519,4.550901,4.346957,3.590961,0.014355,4.463361,4.207112,0.0,2.275007,1.182692,0.111031,5.071677,3.153805,4.409391,0.014355,0.389567,0.0,0.226509,0.042644,0.650765,0.432959,6.294621,8.095344,0.0,0.464668,6.534809,5.203984,4.531069,4.613532,5.963936,8.739679,7.334318,0.0,5.05398,0.014355,5.361417,0.0,0.014355,0.0,0.111031,1.735522,0.0,0.028569,0.0,0.111031,6.14323,0.0,0.250962,3.799087,4.361768,0.014355,0.0,5.623223,4.524189,0.0,0.575312,0.124328,0.0,1.914565,5.185074,0.163499,0.356144,0.201634,0.0,0.014355,0.0,5.427271,0.0,0.0,0.0,0.298658,4.62527,0.042644,4.067811,0.014355,3.044394,4.64789,0.0,0.443607,0.378512,0.298658,0.0,0.0,1.028569,0.275007,0.0,5.747656,3.587365,0.641546,3.943921,0.111031,0.0,5.048759,0.0,0.0,3.072106,5.128046,0.226509,0.042644,0.0,0.0,0.014355,0.823749,0.014355,0.056584,0.176323,0.014355,0.0,0.739848,0.014355,0.0,3.372952,4.662205,0.0,0.137504,1.599318,0.111031,1.189034,4.42156,3.961623,3.533563,0.0,0.137504,0.0,0.15056,0.014355,0.0,0.400538,0.15056,1.786596,0.0,1.871844,2.715893,0.014355,5.387156,7.051481,4.55888,0.137504,0.0,4.074677,0.0,4.82273,0.0,0.226509,2.060047,0.0,10.696359,0.0,4.324811,0.0,0.070389,0.070389,0.0,0.097611,0.0,0.014355,4.319762,5.555203,2.280956,0.214125,0.0,0.084064,0.0,6.414812,1.443607,4.269781,0.028569,5.103078,0.0,4.570463,0.632268,4.873321,0.0,2.646163,0.014355,8.270622,2.007196,5.078524,3.496974,0.0,0.014355,0.070389,0.0,4.619413,2.531069,0.0,0.238787,0.0,4.24184,0.028569,0.0,2.443607,0.15056,1.137504,3.201634,0.028569,4.185867,5.175525,0.042644,4.926948,3.01614,4.233428,4.025915,0.097611,0.0,4.897724,0.632268,0.056584,0.0
998,A2780,ACH-000657,1.286881,0.097611,0.028569,3.61471,0.0,1.531069,7.395063,2.889474,0.176323,0.111031,0.0,3.308885,3.193772,4.402586,0.084064,2.639232,0.0,0.163499,5.004501,0.163499,0.097611,0.124328,0.042644,0.0,0.014355,3.763412,0.097611,0.014355,0.042644,0.464668,0.0,0.028569,0.0,4.22265,4.487358,0.695994,1.989139,0.014355,6.496175,0.0,0.0,0.014355,0.250962,0.070389,5.253611,5.405312,8.34163,5.499527,0.286881,0.0,0.823749,0.056584,0.0,0.0,2.62293,0.014355,0.238787,4.01078,5.759422,0.0,4.818135,0.163499,4.705425,2.397803,6.570766,0.333424,2.31904,1.31034,4.196922,0.0,0.214125,5.331992,5.350144,0.028569,0.137504,1.400538,0.014355,0.014355,0.014355,3.681449,0.226509,2.641546,0.028569,0.0,0.31034,5.652486,0.0,1.778209,0.137504,0.084064,0.028569,0.097611,0.0,1.819668,0.344828,0.084064,0.028569,3.922198,0.014355,6.560868,0.201634,2.364572,4.281698,0.731183,0.028569,0.028569,0.042644,0.226509,4.965323,0.0,0.070389,3.807355,3.992768,0.014355,0.070389,0.495695,1.286881,0.201634,5.502076,3.527321,0.028569,0.042644,4.754353,0.014355,0.028569,0.070389,0.0,0.028569,2.295723,0.124328,0.014355,0.0,2.107688,0.0,5.44062,2.709291,1.664483,0.014355,4.397803,0.124328,3.527321,0.176323,0.0,3.629939,3.929791,0.485427,0.028569,2.611172,3.023255,3.578939,0.214125,4.904002,8.866042,6.377991,6.453518,1.941106,1.575312,6.443441,0.0,0.356144,5.002703,0.097611,0.226509,0.475085,8.486473,0.028569,0.0,7.454505,2.655352,3.974529,1.739848,0.0,0.0,1.292782,0.0,5.140779,0.111031,1.952334,3.726831,0.084064,5.830103,0.0,4.28244,0.0,0.028569,0.0,7.011339,1.599318,3.903038,0.042644,0.176323,3.339137,3.609991,3.32625,4.060047,0.070389,0.070389,0.176323,3.017922,0.0,0.014355,0.0,0.0,2.372952,0.163499,0.863938,4.32553,1.555816,0.0,0.028569,4.709291,0.807355,0.056584,0.056584,0.201634,0.0,0.464668,0.0,0.333424,4.791814,2.950468,5.122673,0.0,1.664483,0.948601,1.454176,0.014355,3.357552,7.298017,4.65019,2.589763,0.014355,6.226123,7.210525,5.951168,0.014355,0.757023,1.85599,0.070389,0.0,3.294253,0.0,2.419539,0.847997,0.0,5.413459,0.0,0.214125,0.0,2.160275,4.447579,1.941106,0.250962,0.056584,0.238787,6.071891,3.288359,0.214125,5.362821,0.124328,0.0,4.178715,0.111031,0.014355,0.056584,0.111031,0.042644,2.763412,2.094236,3.664483,5.781097,4.042644,3.817623,2.140779,3.745237,0.189034,0.014355,2.748461,4.05398,4.165108,0.084064,3.160275,1.735522,1.970854,0.0,0.0,1.117695,7.928548,1.117695,0.0,6.474598,3.802193,0.176323,0.0,0.056584,0.014355,0.0,0.084064,0.0,1.867896,0.378512,10.731828,6.225159,0.028569,0.042644,3.896272,0.0,5.159064,0.163499,0.056584,0.0,0.526069,0.0,0.028569,0.014355,0.042644,1.422233,6.006522,1.137504,1.226509,8.718053,0.739848,3.443607,1.815575,0.137504,0.176323,0.495695,0.014355,0.0,0.014355,4.090853,4.120186,5.126808,0.056584,2.070389,4.670161,0.298658,0.014355,0.0,0.028569,1.130931,0.0,0.0,0.201634,0.042644,0.070389,4.436961,0.422233,0.516015,0.454176,2.521051,0.097611,1.608809,0.111031,7.411002,2.336283,0.432959,0.0,0.0,6.156842,0.333424,3.41684,3.673556,0.0,5.152183,0.0,0.028569,0.0,3.275007,3.539779,0.111031,0.014355,4.128458,0.0,0.0,0.084064,0.070389,0.070389,0.014355,0.014355,0.201634,4.417515,0.0,0.526069,3.85997,8.252902,0.0,0.0,3.448901,7.862637,3.464668,0.641546,7.089583,0.0,0.084064,0.516015,3.970854,4.39163,0.0,6.004277,0.070389,0.028569,0.042644,0.286881,5.487679,3.152183,3.539779,0.056584,0.042644,2.782409,0.356144,0.918386,0.214125,1.786596,0.0,0.042644,1.144046,0.650765,4.078097,5.0387,0.084064,2.263034,6.575917,4.508429,0.056584,0.0,0.163499,1.411426,0.189034,1.049631,0.028569,2.257011,8.314289,0.124328,1.910733,4.522307,3.360364,2.809414,2.536053,0.0,0.028569,1.007196,5.206331,0.0,7.308157,0.356144,0.014355,0.176323,3.097611,0.097611,0.014355,0.056584,9.310976,1.565597,0.028569,1.438293,1.827819,5.971314,0.014355,3.765535,0.782409,4.950468,6.429281,0.070389,0.831877,0.014355,5.897724,1.851999,5.12143,3.697107,6.032542,2.847997,0.0,0.333424,3.019702,0.028569,0.344828,1.411426,3.465974,5.111866,4.370164,3.80426,0.042644,0.505891,0.0,0.028569,0.056584,3.129283,0.594549,3.496974,7.517748,0.536053,5.32301,3.385431,6.135248,3.762349,4.330558,6.509062,5.638364,7.046469,0.555816,4.505256,0.014355,5.334139,0.124328,0.0,0.0,0.028569,0.933573,0.0,0.028569,0.014355,8.533485,6.694184,0.014355,0.963474,3.925999,6.345538,0.014355,0.632268,5.082362,1.541019,0.0,0.378512,2.974529,0.0,2.140779,1.02148,0.389567,0.014355,0.0,0.0,0.432959,0.0,6.079378,0.495695,0.0,0.0,0.070389,2.742006,0.028569,3.443607,2.946731,2.726831,4.333424,0.014355,0.097611,0.275007,0.014355,0.014355,0.0,0.042644,0.275007,0.0,5.964861,4.257011,2.550901,4.604071,0.014355,0.0,5.025029,0.070389,0.0,2.715893,4.727376,0.028569,0.0,0.0,0.014355,0.028569,0.765535,0.0,0.765535,0.028569,1.298658,0.070389,0.505891,0.0,0.0,2.659925,4.402586,0.042644,0.669027,2.765535,0.124328,0.014355,3.658783,3.354734,4.382667,0.014355,0.286881,0.084064,0.042644,0.189034,0.0,0.286881,0.028569,7.550901,0.0,0.028569,2.378512,0.014355,5.922674,7.019702,1.944858,0.028569,0.014355,3.465974,0.0,6.007644,0.0,0.584963,1.695994,0.31034,9.847057,0.0,4.104337,0.014355,0.056584,0.321928,0.070389,0.933573,0.0,0.0,3.750607,5.303781,0.344828,0.014355,0.014355,0.014355,0.014355,0.422233,0.85599,3.915521,0.097611,5.941106,0.0,4.672425,0.0,5.047015,0.214125,5.992995,0.028569,8.769706,0.056584,1.555816,3.863938,0.014355,0.263034,0.0,0.0,5.999324,1.963474,0.0,0.226509,0.014355,4.313971,1.871844,0.0,2.301588,0.238787,0.485427,3.836934,0.124328,3.030336,5.47476,0.097611,4.739308,0.0,0.713696,4.882154,5.135453,0.056584,2.198494,3.196922,0.014355,0.0
1185,A375,ACH-000219,0.0,0.0,3.385431,2.82171,0.0,5.535431,6.361066,0.201634,3.518535,0.650765,0.189034,2.989139,2.217231,4.093391,0.014355,3.794936,0.0,0.948601,4.250204,0.62293,0.097611,0.0,0.042644,3.463361,0.014355,3.830864,0.028569,0.028569,0.028569,0.163499,0.0,0.014355,0.0,0.400538,5.425258,0.238787,0.042644,0.0,2.845992,0.070389,0.0,0.014355,0.176323,0.704872,5.810443,6.07596,7.496335,5.192589,0.163499,0.028569,0.137504,0.084064,0.0,0.0,0.15056,0.014355,0.0,2.799087,6.114783,0.0,4.31034,2.978196,3.411426,2.794936,6.839456,1.117695,0.042644,0.298658,2.807355,0.0,0.0,4.488001,4.244887,0.0,2.100978,0.678072,0.0,0.214125,0.042644,3.44228,1.195348,10.283088,1.636915,0.163499,0.604071,5.710944,0.0,1.831877,0.201634,0.238787,0.0,3.83289,0.0,3.297191,1.195348,4.963936,0.028569,3.215679,0.014355,6.887891,1.0,0.014355,4.369466,2.695994,0.028569,0.0,0.0,0.028569,4.683135,0.0,0.516015,4.628774,6.177121,0.028569,0.014355,3.973611,0.111031,0.201634,5.725196,3.386811,0.918386,3.385431,4.893362,0.111031,0.014355,0.028569,0.042644,0.0,5.279471,0.0,2.094236,0.0,2.560715,0.910733,5.468583,0.201634,3.78136,0.0,0.263034,0.555816,4.962086,1.014355,0.0,3.192194,4.004501,0.526069,0.815575,0.286881,3.382667,2.538538,0.028569,5.793896,9.904605,6.242603,6.501121,2.414136,0.176323,0.0,0.014355,0.641546,5.105594,0.124328,5.798828,0.367371,7.792074,0.0,0.0,7.203397,2.094236,4.110196,1.007196,0.0,0.0,3.50716,0.0,4.9855,0.0,0.15056,2.370164,0.0,5.215679,0.15056,3.834913,0.028569,0.0,0.0,6.632995,2.229588,0.0,0.0,0.070389,2.776104,5.169925,2.636915,4.393004,0.111031,6.263034,0.505891,0.070389,0.0,2.996389,0.014355,0.0,0.0,0.028569,2.361768,4.33985,1.910733,1.090853,0.070389,4.215679,0.0,0.0,0.014355,0.042644,0.0,0.0,0.124328,0.111031,5.915043,3.415488,6.292966,0.014355,0.0,0.056584,1.49057,0.028569,3.508429,7.587515,0.925999,3.198494,0.0,7.981168,7.01022,5.597531,0.028569,1.238787,0.0,1.883621,0.0,0.31034,0.070389,5.913608,0.713696,0.070389,0.0,0.0,0.111031,0.344828,2.117695,4.998196,3.114367,3.061776,0.189034,1.847997,5.968321,3.397803,2.130931,2.568032,0.0,0.124328,3.682573,0.014355,0.0,0.014355,0.042644,0.0,3.200065,0.15056,3.533563,5.981168,3.587365,4.203201,1.752749,3.193772,0.565597,1.144046,2.865919,3.001802,1.157044,0.238787,4.439623,2.885574,0.695994,0.0,0.0,6.30305,7.480911,0.641546,0.0,7.070389,4.217231,0.238787,0.0,0.0,0.014355,0.0,1.438293,0.0,0.084064,0.333424,11.044053,4.732812,0.042644,0.0,4.139961,0.15056,4.420887,0.028569,0.070389,0.163499,0.565597,0.0,2.38405,0.475085,3.635754,0.400538,6.693626,1.495695,4.503985,9.1484,0.389567,3.914565,0.555816,0.0,3.851999,0.389567,1.713696,0.0,1.427606,4.410748,5.695159,4.59156,0.124328,0.014355,4.347666,2.925999,1.459432,0.0,0.084064,0.0,0.0,0.014355,0.042644,0.0,0.0,3.38819,0.0,0.097611,3.592158,3.695994,0.014355,1.0,0.918386,7.075853,0.056584,0.321928,0.0,0.0,5.841973,3.598127,3.198494,2.891419,0.0,4.566206,0.056584,0.097611,0.0,3.288359,3.847997,2.611172,0.0,4.863443,0.0,0.028569,1.443607,3.344828,0.9855,0.0,1.02148,0.298658,4.059182,0.298658,0.15056,6.040673,7.965207,0.422233,0.0,2.182692,7.047124,5.638943,0.097611,6.536053,0.0,0.389567,6.732541,3.252476,4.418865,0.526069,5.417177,0.014355,0.028569,1.505891,0.263034,4.714246,4.036503,3.825786,0.505891,0.475085,3.620586,4.1152,0.941106,0.070389,2.477677,0.0,0.097611,0.536053,3.485427,3.732269,2.223423,0.042644,3.496974,6.57107,4.522307,0.111031,0.0,1.400538,0.163499,0.084064,0.189034,3.192194,3.007196,1.807355,0.028569,3.836934,5.078524,2.140779,3.514753,0.201634,0.056584,5.111449,0.933573,5.642702,0.056584,8.422359,0.250962,0.0,0.0,7.948134,0.0,0.070389,0.028569,9.680817,1.292782,0.042644,1.704872,7.411596,6.095292,0.0,4.298658,3.153805,5.771093,4.432291,0.028569,0.356144,0.0,5.569552,1.232661,4.75007,4.214125,4.491853,3.982765,0.0,4.589763,3.257011,0.0,1.378512,2.316146,0.0,5.842979,3.9855,4.006298,0.014355,0.111031,0.0,0.238787,0.042644,2.100978,0.400538,5.252476,6.897603,0.0,1.565597,5.08151,4.493135,4.348374,3.481557,6.924456,9.606239,7.134632,0.056584,3.914565,0.056584,5.196135,0.028569,0.0,0.0,0.070389,0.669027,0.0,0.042644,0.0,0.124328,6.656639,0.0,0.632268,3.737687,4.942984,0.070389,0.014355,5.897482,1.773996,0.0,0.956057,2.137504,0.056584,2.769772,4.740928,0.411426,0.084064,0.214125,0.0,0.238787,0.0,6.564835,0.014355,0.0,0.0,0.084064,4.720826,0.0,4.322649,0.084064,2.837943,4.995485,0.0,0.941106,0.411426,0.432959,0.014355,0.014355,1.769772,0.941106,0.0,4.775051,5.0054,0.0,3.177918,0.0,0.028569,5.175125,0.0,0.0,3.212569,4.351204,0.189034,0.0,0.0,0.014355,0.014355,0.400538,0.0,0.042644,0.0,0.056584,0.0,0.275007,0.014355,0.0,3.283922,4.903038,0.014355,0.056584,1.895303,0.137504,2.100978,3.311794,2.792855,3.179511,0.014355,0.176323,0.0,0.15056,0.0,0.0,0.695994,0.0,1.650765,0.0,3.85997,1.510962,0.028569,5.710944,6.715756,4.067811,0.613532,0.0,2.849999,0.014355,4.68818,0.0,0.321928,1.510962,0.0,9.671576,0.0,3.099295,0.014355,0.0,0.356144,0.464668,0.0,0.0,0.014355,4.311794,5.424922,0.565597,0.111031,0.070389,0.028569,0.0,6.018145,1.823749,4.881665,0.014355,4.330558,0.0,3.786596,0.0,4.710944,0.0,2.100978,0.070389,8.24246,1.31034,3.740928,3.272023,0.0,0.0,0.0,0.0,3.713696,1.678072,0.0,0.028569,0.0,4.125155,0.014355,0.0,2.263034,0.790772,0.464668,4.023255,0.0,4.497612,6.434795,1.627607,5.138323,4.958843,4.766595,4.474436,0.659925,0.028569,4.512227,0.189034,0.263034,0.0
1269,A498,ACH-000555,0.042644,0.084064,0.056584,3.025029,0.0,6.922317,6.33396,7.592831,5.526382,1.111031,0.084064,3.124328,1.541019,3.371559,0.056584,3.516015,0.0,1.95977,3.258519,0.333424,0.15056,0.263034,0.028569,0.0,0.0,2.577731,0.695994,0.042644,0.014355,1.367371,0.0,0.014355,0.0,5.828073,4.776104,0.238787,0.014355,0.014355,5.938521,0.0,0.0,0.0,0.070389,0.201634,6.087675,5.036064,7.435379,3.887525,0.815575,0.014355,0.163499,3.234195,0.0,0.0,0.389567,0.014355,0.111031,4.351204,4.761285,0.0,0.028569,1.843984,5.732812,2.899176,6.035844,1.333424,1.157044,0.933573,2.316146,0.014355,0.0,3.892391,4.521051,0.0,2.632268,1.169925,0.263034,0.0,0.014355,2.91265,2.084064,10.22062,3.400538,0.356144,0.0,4.186659,0.0,2.584963,0.163499,0.238787,0.0,5.050502,0.070389,0.0,3.155425,0.028569,0.028569,2.223423,0.070389,5.879461,2.568032,0.400538,2.662205,2.405992,0.028569,0.0,0.028569,0.189034,2.799087,0.0,0.0,3.983678,5.407693,0.014355,0.0,1.049631,0.0,0.555816,4.221877,4.653633,1.157044,5.816344,6.358256,0.111031,0.0,0.042644,0.028569,0.014355,1.782409,0.084064,0.226509,0.0,2.550901,1.400538,5.344473,0.238787,5.719457,0.0,4.08151,0.084064,4.06953,0.137504,0.0,1.963474,3.671293,0.815575,3.102658,0.201634,2.908813,4.092546,0.214125,5.524503,9.875181,5.851749,5.546894,3.165108,1.275007,1.111031,0.0,0.084064,6.211207,0.0,7.303141,1.195348,7.305332,0.0,0.0,6.867032,1.933573,2.307429,1.744161,0.0,0.0,5.81455,0.042644,4.934517,0.014355,1.0,4.885574,0.575312,4.576522,0.0,5.108943,0.042644,0.028569,0.0,5.876517,1.226509,1.226509,0.0,0.028569,5.15583,2.9855,2.189034,4.69488,0.097611,0.956057,1.650765,0.111031,0.014355,0.056584,0.0,0.014355,0.0,0.014355,1.333424,4.596339,1.823749,0.014355,0.056584,3.447579,0.028569,0.042644,0.124328,0.0,0.0,0.0,0.014355,0.070389,5.180307,3.224966,5.517276,0.014355,0.056584,0.084064,5.457463,0.014355,4.537917,6.574404,0.687061,0.526069,0.014355,7.03848,6.049413,4.92837,0.097611,2.961623,0.0,2.185867,0.056584,0.807355,0.0,6.952916,1.9855,0.056584,0.0,0.028569,2.269033,0.0,0.0,4.071248,2.028569,1.035624,0.0,0.124328,5.590362,2.435629,1.063503,4.740388,0.042644,0.042644,4.013462,0.632268,5.888256,0.15056,0.0,0.0,0.799087,0.722466,4.168321,4.589763,4.759156,2.792855,1.687061,2.121015,3.550901,0.678072,2.153805,5.219556,1.744161,0.097611,4.329124,1.952334,0.871844,0.014355,0.0,7.442031,6.521365,1.669027,0.356144,6.858105,5.281327,0.545968,0.0,0.85599,0.028569,0.0,0.62293,0.042644,4.813012,0.773996,10.655441,8.821615,0.321928,0.321928,3.894333,0.084064,5.094236,0.879706,0.0,0.0,2.111031,0.0,0.014355,5.240314,0.014355,2.211012,6.81839,2.467279,1.752749,8.553898,0.042644,2.831877,0.565597,4.392317,7.472813,0.454176,2.277985,0.0,1.906891,5.87799,3.833902,0.056584,0.0,4.72792,3.454176,0.847997,0.0,0.028569,0.0,0.014355,0.028569,0.0,0.214125,0.0,0.0,2.980025,0.042644,4.507795,3.934517,0.214125,0.226509,1.104337,1.367371,6.537296,2.097611,0.189034,0.0,0.0,4.885574,3.234195,1.575312,3.460743,0.0,4.670727,0.226509,0.042644,0.0,3.903038,1.580145,0.042644,0.0,6.958611,0.0,0.0,0.250962,0.070389,0.0,0.028569,3.100978,0.137504,4.772414,0.056584,1.157044,5.341274,6.335926,0.0,0.084064,1.823749,6.972922,5.667324,0.070389,6.245458,0.0,0.124328,1.38405,2.575312,4.059182,0.056584,4.732812,0.014355,0.028569,0.495695,0.176323,4.106851,4.142413,3.702658,2.618239,0.014355,3.040892,6.923625,0.485427,0.344828,1.550901,0.0,0.124328,1.292782,2.438293,2.304511,3.24184,0.014355,2.922198,6.321567,4.59156,0.400538,0.782409,0.028569,3.344828,0.432959,2.488001,5.849999,3.788686,6.324451,0.056584,3.439623,5.062208,0.189034,2.503349,0.250962,0.0,4.360364,0.739848,3.979111,0.028569,7.589838,0.422233,0.042644,0.0,5.08534,0.0,0.757023,0.028569,1.914565,1.104337,0.970854,1.432959,1.244887,4.365972,0.432959,4.57289,3.771886,6.307793,0.516015,0.422233,0.565597,0.0,4.852498,0.432959,4.801676,3.776104,4.337711,3.044394,0.0,6.586314,2.797013,0.0,3.012569,0.782409,0.097611,5.399171,5.224581,4.726831,0.014355,0.887525,0.0,0.070389,7.876517,1.163499,0.0,5.46238,8.725298,0.0,0.163499,5.659354,5.540709,2.819668,5.841218,4.728465,8.356408,6.533252,0.189034,3.878725,0.0,5.362119,0.042644,0.0,0.0,5.989593,8.371864,0.0,0.028569,0.0,4.956986,6.196332,0.0,3.840967,4.452859,6.551516,0.084064,0.163499,5.092546,4.809929,0.0,1.372952,1.232661,0.0,1.608809,5.414474,0.62293,1.361768,0.056584,0.0,0.0,0.0,5.723012,0.014355,0.0,0.0,0.042644,4.82171,0.0,3.283922,0.250962,3.718088,5.070819,0.0,0.594549,0.15056,0.042644,0.0,0.014355,0.678072,0.344828,0.028569,7.21393,3.258519,0.422233,3.276497,0.0,0.0,3.982765,0.0,0.0,3.361768,3.575312,0.226509,0.0,0.0,0.056584,0.0,2.998196,0.014355,0.014355,1.117695,0.422233,0.0,1.014355,0.042644,0.0,3.382667,4.684819,0.014355,0.367371,0.475085,0.028569,0.014355,4.340562,3.9855,4.699885,0.0,0.056584,0.111031,0.176323,0.097611,0.056584,0.214125,0.070389,4.494416,0.0,1.967169,2.865919,0.0,4.845992,6.137504,3.833902,0.042644,0.0,2.372952,0.014355,5.132577,0.0,0.056584,1.655352,0.014355,9.381478,0.0,2.201634,0.014355,0.097611,0.201634,0.014355,0.0,0.0,4.334139,3.38819,4.508429,0.575312,0.0,0.189034,0.15056,0.056584,0.687061,0.464668,4.125982,0.0,4.680887,0.176323,4.147307,0.028569,4.769243,0.0,2.794936,0.014355,8.20921,1.169925,3.684819,3.127633,0.028569,0.014355,0.0,0.0,5.210233,3.053111,0.0,0.137504,0.0,3.864929,0.014355,0.0,1.510962,0.056584,1.189034,3.538538,0.028569,6.391974,8.085711,4.317594,4.779785,0.0,0.201634,3.617063,0.286881,0.111031,4.767655,0.604071,0.333424,0.0


In [60]:
print(drug_target_depmap_reduced.shape, len(set(drug_target_depmap_reduced['gene symbol'])))
# the first output is the DTI set, including 2332 DTIs, while only 679 targets/genes are included in these 2332 DTIs.

(2332, 3) 679


In [None]:
# the order of CCLE_expression_depmap_reduced is based on cellline2relid_dict

In [15]:
# after screening samples based on existing CCLE, current determined datasets include:
print('drugcomb_depmap_reduced.shape:', drugcomb_depmap_reduced.shape)
print('drug_target_depmap_reduced.shape:', drug_target_depmap_reduced.shape)

print('len(drug2absid_dict):', len(drug2absid_dict))
print('len(target2absid_dict):', len(target2absid_dict))
print('len(cellline2absid_dict):', len(cellline2absid_dict))

print('len(drug2relid_dict):', len(drug2relid_dict))
print('len(cellline2relid_dict):', len(cellline2relid_dict))

# next we need to determine the twosides and target sets according to the current determined datasets again

drugcomb_depmap_reduced.shape: (11166, 29)
drug_target_depmap_reduced.shape: (2332, 3)
len(drug2absid_dict): 213
len(target2absid_dict): 12802
len(cellline2absid_dict): 147
len(drug2relid_dict): 106
len(cellline2relid_dict): 60


In [None]:
# a chessboard of rel_drug*rel_drug*cell line number size
# due to the reduction of drug/drug-drug pairs, the adverse effect samples also decrease

In [18]:
# start to determine the twosides dataset
twosides_pairset = set(twosides['unified_name'])
drugcomb_depmap_reduced_pairset = set(drugcomb_depmap_reduced['unified_name'])
inter_depmap_reduced_pairset = list(set.intersection(twosides_pairset, drugcomb_depmap_reduced_pairset))
inter_depmap_reduced_pairset.sort()

twosides_depmap_reduced = []
for row in np.array(twosides):
    if(row[-1] in inter_depmap_reduced_pairset):
        twosides_depmap_reduced.append(row)

twosides_depmap_reduced = pd.DataFrame(twosides_depmap_reduced, columns=twosides.columns)
print('drug pair numbers in drugcomb and towsides:', len(set(drugcomb_depmap_reduced['unified_name'])), len(set(twosides_depmap_reduced['unified_name'])))
print('twosides_depmap_reduced.shape:', twosides_depmap_reduced.shape)

# after processing, 346 drug pairs are remained in drugcomb_depmap and twosides_depmap, while in twosides_depmap, 2446 samples are remained
# before processing: 2764 drug pairs are remained
# after processing, drug-drug-cell line pairs focus on fewer drug/drug-drug pairs
# although the total number of drug-drug-cell line pairs increase

# start to determine the target-target dataset
# based on our current selected meta-path types (DTD, DTTD, DTTTD),
# at least one target in target_target samples should be in the target set of drug_target_depmap_reduced
targetset4drug_target_depmap_reduced = set(drug_target_depmap_reduced['gene symbol'])

target_target_depmap_reduced = []
for row in np.array(target_target): 
    if (row[0] in targetset4drug_target_depmap_reduced) or (row[1] in targetset4drug_target_depmap_reduced):
        target_target_depmap_reduced.append(row)
target_target_depmap_reduced = pd.DataFrame(target_target_depmap_reduced, columns=target_target.columns)

targetset_reduced = set(target_target_depmap_reduced['gene1 symbol']).union(target_target_depmap_reduced['gene2 symbol'])
targetset_reduced = list(targetset_reduced.union(targetset4drug_target_depmap_reduced))
targetset_reduced.sort()
target2relid_dict = {target: i for i, target in enumerate(targetset_reduced)}

print('target_target_depmap_reduced.shape:', target_target_depmap_reduced.shape)
print('len(target2relid_dict):', len(target2relid_dict))
print('len(targetset_reduced):', len(targetset_reduced))

drug pair numbers in drugcomb and towsides: 346 346
twosides_depmap_reduced.shape: (2446, 7)
target_target_depmap_reduced.shape: (91785, 2)
len(target2relid_dict): 12217
len(targetset_reduced): 12217


In [23]:
# previous: 7089 drug-drug-cell lines, 18832 AE samples
# now: 11166 drug-drug-cell lines, 2446 AE samples

# previous: 2694 drug pairs, 159 drugs
# now: 346 drug pairs, 106 drugs

# each kind of drug pair corresponds to similar number of AE labels (previous and now), but the total drug pair varieties decrease dramatically
print(18832/2694, 2446/346) # AE

# although the number of AE that each drug pair corresponds to is similar, but for now each drug pair corresponds much more cell lines 
print(7089/2694, 11166/346) # TE

# previous vs now: for each drug pair, its averaging AE label number: unchanged, its averaging TE number: increasing a lot (3 to 30)

print('total drug, target, cell line numbers:', len(drug2relid_dict), len(target2relid_dict), len(cellline2relid_dict))

6.990348923533778 7.069364161849711
2.631403118040089 32.27167630057804
total drug, target, cell line numbers: 106 12217 60


In [24]:
# generate drug-drug adjacent matrices based on relative ids and drug lowercase names
# current do not double the drug-drug pairs by reversing A-B to B-A (thus current adjacent matices are not symmetric)
# to avoid data leakage, only to double drug-drug pairs in the specific training set

duplicated_te = []
drug_te_drug_matrix = np.zeros((len(drug2relid_dict), len(drug2relid_dict)))
for _, row in drugcomb_depmap_reduced.iterrows():
    # row
    temp1 = drug2relid_dict[row['drug1_lower']]
    # col
    temp2 = drug2relid_dict[row['drug2_lower']]
    # check whether exists A/B or B/A cases
    if(drug_te_drug_matrix[temp2, temp1] == 1):
        duplicated_te.append(row)
    drug_te_drug_matrix[temp1, temp2] = 1

duplicated_se = []
drug_se_drug_matrix = np.zeros((len(drug2relid_dict), len(drug2relid_dict)))
for _, row in twosides_depmap_reduced.iterrows():
    # row
    temp1 = drug2relid_dict[row['drug1_lower']]
    # col
    temp2 = drug2relid_dict[row['drug2_lower']]
    # check whether exists A/B or B/A cases
    if(drug_se_drug_matrix[temp2, temp1] == 1):
        duplicated_se.append(row)
    drug_se_drug_matrix[temp1, temp2] = 1

print(drug_se_drug_matrix.sum(), drug_te_drug_matrix.sum())
# *** no duplicated A-B/B-A drug pairs if the two lists are empty ***
# *** (every sample in current drugcomb and twosides does not have the reverse counterpart) ***
print(duplicated_te, duplicated_se)

# *** re-generate the drug_te_drug_matrix according to pre-defined threshold for synergy score values ***

# A p-value, or probability value, is a number describing how likely it is that your data would have occurred by random chance (i.e. that the null hypothesis is true).
# A p-value less than 0.05 (typically ≤ 0.05) is statistically significant. It indicates strong evidence against the null hypothesis, as there is less than a 5% probability the null is correct (and the results are random). Therefore, we reject the null hypothesis, and accept the alternative hypothesis.

# PPF of the standard normal distribution for the probability 1-a = 0.95
# scipy.stats.norm.ppf(0.95)=1.64, https://educationalresearchtechniques.com/2018/09/24/z-scores-and-inferential-stats-in-python/
# do not need to do 0-1 normalization
# based on loewe synergy score

duplicated_te = []
synergy_score_qualified = []
drug_te_drug_matrix = np.zeros((len(drug2relid_dict), len(drug2relid_dict)))
used_synergy_score = 'synergy_loewe'
mean = np.mean(drugcomb_depmap_reduced[used_synergy_score])
std = np.std(drugcomb_depmap_reduced[used_synergy_score])
for _, row in drugcomb_depmap_reduced.iterrows():
    # row
    temp1 = drug2relid_dict[row['drug1_lower']]
    # col
    temp2 = drug2relid_dict[row['drug2_lower']]
    z_score = (float(row[used_synergy_score]) - mean) / std # z-score for current sample
    # check A-B/B-A
    if(drug_te_drug_matrix[temp2, temp1] == 1):
        duplicated_te.append(row)
    if z_score >= 1.64:
        drug_te_drug_matrix[temp1, temp2] = 1
        synergy_score_qualified.append(float(row[used_synergy_score]))
        
print(duplicated_te)
# threshold: 17.06, synergy_score_qualified: total number of synergy score that meets the pre-defined threshold
# based on each drug-drug pair, maybe there are many drug-drug-cell line samples have a synergy score larger than pre-defined threshold
print(len(synergy_score_qualified), np.max(synergy_score_qualified),
      np.min(synergy_score_qualified), np.mean(synergy_score_qualified))
# 36/346 of drug-drug pairs have the te edge in drug_te_drug_matrix
print(drug_te_drug_matrix.sum())

346.0 346.0
[] []
[]
84 70.1360399671155 17.0599025704251 24.690158328988062
37.0


In [25]:
# after generating asymmetric drug-drug matrices, generate target-target (symmetric) and drug-target (asymmetric) matrices
target_target_matrix = np.zeros((len(target2relid_dict), len(target2relid_dict)))
for row in np.array(target_target_depmap_reduced):
    # row
    temp1 = target2relid_dict[row[0]]
    # col
    temp2 = target2relid_dict[row[1]]
    target_target_matrix[temp1, temp2] = 1
    target_target_matrix[temp2, temp1] = 1

drug_target_matrix = np.zeros((len(drug2relid_dict), len(target2relid_dict)))
for row in np.array(drug_target_depmap_reduced):
    # drug
    temp1 = drug2relid_dict[row[1]]
    # target
    temp2 = target2relid_dict[row[2]]
    drug_target_matrix[temp1, temp2] = 1

In [26]:
# four main matrices to be used:
print('drug_te_drug_matrix.shape:', drug_te_drug_matrix.shape)
print('drug_se_drug_matrix.shape:', drug_se_drug_matrix.shape)
print('target_target_matrix.shape:', target_target_matrix.shape)
print('drug_target_matrix.shape:', drug_target_matrix.shape)

drug_te_drug_matrix.shape: (106, 106)
drug_se_drug_matrix.shape: (106, 106)
target_target_matrix.shape: (12217, 12217)
drug_target_matrix.shape: (106, 12217)


In [44]:
from scipy import sparse

prefix = 'D:/B/PROJECT B2_2/dataset/Muthene_dataset/'
midfix = 'common files/'

# transform the above generated dense matrices to sparse ones
# the ids in these matrics are based on drug2rel_dict and target2rel_dict

drug_se_drug_coomatrix = sparse.coo_matrix(drug_se_drug_matrix)
drug_te_drug_coomatrix = sparse.coo_matrix(drug_te_drug_matrix)
drug_target_coomatrix = sparse.coo_matrix(drug_target_matrix)
target_target_coomatrix = sparse.coo_matrix(target_target_matrix)

# store the files generated above to the specified folder (currently same to the original data folder)
sparse.save_npz(prefix + midfix + 'drug_se_drug_coomatrix.npz', 
                drug_se_drug_coomatrix) # asymmetric
sparse.save_npz(prefix + midfix + 'drug_te_drug_coomatrix.npz',
                drug_te_drug_coomatrix) # asymmetric
sparse.save_npz(prefix + midfix + 'drug_target_coomatrix.npz',
                drug_target_coomatrix) # asymmetric
sparse.save_npz(prefix + midfix + 'target_target_coomatrix.npz',
                target_target_coomatrix) # symmetric

# drug and target files before processing based on depmap reduced (but after the correction of false/redundant samples)
# based on absid_dicts
drugcomb.to_csv(prefix + midfix + 'drugcomb.csv', index=False)
twosides.to_csv(prefix + midfix + 'twosides.csv', index=False)
drug_target.to_csv(prefix + midfix + 'drug_target.csv', index=False)
target_target.to_csv(prefix + midfix + 'target_target.csv', index=False)

# drug and target files after processing based on depmap reduced
# based on relid_dicts
drugcomb_depmap_reduced.to_csv(prefix + midfix + 'drugcomb_depmap.csv', index=False)
twosides_depmap_reduced.to_csv(prefix + midfix + 'twosides_depmap.csv', index=False)
drug_target_depmap_reduced.to_csv(prefix + midfix + 'drug_target_depmap.csv', index=False)
target_target_depmap_reduced.to_csv(prefix + midfix + 'target_target_depmap.csv', index=False)

# six mapping dict generated in this file
with open(prefix + midfix + 'drug2relid_dict.pickle', 'wb') as out_file:
    pickle.dump(drug2relid_dict, out_file)
with open(prefix + midfix + 'target2relid_dict.pickle', 'wb') as out_file:
    pickle.dump(target2relid_dict, out_file)
with open(prefix + midfix + 'cellline2relid_dict.pickle', 'wb') as out_file:
    pickle.dump(cellline2relid_dict, out_file)
with open(prefix + midfix + 'drug2absid_dict.pickle', 'wb') as out_file:
    pickle.dump(drug2absid_dict, out_file)
with open(prefix + midfix + 'target2absid_dict.pickle', 'wb') as out_file:
    pickle.dump(target2absid_dict, out_file)
with open(prefix + midfix + 'cellline2absid_dict.pickle', 'wb') as out_file:
    pickle.dump(cellline2absid_dict, out_file)

In [28]:
print(CCLE_expression_depmap_reduced.shape)
CCLE_expression_depmap_reduced.head()

(60, 679)


Unnamed: 0,cellline_name,depmap_id,CHRNA4 (1137),CHRNA2 (1135),FABP7 (2173),TGFBR1 (7046),SCN10A (6336),MMP14 (4323),PSMD1 (5707),CA12 (771),TBXAS1 (6916),PTGER4 (5734),CHRNA6 (8973),HIPK3 (10114),SLC47A1 (55244),DCK (1633),KIT (3815),DHRS1 (115817),DHRS7C (201140),SCN8A (6334),OGG1 (4968),HPGD (3248),CHRNE (1145),ZAP70 (7535),GPR27 (2850),FLT1 (2321),KCNA1 (3736),DHODH (1723),KCNQ1 (3784),GNRHR (2798),FGR (2268),PDE11A (50940),GPR12 (2835),SCN11A (11280),TSSK2 (23617),CA2 (760),MAP3K11 (4296),HTR6 (3362),GPR84 (53831),GPR151 (134391),RDH10 (157506),RDH8 (50700),TAAR6 (319100),CHRNA1 (1134),SSTR2 (6752),AR (367),MAP4K4 (9448),GAK (2580),FDPS (2224),SCAP (22937),FABP4 (2167),FLT3 (2322),NOS2 (4843),SYK (6850),OPRM1 (4988),GPR142 (350383),SBK1 (388228),HRH2 (3274),UTS2R (2837),LYN (4067),PBK (55872),GPR6 (2830),EPHA3 (2042),PLD1 (5337),FGFR4 (2264),LTB4R (1241),AURKA (6790),RBP5 (83758),CACNA1G (8913),JAK3 (3718),PASK (23178),CYP2C9 (1559),SLC6A20 (54716),ERBB2 (2064),NQO2 (4835),NMUR2 (56923),THRB (7068),GPR85 (54329),SLC22A2 (6582),MC4R (4160),CYP2B6 (1555),RIPK1 (8737),CA13 (377677),ANXA1 (301),MAP3K21 (84451),NR3C2 (4306),NPFFR2 (10886),HMGCR (3156),MC2R (4158),MAP3K9 (4293),GPR61 (83873),RDH12 (145226),TAAR1 (134864),NR3C1 (2908),HSD11B1 (3290),LPAR3 (23566),STYK1 (55359),PDE10A (10846),EPX (8288),SIK3 (23387),GPR37L1 (9283),HDAC2 (3066),AOX1 (316),PDE1A (5136),NR2C2 (7182),IRAK4 (51135),GPR21 (2844),HTR3C (170572),MLNR (2862),GALR2 (8811),POLA2 (23649),TLR7 (51284),RGR (5995),MKNK1 (8569),FGFRL1 (53834),CDH5 (1003),NMUR1 (10316),CA5B (11238),NR2E1 (7101),CA3 (761),CCNC (892),LIMK2 (3985),CHRFAM7A (89832),FABP6 (2172),TRIB3 (57761),NTRK2 (4915),CHRNG (1146),CA7 (766),NR1I2 (8856),HTR2C (3358),FYN (2534),CA4 (762),EPHB1 (2047),TLR8 (51311),CDK19 (23097),ADRA1B (147),MELK (9833),FABP3 (2170),KCNMA1 (3778),SLC5A7 (60482),HSD17B14 (51171),TIE1 (7075),TUBB2A (7280),NIM1K (167359),SLC6A7 (6534),TUBD1 (51174),PDPK1 (5170),PHKG1 (5260),LPAR1 (1902),PDE4C (5143),MAP2K5 (5607),DHRSX (207063),HIPK4 (147746),NR1H2 (7376),TUBA1C (84790),RRM1 (6240),PIN1 (5300),CA9 (768),MAPK15 (225689),CCR1 (1230),AGTR2 (186),FABP1 (2168),DECR1 (1666),RIPK3 (11035),ANPEP (290),NPY1R (4886),PSMB5 (5693),GPR52 (9293),GPR148 (344561),ATIC (471),FGFR3 (2261),POLA1 (5422),TBXA2R (6915),CA6 (765),SERPINA7 (6906),ADORA1 (134),MUSK (4593),EPHB4 (2050),GC (2638),HTR2B (3357),MAPK11 (5600),SLC6A3 (6531),RARG (5916),RXFP3 (51289),DECR2 (26063),CYP3A4 (1576),HTR3E (285242),ADRA1A (148),CSNK1E (1454),GPR19 (2842),MATK (4145),NTSR2 (23620),SLC6A4 (6532),MAP3K20 (51776),STK10 (6793),SIK2 (23235),RARA (5914),NPC1L1 (29881),TRIB2 (28951),PDE2A (5138),KCNH2 (3757),SSTR3 (6753),OPRD1 (4985),FABP2 (2169),DRD1 (1812),FABP9 (646480),MCHR1 (2847),LRRK2 (120892),RDH14 (57665),ACVR2A (92),ADRB2 (154),SLC12A3 (6559),PLK4 (10733),CCR5 (1234),TNF (7124),BTK (695),APLNR (187),DRD5 (1816),HTR1A (3350),ADRA1D (146),PTGER2 (5732),EPHA2 (1969),CHRNB1 (1140),CMPK1 (51727),CCR2 (729230),IDO1 (3620),EPHA5 (2044),EGFR (1956),GPR83 (10888),DHRS4L2 (317749),CTNNB1 (1499),NR6A1 (2649),DHRS2 (10202),CHRND (1144),IRAK1 (3654),AURKB (9212),RDH11 (51109),TRHR (7201),PDE5A (8654),EPHA8 (2046),GPR37 (2861),UPP2 (151531),MERTK (10461),PGR (5241),DHRS3 (9249),NEK11 (79858),PXDNL (137902),CRABP1 (1381),BRS3 (680),PTK6 (5753),RBP7 (116362),MMP8 (4317),NFKB1 (4790),TUBB2B (347733),TXK (7294),ESRRB (2103),PDE4B (5142),HPRT1 (3251),BRAF (673),EPHA4 (2043),PIM1 (5292),LPO (4025),TUBA3C (7278),STAT5B (6777),HUNK (30811),SLCO2B1 (11309),HCK (3055),PMP2 (5375),SRMS (6725),GPR3 (2827),SLC6A16 (28968),THRA (7067),CSK (1445),TESK1 (7016),PDSS1 (23590),TSSK6 (83983),STK35 (140901),FGFR2 (2263),PTGS1 (5742),PDSS2 (57107),PKDCC (91461),PDGFRL (5157),RRH (10692),ABL2 (27),QRFPR (84109),SCN2A (6326),TPO (7173),MC3R (4159),CBR1 (873),TYMS (7298),TEC (7006),NPY4R (5540),CSNK1A1 (1452),BDH2 (56898),AGTR1 (185),CYP2C19 (1557),TNNI3K (51086),GPR22 (2845),SLC6A19 (340024),PDE6B (5158),ADORA3 (140),CXCR4 (7852),MYT1 (4661),TUBA1B (10376),PTGR1 (22949),TEK (7010),NPY5R (4889),TNK2 (10188),BMX (660),STK11 (6794),ALOX5 (240),NPPB (4879),CHRM2 (1129),PHOSPHO1 (162466),CCKAR (886),PTPRZ1 (5803),NR0B1 (190),HTR7 (3363),CDKL3 (51265),HIF1A (3091),IRAK2 (3656),IGF1R (3480),TUBB4B (10383),ERBB4 (2066),MAP3K3 (4215),GPR63 (81491),CACNA1H (8912),PXDN (7837),AURKC (6795),HRH1 (3269),OPN1MW (2652),ROR1 (4919),NPC1 (4864),GSK3B (2932),SV2A (9900),RBP2 (5948),SIK1 (150094),RPS6KB1 (6198),TF (7018),DRD2 (1813),STMN4 (81551),HCRTR2 (3062),HTR1F (3355),WEE2 (494551),SLC6A11 (6538),SLC6A13 (6540),SLC12A1 (6557),NPY2R (4887),SLC6A9 (6536),EPHA10 (284656),VCAM1 (7412),GPR176 (11245),EPHB3 (2049),CDKL2 (8999),GPR135 (64582),ITGB2 (3689),FABP5 (2171),ADRA2C (152),DRD4 (1815),SLC22A7 (10864),PRLHR (2834),TOP2B (7155),MLKL (197259),BLM (641),PPARD (5467),TAAR5 (9038),CYP51A1 (1595),PTGFR (5737),ESR1 (2099),MAP3K19 (80122),MAP4K3 (8491),PIM2 (11040),CHRM3 (1131),GPR88 (54112),SRC (6714),TAAR8 (83551),HTR1B (3351),AVPR2 (554),TRPM2 (7226),MAOB (4129),CNR2 (1269),GPR39 (2863),NTRK1 (4914),NR1H3 (10062),PDE7B (27115),EPHA6 (285220),AXL (558),CALM1 (801),CHRM1 (1128),FABP12 (646486),HSD17B1 (3292),TUBB6 (84617),MELTF (4241),SLC6A12 (6539),GART (2618),HTR5A (3361),BMPR1B (658),KCNN4 (3783),PTPRG (5793),STK36 (27148),XDH (7498),RUSC1 (23623),IRAK3 (11213),OPRK1 (4986),NALCN (259232),KCNE1 (3753),YES1 (7525),ADORA2B (136),CLK4 (57396),TRPA1 (8989),CA8 (767),CBR4 (84869),ABCC2 (1244),NR1I3 (9970),OPN1SW (611),C2orf81 (388963),MCHR2 (84539),SLCO1B3 (28234),OPRL1 (4987),VDR (7421),CDK8 (1024),JUP (3728),PTGER3 (5733),NLK (51701),EBP (10682),GGPS1 (9453),ACVRL1 (94),SSTR5 (6755),NTSR1 (4923),PRTFDC1 (56952),ITGAL (3683),EPHB6 (2051),RIPK4 (54101),LPAR2 (9170),CRABP2 (1382),HSD17B13 (345275),TRIB1 (10221),CLK1 (1195),TUBB4A (10382),UPRT (139596),CHRNA3 (1136),LCK (3932),PPARG (5468),CYP2D6 (1565),ARAF (369),NR0B2 (8431),PSMB1 (5689),TNNC2 (7125),CACNA1S (779),PTGIR (5739),TUBB3 (10381),MPO (4353),BDKRB1 (623),TUBA3E (112714),GSTP1 (2950),BCL2 (596),ERN2 (10595),JAK2 (3717),ERBB3 (2065),RAF1 (5894),CHRNB4 (1143),TYRO3 (7301),EPHB2 (2048),SLC6A8 (6535),DDR2 (4921),HTR1D (3352),CACNB2 (783),TNFSF11 (8600),GSK3A (2931),TSSK4 (283629),MINK1 (50488),TUBG2 (27175),NR2F6 (2063),MC1R (4157),SLC6A2 (6530),MET (4233),MAP3K4 (4216),SLC6A1 (6529),TNK1 (8711),TESK2 (10420),FLT4 (2324),CDK7 (1022),FDXR (2232),DHRS7B (25979),INSRR (3645),CHRM4 (1132),DRD3 (1814),RXFP4 (339403),ACKR3 (57007),PDGFRB (5159),CHRNA9 (55584),DDR1 (780),PGD (5226),MC5R (4161),PDGFRA (5156),UPP1 (7378),HSD17B11 (51170),CIT (11113),RIPK2 (8767),TOP1 (7150),LMNA (4000),TOP2A (7153),ABCC8 (6833),MAPK14 (1432),FFAR4 (338557),PKMYT1 (9088),PTGER1 (5731),GPR150 (285601),CYP11B2 (1585),SLC47A2 (146802),TUBA4A (7277),GPR139 (124274),CHRM5 (1133),SLC6A18 (348932),GJA1 (2697),PSMB2 (5690),ADRB3 (155),RARB (5915),PLD2 (5338),MKNK2 (2872),ELN (2006),CCR3 (1232),RECQL (5965),OPN3 (23596),HTR3A (3359),TUBA8 (51807),INSR (3643),CA5A (763),DHFR2 (200895),HIPK2 (28996),CACNA1A (773),FRK (2444),GRPR (2925),CHRNB3 (1142),SCN5A (6331),GPR119 (139760),TYK2 (7297),HRH3 (11255),GPR26 (2849),CYP1A2 (1544),ESR2 (2100),SLC6A6 (6533),AVPR1A (552),TUBE1 (51175),SCN3A (6328),MAP3K2 (10746),HSDL2 (84263),HTR2A (3356),CHRNA7 (1139),ACE (1636),GPR62 (118442),OPN5 (221391),NPFFR1 (64106),CACNA1D (776),TUBB1 (81027),RHO (6010),VEGFA (7422),COQ8A (56997),RBP1 (5947),PECR (55825),GPR65 (8477),SSTR4 (6754),ESRRA (2101),MMP20 (9313),NPBWR2 (2832),ACVR1B (91),RXRB (6257),PDE6A (5145),GHSR (2693),MOS (4342),SLCO1B1 (10599),CCR9 (10803),ADORA2A (135),ITK (3702),RET (5979),GPR45 (11250),CACNA1C (775),IDO2 (169355),EPHA1 (2041),TSSK1B (83942),TAAR2 (9287),MAP3K10 (4294),PIM3 (415116),HRH4 (59340),TUBB8 (347688),ACVR2B (93),PDE6C (5146),KDR (3791),ACVR1 (90),SRD5A1 (6715),RXRA (6256),CCR4 (1233),CXCR6 (10663),GPR78 (27201),SLC6A17 (388662),ACKR2 (1238),PTGDR (5729),OXTR (5021),NMBR (4829),NR2F1 (7025),GPR101 (83550),CATSPER1 (117144),DHRS12 (79758),SDR16C5 (195814),DHFR (1719),TUBG1 (7283),TAOK3 (51347),ALK (238),CACNA1F (778),CHRNA5 (1138),SSTR1 (6751),CTDSP1 (58190),GALR1 (2587),ADRB1 (153),ERN1 (2081),CCKBR (887),TUBB (203068),CA10 (56934),DHRS13 (147015),HCRTR1 (3061),CA1 (759),LTK (4058),NTRK3 (4916),KISS1R (84634),OPN4 (94233),NR1H4 (9971),PRKAB1 (5564),MAP2K1 (5604),PTGS2 (5743),ADRA2A (150),CYP19A1 (1588),TACR1 (6869),SRD5A2 (6716),MMP2 (4313),TSSK3 (81629),PIP4K2C (79837),GPR173 (54328),CDC42BPB (9578),CYP17A1 (1586),MAP4K5 (11183),PROKR1 (10887),ABL1 (25),SLC6A14 (11254),CA11 (770),ADRA2B (151),PSMD2 (5708),ENPP1 (5167),CBR3 (874),PDE7A (5150),KCNA3 (3738),ALOX15 (246),HTR3B (9177),HTR3D (200909),MAPK12 (6300),PPARA (5465),PROKR2 (128674),TUBA3D (113457),HTR1E (3354),MAPK8 (5599),CACNA1B (774),SLC6A5 (9152),LTB4R2 (56413),CHRNB2 (1141),CHRNA10 (57053),TAOK1 (57551),GALR3 (8484),JAK1 (3716),TUBA1A (7846),ABCB1 (5243),UCKL1 (54963),RXRG (6258),SLC6A15 (55117),NR2C1 (7181),TNNC1 (7134),BLK (640),NR2F2 (7026),ESRRG (2104),CSF1R (1436),OPN1LW (5956)
694,786-0,ACH-000649,0.0,0.014355,0.0,4.330558,0.0,7.324901,7.238787,6.603923,3.975447,2.809414,0.0,3.084064,0.028569,5.013016,0.056584,3.69488,0.0,0.042644,3.841973,1.02148,0.0,0.084064,0.042644,0.014355,0.0,3.488001,0.0,0.124328,0.0,0.941106,0.0,0.0,0.263034,5.264912,4.819668,0.0,0.0,0.0,2.594549,0.0,0.0,0.0,0.084064,0.028569,6.596488,6.001127,7.904183,4.684819,0.0,0.0,0.0,3.499527,0.0,0.0,0.084064,0.0,0.0,5.69655,5.807097,0.0,0.014355,3.904966,3.975447,1.238787,7.538538,0.782409,0.0,0.31034,3.374344,0.0,0.0,3.705978,5.824004,0.0,2.046142,1.521051,0.286881,0.0,0.0,4.009885,2.247928,9.462952,4.146492,0.070389,0.070389,5.464015,0.0,2.140779,0.695994,0.0,0.0,4.734981,0.378512,0.042644,3.481557,4.3875,0.0,2.722466,0.124328,7.206917,2.763412,0.176323,4.137504,3.974529,0.0,0.028569,0.0,0.028569,4.658211,0.0,0.014355,4.812498,6.27221,0.028569,0.0,1.536053,0.0,0.014355,6.178117,4.191405,0.0,2.370164,6.449561,0.0,0.014355,0.0,0.0,0.0,2.24184,0.0,0.333424,0.0,3.460743,1.604071,6.32301,0.137504,6.514122,0.0,0.084064,0.263034,6.261907,0.042644,0.0,3.049631,4.263786,0.485427,4.064366,0.0,2.916477,4.404631,0.014355,4.830864,11.218805,6.683135,6.886062,0.0,0.0,0.0,0.0,0.0,6.228434,0.0,3.70044,0.298658,6.97728,0.0,0.0,7.520108,1.974529,4.123501,0.201634,0.0,0.0,4.721919,0.014355,0.321928,0.111031,0.238787,2.411426,0.0,3.0,0.0,3.956986,0.097611,0.0,0.0,6.584812,1.718088,0.124328,0.0,0.0,5.140779,3.866908,2.321928,3.513491,0.028569,0.176323,0.31034,3.485427,0.042644,0.0,0.0,0.0,0.0,0.0,1.367371,4.861955,1.956057,0.028569,0.056584,5.255123,0.0,3.971773,0.070389,0.0,0.0,0.0,0.042644,1.448901,6.450881,1.9855,7.356232,0.0,0.028569,0.15056,5.373996,0.014355,2.937344,7.334407,1.432959,0.659925,0.0,8.191257,7.147001,5.509696,0.042644,0.555816,0.0,0.0,0.028569,0.454176,0.0,1.124328,1.646163,1.618239,0.0,0.0,0.356144,0.263034,0.028569,5.417515,2.395063,0.124328,0.028569,0.189034,6.60585,3.102658,2.035624,4.243364,0.0,0.0,3.331992,0.0,0.594549,0.056584,0.0,0.0,0.757023,0.0,1.536053,5.372256,4.130931,4.555816,0.669027,2.891419,2.722466,0.485427,3.100978,2.31034,0.650765,0.056584,4.137504,1.823749,0.028569,0.0,0.0,6.38111,8.10376,1.803227,0.992768,7.328047,2.634593,0.014355,0.0,0.0,0.124328,0.014355,0.056584,0.042644,0.189034,0.014355,11.895462,5.704319,0.028569,0.084064,2.863938,0.0,5.51885,0.014355,0.226509,0.0,0.367371,0.028569,0.028569,0.321928,1.042644,0.815575,3.710393,2.797013,2.752749,9.716511,0.0,3.812498,1.176323,0.014355,3.122673,0.344828,2.771886,0.0,4.210233,6.201634,4.135863,0.411426,0.0,0.807355,3.879706,0.176323,0.056584,0.0,0.0,0.0,0.0,0.014355,0.070389,0.0,0.0,2.179511,0.0,5.124742,5.460087,0.014355,0.15056,1.144046,1.344828,8.597978,0.0,0.111031,0.014355,0.0,6.161283,4.055716,3.31904,3.50716,0.0,5.730096,1.799087,0.042644,0.0,4.041769,3.576522,0.0,0.0,4.586765,0.0,0.0,0.0,1.201634,0.356144,0.014355,3.125982,0.084064,2.735522,0.0,0.863938,6.938168,8.64958,0.0,0.0,0.286881,7.623004,3.716991,0.250962,6.826803,0.0,1.673556,0.516015,3.82985,3.454176,0.111031,5.720005,0.028569,0.0,0.807355,0.028569,6.100978,2.0,3.650765,1.516015,0.226509,3.185867,1.298658,0.124328,0.0,0.516015,0.0,0.111031,0.111031,1.531069,3.917432,1.117695,0.014355,2.895303,7.793961,4.70044,0.028569,0.0,0.014355,2.788686,0.0,0.014355,5.340562,1.709291,2.689299,0.014355,3.01614,5.910493,0.042644,3.240314,0.454176,0.454176,3.023255,0.163499,4.857981,0.042644,8.541445,0.070389,0.0,0.028569,7.448488,0.0,1.871844,0.070389,8.906921,1.356144,0.070389,2.049631,0.321928,5.678917,0.0,4.093391,3.674687,5.955359,0.333424,0.214125,0.432959,0.0,5.127221,0.918386,3.920293,2.794936,4.216455,1.632268,0.0,7.508587,4.296457,0.0,0.545968,0.659925,0.111031,4.619413,3.237258,4.475085,0.0,0.028569,0.0,0.0,4.908333,0.545968,0.014355,3.347666,7.526695,0.0,0.0,4.789729,4.778209,4.769243,5.821455,6.096346,8.191306,7.426936,0.042644,5.013016,0.0,6.162895,0.028569,0.014355,0.0,0.056584,8.064689,0.0,0.028569,0.0,4.492494,7.468665,0.0,0.124328,3.367371,5.612058,0.111031,0.0,6.821328,3.905928,0.0,1.405992,0.028569,0.0,1.799087,5.11395,0.263034,0.757023,0.163499,0.0,0.014355,0.0,5.526382,0.014355,0.0,0.0,0.014355,5.074249,0.0,2.974529,0.226509,3.845992,5.626147,0.0,0.0,0.111031,0.014355,0.0,0.0,0.298658,0.545968,0.0,6.998872,2.865919,0.286881,3.943921,0.0,0.0,4.018812,0.0,0.0,3.185867,4.05745,0.176323,0.056584,0.0,0.014355,0.0,1.195348,0.0,0.042644,1.356144,0.163499,0.0,0.333424,0.014355,0.0,2.883621,5.228049,0.0,0.028569,1.111031,0.014355,0.042644,4.438958,5.132166,4.566815,0.0,0.111031,0.0,0.014355,0.028569,0.0,1.104337,0.0,0.411426,0.0,1.646163,0.526069,0.014355,5.44228,6.572283,4.01614,0.0,0.0,3.887525,0.014355,5.115616,0.0,0.0,1.748461,0.028569,10.282857,0.0,1.565597,0.0,0.687061,0.014355,0.815575,0.0,0.014355,0.0,4.42156,6.148934,0.214125,0.0,0.0,0.014355,0.0,4.713696,1.111031,4.650765,0.963474,5.075533,0.0,4.280956,0.0,5.687621,0.0,0.15056,0.0,9.403289,3.215679,3.844988,3.545968,0.0,0.014355,0.0,0.0,3.983678,2.931683,0.0,0.189034,0.0,5.950702,0.0,0.0,0.879706,0.070389,0.748461,3.528571,0.0,7.008429,4.465322,4.398487,4.641546,0.0,0.137504,4.793896,0.070389,0.028569,3.880686,0.097611,0.815575,0.0
1316,A2058,ACH-000788,0.0,0.0,4.313971,3.539779,0.0,7.786531,6.597829,0.097611,4.460743,0.584963,0.070389,3.41007,2.543496,4.514753,0.275007,4.08151,0.0,1.056584,4.036503,1.70044,0.084064,0.042644,0.014355,3.489286,0.0,3.70044,0.014355,0.163499,0.028569,0.575312,0.0,0.0,0.0,0.111031,5.928133,0.070389,0.056584,0.014355,4.684819,0.014355,0.0,0.014355,0.250962,0.014355,6.261719,6.258896,8.043793,5.1534,0.0,0.042644,0.028569,0.042644,0.0,0.0,0.163499,0.0,0.0,4.586164,6.735116,0.0,4.469235,4.450221,4.110196,3.063503,6.710944,1.049631,0.111031,0.084064,3.966246,0.0,0.042644,4.754888,5.855242,0.0,1.589763,0.464668,0.0,0.042644,0.0,4.621173,0.713696,8.449479,0.163499,0.214125,0.0,4.988685,0.0,0.298658,0.411426,0.014355,0.0,4.017031,1.910733,3.090853,0.378512,5.878725,0.0,2.9855,0.014355,7.179312,0.214125,0.042644,4.305241,2.817623,0.056584,0.0,0.250962,0.070389,4.960234,0.014355,0.014355,4.346957,6.808256,0.201634,0.097611,0.863938,2.392317,0.014355,5.40973,3.38405,0.992768,1.207893,5.410748,0.226509,0.028569,0.0,0.0,0.0,6.346602,0.0,0.124328,0.0,3.360364,0.111031,5.607626,0.669027,0.823749,0.0,0.526069,1.144046,7.042425,1.063503,0.0,3.046142,3.904002,0.731183,2.100978,0.070389,3.451541,3.997292,0.056584,5.422906,10.2182,6.700856,5.673556,2.157044,0.238787,0.097611,0.0,0.15056,6.45253,0.014355,6.905928,0.0,7.953614,0.084064,0.0,7.476139,2.941106,4.149747,0.925999,0.0,0.0,1.378512,0.0,5.114367,0.0,0.773996,3.399171,0.0,4.44427,0.0,5.14323,0.014355,0.0,0.0,7.183784,0.992768,0.014355,0.0,0.042644,3.58376,4.084064,3.72465,4.97728,0.0,5.776367,0.632268,0.176323,0.028569,1.748461,0.111031,0.0,0.0,0.0,2.403268,4.375039,2.353323,0.432959,0.0,4.502076,0.014355,0.097611,0.163499,0.028569,0.0,0.0,0.014355,0.070389,5.128458,2.367371,6.074034,0.028569,0.0,0.201634,0.163499,0.042644,3.431623,8.254556,1.292782,2.137504,0.014355,6.912051,6.8098,6.215873,0.226509,1.555816,0.0,2.207893,0.0,0.765535,0.0,5.50462,0.941106,0.028569,0.464668,0.0,0.250962,0.124328,5.566511,5.396776,6.158862,2.750607,0.042644,5.449891,6.453847,2.819668,4.228819,2.513491,0.0,0.495695,4.593354,0.084064,0.070389,0.0,0.321928,0.042644,3.061776,0.056584,3.926948,5.986183,3.629939,4.560104,1.189034,2.790772,0.411426,0.389567,3.560715,5.443938,3.094236,0.084064,4.829342,2.523562,0.238787,0.014355,0.0,6.907251,8.318678,0.704872,0.0,6.759156,4.805808,0.042644,0.0,0.0,0.042644,0.014355,1.361768,0.0,0.15056,0.367371,11.191923,6.119771,0.097611,0.0,4.203984,0.31034,4.103498,0.014355,0.0,0.0,0.0,0.0,4.254745,3.370164,2.641546,1.207893,7.631323,1.819668,3.998196,8.902888,0.505891,4.168321,0.014355,0.344828,6.614563,0.422233,1.367371,0.0,2.983678,4.931683,4.646163,4.910733,0.15056,0.565597,4.506526,3.635754,0.389567,0.0,0.0,0.0,0.0,0.0,0.275007,0.0,0.014355,1.879706,0.0,0.097611,3.295723,3.084064,0.163499,1.480265,0.443607,7.678283,0.0,0.163499,0.0,0.0,5.8089,3.075533,3.196922,4.110196,0.0,5.738768,0.298658,0.070389,0.014355,3.412782,3.454176,2.773996,0.014355,4.301588,0.0,0.0,0.137504,0.485427,0.028569,0.0,0.903038,0.970854,2.83996,3.38405,0.536053,6.597084,7.908513,0.0,0.0,1.459432,7.137401,6.663914,0.056584,7.022812,0.0,1.176323,6.746716,3.730096,4.130931,0.226509,5.493775,0.028569,0.0,2.957915,0.669027,5.106851,3.095924,3.283922,0.782409,0.028569,3.229588,1.378512,0.516015,0.400538,0.847997,0.0,0.014355,0.641546,2.970854,3.978196,1.454176,0.097611,3.938286,5.833649,4.752749,0.495695,0.0,0.176323,0.111031,0.137504,0.014355,4.734439,2.017922,3.177918,0.111031,3.755956,5.444601,0.956057,3.134221,0.275007,0.0,1.83996,1.422233,5.216843,0.0,8.350541,0.0,0.0,0.014355,6.863319,0.545968,0.201634,0.070389,9.414432,1.803227,0.0,1.782409,7.294529,5.736605,0.0,5.255501,0.097611,5.634012,5.191405,0.695994,0.757023,0.028569,5.593354,1.584963,5.130519,4.550901,4.346957,3.590961,0.014355,4.463361,4.207112,0.0,2.275007,1.182692,0.111031,5.071677,3.153805,4.409391,0.014355,0.389567,0.0,0.226509,0.042644,0.650765,0.432959,6.294621,8.095344,0.0,0.464668,6.534809,5.203984,4.531069,4.613532,5.963936,8.739679,7.334318,0.0,5.05398,0.014355,5.361417,0.0,0.014355,0.0,0.111031,1.735522,0.0,0.028569,0.0,0.111031,6.14323,0.0,0.250962,3.799087,4.361768,0.014355,0.0,5.623223,4.524189,0.0,0.575312,0.124328,0.0,1.914565,5.185074,0.163499,0.356144,0.201634,0.0,0.014355,0.0,5.427271,0.0,0.0,0.0,0.298658,4.62527,0.042644,4.067811,0.014355,3.044394,4.64789,0.0,0.443607,0.378512,0.298658,0.0,0.0,1.028569,0.275007,0.0,5.747656,3.587365,0.641546,3.943921,0.111031,0.0,5.048759,0.0,0.0,3.072106,5.128046,0.226509,0.042644,0.0,0.0,0.014355,0.823749,0.014355,0.056584,0.176323,0.014355,0.0,0.739848,0.014355,0.0,3.372952,4.662205,0.0,0.137504,1.599318,0.111031,1.189034,4.42156,3.961623,3.533563,0.0,0.137504,0.0,0.15056,0.014355,0.0,0.400538,0.15056,1.786596,0.0,1.871844,2.715893,0.014355,5.387156,7.051481,4.55888,0.137504,0.0,4.074677,0.0,4.82273,0.0,0.226509,2.060047,0.0,10.696359,0.0,4.324811,0.0,0.070389,0.070389,0.0,0.097611,0.0,0.014355,4.319762,5.555203,2.280956,0.214125,0.0,0.084064,0.0,6.414812,1.443607,4.269781,0.028569,5.103078,0.0,4.570463,0.632268,4.873321,0.0,2.646163,0.014355,8.270622,2.007196,5.078524,3.496974,0.0,0.014355,0.070389,0.0,4.619413,2.531069,0.0,0.238787,0.0,4.24184,0.028569,0.0,2.443607,0.15056,1.137504,3.201634,0.028569,4.185867,5.175525,0.042644,4.926948,3.01614,4.233428,4.025915,0.097611,0.0,4.897724,0.632268,0.056584,0.0
998,A2780,ACH-000657,1.286881,0.097611,0.028569,3.61471,0.0,1.531069,7.395063,2.889474,0.176323,0.111031,0.0,3.308885,3.193772,4.402586,0.084064,2.639232,0.0,0.163499,5.004501,0.163499,0.097611,0.124328,0.042644,0.0,0.014355,3.763412,0.097611,0.014355,0.042644,0.464668,0.0,0.028569,0.0,4.22265,4.487358,0.695994,1.989139,0.014355,6.496175,0.0,0.0,0.014355,0.250962,0.070389,5.253611,5.405312,8.34163,5.499527,0.286881,0.0,0.823749,0.056584,0.0,0.0,2.62293,0.014355,0.238787,4.01078,5.759422,0.0,4.818135,0.163499,4.705425,2.397803,6.570766,0.333424,2.31904,1.31034,4.196922,0.0,0.214125,5.331992,5.350144,0.028569,0.137504,1.400538,0.014355,0.014355,0.014355,3.681449,0.226509,2.641546,0.028569,0.0,0.31034,5.652486,0.0,1.778209,0.137504,0.084064,0.028569,0.097611,0.0,1.819668,0.344828,0.084064,0.028569,3.922198,0.014355,6.560868,0.201634,2.364572,4.281698,0.731183,0.028569,0.028569,0.042644,0.226509,4.965323,0.0,0.070389,3.807355,3.992768,0.014355,0.070389,0.495695,1.286881,0.201634,5.502076,3.527321,0.028569,0.042644,4.754353,0.014355,0.028569,0.070389,0.0,0.028569,2.295723,0.124328,0.014355,0.0,2.107688,0.0,5.44062,2.709291,1.664483,0.014355,4.397803,0.124328,3.527321,0.176323,0.0,3.629939,3.929791,0.485427,0.028569,2.611172,3.023255,3.578939,0.214125,4.904002,8.866042,6.377991,6.453518,1.941106,1.575312,6.443441,0.0,0.356144,5.002703,0.097611,0.226509,0.475085,8.486473,0.028569,0.0,7.454505,2.655352,3.974529,1.739848,0.0,0.0,1.292782,0.0,5.140779,0.111031,1.952334,3.726831,0.084064,5.830103,0.0,4.28244,0.0,0.028569,0.0,7.011339,1.599318,3.903038,0.042644,0.176323,3.339137,3.609991,3.32625,4.060047,0.070389,0.070389,0.176323,3.017922,0.0,0.014355,0.0,0.0,2.372952,0.163499,0.863938,4.32553,1.555816,0.0,0.028569,4.709291,0.807355,0.056584,0.056584,0.201634,0.0,0.464668,0.0,0.333424,4.791814,2.950468,5.122673,0.0,1.664483,0.948601,1.454176,0.014355,3.357552,7.298017,4.65019,2.589763,0.014355,6.226123,7.210525,5.951168,0.014355,0.757023,1.85599,0.070389,0.0,3.294253,0.0,2.419539,0.847997,0.0,5.413459,0.0,0.214125,0.0,2.160275,4.447579,1.941106,0.250962,0.056584,0.238787,6.071891,3.288359,0.214125,5.362821,0.124328,0.0,4.178715,0.111031,0.014355,0.056584,0.111031,0.042644,2.763412,2.094236,3.664483,5.781097,4.042644,3.817623,2.140779,3.745237,0.189034,0.014355,2.748461,4.05398,4.165108,0.084064,3.160275,1.735522,1.970854,0.0,0.0,1.117695,7.928548,1.117695,0.0,6.474598,3.802193,0.176323,0.0,0.056584,0.014355,0.0,0.084064,0.0,1.867896,0.378512,10.731828,6.225159,0.028569,0.042644,3.896272,0.0,5.159064,0.163499,0.056584,0.0,0.526069,0.0,0.028569,0.014355,0.042644,1.422233,6.006522,1.137504,1.226509,8.718053,0.739848,3.443607,1.815575,0.137504,0.176323,0.495695,0.014355,0.0,0.014355,4.090853,4.120186,5.126808,0.056584,2.070389,4.670161,0.298658,0.014355,0.0,0.028569,1.130931,0.0,0.0,0.201634,0.042644,0.070389,4.436961,0.422233,0.516015,0.454176,2.521051,0.097611,1.608809,0.111031,7.411002,2.336283,0.432959,0.0,0.0,6.156842,0.333424,3.41684,3.673556,0.0,5.152183,0.0,0.028569,0.0,3.275007,3.539779,0.111031,0.014355,4.128458,0.0,0.0,0.084064,0.070389,0.070389,0.014355,0.014355,0.201634,4.417515,0.0,0.526069,3.85997,8.252902,0.0,0.0,3.448901,7.862637,3.464668,0.641546,7.089583,0.0,0.084064,0.516015,3.970854,4.39163,0.0,6.004277,0.070389,0.028569,0.042644,0.286881,5.487679,3.152183,3.539779,0.056584,0.042644,2.782409,0.356144,0.918386,0.214125,1.786596,0.0,0.042644,1.144046,0.650765,4.078097,5.0387,0.084064,2.263034,6.575917,4.508429,0.056584,0.0,0.163499,1.411426,0.189034,1.049631,0.028569,2.257011,8.314289,0.124328,1.910733,4.522307,3.360364,2.809414,2.536053,0.0,0.028569,1.007196,5.206331,0.0,7.308157,0.356144,0.014355,0.176323,3.097611,0.097611,0.014355,0.056584,9.310976,1.565597,0.028569,1.438293,1.827819,5.971314,0.014355,3.765535,0.782409,4.950468,6.429281,0.070389,0.831877,0.014355,5.897724,1.851999,5.12143,3.697107,6.032542,2.847997,0.0,0.333424,3.019702,0.028569,0.344828,1.411426,3.465974,5.111866,4.370164,3.80426,0.042644,0.505891,0.0,0.028569,0.056584,3.129283,0.594549,3.496974,7.517748,0.536053,5.32301,3.385431,6.135248,3.762349,4.330558,6.509062,5.638364,7.046469,0.555816,4.505256,0.014355,5.334139,0.124328,0.0,0.0,0.028569,0.933573,0.0,0.028569,0.014355,8.533485,6.694184,0.014355,0.963474,3.925999,6.345538,0.014355,0.632268,5.082362,1.541019,0.0,0.378512,2.974529,0.0,2.140779,1.02148,0.389567,0.014355,0.0,0.0,0.432959,0.0,6.079378,0.495695,0.0,0.0,0.070389,2.742006,0.028569,3.443607,2.946731,2.726831,4.333424,0.014355,0.097611,0.275007,0.014355,0.014355,0.0,0.042644,0.275007,0.0,5.964861,4.257011,2.550901,4.604071,0.014355,0.0,5.025029,0.070389,0.0,2.715893,4.727376,0.028569,0.0,0.0,0.014355,0.028569,0.765535,0.0,0.765535,0.028569,1.298658,0.070389,0.505891,0.0,0.0,2.659925,4.402586,0.042644,0.669027,2.765535,0.124328,0.014355,3.658783,3.354734,4.382667,0.014355,0.286881,0.084064,0.042644,0.189034,0.0,0.286881,0.028569,7.550901,0.0,0.028569,2.378512,0.014355,5.922674,7.019702,1.944858,0.028569,0.014355,3.465974,0.0,6.007644,0.0,0.584963,1.695994,0.31034,9.847057,0.0,4.104337,0.014355,0.056584,0.321928,0.070389,0.933573,0.0,0.0,3.750607,5.303781,0.344828,0.014355,0.014355,0.014355,0.014355,0.422233,0.85599,3.915521,0.097611,5.941106,0.0,4.672425,0.0,5.047015,0.214125,5.992995,0.028569,8.769706,0.056584,1.555816,3.863938,0.014355,0.263034,0.0,0.0,5.999324,1.963474,0.0,0.226509,0.014355,4.313971,1.871844,0.0,2.301588,0.238787,0.485427,3.836934,0.124328,3.030336,5.47476,0.097611,4.739308,0.0,0.713696,4.882154,5.135453,0.056584,2.198494,3.196922,0.014355,0.0
1185,A375,ACH-000219,0.0,0.0,3.385431,2.82171,0.0,5.535431,6.361066,0.201634,3.518535,0.650765,0.189034,2.989139,2.217231,4.093391,0.014355,3.794936,0.0,0.948601,4.250204,0.62293,0.097611,0.0,0.042644,3.463361,0.014355,3.830864,0.028569,0.028569,0.028569,0.163499,0.0,0.014355,0.0,0.400538,5.425258,0.238787,0.042644,0.0,2.845992,0.070389,0.0,0.014355,0.176323,0.704872,5.810443,6.07596,7.496335,5.192589,0.163499,0.028569,0.137504,0.084064,0.0,0.0,0.15056,0.014355,0.0,2.799087,6.114783,0.0,4.31034,2.978196,3.411426,2.794936,6.839456,1.117695,0.042644,0.298658,2.807355,0.0,0.0,4.488001,4.244887,0.0,2.100978,0.678072,0.0,0.214125,0.042644,3.44228,1.195348,10.283088,1.636915,0.163499,0.604071,5.710944,0.0,1.831877,0.201634,0.238787,0.0,3.83289,0.0,3.297191,1.195348,4.963936,0.028569,3.215679,0.014355,6.887891,1.0,0.014355,4.369466,2.695994,0.028569,0.0,0.0,0.028569,4.683135,0.0,0.516015,4.628774,6.177121,0.028569,0.014355,3.973611,0.111031,0.201634,5.725196,3.386811,0.918386,3.385431,4.893362,0.111031,0.014355,0.028569,0.042644,0.0,5.279471,0.0,2.094236,0.0,2.560715,0.910733,5.468583,0.201634,3.78136,0.0,0.263034,0.555816,4.962086,1.014355,0.0,3.192194,4.004501,0.526069,0.815575,0.286881,3.382667,2.538538,0.028569,5.793896,9.904605,6.242603,6.501121,2.414136,0.176323,0.0,0.014355,0.641546,5.105594,0.124328,5.798828,0.367371,7.792074,0.0,0.0,7.203397,2.094236,4.110196,1.007196,0.0,0.0,3.50716,0.0,4.9855,0.0,0.15056,2.370164,0.0,5.215679,0.15056,3.834913,0.028569,0.0,0.0,6.632995,2.229588,0.0,0.0,0.070389,2.776104,5.169925,2.636915,4.393004,0.111031,6.263034,0.505891,0.070389,0.0,2.996389,0.014355,0.0,0.0,0.028569,2.361768,4.33985,1.910733,1.090853,0.070389,4.215679,0.0,0.0,0.014355,0.042644,0.0,0.0,0.124328,0.111031,5.915043,3.415488,6.292966,0.014355,0.0,0.056584,1.49057,0.028569,3.508429,7.587515,0.925999,3.198494,0.0,7.981168,7.01022,5.597531,0.028569,1.238787,0.0,1.883621,0.0,0.31034,0.070389,5.913608,0.713696,0.070389,0.0,0.0,0.111031,0.344828,2.117695,4.998196,3.114367,3.061776,0.189034,1.847997,5.968321,3.397803,2.130931,2.568032,0.0,0.124328,3.682573,0.014355,0.0,0.014355,0.042644,0.0,3.200065,0.15056,3.533563,5.981168,3.587365,4.203201,1.752749,3.193772,0.565597,1.144046,2.865919,3.001802,1.157044,0.238787,4.439623,2.885574,0.695994,0.0,0.0,6.30305,7.480911,0.641546,0.0,7.070389,4.217231,0.238787,0.0,0.0,0.014355,0.0,1.438293,0.0,0.084064,0.333424,11.044053,4.732812,0.042644,0.0,4.139961,0.15056,4.420887,0.028569,0.070389,0.163499,0.565597,0.0,2.38405,0.475085,3.635754,0.400538,6.693626,1.495695,4.503985,9.1484,0.389567,3.914565,0.555816,0.0,3.851999,0.389567,1.713696,0.0,1.427606,4.410748,5.695159,4.59156,0.124328,0.014355,4.347666,2.925999,1.459432,0.0,0.084064,0.0,0.0,0.014355,0.042644,0.0,0.0,3.38819,0.0,0.097611,3.592158,3.695994,0.014355,1.0,0.918386,7.075853,0.056584,0.321928,0.0,0.0,5.841973,3.598127,3.198494,2.891419,0.0,4.566206,0.056584,0.097611,0.0,3.288359,3.847997,2.611172,0.0,4.863443,0.0,0.028569,1.443607,3.344828,0.9855,0.0,1.02148,0.298658,4.059182,0.298658,0.15056,6.040673,7.965207,0.422233,0.0,2.182692,7.047124,5.638943,0.097611,6.536053,0.0,0.389567,6.732541,3.252476,4.418865,0.526069,5.417177,0.014355,0.028569,1.505891,0.263034,4.714246,4.036503,3.825786,0.505891,0.475085,3.620586,4.1152,0.941106,0.070389,2.477677,0.0,0.097611,0.536053,3.485427,3.732269,2.223423,0.042644,3.496974,6.57107,4.522307,0.111031,0.0,1.400538,0.163499,0.084064,0.189034,3.192194,3.007196,1.807355,0.028569,3.836934,5.078524,2.140779,3.514753,0.201634,0.056584,5.111449,0.933573,5.642702,0.056584,8.422359,0.250962,0.0,0.0,7.948134,0.0,0.070389,0.028569,9.680817,1.292782,0.042644,1.704872,7.411596,6.095292,0.0,4.298658,3.153805,5.771093,4.432291,0.028569,0.356144,0.0,5.569552,1.232661,4.75007,4.214125,4.491853,3.982765,0.0,4.589763,3.257011,0.0,1.378512,2.316146,0.0,5.842979,3.9855,4.006298,0.014355,0.111031,0.0,0.238787,0.042644,2.100978,0.400538,5.252476,6.897603,0.0,1.565597,5.08151,4.493135,4.348374,3.481557,6.924456,9.606239,7.134632,0.056584,3.914565,0.056584,5.196135,0.028569,0.0,0.0,0.070389,0.669027,0.0,0.042644,0.0,0.124328,6.656639,0.0,0.632268,3.737687,4.942984,0.070389,0.014355,5.897482,1.773996,0.0,0.956057,2.137504,0.056584,2.769772,4.740928,0.411426,0.084064,0.214125,0.0,0.238787,0.0,6.564835,0.014355,0.0,0.0,0.084064,4.720826,0.0,4.322649,0.084064,2.837943,4.995485,0.0,0.941106,0.411426,0.432959,0.014355,0.014355,1.769772,0.941106,0.0,4.775051,5.0054,0.0,3.177918,0.0,0.028569,5.175125,0.0,0.0,3.212569,4.351204,0.189034,0.0,0.0,0.014355,0.014355,0.400538,0.0,0.042644,0.0,0.056584,0.0,0.275007,0.014355,0.0,3.283922,4.903038,0.014355,0.056584,1.895303,0.137504,2.100978,3.311794,2.792855,3.179511,0.014355,0.176323,0.0,0.15056,0.0,0.0,0.695994,0.0,1.650765,0.0,3.85997,1.510962,0.028569,5.710944,6.715756,4.067811,0.613532,0.0,2.849999,0.014355,4.68818,0.0,0.321928,1.510962,0.0,9.671576,0.0,3.099295,0.014355,0.0,0.356144,0.464668,0.0,0.0,0.014355,4.311794,5.424922,0.565597,0.111031,0.070389,0.028569,0.0,6.018145,1.823749,4.881665,0.014355,4.330558,0.0,3.786596,0.0,4.710944,0.0,2.100978,0.070389,8.24246,1.31034,3.740928,3.272023,0.0,0.0,0.0,0.0,3.713696,1.678072,0.0,0.028569,0.0,4.125155,0.014355,0.0,2.263034,0.790772,0.464668,4.023255,0.0,4.497612,6.434795,1.627607,5.138323,4.958843,4.766595,4.474436,0.659925,0.028569,4.512227,0.189034,0.263034,0.0
1269,A498,ACH-000555,0.042644,0.084064,0.056584,3.025029,0.0,6.922317,6.33396,7.592831,5.526382,1.111031,0.084064,3.124328,1.541019,3.371559,0.056584,3.516015,0.0,1.95977,3.258519,0.333424,0.15056,0.263034,0.028569,0.0,0.0,2.577731,0.695994,0.042644,0.014355,1.367371,0.0,0.014355,0.0,5.828073,4.776104,0.238787,0.014355,0.014355,5.938521,0.0,0.0,0.0,0.070389,0.201634,6.087675,5.036064,7.435379,3.887525,0.815575,0.014355,0.163499,3.234195,0.0,0.0,0.389567,0.014355,0.111031,4.351204,4.761285,0.0,0.028569,1.843984,5.732812,2.899176,6.035844,1.333424,1.157044,0.933573,2.316146,0.014355,0.0,3.892391,4.521051,0.0,2.632268,1.169925,0.263034,0.0,0.014355,2.91265,2.084064,10.22062,3.400538,0.356144,0.0,4.186659,0.0,2.584963,0.163499,0.238787,0.0,5.050502,0.070389,0.0,3.155425,0.028569,0.028569,2.223423,0.070389,5.879461,2.568032,0.400538,2.662205,2.405992,0.028569,0.0,0.028569,0.189034,2.799087,0.0,0.0,3.983678,5.407693,0.014355,0.0,1.049631,0.0,0.555816,4.221877,4.653633,1.157044,5.816344,6.358256,0.111031,0.0,0.042644,0.028569,0.014355,1.782409,0.084064,0.226509,0.0,2.550901,1.400538,5.344473,0.238787,5.719457,0.0,4.08151,0.084064,4.06953,0.137504,0.0,1.963474,3.671293,0.815575,3.102658,0.201634,2.908813,4.092546,0.214125,5.524503,9.875181,5.851749,5.546894,3.165108,1.275007,1.111031,0.0,0.084064,6.211207,0.0,7.303141,1.195348,7.305332,0.0,0.0,6.867032,1.933573,2.307429,1.744161,0.0,0.0,5.81455,0.042644,4.934517,0.014355,1.0,4.885574,0.575312,4.576522,0.0,5.108943,0.042644,0.028569,0.0,5.876517,1.226509,1.226509,0.0,0.028569,5.15583,2.9855,2.189034,4.69488,0.097611,0.956057,1.650765,0.111031,0.014355,0.056584,0.0,0.014355,0.0,0.014355,1.333424,4.596339,1.823749,0.014355,0.056584,3.447579,0.028569,0.042644,0.124328,0.0,0.0,0.0,0.014355,0.070389,5.180307,3.224966,5.517276,0.014355,0.056584,0.084064,5.457463,0.014355,4.537917,6.574404,0.687061,0.526069,0.014355,7.03848,6.049413,4.92837,0.097611,2.961623,0.0,2.185867,0.056584,0.807355,0.0,6.952916,1.9855,0.056584,0.0,0.028569,2.269033,0.0,0.0,4.071248,2.028569,1.035624,0.0,0.124328,5.590362,2.435629,1.063503,4.740388,0.042644,0.042644,4.013462,0.632268,5.888256,0.15056,0.0,0.0,0.799087,0.722466,4.168321,4.589763,4.759156,2.792855,1.687061,2.121015,3.550901,0.678072,2.153805,5.219556,1.744161,0.097611,4.329124,1.952334,0.871844,0.014355,0.0,7.442031,6.521365,1.669027,0.356144,6.858105,5.281327,0.545968,0.0,0.85599,0.028569,0.0,0.62293,0.042644,4.813012,0.773996,10.655441,8.821615,0.321928,0.321928,3.894333,0.084064,5.094236,0.879706,0.0,0.0,2.111031,0.0,0.014355,5.240314,0.014355,2.211012,6.81839,2.467279,1.752749,8.553898,0.042644,2.831877,0.565597,4.392317,7.472813,0.454176,2.277985,0.0,1.906891,5.87799,3.833902,0.056584,0.0,4.72792,3.454176,0.847997,0.0,0.028569,0.0,0.014355,0.028569,0.0,0.214125,0.0,0.0,2.980025,0.042644,4.507795,3.934517,0.214125,0.226509,1.104337,1.367371,6.537296,2.097611,0.189034,0.0,0.0,4.885574,3.234195,1.575312,3.460743,0.0,4.670727,0.226509,0.042644,0.0,3.903038,1.580145,0.042644,0.0,6.958611,0.0,0.0,0.250962,0.070389,0.0,0.028569,3.100978,0.137504,4.772414,0.056584,1.157044,5.341274,6.335926,0.0,0.084064,1.823749,6.972922,5.667324,0.070389,6.245458,0.0,0.124328,1.38405,2.575312,4.059182,0.056584,4.732812,0.014355,0.028569,0.495695,0.176323,4.106851,4.142413,3.702658,2.618239,0.014355,3.040892,6.923625,0.485427,0.344828,1.550901,0.0,0.124328,1.292782,2.438293,2.304511,3.24184,0.014355,2.922198,6.321567,4.59156,0.400538,0.782409,0.028569,3.344828,0.432959,2.488001,5.849999,3.788686,6.324451,0.056584,3.439623,5.062208,0.189034,2.503349,0.250962,0.0,4.360364,0.739848,3.979111,0.028569,7.589838,0.422233,0.042644,0.0,5.08534,0.0,0.757023,0.028569,1.914565,1.104337,0.970854,1.432959,1.244887,4.365972,0.432959,4.57289,3.771886,6.307793,0.516015,0.422233,0.565597,0.0,4.852498,0.432959,4.801676,3.776104,4.337711,3.044394,0.0,6.586314,2.797013,0.0,3.012569,0.782409,0.097611,5.399171,5.224581,4.726831,0.014355,0.887525,0.0,0.070389,7.876517,1.163499,0.0,5.46238,8.725298,0.0,0.163499,5.659354,5.540709,2.819668,5.841218,4.728465,8.356408,6.533252,0.189034,3.878725,0.0,5.362119,0.042644,0.0,0.0,5.989593,8.371864,0.0,0.028569,0.0,4.956986,6.196332,0.0,3.840967,4.452859,6.551516,0.084064,0.163499,5.092546,4.809929,0.0,1.372952,1.232661,0.0,1.608809,5.414474,0.62293,1.361768,0.056584,0.0,0.0,0.0,5.723012,0.014355,0.0,0.0,0.042644,4.82171,0.0,3.283922,0.250962,3.718088,5.070819,0.0,0.594549,0.15056,0.042644,0.0,0.014355,0.678072,0.344828,0.028569,7.21393,3.258519,0.422233,3.276497,0.0,0.0,3.982765,0.0,0.0,3.361768,3.575312,0.226509,0.0,0.0,0.056584,0.0,2.998196,0.014355,0.014355,1.117695,0.422233,0.0,1.014355,0.042644,0.0,3.382667,4.684819,0.014355,0.367371,0.475085,0.028569,0.014355,4.340562,3.9855,4.699885,0.0,0.056584,0.111031,0.176323,0.097611,0.056584,0.214125,0.070389,4.494416,0.0,1.967169,2.865919,0.0,4.845992,6.137504,3.833902,0.042644,0.0,2.372952,0.014355,5.132577,0.0,0.056584,1.655352,0.014355,9.381478,0.0,2.201634,0.014355,0.097611,0.201634,0.014355,0.0,0.0,4.334139,3.38819,4.508429,0.575312,0.0,0.189034,0.15056,0.056584,0.687061,0.464668,4.125982,0.0,4.680887,0.176323,4.147307,0.028569,4.769243,0.0,2.794936,0.014355,8.20921,1.169925,3.684819,3.127633,0.028569,0.014355,0.0,0.0,5.210233,3.053111,0.0,0.137504,0.0,3.864929,0.014355,0.0,1.510962,0.056584,1.189034,3.538538,0.028569,6.391974,8.085711,4.317594,4.779785,0.0,0.201634,3.617063,0.286881,0.111031,4.767655,0.604071,0.333424,0.0


In [29]:
# store the cell line information (based on numpy)
# the order in cell line information is already consistent with cellline2relid_dict
np_CCLE_expression_depmap_reduced = []
for key in cellline2relid_dict.keys():
    # retrieve by cellline2relid_dict keys
    temp = np.array(CCLE_expression_depmap_reduced[CCLE_expression_depmap_reduced['cellline_name']==key])
    np_CCLE_expression_depmap_reduced.append(temp)
    
# *** but currently it does not experience 0-1 normalization ***
np_CCLE_expression_depmap_reduced = np.concatenate(np_CCLE_expression_depmap_reduced)[:, 2:]

# save the gene expression data for each cell line, still follow the order of cellline2relid_dict
np.save(prefix + midfix + 'cellline_expression.npy', np_CCLE_expression_depmap_reduced)

In [None]:
print('np_CCLE_expression_depmap_reduced.shape:', np_CCLE_expression_depmap_reduced.shape) # final gene number for each cell line
CCLE_expression_depmap_reduced[CCLE_expression_depmap_reduced['cellline_name']=='786-0']

# obtain and further process the drug molecular graph related information for ablation experiments
drugcomb_alldruginfo_dict_lower={}
for key in drugcomb_alldruginfo_dict.keys():
    drugcomb_alldruginfo_dict_lower[key.lower()]=drugcomb_alldruginfo_dict[key]   

In [53]:
import dgl
from dgl.data import DGLDataset
import torch
import os


relid2drug_dict = {value: key for key, value in drug2relid_dict.items()}
drug_graph_edges = []
drug_graph_properties = []
# store node feature
drug_graph_nodes = []
drugid2morgan = {}
for drugid in relid2drug_dict.keys():
    # drugid: current drug id, drugcomb_alldruginfo_dict_lower: collected composite data
    druginfo = drugcomb_alldruginfo_dict_lower[relid2drug_dict[drugid]]
    drugid2morgan[drugid] = druginfo['morgan_bit']
    counter = -1
    # row in adjacent matrix
    for row in druginfo['adjacent_matrix']:
        counter += 1
        # obtain edges from current adjacent matrix
        for dst in row.nonzero()[0]:
            drug_graph_edges.append([drugid, counter, dst])

    # add self-loop
    temp = druginfo['adjacent_matrix'].shape[0]
    self_loop = [[drugid, i, i] for i in range(temp)]
    drug_graph_edges.extend(self_loop)
    # create label (graph_id) for current drug
    drug_graph_properties.append([drugid, drugid, temp])

    # store the atom numbers
    for atom in druginfo['atom_num']:
        drug_graph_nodes.append([drugid, atom])

drug_graph_edges = pd.DataFrame(drug_graph_edges, columns=['graph_id', 'src', 'dst'])

drug_graph_properties = pd.DataFrame(drug_graph_properties, columns=['graph_id', 'label', 'num_nodes'])

drug_graph_nodes = pd.DataFrame(drug_graph_nodes, columns=['graph_id', 'atom_num'])

In [54]:
drug_graph_properties.head() # label and atom nodes for each molecular graph

Unnamed: 0,graph_id,label,num_nodes
0,0,0,9
1,1,1,11
2,2,2,90
3,3,3,16
4,4,4,19


In [69]:
# count the atom number for each drug molecule
atom_set=list(set(drug_graph_nodes['atom_num']))
atom_set.sort()
atomnum2id={atom: i for i,atom in enumerate(atom_set)}
print(atomnum2id)

# test for embedding atom numbers
atom_embedding=torch.nn.Embedding(len(atom_set),64)
atom_rel_list=[atomnum2id[i] for i in atom_set]
print(atom_rel_list)

atom_embedding=atom_embedding(torch.LongTensor(atom_rel_list))
print(atom_embedding.shape)
print(torch.LongTensor(atom_rel_list).size())

print('set(drug_graph_nodes[atom_num]):', set(drug_graph_nodes['atom_num']))

# store drug related domain knowledge
with open(prefix + midfix + 'atomnum2id_dict.pickle','wb') as out_file:
    pickle.dump(atomnum2id,out_file)

# mapping from relative drug ids to correspongding ECFP6
with open(prefix + midfix + 'drugid2morgan.pickle','wb') as out_file:
    pickle.dump(drugid2morgan, out_file)

# save the molecular graph information related to involved drugs into the original data folder 
drug_graph_edges.to_csv(prefix + midfix + 'drug_graph_edges.csv',index=0)
drug_graph_properties.to_csv(prefix + midfix + 'drug_graph_properties.csv',index=0)
drug_graph_nodes.to_csv(prefix + midfix + 'drug_graph_nodes.csv',index=0)

{5: 0, 6: 1, 7: 2, 8: 3, 9: 4, 15: 5, 16: 6, 17: 7, 35: 8}
[0, 1, 2, 3, 4, 5, 6, 7, 8]
torch.Size([9, 64])
torch.Size([9])
set(drug_graph_nodes[atom_num]): {35, 5, 6, 7, 8, 9, 15, 16, 17}


In [48]:
# another test for generate drug molecular files
class DrugStrucDataset(DGLDataset):
    def __init__(self):
        super().__init__(name='drugstruc')

    def process(self):
        # read the molecular graph information related to involved drugs from the original data folder 
        edges = pd.read_csv(prefix + midfix + 'drug_graph_edges.csv')
        properties = pd.read_csv(prefix + midfix + 'drug_graph_properties.csv')
        nodes = pd.read_csv(prefix + midfix + 'drug_graph_nodes.csv')
        self.graphs = []
        self.labels = []

        # Create a graph for each graph ID from the edges table.
        # First process the properties table into two dictionaries with graph IDs as keys.
        # The label and number of nodes are values.
        label_dict = {}
        num_nodes_dict = {}
        for _, row in properties.iterrows():
            label_dict[row['graph_id']] = row['label']
            num_nodes_dict[row['graph_id']] = row['num_nodes']

        # For the edges, first group the table by graph IDs.
        edges_group = edges.groupby('graph_id')
        nodes_group = nodes.groupby('graph_id')

        # For each graph ID...
        for graph_id in edges_group.groups:
            # Find the edges as well as the number of nodes and its label.
            edges_of_id = edges_group.get_group(graph_id)
            nodes_of_id = nodes_group.get_group(graph_id)
            src = edges_of_id['src'].to_numpy()
            dst = edges_of_id['dst'].to_numpy()
            num_nodes = num_nodes_dict[graph_id]
            label = label_dict[graph_id]
            atom_features=torch.from_numpy(nodes_of_id['atom_num'].to_numpy())
            atom_features = atom_features.type(torch.float32)

            # Create a graph and add it to the list of graphs and labels.
            # in other words, create the dgl graph correspondinf to each drug molecular sub-graph and add node features for each graph here
            g = dgl.graph((src, dst), num_nodes=num_nodes)
            g.ndata['atom_num'] = atom_features
            self.graphs.append(g)
            self.labels.append(label) # each graph has a label created by its graph id

        # Convert the label list to tensor for saving.
        self.labels = torch.LongTensor(self.labels)

    def __getitem__(self, i):
        return self.graphs[i], self.labels[i]

    def __len__(self):
        return len(self.graphs)
    
# test
dataset = DrugStrucDataset()
graph, label = dataset[10]
print(graph, label) # dgl graph object for the 11th molecular graph + 11th numerical label
print('dataset.labels:', dataset.labels) # all numerical labels for every molecular graph

Graph(num_nodes=13, num_edges=39,
      ndata_schemes={'atom_num': Scheme(shape=(), dtype=torch.float32)}
      edata_schemes={}) tensor(10)
dataset.labels: tensor([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,  10,  11,  12,  13,
         14,  15,  16,  17,  18,  19,  20,  21,  22,  23,  24,  25,  26,  27,
         28,  29,  30,  31,  32,  33,  34,  35,  36,  37,  38,  39,  40,  41,
         42,  43,  44,  45,  46,  47,  48,  49,  50,  51,  52,  53,  54,  55,
         56,  57,  58,  59,  60,  61,  62,  63,  64,  65,  66,  67,  68,  69,
         70,  71,  72,  73,  74,  75,  76,  77,  78,  79,  80,  81,  82,  83,
         84,  85,  86,  87,  88,  89,  90,  91,  92,  93,  94,  95,  96,  97,
         98,  99, 100, 101, 102, 103, 104, 105])


In [73]:
print('len(drug2relid_dict):', len(drug2relid_dict))
print('len(target2relid_dict):', len(target2relid_dict))
print('len(cellline2relid_dict):', len(cellline2relid_dict))

len(drug2relid_dict): 106
len(target2relid_dict): 12217
len(cellline2relid_dict): 60
