# GPR Annotation

### 1 - Generation of Orthologs List for Human and CHO genes with NIH gene IDs

A dataset containing Ensemb IDs of ortholog genes between Human and Chinese Hamster was obtained from BioMart. Two  datasets containing a complete gene lists for the entire Human and Chinese Hamster organisms were obtained from NIH Datasets https://www.ncbi.nlm.nih.gov/datasets/. Furthermore, two datasets containing Ensembl and Entrez IDs from both, Human and CHO, were obtained from DAVID https://david.ncifcrf.gov/tools.jsp. The final "orthologs" dataset generated contains all the ortholog genes from Human and Hamster with its corresponding NIH IDs. Finally, one dataset containing CHO and Human gene orthologs from Paranoid database https://inparanoid.sbc.su.se was used to fill empty genes.

In [8]:
import pandas as pd
import numpy as np

In [9]:
#Generate orthologs df
orthologs = pd.read_csv('../Data/GPR_Curation/mart_export-3.txt')
#Eliminate null values in the dataset
orthologs = orthologs.dropna()
#Drop useless columns 
orthologs = orthologs.drop(['Gene stable ID version'], axis=1)
# Change columns names
orthologs = orthologs.rename(columns={'Gene stable ID': 'CHO Ensembl ID','Gene name': 'CHO Gene Name','Human gene stable ID':'Human Ensembl ID','Human gene name':'Human Gene Name'})

orthologs

Unnamed: 0,CHO Ensembl ID,CHO Gene Name,Human Ensembl ID,Human Gene Name
5,ENSCGRG00001000006,ND1,ENSG00000198888,MT-ND1
9,ENSCGRG00001000010,ND2,ENSG00000198763,MT-ND2
15,ENSCGRG00001000016,COX1,ENSG00000198804,MT-CO1
18,ENSCGRG00001000019,COX2,ENSG00000198712,MT-CO2
20,ENSCGRG00001000021,ATP8,ENSG00000228253,MT-ATP8
...,...,...,...,...
27530,ENSCGRG00001025067,Ero1b,ENSG00000086619,ERO1B
27531,ENSCGRG00001025068,Pcp4l1,ENSG00000248485,PCP4L1
27532,ENSCGRG00001025069,Slc30a1,ENSG00000170385,SLC30A1
27534,ENSCGRG00001025071,Zfp605,ENSG00000196458,ZNF605


Dictionaries from the NCBI datasets are used to map Entrez Gene IDs from the Gene Names

In [10]:
#Dict from dataset of Human Entrez Gene IDs from NCBI database
human_genes = pd.read_csv('../Data/GPR_Curation/human_ncbi_genes.txt', sep='\t')
human_genes = human_genes.rename(columns={'Symbol': 'Human Gene Name','NCBI GeneID': 'Human GeneID'})
human_dict = human_genes.set_index('Human Gene Name')['Human GeneID'].to_dict()
human_dict

{'TP53': 7157,
 'EGFR': 1956,
 'TNF': 7124,
 'APOE': 348,
 'VEGFA': 7422,
 'IL6': 3569,
 'TGFB1': 7040,
 'MTHFR': 4524,
 'ERBB2': 2064,
 'HIF1A': 3091,
 'ESR1': 2099,
 'IL10': 3586,
 'APP': 351,
 'ACE': 1636,
 'BRCA1': 672,
 'STAT3': 6774,
 'MMP9': 4318,
 'CRP': 1401,
 'KRAS': 3845,
 'BDNF': 627,
 'BRAF': 673,
 'ADIPOQ': 9370,
 'AR': 367,
 'AKT1': 207,
 'ABCB1': 5243,
 'HLA-DRB1': 3123,
 'NFKB1': 4790,
 'VDR': 7421,
 'IL1B': 3553,
 'CDKN2A': 1029,
 'PTEN': 5728,
 'LOC110806262': 110806262,
 'CTNNB1': 1499,
 'TLR4': 7099,
 'PTGS2': 5743,
 'NOS3': 4846,
 'CFTR': 1080,
 'COMT': 1312,
 'SNCA': 6622,
 'CXCL8': 3576,
 'CD274': 29126,
 'TERT': 7015,
 'PPARG': 5468,
 'SLC6A4': 6532,
 'MYC': 4609,
 'MAPT': 4137,
 'HLA-B': 3106,
 'MTOR': 2475,
 'CDH1': 999,
 'IGF1': 3479,
 'BCL2': 596,
 'LEP': 3952,
 'CXCR4': 7852,
 'GSTM1': 2944,
 'IFNG': 3458,
 'BRCA2': 675,
 'MDM2': 4193,
 'JAK2': 3717,
 'MMP2': 4313,
 'CD4': 920,
 'NFE2L2': 4780,
 'MAPK1': 5594,
 'CCND1': 595,
 'IL17A': 3605,
 'SERPINE1': 50

In [11]:
#Dict from dataset of CHO Entrez Gene IDs from NCBI database
cho_genes = pd.read_csv('../Data/GPR_Curation/cho_ncbi_genes.txt', sep='\t')
cho_genes = cho_genes.rename(columns={'Symbol': 'CHO Gene Name','NCBI GeneID': 'CHO GeneID'})
cho_dict = cho_genes.set_index('CHO Gene Name')['CHO GeneID'].to_dict()
cho_dict

{'Scap': 100689048,
 'Nsf': 100770898,
 'Abcb1': 100682536,
 'Dhfr': 100689028,
 'Ercc2': 100689272,
 'Tubb': 100689091,
 'Pea15': 100736554,
 'Sar1b': 100758826,
 'Pex5': 100689015,
 'Rad51c': 100689078,
 'Hspa5': 100689305,
 'Hmgcr': 100756363,
 'Tp53': 100682525,
 'Mgat1': 100682529,
 'Rpsa': 100689045,
 'Eef2': 100689051,
 'Slc20a2': 100689023,
 'Hs6st1': 100689173,
 'Ubb': 100689268,
 'Cbr3': 100689021,
 'Kif2c': 100689309,
 'Mt1': 100689478,
 'Mir7a': 102466467,
 'Mt2': 100689479,
 'Polr2a': 100689016,
 'Srebf2': 100689017,
 'Dpagt1': 100689054,
 'Casp3': 100689061,
 'Ldha': 100689064,
 'Cxcl3': 100689100,
 'Eef1a1': 100689276,
 'Rps14': 100689292,
 'Akr1b8': 100689318,
 'Xrcc1': 100689414,
 'Npc1': 100689424,
 'Ptdss2': 100689448,
 'Parp1': 100689463,
 'Smu1': 100736555,
 'Prnp': 100762792,
 'Kars1': 100766627,
 'Mpdu1': 100689049,
 'Mbtps1': 100689417,
 'Bdnf': 100768664,
 'Ap3m1': 100689277,
 'Adam17': 100684971,
 'Pisd': 100689093,
 'Ugp2': 100689325,
 'Ldlr': 100689399,
 'Hs

Dictionaries from the DAVID datasets are used to map Entrez Gene IDs from the Ensembl IDs

In [12]:
#Dict from dataset of Human Entrez Gene IDs from DAVID
human_david = pd.read_csv('../Data/GPR_Curation/david_output_human.txt', sep='\t')
human_dict2 = human_david.set_index('From')['To'].to_dict()
human_dict2

{'ENSG00000215203': 389207,
 'ENSG00000179029': 84314,
 'ENSG00000179023': 127707,
 'ENSG00000180011': 284273,
 'ENSG00000131089': 23229,
 'ENSG00000170689': 3219,
 'ENSG00000013810': 10460,
 'ENSG00000205884': 613210,
 'ENSG00000131080': 60401,
 'ENSG00000168374': 378,
 'ENSG00000179021': 285237,
 'ENSG00000156381': 122416,
 'ENSG00000182685': 283870,
 'ENSG00000182687': 8811,
 'ENSG00000143079': 55917,
 'ENSG00000180008': 122809,
 'ENSG00000025800': 23633,
 'ENSG00000143061': 3321,
 'ENSG00000156374': 84108,
 'ENSG00000131096': 5697,
 'ENSG00000181350': 388341,
 'ENSG00000131095': 2670,
 'ENSG00000131097': 51751,
 'ENSG00000168389': 84879,
 'ENSG00000131094': 10882,
 'ENSG00000182670': 7267,
 'ENSG00000168386': 11259,
 'ENSG00000144395': 284992,
 'ENSG00000143067': 90874,
 'ENSG00000182676': 116729,
 'ENSG00000180035': 197407,
 'ENSG00000155034': 80028,
 'ENSG00000179044': 283849,
 'ENSG00000118094': 11181,
 'ENSG00000179046': 205860,
 'ENSG00000157693': 203197,
 'ENSG00000168394': 6

In [13]:
#Dict from dataset of CHO Entrez Gene IDs from DAVID
cho_david = pd.read_csv('../Data/GPR_Curation/david_output_cho.txt', sep='\t')
cho_dict2 = cho_david.set_index('From')['To'].to_dict()
cho_dict2

{'ENSCGRG00001018393': 100767767,
 'ENSCGRG00001017062': 100770447,
 'ENSCGRG00001018390': 100759155,
 'ENSCGRG00001017061': 100751868,
 'ENSCGRG00001018391': 100753400,
 'ENSCGRG00001017060': 100756731,
 'ENSCGRG00001017067': 100764339,
 'ENSCGRG00001017066': 100756003,
 'ENSCGRG00001018399': 100769638,
 'ENSCGRG00001005074': 100754819,
 'ENSCGRG00001005078': 113837268,
 'ENSCGRG00001005076': 100769225,
 'ENSCGRG00001017073': 100759646,
 'ENSCGRG00001017076': 100756306,
 'ENSCGRG00001017070': 100754902,
 'ENSCGRG00001017071': 100760100,
 'ENSCGRG00001017078': 100756850,
 'ENSCGRG00001017079': 100762299,
 'ENSCGRG00001005061': 100751441,
 'ENSCGRG00001014803': 100770376,
 'ENSCGRG00001005062': 103161413,
 'ENSCGRG00001014809': 100763237,
 'ENSCGRG00001014805': 100755256,
 'ENSCGRG00001006396': 100763695,
 'ENSCGRG00001005065': 100752292,
 'ENSCGRG00001014807': 100771751,
 'ENSCGRG00001005066': 100757565,
 'ENSCGRG00001017085': 100756377,
 'ENSCGRG00001017087': 100765826,
 'ENSCGRG00001

In [38]:
#Dict from the paranoid dataset obtained by Hooman in 2016
# The dictionary generated has Human Gene IDs as keys and CHO Gene IDs "orthologs" as values
cho_paranoid_df = pd.read_csv('../Data/GPR_Curation/human.cho.id.final.with.mito.with.inparanoid', sep=';', names=['Human IDs', 'CHO IDs'])
cho_paranoid_df = cho_paranoid_df.astype(str)
cho_paranoid_dict = cho_paranoid_df.set_index('Human IDs')['CHO IDs'].to_dict()
cho_paranoid_dict

{'10000': '100752454',
 '1000': '100689204',
 '10001': '100762349',
 '10002': '100752298',
 '10003': '100769032',
 '10004': '100768106',
 '10005': '100761464',
 '10006': '100772463',
 '10007': '100689210',
 '10008': '100755499',
 '10009': '100763419',
 '100': '100756254',
 '10010': '100764984',
 '100101267': '100762026',
 '100101467': '100766295',
 '1001': '100758473',
 '10011': '100753253',
 '100113407': '100763981',
 '100125288': '100761549',
 '100127206': '100772872',
 '100127889': '100762880',
 '100127983': '100771996',
 '100128569': '100762642',
 '100128731': '100762772',
 '100128927': '100752108',
 '100129094': '100762433',
 '100129271': '100756558',
 '100129361': '103159661',
 '100129480': '100768732',
 '100129520': '100754139',
 '100129583': '100760554',
 '100129669': '100761208',
 '100129792': '100763254',
 '100129924': '100773888',
 '100130097': '103161207',
 '100130274': '100763932',
 '100130301': '100763417',
 '100130311': '100770028',
 '100130348': '100767526',
 '100130361

In [54]:
# Map dictionary into the orthologs dataset

# CHO Genes
orthologs['CHO GeneID_David'] = orthologs['CHO Ensembl ID'].map(cho_dict2)
orthologs['CHO GeneID_David'] = orthologs['CHO GeneID_David'].fillna('').astype(str).str.replace(".0","",regex=False)
orthologs['CHO GeneID'] = orthologs['CHO Gene Name'].map(cho_dict)
orthologs['CHO GeneID'] = orthologs['CHO GeneID'].fillna('').astype(str).str.replace(".0","",regex=False)

# Human Genes
orthologs['Human GeneID'] = orthologs['Human Gene Name'].map(human_dict)
orthologs['Human GeneID'] = orthologs['Human GeneID'].fillna('').astype(str).str.replace(".0","",regex=False)
orthologs['Human GeneID_David'] = orthologs['Human Ensembl ID'].map(cho_dict2)
orthologs['Human GeneID_David'] = orthologs['Human GeneID_David'].fillna('').astype(str).str.replace(".0","",regex=False)



#Replace empty values with the values obtained from David
for i,row in orthologs.iterrows():
    if row['CHO GeneID'] == '':
        row['CHO GeneID'] = row['CHO GeneID_David']
    if row['Human GeneID'] == '':
        row['Human GeneID'] = row['Human GeneID_David']
    
#Replace the rest of the empty values with the those from the paranoid dataset
for i,row in orthologs.iterrows():
    if row['CHO GeneID'] == '':
        try:
            row['CHO GeneID'] = cho_paranoid_dict[row['Human GeneID']]
        except:
            continue
    if row['Human GeneID'] == '':
        try:
            row['Human GeneID'] = [k for k, v in cho_paranoid_dict.items() if v == row['CHO GeneID']]
        except:
            continue

orthologs.drop(['CHO GeneID_David'], axis=1)        

orthologs['Human GeneID'] = orthologs['Human Gene Name'].map(human_dict)
orthologs['Human GeneID'] = orthologs['Human GeneID'].fillna('').astype(str).str.replace(".0","",regex=False)

# Reorganize columns
orthologs = orthologs[['CHO Gene Name','CHO GeneID', 'CHO Ensembl ID', 'Human Gene Name', 'Human GeneID','Human Ensembl ID']]
orthologs = orthologs.reset_index(drop = True)

orthologs.to_excel('../Data/GPR_Curation/orthologs.xlsx')
orthologs

Unnamed: 0,CHO Gene Name,CHO GeneID,CHO Ensembl ID,Human Gene Name,Human GeneID,Human Ensembl ID
0,ND1,3979183,ENSCGRG00001000006,MT-ND1,4535,ENSG00000198888
1,ND2,3979184,ENSCGRG00001000010,MT-ND2,4536,ENSG00000198763
2,COX1,3979185,ENSCGRG00001000016,MT-CO1,4512,ENSG00000198804
3,COX2,3979186,ENSCGRG00001000019,MT-CO2,4513,ENSG00000198712
4,ATP8,3979187,ENSCGRG00001000021,MT-ATP8,4509,ENSG00000228253
...,...,...,...,...,...,...
18152,Ero1b,100764579,ENSCGRG00001025067,ERO1B,56605,ENSG00000086619
18153,Pcp4l1,100770275,ENSCGRG00001025068,PCP4L1,654790,ENSG00000248485
18154,Slc30a1,100751596,ENSCGRG00001025069,SLC30A1,7779,ENSG00000170385
18155,Zfp605,100767561,ENSCGRG00001025071,ZNF605,100289635,ENSG00000196458


### 2 - Finding CHO orthologs for Human GPRs in Recon3D

Using the "orthologs" dataset generated above, we can map all the CHO genes in the recon 3D dataset GPR column and generate a new columns "CHO GPR"

In [1]:
import cobra
from cobra.io.mat import load_matlab_model

In [2]:
recon3d = load_matlab_model('../Data/GPR_Curation/Recon3D_301.mat')

ImportError: load_matlab_model() requires scipy.

In [55]:
#Generate recon3d df
recon3d = pd.read_excel('../Data/GPR_Curation/recon3d_gprs.xlsx')

recon3d = recon3d.groupby('m_reaction').first()
recon3d['m_gene_reaction_rule'] = recon3d['m_gene_reaction_rule'].replace(np. nan,'',regex=True)
recon3d

Unnamed: 0_level_0,m_gene_reaction_rule,m_metabolites,m_subsystem,m_gene,seq_uniprot,seq_len,seq_file,seq_num_structures,seq_num_experimental_structures,struct_id,struct_chain_id,struct_chain_seq_coverage,struct_is_experimental,struct_pdb,struct_resolution,struct_chemicals,struct_file
m_reaction,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1
11DOCRTSLte,5243.1,h2o[c];atp[c];h[c];11docrtsl[c];11docrtsl[e];p...,"Transport, extracellular",5243.1,P08183-1,1280.0,P08183-1.fasta,21.0,21.0,3g61-A,A,80.5,1.0,3g61,4.35,2J8,3g61-A_clean.pdb
11DOCRTSTRNte,5243.1,atp[c];pi[c];11docrtstrn[c];h[c];11docrtstrn[e...,"Transport, extracellular",5243.1,P08183-1,1280.0,P08183-1.fasta,21.0,21.0,3g61-A,A,80.5,1.0,3g61,4.35,2J8,3g61-A_clean.pdb
12DHCHOLabc,8714.3 or 8647.1 or 8714.2 or 8714.1 or 1244.1...,atp[c];12dhchol[e];12dhchol[c];pi[c];h[c];h2o[...,"Transport, extracellular",1244.1,Q92887-1,1545.0,Q92887-1.fasta,0.0,0.0,,,,,,,,
12DHCHOLt,28234.1 or 10599.1 or 123264.1 or 200931.1,hco3[c];12dhchol[e];12dhchol[c];hco3[e],"Transport, extracellular",123264.1,Q9NPD5-1,702.0,Q9NPD5-1.fasta,0.0,0.0,,,,,,,,
12DHCHOLt2,6554.1 or 6555.1,na1[e];12dhchol[c];12dhchol[e];na1[c],"Transport, extracellular",6555.1,Q12908-1,348.0,Q12908-1.fasta,2.0,0.0,H19894-X,X,99.7,0.0,,,,NP_000443.1_model1_clean-X_clean.pdb
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
r2525,8501.1,gln_L[c];gln_L[e],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb
r2526,8501.1,ser_L[e];ser_L[c],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb
r2532,8501.1,asn_L[c];asn_L[e],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb
r2534,8501.1,thr_L[c];thr_L[e],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb


In [56]:
# Orthologs dict
orthologs_dict = orthologs.set_index('Human GeneID')['CHO GeneID'].to_dict()
orthologs_dict

{'4535': '3979183',
 '4536': '3979184',
 '4512': '3979185',
 '4513': '3979186',
 '4509': '3979187',
 '4508': '3979188',
 '4514': '3979189',
 '4537': '3979190',
 '4539': '3979178',
 '4538': '3979179',
 '4540': '3979180',
 '4541': '3979181',
 '4519': '3979182',
 '54859': '100764169',
 '203523': '100764457',
 '55813': '100761515',
 '901': '100753075',
 '9840': '100754149',
 '6919': '100768573',
 '5885': '100750544',
 '1910': '100762726',
 '26022': '100762391',
 '84432': '100768325',
 '90187': '100771706',
 '1763': '100761842',
 '4026': '100753874',
 '79184': '100753541',
 '64795': '100766802',
 '100507003': '100772084',
 '4841': '100757453',
 '84311': '100755070',
 '10864': '100757046',
 '6857': '100753843',
 '51268': '100765858',
 '59272': '100772552',
 '58516': '100760112',
 '645104': '100769210',
 '64857': '100761461',
 '165904': '100756551',
 '8722': '100756958',
 '1896': '100768945',
 '28959': '100764547',
 '125115': '100758909',
 '2188': '103161842',
 '144809': '113832672',
 '10873'

In [57]:
# Extract GPR info from Recon3D and swap gene IDs from human to CHO
import re
cho_gpr = []

for row in recon3d['m_gene_reaction_rule']:
    if row != "":
        gpr = re.findall('[\d.]*\d+', row)
        new_gpr = row
        for g in gpr:
            human_g = g.split('.')[0]
            try:
                cho_g = orthologs_dict[human_g]
                if cho_g == '':
                    cho_g = f'h{human_g}'
            except:
                cho_g = f'h{human_g}'
            new_gpr = new_gpr.replace(g, cho_g)
    elif row == '':
        new_gpr = ''
        
    cho_gpr.append(new_gpr)

In [59]:
# Generate Recon3D dataset with the addition of GPR with CHO genes
recon3d['CHO GPR'] = cho_gpr
recon3d.to_excel('../Data/GPR_Curation/recon3D_chogprs.xlsx')
recon3d

Unnamed: 0_level_0,m_gene_reaction_rule,m_metabolites,m_subsystem,m_gene,seq_uniprot,seq_len,seq_file,seq_num_structures,seq_num_experimental_structures,struct_id,struct_chain_id,struct_chain_seq_coverage,struct_is_experimental,struct_pdb,struct_resolution,struct_chemicals,struct_file,CHO GPR
m_reaction,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1
11DOCRTSLte,5243.1,h2o[c];atp[c];h[c];11docrtsl[c];11docrtsl[e];p...,"Transport, extracellular",5243.1,P08183-1,1280.0,P08183-1.fasta,21.0,21.0,3g61-A,A,80.5,1.0,3g61,4.35,2J8,3g61-A_clean.pdb,100682536
11DOCRTSTRNte,5243.1,atp[c];pi[c];11docrtstrn[c];h[c];11docrtstrn[e...,"Transport, extracellular",5243.1,P08183-1,1280.0,P08183-1.fasta,21.0,21.0,3g61-A,A,80.5,1.0,3g61,4.35,2J8,3g61-A_clean.pdb,100682536
12DHCHOLabc,8714.3 or 8647.1 or 8714.2 or 8714.1 or 1244.1...,atp[c];12dhchol[e];12dhchol[c];pi[c];h[c];h2o[...,"Transport, extracellular",1244.1,Q92887-1,1545.0,Q92887-1.fasta,0.0,0.0,,,,,,,,,100767558 or 100762480 or 100767558 or 1007675...
12DHCHOLt,28234.1 or 10599.1 or 123264.1 or 200931.1,hco3[c];12dhchol[e];12dhchol[c];hco3[e],"Transport, extracellular",123264.1,Q9NPD5-1,702.0,Q9NPD5-1.fasta,0.0,0.0,,,,,,,,,100774298 or 100774298 or 100751085 or 100753765
12DHCHOLt2,6554.1 or 6555.1,na1[e];12dhchol[c];12dhchol[e];na1[c],"Transport, extracellular",6555.1,Q12908-1,348.0,Q12908-1.fasta,2.0,0.0,H19894-X,X,99.7,0.0,,,,NP_000443.1_model1_clean-X_clean.pdb,100756998 or 100689396
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
r2525,8501.1,gln_L[c];gln_L[e],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb,100757617
r2526,8501.1,ser_L[e];ser_L[c],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb,100757617
r2532,8501.1,asn_L[c];asn_L[e],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb,100757617
r2534,8501.1,thr_L[c];thr_L[e],"Transport, extracellular",8501.1,O75387-1,559.0,O75387-1.fasta,2.0,0.0,H16666-X,X,100.0,0.0,,,,NP_003618.1_model1_clean-X_clean.pdb,100757617
