# Isozymes in E. coli

This notebook contains a preliminary study of isozymes in _E. coli_.

Benjamín J. Sánchez, 2020-02-04

## 1. Loading Model and Data

In [1]:
import cameo
import pandas as pd
import urllib

# E. coli model:
import cameo
model = cameo.load_model("iML1515")



In [2]:
# proteomics data:
df = pd.read_csv("s05_proteomics_data_raw.csv", index_col=0)
print(df)

        molecular_weight  chemostat_0.5_mean  chemostat_0.35_mean  \
P0A8T7      155045.00800                4780                 3900   
P0A8V2      150520.27580                5245                 4388   
P36683       93420.94570               15733                20261   
P15254      141295.89840                2285                 1730   
P09831      163176.31530                2321                 1959   
...                  ...                 ...                  ...   
P0ACS2       17121.07240                   1                    1   
P0AA97       20845.49274                   1                    1   
P0AB83       23529.40171                   4                    4   
P23862       20344.80503                   8                    8   
P77433       25178.92327                   0                    3   

        chemostat_0.2_mean  chemostat_0.12_mean  chemostat_0.5_uncertainty  \
P0A8T7                3477                 3000                       8.68   
P0A8V2         

In [3]:
# uniprot mapper of all uniprot codes in the data:
url = "https://www.uniprot.org/uploadlists/"
params = {
"from": "ACC+ID",
"to": "GENENAME",
"format": "tab",
"query": " ".join(df.index.tolist())  # all 
}
data = urllib.parse.urlencode(params).encode("utf-8")
req = urllib.request.Request(url, data)
f = urllib.request.urlopen(req)
response = f.read().decode("utf-8")
uniprot_file = open("uniprot.txt","w")
uniprot_file.write(response)
uniprot_file.close()
uniprot_dict = pd.read_csv("uniprot.txt", index_col=0, sep = "\t")
print(uniprot_dict)

          To
From        
P0A8T7  rpoC
P0A8V2  rpoB
P36683  acnB
P15254  purL
P09831  gltB
...      ...
P0ACS2  soxR
P0AA97  yaeQ
P0AB83   nth
P23862  priC
P77433  ykgG

[2055 rows x 1 columns]


## 2. Isozyme occurrence

In [4]:
isozymes_in_model = 0
for reaction in model.reactions:
    if " or " in reaction.gene_reaction_rule:
        isozymes_in_model += 1
print("Number of reactions in the model with isozymes: " + str(isozymes_in_model))

Number of reactions in the model with isozymes: 743


In [5]:
# count isozymes in data:
isozymes_in_data = []
for gene_A in model.genes:
    try:
        protein_A = uniprot_dict[uniprot_dict["To"]==gene_A.name].index.tolist()[0]
        if protein_A in df.index:
            for gene_B in model.genes:
                if gene_A != gene_B:
                    try:
                        protein_B = uniprot_dict[uniprot_dict["To"]==gene_B.name].index.tolist()[0]
                        if protein_B in df.index:
                            for reaction_A in gene_A.reactions:
                                if gene_B.id in reaction_A.gene_reaction_rule and not " and " in reaction_A.gene_reaction_rule:
                                    isozymes_in_data.append([protein_A, protein_B])
                                    break
                    except:
                        pass
    except:
        pass
    print("done with gene " + gene_A.name)
print("Number of reactions with isozymes: " + str(len(isozymes_in_data)/2))  # Every occurrence is counted twice

done with gene glyA
done with gene ltaE
done with gene cysG
done with gene hemF
done with gene talB
done with gene gor
done with gene tktB
done with gene pyrD
done with gene glcF
done with gene garL
done with gene glcE
done with gene glcD
done with gene pfkA
done with gene fabF
done with gene lpxL
done with gene lpxM
done with gene trpA
done with gene lpxP
done with gene nadC
done with gene acpP
done with gene aas
done with gene dapE
done with gene tktA
done with gene trpB
done with gene glpD
done with gene glpB
done with gene glpC
done with gene glpA
done with gene tyrB
done with gene ilvE
done with gene aroE
done with gene ydiB
done with gene proA
done with gene ynfH
done with gene manA
done with gene ribD
done with gene dmsA
done with gene ynfF
done with gene ynfE
done with gene dmsC
done with gene ynfG
done with gene dmsB
done with gene ribB
done with gene ribF
done with gene ghrB
done with gene nagB
done with gene ybjI
done with gene cof
done with gene adhP
done with gene cobC
don

done with gene accB
done with gene accA
done with gene fsaB
done with gene mqo
done with gene astD
done with gene accC
done with gene pdxA
done with gene fsaA
done with gene pdxJ
done with gene hldD
done with gene nadK
done with gene hemB
done with gene idnD
done with gene purD
done with gene menF
done with gene purL
done with gene ghrA
done with gene eutC
done with gene argE
done with gene menC
done with gene eutB
done with gene entA
done with gene entB
done with gene cpsB
done with gene sgbE
done with gene add
done with gene cyaA
done with gene araD
done with gene adeD
done with gene suhB
done with gene ulaF
done with gene purA
done with gene prpC
done with gene yjjG
done with gene rsgA
done with gene umpH
done with gene nagA
done with gene selB
done with gene yfdR
done with gene argK
done with gene yfbR
done with gene ansA
done with gene hypB
done with gene iaaA
done with gene gloA
done with gene yeiR
done with gene ybhA
done with gene asnA
done with gene yjiA
done with gene asnB
do

done with gene gloB
done with gene amyA
done with gene gpp
done with gene malS
done with gene xanP
done with gene xdhC
done with gene adeP
done with gene spoT
done with gene xdhB
done with gene fadL
done with gene adeQ
done with gene xdhA
done with gene cpdB
done with gene nanC
done with gene solA
done with gene alsB
done with gene cobT
done with gene alsA
done with gene arsB
done with gene alsC
done with gene ybbW
done with gene araG
done with gene yniC
done with gene lyxK
done with gene patD
done with gene wcaH
done with gene araH
done with gene araF
done with gene idnT
done with gene epd
done with gene hisH
done with gene yliI
done with gene hisF
done with gene acrF
done with gene dut
done with gene acrE
done with gene gcd
done with gene panE
done with gene rhaT
done with gene ilvA
done with gene mgtA
done with gene ghxP
done with gene pncB
done with gene ghxQ
done with gene selD
done with gene hyaC
done with gene nikD
done with gene mglB
done with gene nikB
done with gene nikA
done

done with gene avtA
done with gene fiu
done with gene lysU
done with gene psd
done with gene cirA
done with gene sdhA
done with gene sdhD
done with gene sdhB
done with gene sdhC
done with gene bglF
done with gene chiP
done with gene yddG
done with gene pheP
done with gene tesA
done with gene entE
done with gene acnA
done with gene yihU
done with gene ampH
done with gene mdtJ
done with gene acnB
done with gene ggt
done with gene mdtI
done with gene dacA
done with gene lhgO
done with gene ldtA
done with gene dacC
done with gene ldtC
done with gene nnr
done with gene dacD
done with gene alaE
done with gene ldtB
done with gene yfeW
done with gene mltA
done with gene dacB
done with gene mltD
done with gene yceG
done with gene yqjH
done with gene ubiE
done with gene emtA
done with gene glxK
done with gene mltB
done with gene yagF
done with gene yjhG
done with gene yjhH
done with gene yagE
done with gene yieH
done with gene allC
done with gene allE
done with gene uidA
done with gene ydiO
done