In [3]:
import pandas as pd
import numpy as np
from Bio import SeqIO
from Bio.SeqRecord import SeqRecord
from Bio.Seq import Seq
from Bio import Entrez

### Gene Table.

Fields:
- name
- description
- organism
- nucleotide sequence
- chromosome
- start and end position
- strand
- translated sequence

For eukaryotes, the nucleotide sequence should be the spliced mRNA and the coordinates should span the entire locus. 

### Pathway Table.

Fields:
- name
- description. 

### Enzyme  Table.

Fields:
- name
- function
- enzyme commission  (EC) number

Multiple  genes  encode  enzymes  that  perform  the  same function, so there ought to be fewer enzymes than genes.

### Associative Tables.

1. There are relationships between enzymes and pathways—some enzymes belong to certain pathways. Many to Many. Many enzymes belong to many pathways.
2. There is an order to enzymes within pathways. How can the order be represented in a table? Use the same table as in 1. but add a number which represents the order, 0 being the first and the largest number being the last.
3. Genes in the gene table encode enzymes in the enzyme table. How can this be represented? many-to-many from enzymes to genes if we were trying to generalize, because of alternative splicing which allows a gene to code for many enzymes, and because many genes can code for enzymes that perform the same function. However for this lab the TA said it would be okay to do one-to-one

### Commands to create tables

CREATE TABLE IF NOT EXISTS genes (id INT PRIMARY KEY ASC,  name TEXT, description TEXT, chromosome TEXT, start INT, end INT, strand VARCHAR(1)); 

CREATE TABLE IF NOT EXISTS pathways (id INT PRIMARY KEY ASC, name TEXT, description TEXT); 

CREATE TABLE IF NOT EXISTS enzymes (id INT PRIMARY KEY ASC, name TEXT, function TEXT, ecn TEXT);

CREATE TABLE IF NOT EXISTS enzymes_pathways (id INT PRIMARY KEY ASC, enzyme_id INT,pathway_id INT,FOREIGN KEY(enzyme_id) REFERENCES enzymes(id),FOREIGN KEY(pathway_id) REFERENCES pathways(id));

CREATE TABLE IF NOT EXISTS genes_enzymes (id INT PRIMARY KEY ASC,
                                         gene_id INT,
                                         enzyme_id INT,
                                         FOREIGN KEY(gene_id) REFERENCES genes(id),
                                         FOREIGN KEY(enzyme_id) REFERENCES enzymes(id)
                                         );
                            

## DATA COLLECTION

Mapping from EC number to GI (gene identifier)
ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_sprot.dat.gz  
The EC number could be found in the DE field, the GI (gene identifier) in one of the DR lines. 

To find enzymes in pathways:  
https://www.genome.jp/kegg-bin/show_pathway?map00010  
To look up the enzymes:  
https://enzyme.expasy.org/  
To get the info:
https://www.uniprot.org/  


### Glycolysis
EC 5.4.2.2, 5.3.1.9, 4.1.2.13, 4.2.1.11
Phosphoglucomutase (alpha-D-glucose-1,6-bisphosphate-dependent).

#### 5.4.2.2
organisms:  
HUMAN: PGM2  
        1 gggctctgca gcggtagcac aagctcagcg atggcggctc cagaaggcag cggtctaggc
       61 gaggacgccc ggctggacca ggagaccgcc cagtggctgc gctgggacaa gaattcctta
      121 actttggagg cagtgaaacg actaatagca gaaggtaata aagaagaact acgaaaatgt
      181 tttggggccc gaatggagtt tgggacagct ggcctccgag ctgctatggg acctggaatt
      241 tctcgtatga atgacttgac catcatccag actacacagg gattttgcag atacctggaa
      301 aaacaattca gtgacttaaa gcagaaaggc atcgtgatca gttttgacgc ccgagctcat
      361 ccatccagtg ggggtagcag cagaaggttt gcccgacttg ctgcaaccac atttatcagt
      421 caggggattc ctgtgtacct cttttctgat ataacgccaa ccccctttgt gcccttcaca
      481 gtatcacatt tgaaactttg tgctggaatc atgataactg catctcacaa tccaaagcag
      541 gataatggtt ataaggtcta ttgggataat ggagctcaga tcatttctcc tcacgataaa
      601 gggatttctc aagctattga agaaaatcta gaaccgtggc ctcaagcttg ggacgattct
      661 ttaattgata gcagtccact tctccacaat ccgagtgctt ccatcaataa tgactacttt
      721 gaagacctta aaaagtactg tttccacagg agcgtgaaca gggagacaaa ggtgaagttt
      781 gtgcacacct ctgtccatgg ggtgggtcat agctttgtgc agtcagcttt caaggctttt
      841 gaccttgttc ctcctgaggc tgttcctgaa cagagagatc cggatcctga gtttccaaca
      901 gtgaaatacc cgaatcccga agaggggaaa ggtgtcttga ctttgtcttt tgctttggct
      961 gacaaaacca aggccagaat tgttttagct aacgacccgg atgctgatag acttgctgtg
     1021 gcagaaaagc aagacagtgg tgaatggagg gtgttttcag gcaatgagtt gggggccctc
     1081 ctgggctggt ggctttttac atcttggaaa gagaagaacc aggatcgcag tgctctcaaa
     1141 gacacgtaca tgttgtccag caccgtctcc tccaaaatct tgcgggccat tgccttaaag
     1201 gaaggttttc attttgagga aacattaact ggctttaagt ggatgggaaa cagagccaaa
     1261 cagctaatag accaggggaa aactgtttta tttgcatttg aagaagctat tggatacatg
     1321 tgctgccctt ttgttctgga caaagatgga gtcagtgccg ctgtcataag tgcagagttg
     1381 gctagcttcc tagcaaccaa gaatttgtct ttgtctcagc aactaaaggc catttatgtg
     1441 gagtatggct accatattac taaagcttcc tattttatct gccatgatca agaaaccatt
     1501 aagaaattat ttgaaaacct cagaaactac gatggaaaaa ataattatcc aaaagcttgt
     1561 ggcaaatttg aaatttctgc cattagggac cttacaactg gctatgatga tagccaacct
     1621 gataaaaaag ctgttcttcc cactagtaaa agcagccaaa tgatcacctt cacctttgct
     1681 aatggaggcg tggccaccat gcgcaccagt gggacagagc ccaaaatcaa gtactatgca
     1741 gagctgtgtg ccccacctgg gaacagtgat cctgagcagc tgaagaagga actgaatgaa
     1801 ctggtcagtg ctattgaaga acattttttc cagccacaga agtacaatct gcagccaaaa
     1861 gcagactaaa atagtccagc cttgggtata cttgcattta cctacaatta agctgggttt
     1921 aacttgttaa gcaatatttt taagggccaa atgattcaaa acatcacagg tatttatgtg
     1981 ttttacaaag acctacattc ctcattgttt catgtttgac ctttaaggtg aaaaaagaaa
     2041 atggccaaac ccaacaaact aacattccta ctaaaaagtt gagcttggac atattttgaa
     2101 tttttgtaag tgaagatttt taaactgact aacttaaaaa aatagattgt aattgatgtg
     2161 ccttaatttg cataaatcat aaatgtaaaa aaaaaaaaaa aaaa
     MAAPEGSGLGEDARLDQETAQWLRWDKNSLTLEAVKRLIAEGNK
     EELRKCFGARMEFGTAGLRAAMGPGISRMNDLTIIQTTQGFCRYLEKQFSDLKQKGIV
     ISFDARAHPSSGGSSRRFARLAATTFISQGIPVYLFSDITPTPFVPFTVSHLKLCAGI
     MITASHNPKQDNGYKVYWDNGAQIISPHDKGISQAIEENLEPWPQAWDDSLIDSSPLL
     HNPSASINNDYFEDLKKYCFHRSVNRETKVKFVHTSVHGVGHSFVQSAFKAFDLVPPE
     AVPEQRDPDPEFPTVKYPNPEEGKGVLTLSFALADKTKARIVLANDPDADRLAVAEKQ
     DSGEWRVFSGNELGALLGWWLFTSWKEKNQDRSALKDTYMLSSTVSSKILRAIALKEG
     FHFEETLTGFKWMGNRAKQLIDQGKTVLFAFEEAIGYMCCPFVLDKDGVSAAVISAEL
     ASFLATKNLSLSQQLKAIYVEYGYHITKASYFICHDQETIKKLFENLRNYDGKNNYPK
     ACGKFEISAIRDLTTGYDDSQPDKKAVLPTSKSSQMITFTFANGGVATMRTSGTEPKI
     KYYAELCAPPGNSDPEQLKKELNELVSAIEEHFFQPQKYNLQPKAD
Chromosome 4
gene            1..2204
CDS             31..1869

Drosophilia: Pgm: phosphoglucomutase  
        1 atgtcgctaa cggtggaaat tgttgccaca aagccctatg agggtcagaa gccaggaacc
       61 agtggattgc gcaaaaaggt aaggtcttca ggtggcggaa aagctcgcac ttgcatttta
      121 taacttctga aatcgtttcc gaatctcagg ttaaggtttt cacccagccc aactacacgg
      181 agaactttgt ccaggccatc ttggaggcaa atggagctgc tctggttggt tccacccttg
      241 tagttggtgg agatggacgt ttctactgca aggaggctgc cgagctaatt gtgcggctat
      301 ccgctgccaa tggcgtttcc aagttgctgg tgggtcaaaa cggcatcctg tccacccctg
      361 ccgtatccag cctgatccgt cacaacaagg ctttgggtaa gttcaacgca ggcagccttc
      421 actgtgctcg taaagatttt aattgataag aagcatcttc acacaatcaa cgggtggcgg
      481 ctgttcgttg acagaggtcc ctggggtgca ataataacta tggattcaat cggttaacag
      541 agagttgctt actcgggcaa ccaaatttga atcgggtaaa attgatttag ggactcgtgc
      601 aatcgctaat cagactaacc tttaataaaa ttgtatggtg taattactta agcgaatttg
      661 atatacaaat ttgcttttaa tatctgtctt atactaacaa aagaccatct gtcaagctta
      721 cattattatt tcgcattata gaagcaatat tgcaaaatct ctattatctt aataatatga
      781 aatatttaaa tctaagcttt tgttgtactt actcaaacag tttattcaca ttaaaggtgg
      841 cctctttgga atataaaatt gttttagatg cctaggcaca cccaactaaa aaatatacac
      901 gatttaaaaa tgctttttta aaccttatag gcggcattgt tttgactgca tcccacaatc
      961 ccggtggtcc agagaatgat ttcggcatca agttcaactg cgagaacgga ggacctgccc
     1021 cggatgcgtt caccaaccac atctacaaga tcaccaccga gatcaaggag tacaagctgg
     1081 tgcgcaacct gcagatcgac atctcaaagg ttggtgtaac ctcgttcgac atcgccggaa
     1141 agccctttac cgtggaggtg atcgattcgg tggccaacta tgtgcgccac atggaggaaa
     1201 tcttcgactt cgccaagctg aaggacttcg taagtggcaa agccactgga aagcctctga
     1261 agatgcgcat cgatgcaatg aacggagtaa ctggctcata tgtgcgcgag atcttcctga
     1321 accggttggg tgccaccgaa tcatcggtgg tccacaccac tccactgccc gactttggtg
     1381 gtctgcatcc tgacccaaat ctcacatacg ccaaggacct ggttgacact gtcgcccagg
     1441 gagactatga cattggagct gccttcgatg gagatggtga ccgcaacatg atcattggca
     1501 gcaaggcgtt cttcgtaact cccagcgact cgctggcggt aattgcccac tacctggagg
     1561 ccataccgta cttccaaaag aatggtgttc aaggattcgc ccgcagtatg ccaactgcat
     1621 ccgctgtgga tttggtgggc agaaagttgg gcaaggaagt gtttgaggtt cccactggat
     1681 ggaagtactt cggtaatctc atggacgccg gaaggttgtg tctgtgcgga gaggagagct
     1741 tcggaactgg ctccaatcac atccgcgaaa aggatggcat ctgggcggtt ctcgcttgga
     1801 tctccgtgat gcagcacacg ggtaagggca tcgaagacat cctgaagcag cactggtctg
     1861 tgtatggacg caactatttc acccgctacg attatgagga gtgcgcttcc gatccttgca
     1921 acgagatggt ggccaccatg gagaagacca taactgctcc ggagttcgtc ggcaagagct
     1981 attccagcgg cggaaaaacc tacaaggtca aggaggccga caacttcagc tacacagatc
     2041 ctgtcgacaa gtcggtggcc acgaaacagg gtctgcgcat tgtgttcgag gatggcagcc
     2101 gcattgtggt gcgcctcagt ggaactggaa gctcgggagc aaccgttcgg tgagtcacga
     2161 tgagatttaa tatcaaataa ttcttttcaa taatcgatga attgttcctt ttcagcttgt
     2221 acattgattc ctatgagaag gagaatgttt tgggccaggc cagcgtgatg ctgaaaccct
     2281 tgatcgacat cgccctggag atctctcagc tgcccaagtt cactggacgc aacgctccaa
     2341 cggttatcac gtaa
     MSLTVEIVATKPYEGQKPGTSGLRKKVKVFTQPNYTENFVQAIL
     EANGAALVGSTLVVGGDGRFYCKEAAELIVRLSAANGVSKLLVGQNGILSTPAVSSLI
     RHNKALGGIVLTASHNPGGPENDFGIKFNCENGGPAPDAFTNHIYKITTEIKEYKLVR
     NLQIDISKVGVTSFDIAGKPFTVEVIDSVANYVRHMEEIFDFAKLKDFVSGKATGKPL
     KMRIDAMNGVTGSYVREIFLNRLGATESSVVHTTPLPDFGGLHPDPNLTYAKDLVDTV
     AQGDYDIGAAFDGDGDRNMIIGSKAFFVTPSDSLAVIAHYLEAIPYFQKNGVQGFARS
     MPTASAVDLVGRKLGKEVFEVPTGWKYFGNLMDAGRLCLCGEESFGTGSNHIREKDGI
     WAVLAWISVMQHTGKGIEDILKQHWSVYGRNYFTRYDYEECASDPCNEMVATMEKTIT
     APEFVGKSYSSGGKTYKVKEADNFSYTDPVDKSVATKQGLRIVFEDGSRIVVRLSGTG
     SSGATVRLYIDSYEKENVLGQASVMLKPLIDIALEISQLPKFTGRNAPTVIT
     gene            <1..>2354
     mRNA            join(<1..78,150..396,931..2149,2216..>2354)
     CDS             join(1..78,150..396,931..2149,2216..2354)

MOUSE: Pgm1  
1 gagagccgca gccactgtcg cctcgcagcc aaccgccacc atggtgaaga tcgtgacagt
       61 gaagacgcag gcatatccgg atcagaagcc gggcaccagc ggattgcgga agcgagtgaa
      121 ggttttccag agcaacgcca actatgcgga gaatttcatc cagagcatcg tctctaccgt
      181 ggagccggcg ctgaggcagg aggccacgct ggttgtgggc ggggacggcc gcttctacat
      241 gaccgaggcc atccagctca tcgtacgcat cgctgcagcc aacgggattg gtcgcctggt
      301 tattgggcag aatggaatac tctccacccc tgccgtatct tgcatcatcc gaaaaatcaa
      361 agctattggt gggatcattc tgacagccag ccataatcca ggagggccca atggagattt
      421 tggaattaaa ttcaatattt ctaatggggg tcctgctcca gaagcaatca ctgataaaat
      481 tttccaaatc agcaagacaa tcgaagaata tgccatttgc cctgacttga aggtagacct
      541 cggtgttctg ggaaagcagc agtttgactt ggaaaacaag ttcaagccct tcacagtgga
      601 gattgtggac tcagtggagg cctatgccac aatgctgaga aacatcttcg atttcaacgc
      661 actgaaggag ctactctctg gtccaaacag actgaagatc cgcatagacg ccatgcacgg
      721 agttgtggga ccgtacgtaa agaagatcct ctgtgaagaa cttggtgccc ctgcaaactc
      781 agctgtgaac tgtgttcccc tggaggattt tggaggccac catcccgacc ccaatctcac
      841 ctatgctgct gacctagtgg agaccatgaa gtcaggagag catgatttcg gggctgcctt
      901 tgatggtgac ggggatcgaa acatgattct gggcaagcac gggttctttg tgaatccttc
      961 tgactctgtg gctgtcatcg ctgccaacat cttcagcatt ccgtacttcc agcagaccgg
     1021 ggtccgtggc tttgcacgca gcatgcccac aagtggtgct ctggaccggg tagcaaatgc
     1081 cacaaagatc gctttgtatg agaccccaac tggctggaag ttttttggga atttgatgga
     1141 tgcaagcaag ctgtccctct gtggagagga gagctttggg accggttcgg accatatccg
     1201 agagaaagat ggactgtggg ccgtcctggc ctggctctcc attctggcca cccgcaaaca
     1261 gagcgtggag gacatcctca aagaccactg gcagaagttt ggtcggaact tctttaccag
     1321 gtatgactac gaggaggtgg aagctgaggg tgcaaacaaa atgatgaagg acctggaggc
     1381 cctgatgctg gaccgctcct ttgtggggaa gcagttctca gcaaacgata aagtctacac
     1441 tgtggagaaa gcggataact ttgaatatag tgacccagta gatggaagca tttcaaaaaa
     1501 tcagggcttg cggcttattt ttgcagatgg ttctcgtatc atcttcagac tgagtggcac
     1561 cgggagtgca ggggctacca tccggctgta tattgatagc tacgagaagg acgttgccaa
     1621 gatcaaccag gacccccagg tgatgctggc gcccctgatc tccattgctc tgaaagtgtc
     1681 ccagctccag gagaggacgg gtcgcactgc gcccactgtc atcacctaga aagatggcca
     1741 gatgtggcac gtccctcccc caggactatc cacgccacct gattgaagag cacggacaga
     1801 aacagtgtat ttgcctgggc cttttaggac tcggtcttga ttttttactt cccactttga
     1861 taaacagcca tttgtgaggc actgccactg tgtgggggag agggaaagca gacccgaggg
     1921 cctgcacctg tgtctgttcc ttctcttgcc ctattaaatt gctgctgtgc g
     MVKIVTVKTQAYPDQKPGTSGLRKRVKVFQSNANYAENFIQSIV
     STVEPALRQEATLVVGGDGRFYMTEAIQLIVRIAAANGIGRLVIGQNGILSTPAVSCI
     IRKIKAIGGIILTASHNPGGPNGDFGIKFNISNGGPAPEAITDKIFQISKTIEEYAIC
     PDLKVDLGVLGKQQFDLENKFKPFTVEIVDSVEAYATMLRNIFDFNALKELLSGPNRL
     KIRIDAMHGVVGPYVKKILCEELGAPANSAVNCVPLEDFGGHHPDPNLTYAADLVETM
     KSGEHDFGAAFDGDGDRNMILGKHGFFVNPSDSVAVIAANIFSIPYFQQTGVRGFARS
     MPTSGALDRVANATKIALYETPTGWKFFGNLMDASKLSLCGEESFGTGSDHIREKDGL
     WAVLAWLSILATRKQSVEDILKDHWQKFGRNFFTRYDYEEVEAEGANKMMKDLEALML
     DRSFVGKQFSANDKVYTVEKADNFEYSDPVDGSISKNQGLRLIFADGSRIIFRLSGTG
     SAGATIRLYIDSYEKDVAKINQDPQVMLAPLISIALKVSQLQERTGRTAPTVIT
CDS             41..1729
source          1..1971

Other organisms:
PSEAB, PSEAE, PSEPK, PSESM, BACSU, STAA3, STAA8, STAAB, STAAC, STAAM, STAAN, STAAR, STAAS, STAAW, STAEQ, STAES, STAHJ, STAS1, BOVIN, DICDI, MACFA, MOUSE, PARTE, RABIT,   RAT, YEAST, DICDI, MOUSE, PARTE, PONAB, YEAST, ARATH, MAIZE, ARATH, MAIZE, BROIN, MESCR, C_PEA, POPTN, SOLTU, THEKO, ARATH, BRANA, P_PEA, SOLTU, ASPFU, ASPOR, DROME, DROSI, ECOLI, EMENI, ENTDI, ENTHI, KOMXY, NEIGO, NEIMA, NEIMB, RHIRD, SCHPO, XANCB, XANCP

#### 5.3.1.9

ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: GPI
        1 ctcgagagct ccgccatggc cgctctcacc cgggaccccc agttccagaa gctgcagcaa
       61 tggtaccgcg agcaccgctc cgagctgaac ctgcgccgcc tcttcgatgc caacaaggac
      121 cgcttcaacc acttcagctt gaccctcaac accaaccatg ggcatatcct ggtggattac
      181 tccaagaacc tggtgacgga ggacgtgatg cggatgctgg tggacttggc caagtccagg
      241 ggcgtggagg ccgcccggga gcggatgttc aatggtgaga agatcaacta caccgagggt
      301 cgagccgtgc tgcacgtggc tctgcggaac cggtcaaaca cacccatcct ggtagacggc
      361 aaggatgtga tgccagaggt caacaaggtt ctggacaaga tgaagtcttt ctgccagcgt
      421 gtccggagcg gtgactggaa ggggtacaca ggcaagacca tcacggacgt catcaacatt
      481 ggcattgtcg gctccgacct gggacccctc atggtgactg aagcccttaa gccatactct
      541 tcaggaggtc cccgcgtctg gtatgtctcc aacattgatg gaactcacat tgccaaaacc
      601 ctggcccagc tgaacccgga gtcctccctg ttcatcattg cctccaagac ctttactacc
      661 caggagacca tcacgaatgc agagacggcg aaggagtggt ttctccaggc ggccaaggat
      721 ccttctgcag tggcgaagca ctttgttgcc ctgtctacta acacaaccaa agtgaaggag
      781 tttggaattg accctcaaaa catgttcgag ttctgggatt gggtgggagg acgctactcg
      841 ctgtggtcgg ccatcggact ctccattgcc ctgcacgtgg gttttgacaa cttcgagcag
      901 ctgctctcgg gggctcactg gatggaccag cacttccgca cgacgcccct ggagaagaac
      961 gcccccgtct tgctggccct gctgggtatc tggtacatca actgctttgg gtgtgagaca
     1021 cacgccatgc tgccctatga ccagtacctg caccgctttg ctgcgtactt ccagcagggc
     1081 gacatggagt ccaatgggaa atacatcacc aaatctggaa cccgtgtgga ccaccagaca
     1141 ggccccattg tgtgggggga gccagggacc aatggccagc atgcttttta ccagctcatc
     1201 caccaaggca ccaagatgat accctgtgac ttcctcatcc cggtccagac ccagcacccc
     1261 atacggaagg gtctgcatca caagatcctc ctggccaact tcttggccca gacagaggcc
     1321 ctgatgaggg gaaaatcgac ggaggaggcc cgaaaggagc tccaggctgc gggcaagagt
     1381 ccagaggacc ttgagaggct gctgccacat aaggtctttg aaggaaatcg cccaaccaac
     1441 tctattgtgt tcaccaagct cacaccattc atgcttggag ccttggtcgc catgtatgag
     1501 cacaagatct tcgttcaggg catcatctgg gacatcaaca gctttgacca gtggggagtg
     1561 gagctgggaa agcagctggc taagaaaata gagcctgagc ttgatggcag tgctcaagtg
     1621 acctctcacg acgcttctac caatgggctc atcaacttca tcaagcagca gcgcgaggcc
     1681 agagtccaat aaactcgtgc tcatctgcag cctcctctgt gactcccctt tctcttctcg
     1741 tccctcctcc ccggagccgg cactgcatgt tcctggacac cacccagagc accctctggt
     1801 tgtgggcttg gaccacgagc ccttagcagg gaaggctggt ctcccccagc ctaaccccca
     1861 gcccctccat gtctatgctc cctctgtgtt agaattggct gaagtgtttt tgtgcagctg
     1921 acttttctga cccatgttca cgttgttcac atcccatgta gaaaaacaaa gatgccacgg
     1981 aggaggt
     MAALTRDPQFQKLQQWYREHRSELNLRRLFDANKDRFNHFSLTL
     NTNHGHILVDYSKNLVTEDVMRMLVDLAKSRGVEAARERMFNGEKINYTEGRAVLHVA
     LRNRSNTPILVDGKDVMPEVNKVLDKMKSFCQRVRSGDWKGYTGKTITDVINIGIVGS
     DLGPLMVTEALKPYSSGGPRVWYVSNIDGTHIAKTLAQLNPESSLFIIASKTFTTQET
     ITNAETAKEWFLQAAKDPSAVAKHFVALSTNTTKVKEFGIDPQNMFEFWDWVGGRYSL
     WSAIGLSIALHVGFDNFEQLLSGAHWMDQHFRTTPLEKNAPVLLALLGIWYINCFGCE
     THAMLPYDQYLHRFAAYFQQGDMESNGKYITKSGTRVDHQTGPIVWGEPGTNGQHAFY
     QLIHQGTKMIPCDFLIPVQTQHPIRKGLHHKILLANFLAQTEALMRGKSTEEARKELQ
     AAGKSPEDLERLLPHKVFEGNRPTNSIVFTKLTPFMLGALVAMYEHKIFVQGIIWDIN
     SFDQWGVELGKQLAKKIEPELDGSAQVTSHDASTNGLINFIKQQREARVQ
     mRNA            <1..1987
     CDS             16..1692

MOUSE: GPI
        1 caattccgct tccgagcacg tcctgctccg tgtacctctc gggtccctcg ccatggctgc
       61 gctcacccgg aacccgcagt tccagaagct cctggagtgg caccgcgcga actctgccaa
      121 cctcaagctg cgcgaacttt ttgaggcgga tccggagcgc ttcaacaact tcagcttgaa
      181 cctcaacacc aaccatgggc atattctggt ggactactcc aagaaccttg tgaacaagga
      241 ggtgatgcag atgctggtgg agctggccaa gtccagaggc gtggaggctg cacgggacaa
      301 catgttcagt ggttccaaga tcaactacac cgaggatcgg gcggtgctgc atgtggccct
      361 tcggaaccgg tccaacacac ccatcaaggt ggacggcaaa gatgtgatgc cggaggtgaa
      421 cagggttctg gacaagatga agtctttctg ccagcgggtc cggagtggtg actggaaagg
      481 gtacactggc aaatccatca cggacatcat caacatcggc atcgggggct ctgacctggg
      541 acccctcatg gtgactgaag ctctcaagcc ttactcgaaa ggaggtcccc gtgtctggtt
      601 tgtctctaac attgatggga cccacattgc caaaacactg gccagcttgt cccctgagac
      661 ttccctcttt ataatcgcct ccaagacctt caccacccag gagaccatca ccaatgcaga
      721 gacagcaaag gagtggtttc tcgaagcggc caaggatcca tctgcagttg caaagcactt
      781 tgtcgccctg tctacgaaca cggccaaagt gaaagagttt ggaattgacc ctcaaaacat
      841 gttcgagttc tgggattggg taggtggccg ctattcgctg tggtcagcca ttggactttc
      901 cattgctctg catgtaggtt ttgaccactt cgagcagctg ctgtccgggg ctcactggat
      961 ggaccagcac ttcctcaaga cgcccctgga gaagaatgcc cccgtcctgc tggctctact
     1021 gggcatctgg tacatcaact gctacggctg tgagacccac gccttgctgc cctatgacca
     1081 gtacatgcac cgctttgctg cctatttcca gcagggtgac atggagtcca acggaaagta
     1141 catcaccaag tccggggccc gtgtggacca ccagacaggc cccatcgtgt ggggggaacc
     1201 agggaccaat ggtcaacatg cattctacca gctcatccac caaggcacca agatgatacc
     1261 ctgtgacttt ctcatccctg tccagaccca gcaccccata cggaaaggtc tgcatcacaa
     1321 gatcctcctg gctaacttct tggcccagac tgaggccctg atgaagggga agttgcctga
     1381 agaggccagg aaggagctcc aggctgccgg aaagagccca gaagacttgg agaaactctt
     1441 gccacacaag gtctttgaag gaaaccgccc gaccaactct attgtgttta ccaagctgac
     1501 acccttcatt ctgggggcct tgattgccat gtatgagcac aagatctttg ttcagggcat
     1561 catgtgggac atcaacagct tcgaccagtg gggagtggag ctggggaagc agctggccaa
     1621 gaaaattgag ccggagctgg agggcagctc tgctgtgacc tcccatgatt cctccactaa
     1681 cggactgatc agcttcatca agcaacagcg ggacaccaaa ctagaataac tccagccgcg
     1741 gccctactga ctggtcctcc gtgtcccttc tcaccatatg cactgcatgg tcctgcccct
     1801 ccctgcccag agcgcaccac cggtagttgg cctggactac aaggctgttg ggagaagctg
     1861 gtctggaact gccatccacc cactacgcac cctccctgtt gaagctgatg gaagggcttt
     1921 gacgtgtcat gttgttctga cctgtatttc acaccccagc tagaataaag acacctagag
     1981 gaggc
     MAALTRNPQFQKLLEWHRANSANLKLRELFEADPERFNNFSLNL
     NTNHGHILVDYSKNLVNKEVMQMLVELAKSRGVEAARDNMFSGSKINYTEDRAVLHVA
     LRNRSNTPIKVDGKDVMPEVNRVLDKMKSFCQRVRSGDWKGYTGKSITDIINIGIGGS
     DLGPLMVTEALKPYSKGGPRVWFVSNIDGTHIAKTLASLSPETSLFIIASKTFTTQET
     ITNAETAKEWFLEAAKDPSAVAKHFVALSTNTAKVKEFGIDPQNMFEFWDWVGGRYSL
     WSAIGLSIALHVGFDHFEQLLSGAHWMDQHFLKTPLEKNAPVLLALLGIWYINCYGCE
     THALLPYDQYMHRFAAYFQQGDMESNGKYITKSGARVDHQTGPIVWGEPGTNGQHAFY
     QLIHQGTKMIPCDFLIPVQTQHPIRKGLHHKILLANFLAQTEALMKGKLPEEARKELQ
     AAGKSPEDLEKLLPHKVFEGNRPTNSIVFTKLTPFILGALIAMYEHKIFVQGIMWDIN
     SFDQWGVELGKQLAKKIEPELEGSSAVTSHDSSTNGLISFIKQQRDTKLE
     gene            1..1985
     mRNA            1..1985
     CDS             53..1729

Drosophilia: PGI
        1 taagcagccg gatccgctat tataagtgaa gtgtcgcgag cggtcgaagc agttcgcctg
       61 tgctctcttc tccgtgtgct actaatttgc atcgagtgct aaatagtcct cccttgccct
      121 tctactccgc atccgcctgc tgttcctgct tgggataact gaagtaagat ggccggccca
      181 cttcctccgc ttaaccagga ggcagcgttc cagaagctgc aggagtacta cgactccaag
      241 ggcaaggacc tgaacatcaa ggacctgttc gtgaaggatt ccaagagatt ctcaaaatac
      301 aggtgggttt ttgtgtcgat ttcgcctcag agggtggaag ttacgtatct agttcccgca
      361 tacatacact cattcgtgta tcccccatcg gcaatcgttt attcatcgag ttgcgctttg
      421 cccactttca ctttcaccat cggctgtcga gtgtcgccgc cactcgattt gtccttgcgt
      481 aaggtcacag caacgacctc cgaatcgtac ttgctctgag gtcaaatgtt tttcgtttgt
      541 ttatcagcct gcgcctgcac acccagaacg atggcgagat actgctggac tactcgaaga
      601 accgtatcaa tgacgaggtc tgggatctgc tcctcaccct ggccaaggtg cgccgcgtta
      661 acgccgcgcg ggacgccatg ttctccggcc agcacattaa catcacggag aaccgcgccg
      721 tcctccacac ggccctgcgc aaccgcggca cggatcccgt cctggtggac gacaaggacg
      781 tgatgcccga tgtgcgcgcc gaactggccc acatgaagga gttcaccaac atggtcatct
      841 ccggcgtgtg gcgcggctgc accggcaaac agatcaccga cgtggtcaac atcggcatcg
      901 gtggctccga tctgggcccg ctgatggtca ccgaagcgct gaagccctac ggcaagggcc
      961 ttcactccca ctttgtgtcg aacatcgatg gcactcatct ggccgaggtc ctcaagaagg
     1021 tcaactacga gaccaccctc ttcattgtcg cctcaaaaac tttcaccacc caggagacca
     1081 ttacgaacgc cacctccgcc aagacctggc tcctggagca ttccaaggag gtaagtacag
     1141 cgaaaggtcg aacattaaat gaccttcatt gatagcgctt taagcaaaga taaccaaact
     1201 aatacaatga accatcaatg gaccctagtg atttttctta tcattctata agaaccattt
     1261 tgacgtgttc aagctatcaa atcaatttaa tgtgcttatc aaatgcagcc tatggactta
     1321 atcaaaggct aaatcggatt tcaaattcga ataaaatgtt tccaatatga aattccactt
     1381 gccttaaatg taaaatagat aacgcagcca aagcaaatag ttacatcaca acattttagt
     1441 ctgacctata tttgcaaact atttttgttt tgttttagcc tgagtccgtg gccaagcatt
     1501 ttgtggccct gtcgaccaac aaggaaaagg tcaccgaatt cggcattgac agcaccaaca
     1561 tgttcggttt ttgggattgg gtgggcggtc gctactccct gtggtcggcc attggactgt
     1621 caatctgtct gtccattggc tttgagaact ttgagcaact gctggatgga gctcacttca
     1681 tggacaacca tttcaagacg acaccattcg agaagaatgt aagactcaac tgagagttaa
     1741 gtaaaatgat tatagttaac cattttattg gctttcctag gctcctgtta tcctggcgtt
     1801 gctaggcatt tggtactcca acttcttcaa ggcggaaaca catgccctcc ttccctacga
     1861 tcagtacttg caccggttcg ccgcctactt ccagcagggc gatatggaga gcaacggcaa
     1921 gttcgtcagc aagtcgggca aacccgtcaa gtacagcact ggtccgatcg tgtggggcga
     1981 gcctggcacc aatggccagc acgccttcta ccagctcatc caccagggca cccgcctgat
     2041 cccctgcgat ttcatcgctc ccgcccagac acacaatccc attgccggcg gcaagcacca
     2101 caagattctg ctatcgaatt tccttgccca gacggaggct ttaatggccg gaaagacggt
     2161 cgacgaggcc aggaccgagc tgtccaaggc tggcctgtgc ggcaacgagc tggataactt
     2221 gttgccccac aaggtgttcg tcggcaaccg gcccacaaac tcgattgtgg tgaagaaggt
     2281 ttcacctttc accctaggcg cgttgattgg tacgtctcac tgtttcagct cacgagcacc
     2341 tattaatgtc aattgatttt gcagcgctgt acgagcacaa gatcttcgtt cagggcatca
     2401 tttgggacat caactcgttc gaccaatggg gtgtggagct gggcaagcag ctggccaagg
     2461 ccatcgagcc ggagctggat cactgcaacg aggtctccac gcacgacagt tccacgaacg
     2521 gtctaattaa cttcatcaaa gccaattgga agtaatcatg tc
     MAGPLPPLNQEAAFQKLQEYYDSKGKDLNIKDLFVKDSKRFSKY
     SLRLHTQNDGEILLDYSKNRINDEVWDLLLTLAKVRRVNAARDAMFSGQHINITENRA
     VLHTALRNRGTDPVLVDDKDVMPDVRAELAHMKEFTNMVISGVWRGCTGKQITDVVNI
     GIGGSDLGPLMVTEALKPYGKGLHSHFVSNIDGTHLAEVLKKVNYETTLFIVASKTFT
     TQETITNATSAKTWLLEHSKEPESVAKHFVALSTNKEKVTEFGIDSTNMFGFWDWVGG
     RYSLWSAIGLSICLSIGFENFEQLLDGAHFMDNHFKTTPFEKNAPVILALLGIWYSNF
     FKAETHALLPYDQYLHRFAAYFQQGDMESNGKFVSKSGKPVKYSTGPIVWGEPGTNGQ
     HAFYQLIHQGTRLIPCDFIAPAQTHNPIAGGKHHKILLSNFLAQTEALMAGKTVDEAR
     TELSKAGLCGNELDNLLPHKVFVGNRPTNSIVVKKVSPFTLGALIALYEHKIFVQGII
     WDINSFDQWGVELGKQLAKAIEPELDHCNEVSTHDSSTNGLINFIKANWK
     gene            join(169..302,548..1130,1479..1718,1781..2309,2365..2555)
     CDS             join(169..302,548..1130,1479..1718,1781..2309,2365..2555)

Other organisms:
CHRSD, CHRVO, CLAAR, CLACO, CLAFR, CLALE, CLAMI, CLARO, CLAWI, CLAXA, COLP3, CUPNJ, NEIG1, NEIMA, NEIMB, PSEPK, RHIME, RHOJR, STRAW, STRCO, THIDA, CHRSD, CHRVO, CLACO, CLALE, CLAXA, COLP3, CUPNJ, NEIG1, NEIMA, NEIMB, PSEPK, RHIME, RHOJR, STRAW, STRCO, THIDA, CLALE, RHOJR, RHOJR, GEOSE, ORYSJ, GEOSE, ORYSJ, ARATH, ACAM1, ACHLI, ACIAD, ACIB3, ACIB5, ACIBC, ACIBS, ACIBT, ACIBY, ACILW, ACTP2, ACTP7, ACTPJ, AERHH, AERS4, AGABI, AGRFC, AGRRK, AGRVS, ALCBS, ALIF1, ALIFM, ALISL, ALKMQ, ALTMD, ANAD2, ANADE, ANASK, ANAVT, ARAHG, ARALP, ARATH, AROAE, ASHGO, ASPOR, AYWBP, BACAH, BACAN, BACC0, BACC1, BACC2, BACC4, BACC7, BACCN, BACCR, BACCZ, BACFN, BACFR, BACHD, BACHK, BACLD, BACP2, BACSK, BACSU, BACTN, BACV8, BACVZ, BACWK, BARBK, BARHE, BARQU, BAUCH, BEII9, BIFLO, BLOFL, BLOPB, BORA1, BORAP, BORBP, BORBR, BORBU, BORBZ, BORPA, BORPD, BORPE, BOVIN, BRUA1, BRUA2, BRUAB, BRUC2, BRUMB, BRUME, BRUO2, BRUSI, BRUSU, BUCA5, BUCAI, BUCAP, BUCAT, BUCBP, BUCCC, BURA4, BURCA, BURCC, BURCJ, BURL3, BURM1, BURM7, BURM9, BURMA, BURMS, BURP0, BURP1, BURP6, BURPS, BURTA, CALFI, CALS4, CAMJD, CAMJE, CANAL, CANGA, CARHZ, CAUSK, CAUVC, CAUVN, CHESB, CHLAB, CHLCH, CHLCV, CHLFF, CHLL7, CHLMU, CHLPD, CHLPN, CHLT2, CHLTA, CHLTB, CHLTE, CHLTR, CITK8, CLOAB, CLOB1, CLOB8, CLOBA, CLOBB, CLOBH, CLOBK, CLOBL, CLOBM, CLONN, CLOP1, CLOPE, CLOPS, CLOTE, CLOTH, CORDI, COREF, CORGB, CORGL, CORJK, CORK4, COXB1, COXB2, COXBN, COXBR, COXBU, CRIGR, CROS8, CUPMC, CUPTR, CUTAK, CYAP4, CYAP7, DECAR, DEIDV, DEIGD, DEIRA, DESAH, DESAL, DESHD, DESHY, DESMR, DESOH, DESPS, DICDI, DROME, DROSI, DROYA, ECO24, ECO27, ECO45, ECO55, ECO57, ECO5E, ECO7I, ECO81, ECO8A, ECOBW, ECODH, ECOHS, ECOK1, ECOL5, ECOL6, ECOLC, ECOLI, ECOLU, ECOSE, ECOSM, ECOUT, EDWI9, ENCCU, ENT38, ENTFA, ERWT9, ERYLH, ESCF3, EXIS2, FRACC, FRAP2, FRAT1, FRATF, FRATH, FRATM, FRATN, FRATO, FRATT, FRATW, FUSNN, GEOBB, GEODF, GEOKA, GEOMG, GEOSL, GEOSM, GEOTN, GEOUR, GLOVI, GRAFK, HAEDU, HAEI8, HAEIE, HAEIG, HAEIN, HAEPS, HAES1, HAHCH, HALMA, HALSA, HALWD, HAMD5, HELAH, HELMI, HELP2, HELPG, HELPH, HELPJ, HELPS, HELPY, HISS2, HUMAN, HYDCU, IDILO, JANSC, KLEOX, KLEP3, KLEP7, KLULA, LACAC, LACBA, LACCB, LACDA, LACFE, LACGA, LACH4, LACJO, LACLA, LACLM, LACLS, LACP3, LACP7, LACPL, LACRD, LACRJ, LACS1, LACSS, LARHH, LEGPA, LEGPH, LEGPL, LEGPN, LEIME, LEPBA, LEPBJ, LEPBL, LEPBP, LEPCP, LEPIC, LEPIN, LEUCK, LEUMM, LISIN, LISMF, LISMO, LISW6, MACFA, MAGMM, MAGSA, MAIZE, MANSM, MARMS, MESFL, METCA, METFK, METJA, METMP, METPP, METSB, MICAN, MOUSE, MYCA1, MYCBO, MYCBP, MYCBT, MYCCT, MYCGA, MYCGE, MYCGI, MYCH2, MYCH7, MYCHJ, MYCLB, MYCLE, MYCMM, MYCMO, MYCMS, MYCPA, MYCPE, MYCPN, MYCPU, MYCS2, MYCS5, MYCSM, MYCTA, MYCTO, MYCTU, MYCUA, MYCVP, MYXXD, NATPD, NEUCR, NITEU, NITMU, NITOC, NOCFA, NOSP7, NOSS1, NOVAD, OCEIH, OCHA4, OENOB, OENSH, ONYPE, PARD8, PARP8, PARPJ, PARUW, PARXL, PASMU, PECAS, PECCP, PEDPA, PELCD, PEPD6, PHOLL, PHOPR, I_PIG, PLAFA, POLNA, PONAB, PORGI, PROM0, PROM1, PROM2, PROM4, PROM5, PROM9, PROMA, PROMH, PROMM, PROMP, PROMS, PROMT, PSE14, PSEA6, PSEA7, PSEA8, PSEAB, PSEAE, PSEE4, PSEF5, PSEFL, PSEFS, PSEHT, PSEMY, PSEP1, PSEPF, PSEPG, PSEPW, PSESM, PSEU2, PSEU5, PSYA2, PSYCK, PSYIN, PYRAB, PYRFU, PYRHO, RABIT, RALPJ, RALSO, I_RAT, RHIE6, RHIEC, RHIL3, RHILO, RHILW, RHIME, RHOFT, RHOOB, RHORT, RHOS1, RHOS4, RHOS5, RHOSK, RIPO1, ROSCS, ROSDO, ROSS1, RUBXD, RUEPO, RUEST, SACD2, SALA4, SALAR, SALCH, SALDC, SALEP, SALG2, SALHS, SALNS, SALPA, SALPB, SALPC, SALPK, SALSV, SALTI, SALTY, SCHPO, SERP5, SHEAM, SHEB2, SHEB5, SHEB8, SHEB9, SHEDO, SHEFN, SHEHH, SHELP, SHEON, SHEPA, SHEPC, SHEPW, SHESA, SHESH, SHESM, SHESR, SHESW, SHEWM, SHIB3, SHIBS, SHIDS, SHIF8, SHIFL, SHISS, SINMW, SODGM, SPHAL, SPHWW, SPIOL, STAA1, STAA3, STAA8, STAAB, STAAC, STAAE, STAAM, STAAN, STAAR, STAAS, STAAW, STAEQ, STAES, STAHJ, STAS1, STRA1, STRA3, STRA5, STREM, STRGC, STRGG, STRM5, STRMK, STRMU, STRP1, STRP2, STRP3, STRP4, STRP6, STRP8, STRPB, STRPC, STRPD, STRPF, STRPG, STRPI, STRPM, STRPN, STRPQ, STRPS, STRPZ, STRR6, STRT1, STRT2, STRTD, SYMTH, SYNAS, SYNE7, SYNFM, SYNJA, SYNJB, SYNP6, SYNPX, SYNS9, SYNSC, SYNY3, THEEB, THELI, THEMA, THEP3, THEPX, THET2, THET8, TOLAT, TREDE, TREPA, TREPS, TRYBB, UNCTG, VIBC3, VIBCB, VIBCH, VIBCM, VIBPA, VIBTL, VIBVU, VIBVY, WIGBR, XANAC, XANC5, XANC8, XANCB, XANCI, XANCP, XANOM, XANOP, XANOR, XANP2, XYLF2, XYLFA, XYLFM, XYLFT, YEAST, YERE8, YERP3, YERPA, YERPB, YERPE, YERPG, YERPN, YERPP, YERPS, YERPY, ZYMMO, SINMW, THEGJ, THEKO, THEON, AERPE, AQUAE, CALBD, PYRAE, SACS2, SULAC, SULTO, THEAC, THEVO, 

#### 2.7.2.3

ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: PGK1
        1 aagcctccgg agcgcacgtc ggcagtcggc tccctcgttg accgaatcac cgacctctct
       61 ccccagctgt atttccaaaa tgtcgctttc taacaagctg acgctggaca agctggacgt
      121 taaagggaag cgggtcgtta tgagagtcga cttcaatgtt cctatgaaga acaaccagat
      181 aacaaacaac cagaggatta aggctgctgt cccaagcatc aaattctgct tggacaatgg
      241 agccaagtcg gtagtcctta tgagccacct aggccggcct gatggtgtgc ccatgcctga
      301 caagtactcc ttagagccag ttgctgtaga actcaaatct ctgctgggca aggatgttct
      361 gttcttgaag gactgtgtag gcccagaagt ggagaaagcc tgtgccaacc cagctgctgg
      421 gtctgtcatc ctgctggaga acctccgctt tcatgtggag gaagaaggga agggaaaaga
      481 tgcttctggg aacaaggtta aagccgagcc agccaaaata gaagctttcc gagcttcact
      541 ttccaagcta ggggatgtct atgtcaatga tgcttttggc actgctcaca gagcccacag
      601 ctccatggta ggagtcaatc tgccacagaa ggctggtggg tttttgatga agaaggagct
      661 gaactacttt gcaaaggcct tggagagccc agagcgaccc ttcctggcca tcctgggcgg
      721 agctaaagtt gcagacaaga tccagctcat caataatatg ctggacaaag tcaatgagat
      781 gattattggt ggtggaatgg cttttacctt ccttaaggtg ctcaacaaca tggagattgg
      841 cacttctctg tttgatgaag agggagccaa gattgtcaaa gacctaatgt ccaaagctga
      901 gaagaatggt gtgaagatta ccttgcctgt tgactttgtc actgctgaca agtttgatga
      961 gaatgccaag actggccaag ccactgtggc ttctggcata cctgctggct ggatgggctt
     1021 ggactgtggt cctgaaagca gcaagaagta tgctgaggct gtcactcggg ctaagcagat
     1081 tgtgtggaat ggtcctgtgg gggtatttga atgggaagct tttgcccggg gaaccaaagc
     1141 tctcatggat gaggtggtga aagccacttc taggggctgc atcaccatca taggtggtgg
     1201 agacactgcc acttgctgtg ccaaatggaa cacggaggat aaagtcagcc atgtgagcac
     1261 tgggggtggt gccagtttgg agctcctgga aggtaaagtc cttcctgggg tggatgctct
     1321 cagcaatatt tagtactttc ctgcctttta gttcctgtgc acagccccta agtcaactta
     1381 gcattttctg catctccact tggcattagc taaaaccttc catgtcaaga ttcagctagt
     1441 ggccaagaga tgcagtgcca ggaaccctta aacagttgca cagcatctca gctcatcttc
     1501 actgcaccct ggatttgcat acattcttca agatcccatt tgaatttttt agtgactaaa
     1561 ccattgtgca ttctagagtg catatattta tattttgcct gttaaaaaga aagtgagcag
     1621 tgttagctta gttctctttt gatgtaggtt attatgatta gctttgtcac tgtttcacta
     1681 ctcagcatgg aaacaagatg aaattccatt tgtaggtagt gagacaaaat tgatgatcca
     1741 ttaagtaaac aataaaagtg tccattg
     MSLSNKLTLDKLDVKGKRVVMRVDFNVPMKNNQITNNQRIKAAV
     PSIKFCLDNGAKSVVLMSHLGRPDGVPMPDKYSLEPVAVELKSLLGKDVLFLKDCVGP
     EVEKACANPAAGSVILLENLRFHVEEEGKGKDASGNKVKAEPAKIEAFRASLSKLGDV
     YVNDAFGTAHRAHSSMVGVNLPQKAGGFLMKKELNYFAKALESPERPFLAILGGAKVA
     DKIQLINNMLDKVNEMIIGGGMAFTFLKVLNNMEIGTSLFDEEGAKIVKDLMSKAEKN
     GVKITLPVDFVTADKFDENAKTGQATVASGIPAGWMGLDCGPESSKKYAEAVTRAKQI
     VWNGPVGVFEWEAFARGTKALMDEVVKATSRGCITIIGGGDTATCCAKWNTEDKVSHV
     STGGGASLELLEGKVLPGVDALSNI
     CDS             80..1333

MOUSE: Pgk1
        1 tcgacctcac ggtcttgcca aaatgtcgct ttccaacaag ctgactttgg acaagctgga
       61 cgtgaagggg aagcgggtcg tgatgagggt ggacttcaac gttcctatga agaacaacca
      121 gataacaaac aaccaaagga tcaaggctgc tgttccaagc atcaaattct gcttggacaa
      181 tggagccaac tccgttgtcc ttatgagcca cctgggccgg cctgatggtg ttcccatgcc
      241 tgacaagtac tccttagagc cagttgctgc tgaactcaaa tctctgctgg gcaaggatgt
      301 tctgttcttg aaggattgtg tgggcccaga agtcgagaat gcctgtgcca acccagcggc
      361 tgggactgtc atcctgctgg aaaacctccg ctttcatgta gaggaagaag ggaagggaaa
      421 agatgcttct gggaacaagg ttaaagctga gccggccaaa attgatgctt tccgagcctc
      481 actgtccaaa ctaggagatg tctatgtcaa tgatgctttt gggactgcac accgagccca
      541 tagctccatg gtgggtgtga atctgccaca gaaggctggt ggatttttga tgaagaagga
      601 gctgaactac tttgccaagg ctttggagag tcctgagcga cccttcctgg ctatcttggg
      661 aggcgctaaa gttgcagaca agatccagct gatcaataat atgctagaca aagtcaatga
      721 gatgatcatt ggtggtggaa tggcctttac cttccttaag gtcctcaaca acatggagat
      781 tggcacatct ctgtatgatg aagaaggagc caagattgtc aaagatctca tgtccaaagc
      841 tgagaaaaat ggtgtgaaga ttaccttgcc tgttgacttt gtcactgctg acaaatttga
      901 tgagaatgcc aagactggcc aagctactgt ggcctctggt atacctgctg gctggatggg
      961 cttggactgt ggtactgaga gcagcaagaa atatgccgag gctgtgggtc gagctaagca
     1021 gattgtttgg aatggtcctg ttggggtatt tgaatgggaa gcctttgcca ggggaaccaa
     1081 gtcactcatg gatgaggtgg tgaaagccac ttctaggggt tgcatcacta tcataggtgg
     1141 tggagacact gccacttgct gtgccaaatg gaacacagag gataaagtca gccatgtgag
     1201 cactgggggc ggtgccagtc tagagctcct ggaaggtaaa gtccttcctg gggtggatgc
     1261 tctcagcaat gtttagtatt ttctttcctg cctttggttc ctgtgctcct aagctaacct
     1321 gctgttttcc acatctccat ttggtgttag cgcaagattc agctagtggc tgagatgtgg
     1381 cacagacctt aacagtgcaa gcatctcagc tcgtcttact gcatcagatg ctggttcttc
     1441 aagatcccat ttaaattcct tagtgactaa aaccattgtg cattgtagag ggcgtctatt
     1501 tatattctgc ctgagaaagg aagtgagctg taaaggctga gctctctctc tgacgtatgt
     1561 agcctctggt tagcttcgtc actcactgtt cttgactcag catggcaatc tgatgaaatt
     1621 cccagctgta agtctgcaga aatttccgaa ttc
     MSLSNKLTLDKLDVKGKRVVMRVDFNVPMKNNQITNNQRIKAAV
     PSIKFCLDNGANSVVLMSHLGRPDGVPMPDKYSLEPVAAELKSLLGKDVLFLKDCVGP
     EVENACANPAAGTVILLENLRFHVEEEGKGKDASGNKVKAEPAKIDAFRASLSKLGDV
     YVNDAFGTAHRAHSSMVGVNLPQKAGGFLMKKELNYFAKALESPERPFLAILGGAKVA
     DKIQLINNMLDKVNEMIIGGGMAFTFLKVLNNMEIGTSLYDEEGAKIVKDLMSKAEKN
     GVKITLPVDFVTADKFDENAKTGQATVASGIPAGWMGLDCGTESSKKYAEAVGRAKQI
     VWNGPVGVFEWEAFARGTKSLMDEVVKATSRGCITIIGGGDTATCCAKWNTEDKVSHV
     STGGGASLELLEGKVLPGVDALSNV
     gene            1..1653
     CDS             23..1276

Drosophilia Melanogaster: Pgk
        1 gagaagatgt gtgattgact tggttggccc tcaacagaat catttattca ataattacat
       61 attgacatac aacatcaagg ggcggctgtt acatacggta tgtacatatg tatgtactgt
      121 cgtagattat tatttattaa acattttttt ttattatttt tataaattaa ttataaattt
      181 ttataaaaaa tcactaattc ggactttcag ttaaaattta acagacattc aagggtgtgg
      241 aagaaaaaag ttctaagggg ttaaaattta ttataaaaaa tttattaaaa aaaataattt
      301 ttatatgtat ttaagtgaaa atttatatga acggtttcta tttaagttaa tataaaaaaa
      361 atgtatactg taaatagcaa atgatcaatt aaatgatcta gtcagatatg gcagacattt
      421 attttgttaa tttttaggca tatgattatc tatggacaat atttaaatat tatgaaaata
      481 atgatatttt aaataataga tttttaaatt ttagaattgt gtggcccctt ttcgacaccc
      541 ttggaacgga tgcttcacag cactgtgctg acagcactta ccaacactgc ttgggcgcca
      601 aatacagagt tgcatttgga gagtacaact tttatccaac tttcgaacga gaatacaatc
      661 cgataccaac ttcggactcc aaaataggag tatacccagc tggatcctgc gcatggcacc
      721 taccaatcgg cggaaaaccg cttgccacgg attgacgccc tggaagtgga gatgcaaccc
      781 tagcagctca ccgacaaaat gaccttgcgc tgacattgcc gcacagcagt tgaggacgaa
      841 gaagattcgc ggaatcagtg gtatcgcaat ccggagtttg ctagcacgca caggaagtat
      901 ccagaaaatc cagaaaaatc caaagatggc cttcaataag ctgagcatcg aaaacctgga
      961 cttggcgggc aagcgggtgt tgatgcggta atccaaagcc aatcctcgcg tgaaattcag
     1021 ttgcataaac attgcccgtg cttctttgca gcgtcgactt caatgtgccc atcaaggagg
     1081 gcaagatcac cagcaaccag agaattgtcg ctgccttgga tagtatcaag ttggcccttt
     1141 ccaagaaagc caagtcggtg gtgctgatgt cccacttggg tcgtcccgat ggcaacaaga
     1201 acatcaagta caccctggca cccgtggccg ctgagctgaa gaccctgctt ggccaggatg
     1261 tgatcttcct aagtgactgc gtcggcagcg aagtggaggc cgcttgcaag gatcccgcac
     1321 cgggatccgt cattctgctg gagaacgtcc gcttctacgt ggaggaggag ggcaagggct
     1381 tggatgccag cggcggcaag gtcaaggccg atcctgccaa ggtcaaggag ttccgtgcca
     1441 gcctggccaa gctgggcgat gtctatgtca acgacgcctt cggcactgcc catcgcgccc
     1501 acagttccat gatgggcgat ggcttcgagc agcgcgcagc tggtctgttg ctgaacaagg
     1561 agctgaagta cttctcgcag gccctggaca agccaccaaa tcccttcctg gcaattctcg
     1621 gtggcgccaa ggtggccgac aagatccagc tgattgagaa ccttctggac aaggtcaacg
     1681 agatgatcat cggtggcggc atggccttca ccttcctgaa ggtcctcaac aacatgaaga
     1741 tcggcggttc cctgttcgac gaggagggct ccaagatcgt cgagaaactg gtggagaagg
     1801 ccaagaagaa taacgtgcag ttgcatctgc cagtggactt tgtctgcggc gacaagttcg
     1861 ccgagaacgc tgccgtcagc gaggccaccg tggaggccgg aattcccgat ggacacatgg
     1921 gtctggatgt gggtcccaag acccgtgagc tcttcgcggc acccatcgca cgcgccaagc
     1981 tcatcgtgtg gaacgggtag gtgtcacact gaagctactt ctccaaatgt cctataatgg
     2041 ttttcccatt ttagaccccc cggtgtcttt gagttcccca acttcgccaa cggcaccaag
     2101 tccatcatgg acggcgtggt ggccgccacc aagaacggca ccgtctccat catcggcggc
     2161 ggcgacactg cctcttgctg cgccaagtgg aacacggagg cactcgtctc gcacgtctcc
     2221 accggaggcg gcgcttcgct ggagctcctg gagggcaaga cactgccagg cgtgcgtgca
     2281 ttgaccagcg cctaagcgta catatatacg gtatattaat gttaatcgca tcgtttacct
     2341 tgtaagcaca aaccacgacg ttaaaaagtg ttgaatctat ttgttgcgga accatataat
     2401 gcatacgaaa taaaggaatc ctagtttatt tgcgggcaaa gttgctgtcc attgaggagg
     2461 cggtgcgctg tatgttgttg agattggccc ggatgcgatc gccaattgag ttatggttgg
     2521 caatggcctt cttcacctcc ttgttaatga acctccttgt cgaagtctcg ttcacgattt
     2581 ggcctct
     MAFNKLSIENLDLAGKRVLMRVDFNVPIKEGKITSNQRIVAALD
     SIKLALSKKAKSVVLMSHLGRPDGNKNIKYTLAPVAAELKTLLGQDVIFLSDCVGSEV
     EAACKDPAPGSVILLENVRFYVEEEGKGLDASGGKVKADPAKVKEFRASLAKLGDVYV
     NDAFGTAHRAHSSMMGDGFEQRAAGLLLNKELKYFSQALDKPPNPFLAILGGAKVADK
     IQLIENLLDKVNEMIIGGGMAFTFLKVLNNMKIGGSLFDEEGSKIVEKLVEKAKKNNV
     QLHLPVDFVCGDKFAENAAVSEATVEAGIPDGHMGLDVGPKTRELFAAPIARAKLIVW
     NGPPGVFEFPNFANGTKSIMDGVVAATKNGTVSIIGGGDTASCCAKWNTEALVSHVST
     GGGASLELLEGKTLPGVRALTSA
     gene            order(926..987,1052..1996,2055..2295)
     CDS             join(926..987,1052..1996,2055..2295)

Other animals:
BOVIN, CRIGR, HORSE, HUMAN, MACEU, MACFA, METAC, MOUSE, PANTR, 1_PIG, PONAB,   RAT, RHINI, TRYCO, HORSE, HUMAN, MACFA, METAC, MOUSE, 2_PIG, RHINI, CRIFA, TRYBB, CRIFA, LEIMA, LEIME, TRYBB, CRIFA, CUPNH, LEIMA, LEIME, TRYBB, TRYBB, TRYBB, TRYCO, ARATH, ARATH, CHLRE, PHYPA, SCEFU, SPIOL, TOBAC, VOLCA, WHEAT, CUPNH, THEMA, ARATH, TOBAC, WHEAT, ACAM1, ACHLI, ACIAC, ACIAD, ACIB3, ACIB5, ACIBC, ACIBS, ACIBT, ACIBY, ACIC5, ACIET, ACIF2, ACIF5, ACISJ, ACTP2, ACTP7, ACTPJ, ACTSZ, AERHH, AERPE, AERS4, AGABI, AGRFC, AGRVS, AKKM8, ALCBS, ALIF1, ALIFM, ALISL, ALKEH, ANAD2, ANADE, ANADF, ANASK, ANAVT, ANOFW, APLCA, AQUAE, ARCB4, ARCFU, AROAE, ARTS2, ASHGO, ASPOR, AZOC5, AZOSB, AZOVD, BACAA, BACAC, BACAH, BACAN, BACC0, BACC1, BACC2, BACC3, BACC4, BACC7, BACCE, BACCN, BACCQ, BACCZ, BACHD, BACHK, BACLD, BACMD, BACP2, BACSK, BACSU, BACTN, BACWK, BARBK, BARHE, BARQU, BART1, BAUCH, BDEBA, BEUC1, BIFAA, BIFLD, BIFLO, BIFLS, BLOFL, BLOPB, BORAP, BORBP, BORBR, BORBU, BORBZ, BORDL, BORHD, BORPA, BORPE, BORRA, BORT9, BRADU, BREBN, BRUAB, BRUME, BRUSU, BUCA5, BUCAI, BUCAP, BUCAT, BUCBP, CAEEL, CALS4, CAMC1, CAMC5, CAMFF, CAMHC, CAMJ8, CAMJD, CAMJE, CAMJJ, CAMJR, CAMLR, CANAL, CANGA, CANMA, CARHZ, CAUSK, CAUVC, CAUVN, CELJU, CHESB, CHICK, CHLAA, CHLAB, CHLAD, CHLCH, CHLCV, CHLFF, CHLL2, CHLL7, CHLMU, CHLP8, CHLPB, CHLPD, CHLPM, CHLPN, CHLSY, CHLT2, CHLT3, CHLTA, CHLTB, CHLTE, CHLTR, CHRVO, CLAM3, CLAMS, CLOAB, CLOB1, CLOB6, CLOB8, CLOBA, CLOBB, CLOBH, CLOBJ, CLOBK, CLOBL, CLOBM, CLOK1, CLOK5, CLONN, CLOP1, CLOPA, CLOPE, CLOPS, CLOTE, COLP3, CONMG, COPPD, CORA7, CORDI, COREF, CORGB, CORGL, CORJK, CORK4, CORU7, COXBU, CROS8, CUTAK, CYAP4, CYAP7, DEBHA, DECAR, DEIDV, DEIGD, DEIRA, DESAD, DESAH, DESAL, DESAP, DESDA, DESOH, DESPS, DESVH, DESVM, DESVV, DICDI, DICT6, DICTD, DINSH, DROME, ECO24, ECO57, ECOHS, ECOK1, ECOL5, ECOL6, ECOLC, ECOLI, ELUMP, EMENI, ENT38, ENTFA, ERWT9, EUPCR, EXIS2, EXISA, FERNB, FINM2, FRAAA, FRACC, FRAP2, FRASN, FRAT1, FRATF, FRATH, FRATM, FRATN, FRATO, FRATT, FRATW, FUNMO, FUSNN, GEOBB, GEODF, GEOKA, GEOLS, GEOMG, GEOSE, GEOSM, GEOSW, GEOUR, GLACH, GLOVI, GLUOX, GRABC, HAEDU, HAEI8, HAEIE, HAEIG, HAEIN, HAHCH, HALHL, HALLT, HALMA, HALS3, HALSA, HALVA, HELHP, HELPJ, HELPY, HERA2, HERAR, HISS2, HYDS0, HYPJE, HYPRU, JANMA, JANSC, KINRD, KLEP3, KLULA, KORVE, LACAC, LACBA, LACCB, LACDA, LACDB, LACDE, LACDL, LACF3, LACGA, LACH4, LACJO, LACLA, LACLM, LACLS, LACP3, LACPL, LACRJ, LACS1, LACSS, LARHH, LEGPA, LEGPC, LEGPH, LEGPL, LEIXX, LEPBA, LEPBJ, LEPBL, LEPBP, LEPCP, LEPIC, LEPIN, LEUCK, LEUMM, LISIN, LISMC, LISMF, LISMH, LISMO, LISW6, MACCJ, MANSM, MARHV, MARMM, MARMS, METBR, METC4, METCA, METEP, METFK, METFV, METJA, METKA, METLZ, METMA, METMP, METPB, METRJ, METS5, METTH, MICAN, MICLC, MOOTA, MYCA1, MYCA9, MYCAV, MYCBO, MYCBP, MYCBT, MYCGA, MYCGE, MYCGI, MYCH2, MYCLB, MYCLE, MYCMM, MYCMS, MYCPA, MYCPE, MYCPN, MYCPU, MYCS2, MYCSJ, MYCSK, MYCSS, MYCTA, MYCTO, MYCTU, MYCUA, MYCVP, NATPD, NAUPA, NEIG1, NEIG2, NEIM0, NEIMA, NEIMB, NEIMF, NEUCR, NITEC, NITEU, NITMU, NITOC, NITSB, NOCFA, NOSP7, NOSS1, NOVAD, OCEIH, OENOB, ONYPE, OPISI, ORITB, ORITI, PAEAT, PARPR, PASMU, PECAS, PECCP, PEDPA, PELPB, PELPD, PELTS, PENCH, PENCI, PEPD6, PHOLL, PHOLU, PHOPR, PICPA, PICTO, PINST, PLAF7, PORGI, PROA2, PROM0, PROM1, PROM2, PROM3, PROM4, PROM5, PROM9, PROMA, PROMH, PROMM, PROMP, PROMS, PROMT, PSE14, PSEA6, PSEA7, PSEA8, PSEAB, PSEAE, PSECP, PSEE4, PSEF5, PSEFS, PSEHT, PSELT, PSEMY, PSEMZ, PSEP1, PSEPF, PSEPG, PSEPK, PSEPW, PSESM, PSEU2, PSYCK, PSYWF, PYRAB, PYRAE, PYRFU, PYRHO, PYRWO, RALSO, RENSM, RHIL3, RHILO, RHILW, RHIME, RHOBA, RHOCS, RHOE4, RHOFT, RHOJR, RHOOB, RHOPA, RHOS1, RHOS4, RHOS5, RHOSK, RIPO1, ROSCS, ROSDO, ROSS1, RUBXD, RUEPO, RUEST, RUTMC, SACEN, SACS2, SALA4, SALAI, SALAR, SALCH, SALDC, SALEP, SALG2, SALHS, SALNS, SALPA, SALPB, SALPK, SALRD, SALSV, SALTI, SALTO, SALTY, SCHMA, SCHPO, SERP5, SHEB2, SHEB5, SHEB8, SHEB9, SHEDO, SHEFN, SHEHH, SHELP, SHEON, SHEPA, SHEPC, SHEPW, SHESA, SHESH, SHESM, SHESR, SHESW, SHEWM, SHIBS, SHIDS, SHIF8, SHIFL, SHISS, SINFN, SINMW, SODGM, SOLUE, SPHAL, SPHWW, SPICI, STAA1, STAA2, STAA3, STAA8, STAA9, STAAB, STAAC, STAAE, STAAM, STAAN, STAAR, STAAS, STAAT, STAAU, STAAW, STACT, STAEQ, STAES, STAHJ, STAS1, STENO, STRA1, STRA3, STRA5, STRAW, STRCO, STRE4, STREM, STRGC, STRGG, STRM5, STRMK, STRMU, STRP1, STRP2, STRP3, STRP4, STRP6, STRP7, STRP8, STRPB, STRPC, STRPF, STRPG, STRPI, STRPJ, STRPM, STRPN, STRPQ, STRPS, STRPZ, STRR6, STRS2, STRS7, STRSV, STRSY, STRT1, STRT2, STRTD, STRU0, STRZJ, STRZP, STRZT, SULAC, SULDN, SULTO, SYMTH, SYNE7, SYNFM, SYNJA, SYNJB, SYNP2, SYNP6, SYNPW, SYNPX, SYNR3, SYNS3, SYNS9, SYNSC, SYNY3, TERTT, TETPY, TETTH, THEAB, THEAC, THEEB, THEKO, THEM4, THEON, THEP1, THERP, THESM, THESQ, THET2, THET8, THEVO, THIDA, THISH, TOLAT, TREDE, TREPA, TREPS, TRIEI, TROW8, TROWT, UREPA, VESOH, VIBC3, VIBCB, VIBCH, VIBPA, VIBVU, VIBVY, WIGBR, WOLPM, WOLPP, WOLSU, WOLTR, WOLWR, XANAC, XANC5, XANC8, XANCB, XANCP, XANFL, XANOM, XANOP, XANOR, XANP2, XYLFA, XYLFT, YARLI, YEAST, YERE8, YERP3, YERPA, YERPB, YERPE, YERPG, YERPN, YERPP, YERPS, YERPY, 

#### 4.2.1.11

ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: MINPP1
        1 ctccactgac cgtcccgacg atgctacgcg cgcccggctg cctcctccgg acctccgtag
       61 cgcctgccgc ggccctggct gcggcgctgc tctcgtcgct tgcgcgctgc tctcttctag
      121 agccgaggga cccggtggcc tcgtcgctca gcccctattt cggcaccaag actcgctacg
      181 aggatgtcaa ccccgtgcta ttgtcgggcc ccgaggctcc gtggcgggac cctgagctgc
      241 tggaggggac ctgcaccccg gtgcagctgg tcgccctcat tcgccacggc acccgctacc
      301 ccacggtcaa acagatccgc aagctgaggc agctgcacgg gttgctgcag gcccgcgggt
      361 ccagggatgg cggggctagt agtaccggca gccgcgacct gggtgcagcg ctggccgact
      421 ggcctttgtg gtacgcggac tggatggacg ggcagctagt agaaaaggga cggcaggata
      481 tgcgacagct ggcgctgcgt ctggcctcgc tcttcccggc ccttttcagc cgtgagaact
      541 acggccgcct gcggctcatc accagttcca agcaccgctg catggatagc agcgccgcct
      601 tcctgcaggg gctgtggcag cactaccacc ctggcttgcc gccgccggac gtcgcagata
      661 tggagtttgg acctccaaca gttaatgata aactaatgag attttttgat cactgtgaga
      721 agtttttaac tgaagtagaa aaaaatgcta cagctcttta tcacgtggaa gccttcaaaa
      781 ctggaccaga aatgcagaac attttaaaaa aagttgcagc tactttgcaa gtgccagtaa
      841 atgatttaaa tgcagattta attcaagtag cctttttcac ctgttcattt gacctggcaa
      901 ttaaaggtgt taaatctcct tggtgtgatg tttttgacat agatgatgca aaggtattag
      961 aatatttaaa tgatctgaaa caatattgga aaagaggata tgggtatact attaacagtc
     1021 gatccagctg caccttgttt caggatatct ttcagcactt ggacaaagca gttgaacaga
     1081 aacaaaggtc tcagccaatt tcttctccag tcatcctcca gtttggtcat gcagagactc
     1141 ttcttccact gctttctctc atgggctact tcaaagacaa ggaaccccta acagcgtaca
     1201 attacaaaaa acaaatgcat cggaagttcc gaagtggtct cattgtacct tatgcctcga
     1261 acctgatatt tgtgctttac cactgtgaaa atgctaagac tcctaaagaa caattccgag
     1321 tgcagatgtt attaaatgaa aaggtgttac ctttggctta ctcacaagaa actgtttcat
     1381 tttatgaaga tctgaagaac cactacaagg acatccttca gagttgtcaa accagtgaag
     1441 aatgtgaatt agcaagggct aacagtacat ctgatgaact atgagtaact gaagaacatt
     1501 tttaattctt taggaatctg caatgagtga ttacatgctt gtaataggta ggcaattcct
     1561 tgattacagg aagcttttat attacttgag tatttctgtc ttttcacaga aaaacattgg
     1621 gtttctctct gggtttggac atgaaatgta agaaaagatt tttcactgga gcagctctct
     1681 taaggagaaa caaatctatt tagagaaaca gctggccctg caaatgttta cagaaatgaa
     1741 attcttccta cttatataag aaatctcaca ctgagataga attgtgattt cataataaca
     1801 cttgaaaagt gctggagtaa caaaatatct cagttggacc atccttaact tgattgaact
     1861 gtctaggaac tttacagatt gttctgcagt tctctcttct tttcctcagg taggacagct
     1921 ctagcatttt cttaatcagg aatattgtgg taagctggga gtatcactct ggaagaaagt
     1981 aacatctcca gatgagaatt tgaaacaaga aacagagtgt tgtaaaagga caccttcact
     2041 gaagcaagtc ggaaagtaca atgaaaataa atatttttgg tatttattta tgaaatattt
     2101 gaacattttt tcaataattc ctttttactt ctaggaagtc tcaaaagacc atcttaaatt
     2161 attatatgtt tggacaatta gcaacaagtc agatagttag aatcgaagtt tttcaaatcc
     2221 attgcttagc taactttttc attctgtcac ttggcttcga tttttatatt ttcctattat
     2281 atgaaatgta tcttttggtt gtttgatttt tctttctttc tttgtaaata gttctgagtt
     2341 ctgtcaaatg ccgtgaaagt atttgctata ataaagaaaa ttcttgtgac tttaaaaaaa
     2401 aaaaaaaaaa aa
     MLRAPGCLLRTSVAPAAALAAALLSSLARCSLLEPRDPVASSLS
     PYFGTKTRYEDVNPVLLSGPEAPWRDPELLEGTCTPVQLVALIRHGTRYPTVKQIRKL
     RQLHGLLQARGSRDGGASSTGSRDLGAALADWPLWYADWMDGQLVEKGRQDMRQLALR
     LASLFPALFSRENYGRLRLITSSKHRCMDSSAAFLQGLWQHYHPGLPPPDVADMEFGP
     PTVNDKLMRFFDHCEKFLTEVEKNATALYHVEAFKTGPEMQNILKKVAATLQVPVNDL
     NADLIQVAFFTCSFDLAIKGVKSPWCDVFDIDDAKVLEYLNDLKQYWKRGYGYTINSR
     SSCTLFQDIFQHLDKAVEQKQRSQPISSPVILQFGHAETLLPLLSLMGYFKDKEPLTA
     YNYKKQMHRKFRSGLIVPYASNLIFVLYHCENAKTPKEQFRVQMLLNEKVLPLAYSQE
     TVSFYEDLKNHYKDILQSCQTSEECELARANSTSDEL
     CDS             21..1484

MOUSE: Minpp1
        1 acaccgaagc tccgagacga tcggccacac tcgctcggtg acagcaccgg agaccacgct
       61 tgccttctga ggttcccggg ccggaagtgc gctctgctcc cgcccccgcc ggcggatccg
      121 gaagtggggg tcggcaagcg gcgcgccgcc ctccgcgggg cccccgggca cgatgcttcg
      181 cggcgcgcgc agccacctcc cggcctcggt agcgcccgcc gcggtcctgg ctgcggcgct
      241 gctctcgtcg ttcgcgcgct gctctctccc ggggcgcggc gacccggtgg cttcggtgct
      301 cagcccctac ttcggcacga agacacgcta cgaagatgcc aacccctggc tgctggtcga
      361 tccggtggcg ccgcggcggg acccggagct gctggcgggg acctgcaccc cggtgcagct
      421 ggtcgccctc atccgtcacg gcacccgcta ccctacgacc aagcagatcc gcaagctgaa
      481 gcagctgcag gggctgctgc agacccgcga gtcccgggat ggcgggagcc aagtggccgc
      541 cgcgctggcc gagtggccgc tgtggtacgg tgactggatg gacgggcagc tggtggagaa
      601 ggggcggcag gacatgcgac agctggccct gcgtctggct gccctcttcc cagacctctt
      661 cagccgggag aactacgacc gcctgcggct gatcaccagc tccaagcacc gctgtgtgga
      721 cagcagcgcc gccttcctcc aggggttgtg gcagcattac cacccaggac tgccacctcc
      781 cgacgtctca gatatggagt gtggccctcc aagaattaat gataaactaa tgaggttctt
      841 cgatcattgt gagaagttct taactgatgt ggaaagaaac gagacggctc tttatcatgt
      901 ggaagctttc aaaactggac cagaaatgca gaaggtctta aagaaagttg cagctactct
      961 gcaagtgcca atgaacagtt taaatgcaga cttaattcag gtagcttttt tcacctgttc
     1021 atttgacctg gcaattaaag gtgtccattc tccctggtgt gatgtgtttg acgtagatga
     1081 tgcaagggtt ctggaatact taaacgacct gaaacagtac tggaaacgaa gctatggcta
     1141 caccattaac agccggtcca gctgcaacct atttcaggac atttttctac acctggacaa
     1201 agcagtggag cagaagcaaa ggtctcagcc agtctcctct ccagtcatcc tccagtttgg
     1261 acacgcggag acgctcctgc cgctcctctc cctcatgggc tacttcaagg acaaggagcc
     1321 tctgaccgct tacaatttcg aggagcaagt taatcgcaag ttccgaagtg gtcacatcgt
     1381 accttatgcc tcaaacctaa tcttcgtgct ttaccactgt gacaacgcgc agagccccga
     1441 agaacaattc cagatacagc tgctgctgaa tgagaaggtg ctgcccctgg ctcactcgca
     1501 gagacccgtc gggttgtatg aggagctcaa gacccactac cgggacattc ttcagagctg
     1561 ccaaaccagt aaggagtgca gcccgcccaa agcgaacatc acgtccgatg agctctgagg
     1621 accttcggct gtgcatactg aggggtggtt gtgtttgcag gaggtagcca ctctagaggc
     1681 cgcggcagaa ggagctctgt gagtccaagg ccagcctgtt ctacatagtg agttccaggc
     1741 cagccaagac tacatagagc aataaagcct ggtctttctg tcttttcaca gaaaataata
     1801 gttcctttta ggatctagac atacgggtaa gacatgactc tccctggagc agctctctgc
     1861 agaacaaaaa ctaattcaat gaagcagctg tccctcccag tgtttgcaga gctgagattt
     1921 tcctaatgac ctaagaagat actgacgtag aacggtatta gaaaatgaca cttcaaaaat
     1981 gttggatacc aaagcacggt agctgccggg tgagcggcag tgattggcag agatggggac
     2041 ttgagtgacc atgttgggtt cccttcttct ccttcttgca ggacacaaat gatatcgctt
     2101 agtcataagt gtggtagact ggatcctgac cagaaggagg tctgatataa tatccatcca
     2161 gacaagaaat caacatgcta tcaagaacca ggttgaagca aaactgaaag tgtgtgatat
     2221 ttttgttgac gttatttata aaaatatttc aacgctgtca ataattgtct ttaacctcca
     2281 agtaggtctt gcagaatcgt cttcatttca tcagacctat tgggggtgaa cagtaattaa
     2341 taggaggccc agcctggcag acgcttgctg acgctccttg gctcttgcct gcttgtcttt
     2401 ttcattccat catggcttcc cttttcatag ctggatcttc cgtgaagtgt tccttttggt
     2461 ggtttggatt tttttttttt ttaaataaag accttatctg ccgaatttaa ttgtagagat
     2521 ttgaacccga tcaaagaaat tttgagttct ctcaaatacc ataaaagtgt ttgctacaat
     2581 aaataaaatt cttgtgactt taaaaaaaaa a
     MLRGARSHLPASVAPAAVLAAALLSSFARCSLPGRGDPVASVLS
     PYFGTKTRYEDANPWLLVDPVAPRRDPELLAGTCTPVQLVALIRHGTRYPTTKQIRKL
     KQLQGLLQTRESRDGGSQVAAALAEWPLWYGDWMDGQLVEKGRQDMRQLALRLAALFP
     DLFSRENYDRLRLITSSKHRCVDSSAAFLQGLWQHYHPGLPPPDVSDMECGPPRINDK
     LMRFFDHCEKFLTDVERNETALYHVEAFKTGPEMQKVLKKVAATLQVPMNSLNADLIQ
     VAFFTCSFDLAIKGVHSPWCDVFDVDDARVLEYLNDLKQYWKRSYGYTINSRSSCNLF
     QDIFLHLDKAVEQKQRSQPVSSPVILQFGHAETLLPLLSLMGYFKDKEPLTAYNFEEQ
     VNRKFRSGHIVPYASNLIFVLYHCDNAQSPEEQFQIQLLLNEKVLPLAHSQRPVGLYE
     ELKTHYRDILQSCQTSKECSPPKANITSDEL
     gene            1..2611
     CDS             173..1618
     
DROME: Mipp1
        1 cgcgacgtcg tgagcggtca agtcgcttga aacggctaag ggaaaactac tgcccaactt
       61 caattgttta ccaagtgcat ttaaattacc aactactaga gctatgcgcc tgctgatatt
      121 gctactgctg ccactggtgg ccatcgccca agatgactac tgcttcagca aggacacctc
      181 ccgcctccag acccgccagt tctcctcgaa gaccgcctat cagatcgtca agggcacgga
      241 cattgacaag cagtacctgg tgcccggctg tcagccccag aagatgtgga tctttcacag
      301 gcacggcaca cgactgccca agaagagcat gatcaacaag gcgtccaggg tggctgagct
      361 gcgcgatctc atcattaaca actaccaagt ggccaggacc aagcccgaaa cggatgctct
      421 ctgccagacg gatctgattg ccatcaagtt gtggaagtgg aacagcagca taacgcccga
      481 catggaggag tatctgaccg cccagggcta cgaggatctc aggggcacgg ccaagctgta
      541 ccagcggtac tatcccactg tgctgaccgc taactataat gacacttact accagttccg
      601 ccatacggac acccagcgca ccacggaaag tttcaaggct ttcgccgagg gtctgtttgg
      661 atcccaaaac gctgctcatc ccgtcgagat tcccaagcag gatctgctgc tgcgtcccta
      721 tgactattgc tcctctttca agaatgtgaa ctacaaggat gagggctctg agtactacaa
      781 gtttcatcag tcgaagctgt acaacgacac gttggcggat atctccactc gattgggttt
      841 cctttacacc ctggaggagg cggacatcaa gctaatgtac gatatgtgtc gctatgagca
      901 ggcgtggaat gtggaccgca atagcgtctg gtgcggcgcc ttcttgccgg agcaaataac
      961 ggtctttgag tacctggaag atctaaagta ctactatggc tcgggctatg gtttcccgga
     1021 aaacgcacat ctcaactgcc gactggtgca ggacctgctc acccacctga gcaatccggt
     1081 gtcgccgcat gtggtanctc atttcggtca ctcgactggt ctcctaactc tcctaactgc
     1141 gctgggaatc canaaggacg acatcaagtt gcgggcagac aattacgata gtttgacgag
     1201 ccgccgttgg aagagcagcc tgatcgatcc gtttgccgcc aatttcgtgg cggtgaaata
     1261 cgacttgccg gcggacttgg atcgcgagaa ggtggtcttc ttcctcaacc agcaggccgt
     1321 gcagctggac tggtgcagcg tcggtctgtg caagtggtca gatgtcctcg agaagtacaa
     1381 gaccattgcg gatgcggatt gtggagaata ctactgccgg acgggaggtg ctccatcgct
     1441 gggatccgga gttggcggac ttctggccac cacgctcgcc gccatgctgg tctacttaat
     1501 gcactaactt tcgattagat tagtttttaa ttcgtaatgt acaaatttcg taccaaatgg
     1561 agggacgcca
     MRLLILLLLPLVAIAQDDYCFSKDTSRLQTRQFSSKTAYQIVKG
     TDIDKQYLVPGCQPQKMWIFHRHGTRLPKKSMINKASRVAELRDLIINNYQVARTKPE
     TDALCQTDLIAIKLWKWNSSITPDMEEYLTAQGYEDLRGTAKLYQRYYPTVLTANYND
     TYYQFRHTDTQRTTESFKAFAEGLFGSQNAAHPVEIPKQDLLLRPYDYCSSFKNVNYK
     DEGSEYYKFHQSKLYNDTLADISTRLGFLYTLEEADIKLMYDMCRYEQAWNVDRNSVW
     CGAFLPEQITVFEYLEDLKYYYGSGYGFPENAHLNCRLVQDLLTHLSNPVSPHVVXHF
     GHSTGLLTLLTALGIXKDDIKLRADNYDSLTSRRWKSSLIDPFAANFVAVKYDLPADL
     DREKVVFFLNQQAVQLDWCSVGLCKWSDVLEKYKTIADADCGEYYCRTGGAPSLGSGV
     GGLLATTLAAMLVYLMH
     gene            1..1570
     CDS             104..1507

Other Animals:
CHICK, DICDI, DROME, HUMAN, MOUSE, PONAB, RAT, 


### Pentose Phosphate

#### 2.2.1.2
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: TALDO1
        1 cgcgcccgtc ccgtcgccgc cgccgccgcc gcagacccct cggtcttgct atgtcgagct
       61 cacccgtgaa gcgtcagagg atggagtccg cgctggacca gctcaagcag ttcaccaccg
      121 tggtggccga cacgggcgac ttccacgcca tcgacgagta caagccccag gatgctacca
      181 ccaacccgtc cctgatcctg gccgcagcac agatgcccgc ttaccaggag ctggtggagg
      241 aggcgattgc ctatggccgg aagctgggcg ggtcacaaga ggaccagatt aaaaatgcta
      301 ttgataaact ttttgtgttg tttggagcag aaatactaaa gaagattccg ggccgagtat
      361 ccacagaagt agacgcaagg ctctcctttg ataaagatgc gatggtggcc agagccaggc
      421 ggctcatcga gctctacaag gaagctggga tcagcaagga ccgaattctt ataaagctgt
      481 catcaacctg ggaaggaatt caggctggaa aggagctcga ggagcagcac ggcatccact
      541 gcaacatgac gttactcttc tccttcgccc aggctgtggc ctgtgccgag gcgggtgtga
      601 ccctcatctc cccatttgtt gggcgcatcc ttgattggca tgtggcaaac accgacaaga
      661 aatcctatga gcccctggaa gaccctgggg taaagagtgt cactaaaatc tacaactact
      721 acaagaagtt tagctacaaa accattgtca tgggcgcctc cttccgcaac acgggcgaga
      781 tcaaagcact ggccggctgt gacttcctca ccatctcacc caagctcctg ggagagctgc
      841 tgcaggacaa cgccaagctg gtgcctgtgc tctcagccaa ggcggcccaa gccagtgacc
      901 tggaaaaaat ccacctggat gagaagtctt tccgttggtt gcacaacgag gaccagatgg
      961 ctgtggagaa gctctctgac gggatccgca agtttgccgc tgatgcagtg aagctggagc
     1021 ggatgctgac agaacgaatg ttcaatgcag agaatggaaa gtagcgcatc cctgaggctg
     1081 gactccagat ctgcaccgcc ggccagctgg gatctgactg cacgtggctt ctgatgaatc
     1141 ttgcgttttt tacaaattgg agcagggaca gatcatagat ttctgatttt atgtaaaatt
     1201 ttgcctaata cattaaagca gtcacttttc ctgtgctgtt tcaaaaaaaa aaaaaaaaaa
     1261 aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa aaaaaaaaa
     MSSSPVKRQRMESALDQLKQFTTVVADTGDFHAIDEYKPQDATT
     NPSLILAAAQMPAYQELVEEAIAYGRKLGGSQEDQIKNAIDKLFVLFGAEILKKIPGR
     VSTEVDARLSFDKDAMVARARRLIELYKEAGISKDRILIKLSSTWEGIQAGKELEEQH
     GIHCNMTLLFSFAQAVACAEAGVTLISPFVGRILDWHVANTDKKSYEPLEDPGVKSVT
     KIYNYYKKFSYKTIVMGASFRNTGEIKALAGCDFLTISPKLLGELLQDNAKLVPVLSA
     KAAQASDLEKIHLDEKSFRWLHNEDQMAVEKLSDGIRKFAADAVKLERMLTERMFNAE
     NGK
     source          1..1319
     repeat_region   1..464
     5'UTR           1..50
     CDS             51..1064
     
MOUSE: Taldo1
        1 tcgccatgtc ggggtccccg gtaaagcgcc agaggatgga gtccgccttg gaccagctca
       61 agcagttcac caccgtggtg gccgacacgg gtgatttcaa tgccatcgat gaatacaagc
      121 cccaagatgc caccaccaac ccatccctga tcctggctgc agcccagatg cctgcctacc
      181 aagagctggt agaggaggcc attgcctacg gcaagaagct gggtgggcct caagaggagc
      241 agattaaaaa tgccattgac aaactttttg tgctgtttgg agcagaaata ttaaagaaga
      301 ttccaggccg tgtatccaca gaagttgatg caaggctttc ctttgataag gatgccatgg
      361 tggcccgagc caggcgcctc atcgagcttt acaaagaagc tggggtcggc aaggacagaa
      421 ttctcatcaa gttatcatca acctgggagg ggattcaggc tggaaaggag ctggaggaac
      481 agcatggcat ccactgcaac atgacactgc ttttctcctt cgcccaggct gtggcctgtg
      541 ctgaggcggg cgtgacgctc atctctccct ttgtggggcg catccttgat tggcatgtgg
      601 caaacacaga caagaaatcc tatgaacccc aggaggaccc tggggtcaag agtgtcacca
      661 aaatctacaa ctactacaag aagttcggct acaagaccat tgtcatgggc gcctccttcc
      721 gcaacacggg cgagatcaaa gcactggcgg gctgtgactt cctcaccatc tccccgaagc
      781 tcctggggga gctgctcaag gataacagca agctggcgcc tgcgctctct gtcaaggcgg
      841 cccagaccag tgactcggag aagatacatc tggacgagaa ggccttccgt tggctgcaca
      901 acgaagacca aatggccgtg gagaagctct ccgacggcat ccgcaaattt gctgctgatg
      961 ccataaagtt ggagcggatg ctcacggaac gaatgttcag cgctgagaac gggaagtagt
     1021 gcaacacccg aggccccagt cctgcaccga ggctgacccc agacctgcac tgcctttgag
     1081 ctgggtccta attgcacatg gcttgtgacg aatgaatctt gcatttttta gtgatcggag
     1141 aagggatgga tcata
     MSGSPVKRQRMESALDQLKQFTTVVADTGDFNAIDEYKPQDATT
     NPSLILAAAQMPAYQELVEEAIAYGKKLGGPQEEQIKNAIDKLFVLFGAEILKKIPGR
     VSTEVDARLSFDKDAMVARARRLIELYKEAGVGKDRILIKLSSTWEGIQAGKELEEQH
     GIHCNMTLLFSFAQAVACAEAGVTLISPFVGRILDWHVANTDKKSYEPQEDPGVKSVT
     KIYNYYKKFGYKTIVMGASFRNTGEIKALAGCDFLTISPKLLGELLKDNSKLAPALSV
     KAAQTSDSEKIHLDEKAFRWLHNEDQMAVEKLSDGIRKFAADAIKLERMLTERMFSAE
     NGK
     source          1..1155
     CDS             6..1019

DROME: Taldo
        1 ggaagtgatc gcacgttaaa aaagcaaaag atgtcggtat tacaggaact caagaaaatc
       61 accacaattg tggctgacac cggcgacttt gaagccatca acatctataa gcccacggat
      121 gccaccacta atccctccct catcttgtcc gcttcgtcca tggagcggta ccagccgctg
      181 gtccaaaagg cggtggaata cgccaagggc aagaagggct ccgtgagtga gcaggtggcc
      241 gaggccatgg actacctgtg cgtgctgttc ggaacggaaa tcctgaaggt tgtgcccggt
      301 cgcgtttcca ccgagatcga tgcccgcttg tccttcgaca ccaagaagag cgtggagaag
      361 gccctgaagc tgatcgccct gtacaaatcc ctgggcgtcg acaaggagcg aattctgatc
      421 aagctggcgt ccacctggga gggcatcaag gcggccgaga tcctggagaa cgagcacggt
      481 gtgcactgca acctgacgct ccttttctcg ttcgcacagg ccgtggcttg cgccgaggcc
      541 ggcgtgaccc tcatctcccc gttcgtgggc cgcatcctgg actggtacgt ggccaacacg
      601 gataccaaga agttcgaggc gctcaaggac ccgggcgtga tctccgtgac gaacatctac
      661 aactactaca agaagttcgg ctacaagacc ctggtcatgg gcgcctcctt ccgtaacgtg
      721 ggcgaaatca aggccctggc tggctgcgat ctgcttacca tcagcccagc gctgcttaag
      781 gagctggaga acgagaccga gtcggtggtc acctacctgt ccgtaagcaa cgccaagctg
      841 caggacatcg agaagatcac cgtcgatgag agccggttcc gctggctgct caacgaggac
      901 gccatggcca ccgacaaact ttccgagggc atcaggaagt tcgccgtgga tactgttaag
      961 ctggagaatt tgattaagac ctatcttaag tagatgttcc tctgggtccg ctagcaggtg
     1021 gaggatgaat acattcgttt ttgaaaaaga caatgatttt atactttaat aaacactaca
     1081 attaaaagag atgaaaaaaa aaaaaaaaaa a
     MSVLQELKKITTIVADTGDFEAINIYKPTDATTNPSLILSASSM
     ERYQPLVQKAVEYAKGKKGSVSEQVAEAMDYLCVLFGTEILKVVPGRVSTEIDARLSF
     DTKKSVEKALKLIALYKSLGVDKERILIKLASTWEGIKAAEILENEHGVHCNLTLLFS
     FAQAVACAEAGVTLISPFVGRILDWYVANTDTKKFEALKDPGVISVTNIYNYYKKFGY
     KTLVMGASFRNVGEIKALAGCDLLTISPALLKELENETESVVTYLSVSNAKLQDIEKI
     TVDESRFRWLLNEDAMATDKLSEGIRKFAVDTVKLENLIKTYLK

Other Animals:
BACAN, BACCR, CYBJA, FUSO4, GIBIN, KLULA, LISIN, LISMF, LISMO, PECAS, SALCH, SALPA, SCHPO, SHISS, STRAW, STRCO, YEAST, BACAN, BACCR, LISIN, LISMF, LISMO, NOSP7, NOSS1, PECAS, SALCH, SALPA, SHISS, STRAW, STRCO, YEAST, CYBJA, ECO57, ECOL6, ECOLI, PASMU, SALTI, SALTY, SHIFL, ECO57, ECOL6, ECOLI, PASMU, SALTI, SALTY, SHIFL, BOVIN, CAPAA, CARMA, CRIGR, DICDI, DROME, HUMAN, MOUSE, O_PIG, O_RAT, ACIAC, ACIC1, ACIC5, ACIET, ACISJ, ACTP2, ACTP7, ACTPJ, ACTSZ, AERS4, AGARV, AGRFC, AGRRK, AGRVS, ALIF1, ALIFM, ALISL, ALKMQ, ALKOO, ALTMD, ANAD2, ANADE, ANADF, ANASK, ANAVT, AQUAE, ARTS2, BACC1, BACCN, BACCZ, BACFN, BACFR, BACHD, BACHK, BACP2, BACSK, BACSU, BACTN, BACV8, BACVZ, BARBK, BARHE, BARQU, BART1, BAUCH, BDEBA, BLOFL, BORA1, BORBR, BORPA, BORPD, BORPE, BRAHW, BREBN, BRUA1, BRUA2, BRUAB, BRUC2, BRUMB, BRUME, BRUO2, BRUSI, BRUSU, BUCA5, BUCAI, BUCAP, BUCAT, BUCBP, BUCCC, BURA4, BURCA, BURCC, BURCH, BURCJ, BURCM, BURL3, BURM1, BURM7, BURMA, BURMS, BURP0, BURP1, BURP6, BURPS, BURTA, BURVG, CALBD, CALS4, CALS8, CAMJ8, CAMJD, CAMJE, CAMJJ, CAMJR, CARHZ, CAUSK, CAUVC, CAUVN, CELJU, CHESB, CHLAB, CHLCH, CHLCV, CHLFF, CHLL2, CHLL7, CHLMU, CHLP8, CHLPB, CHLPD, CHLPM, CHLPN, CHLT3, CHLTA, CHLTE, CHLTR, CHRSD, CLOAB, CLOB1, CLOB6, CLOBA, CLOBB, CLOBH, CLOBJ, CLOBK, CLOBL, CLOBM, CLOK1, CLOK5, CLONN, CLOP1, CLOPE, CLOPS, CLOTE, COLP3, COPPD, CUPMC, CUPNH, CUPNJ, CUPTR, CYTH3, DEHM1, DEIRA, DELAS, DESAD, DESAH, DESAL, DESAP, DESHD, DESHY, DESOH, DESPS, DESRM, DICTD, DINSH, ECO1E, EDWI9, ERYLH, EXIS2, EXISA, FERNB, FLAPJ, FRAAA, FRACC, FRASN, GEOBB, GEODF, GEOKA, GEOLS, GEOMG, GEOSL, GEOSM, GEOSW, GEOTN, GEOUR, GLOVI, HAEDU, HAEI8, HAEIE, HAEIG, HAEIN, HAEPS, HAES1, HAMD5, HELMI, HELP2, HELPH, HELPJ, HELPS, HELPY, HERA2, HISS2, HYDS0, HYPNA, JANSC, KOCRD, KOSOT, LACP7, LACPL, LEIXX, LEPBA, LEPBJ, LEPBL, LEPBP, LEPCP, LEPIC, LEPIN, LYSSC, MANSM, MARHV, MARMM, MARMS, META3, METAM, METCA, METFK, METJA, METM5, METM6, METM7, METMP, METPP, METVS, MOOTA, MYCBO, MYCBP, MYCBT, MYCLB, MYCLE, MYCMM, MYCPA, MYCS2, MYCTA, MYCTO, MYCTU, MYCUA, MYXXD, NATTJ, NEIG1, NEIG2, NEIM0, NEIMA, NEIMB, NEIMF, NITMS, NOSP7, NOSS1, NOVAD, OCEIH, OCHA4, OPITP, PARD8, PARDP, PARL1, PARP8, PARPJ, PARUW, PARXL, PELCD, PELPB, PELPD, PELTS, PEPD6, PERMH, PETMO, PHEZH, PHOLL, PHOPR, PICTO, POLNA, POLSJ, PORG3, PORGI, PROA2, PROM0, PROM1, PROM4, PROM5, PROM9, PROMA, PROMH, PROMM, PROMP, PROMT, PSE14, PSEA6, PSEA7, PSEA8, PSEAB, PSEAE, PSECP, PSEE4, PSEF5, PSELT, PSEMY, PSEPF, PSEPG, PSEPK, PSEPW, PSESM, PSEU2, PSEU5, RALPJ, RALSO, RENSM, RHIE6, RHIEC, RHILO, RHILW, RHIME, RHOCS, RHOFT, RHORT, RHOS1, RHOS4, RHOS5, RHOSK, ROSCS, ROSDO, ROSS1, RUEPO, RUEST, SACEN, SHEAM, SHEB2, SHEB5, SHEB8, SHEB9, SHEDO, SHEFN, SHEHH, SHELP, SHEON, SHEPA, SHEPC, SHEPW, SHESA, SHESH, SHESM, SHESR, SHESW, SHEWM, SHIBS, SHIDS, SINFN, SINMW, SODGM, SORC5, SPHAL, SPHWW, STRA3, STRA5, STRE4, STREM, STRP1, STRP3, STRP6, STRP8, STRPB, STRPC, STRPD, STRPF, STRPG, STRPM, STRPQ, STRPZ, STRS7, SULSY, SYMTH, SYNFM, SYNP6, SYNPX, SYNWW, SYNY3, TERTT, THEAB, THEAC, THEEB, THEFY, THEM4, THEMA, THEP1, THEPX, THESQ, THET2, THET8, THEVO, THEYD, THIDA, THISH, TRIEI, VARPS, VEREI, VIBC3, VIBCB, VIBCH, VIBCM, VIBPA, VIBVU, VIBVY, WIGBR, XANAC, XANC5, XANC8, XANCB, XANCP, XANOM, XANOP, XANOR, YERE8, YERP3, YERPB, YERPE, YERPG, YERPS, 

#### 2.7.1.11
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: PFKL
        1 gcgacgcggc gcaggcggcg ggagtgcgag ctgggcccgt gtttcggccg ccgccatggc
       61 cgcggtggac ctggagaagc tgcgggcgtc gggcgcgggc aaggccatcg gcgtcctgac
      121 cagcggcggc gaccggcaag gcatgaacgc tgctgtccgg gctgtgacgc gcatgggcat
      181 ttatgtgggt gccaaagtct tcctcatcta cgagggctat gagggcctcg tggagggagg
      241 tgagaacatc aagcaggcca actggctgag cgtctccaac atcatccagc tgggcggcac
      301 tatcattggc agcgctcgct cgaaggcctt taccaccagg gaggggcgcc gggcagcggc
      361 ctacaacctg gtccagcacg gcatcaccaa cctgtgcgtc atcggcgggg atggcagcct
      421 cacaggtgcc aacatcttcc gcagcgagtg gggcagcctg ctggaggagc tggtggcgga
      481 aggtaagatc tcagagacta cagcctggac ctactcgcac ctgaacatcg cgggcctagt
      541 gggctccatc gataacgact tctgcggcac cgacatgacc atcggcacgg actcggccct
      601 ccaccgcatc atggaggtca tcgatgccat caccaccact gcccagagcc accagaggac
      661 cttcgtgctg gaagtgatgg gccggcactg cgggtacctg gcgctggtat ctgcactggc
      721 ctcaggggcc gactggctgt tcatccccga ggctccaccc gaggacggct gggagaactt
      781 catgtgtgag aggctgggtg agactcggag ccgtgggtcc cgactgaaca tcatcatcat
      841 cgctgagggt gccattgacc gcaacgggaa gcccatctcg tccagctacg tgaaggacct
      901 ggtggttcag aggctgggct tcgacacccg tgtaactgtg ctgggccacg tgcagcgggg
      961 agggacgccc tctgccttcg accggatcct gagcagcaag atgggcatgg aggcggtgat
     1021 ggcgctgctg gaagccacgc ctgacacgcc ggcctgcgtg gtcaccctct cggggaacca
     1081 gtcagtgcgg ctgcccctca tggagtgcgt gcagatgacc aaggaagtgc agaaagccat
     1141 ggatgacaag aggtttgacg aggccaccca gctccgtggt gggagcttcg agaacaactg
     1201 gaacatttac aagctcctca cccaccagaa gccccccaag gagaagtcta acttctccct
     1261 ggccatcctg aatgtggggg ccccggcggc tggcatgaat gcggccgtgc gctcggcggt
     1321 gcggaccggc atctcccatg gacacacagt atacgtggtg cacgatggct tcgaaggcct
     1381 agccaagggt caggtgcaag aagtaggctg gcacgacgtg gccggctggt tggggcgtgg
     1441 tggctccatg ctggggacca agaggaccct gcccaagggc cagctggagt ccattgtgga
     1501 gaacatccgc atctatggta ttcacgccct gctggtggtc ggtgggtttg aggcctatga
     1561 aggggtgctg cagctggtgg aggctcgcgg gcgctacgag gagctctgca tcgtcatgtg
     1621 tgtcatccca gccaccatca gcaacaacgt ccctggcacc gacttcagcc tgggctccga
     1681 cactgctgta aatgccgcca tggagagctg tgaccgcatc aaacagtctg cctcggggac
     1741 caagcgccgt gtgttcatcg tggagaccat ggggggttac tgtggctacc tggccaccgt
     1801 gactggcatt gctgtggggg ccgacgccgc ctacgtcttc gaggaccctt tcaacatcca
     1861 cgacttaaag gtcaacgtgg agcacatgac ggagaagatg aagacagaca ttcagagggg
     1921 cctggtgctg cggaacgaga agtgccatga ctactacacc acggagttcc tgtacaacct
     1981 gtactcatca gagggcaagg gcgtcttcga ctgcaggacc aatgtcctgg gccacctgca
     2041 gcagggtggc gctccaaccc cctttgaccg gaactatggg accaagctgg gggtgaaggc
     2101 catgctgtgg ttgtcggaga agctgcgcga ggtttaccgc aagggacggg tgttcgccaa
     2161 tgccccagac tcggcctgcg tgatcggcct gaagaagaag gcggtggcct tcagccccgt
     2221 cactgagctc aagaaagaca ctgatttcga gcaccgcatg ccacgggagc agtggtggct
     2281 gagcctgcgg ctcatgctga agatgctggc acaataccgc atcagtatgg ccgcctacgt
     2341 gtcaggggag ctggagcacg tgacccgccg caccctgagc atggacaagg gcttctgagg
     2401 ccagccatgc ccgagctgcc cctccccagc ccccacccat gccagcgcac gcgccagggc
     2461 tcagatgggg cctgggctgt tgtgtctgga gcctgcaggc aggtgggggc tgcgtccctg
     2521 ctcagcccat cccctgcctc tactccctgg ccacctgcca ggcctccctc cggctggtgt
     2581 cttgagacca gcctgccagg cctccagcag gaggacagag tgccctgggg catccacctt
     2641 cctgcccagg ggacgtggcg ctgtcggtgt ttggaggctg ctgccccctg gctttggcgc
     2701 cccatgggcc ctcagcgtct ccccatgctg ggctcactac atgggccagc ccttgctcta
     2761 cctggccggt aggctgctgg cgcctaggtt gtgttgagag ggggatgccc ctggccctgc
     2821 ctcactgtga cctgctcctg cccacgtgca gcacctgtca ccttttctag aaataaaatc
     2881 accctgactg tggggtgcca tcggtctccg gaga
     MAAVDLEKLRASGAGKAIGVLTSGGDRQGMNAAVRAVTRMGIYV
     GAKVFLIYEGYEGLVEGGENIKQANWLSVSNIIQLGGTIIGSARSKAFTTREGRRAAA
     YNLVQHGITNLCVIGGDGSLTGANIFRSEWGSLLEELVAEGKISETTAWTYSHLNIAG
     LVGSIDNDFCGTDMTIGTDSALHRIMEVIDAITTTAQSHQRTFVLEVMGRHCGYLALV
     SALASGADWLFIPEAPPEDGWENFMCERLGETRSRGSRLNIIIIAEGAIDRNGKPISS
     SYVKDLVVQRLGFDTRVTVLGHVQRGGTPSAFDRILSSKMGMEAVMALLEATPDTPAC
     VVTLSGNQSVRLPLMECVQMTKEVQKAMDDKRFDEATQLRGGSFENNWNIYKLLTHQK
     PPKEKSNFSLAILNVGAPAAGMNAAVRSAVRTGISHGHTVYVVHDGFEGLAKGQVQEV
     GWHDVAGWLGRGGSMLGTKRTLPKGQLESIVENIRIYGIHALLVVGGFEAYEGVLQLV
     EARGRYEELCIVMCVIPATISNNVPGTDFSLGSDTAVNAAMESCDRIKQSASGTKRRV
     FIVETMGGYCGYLATVTGIAVGADAAYVFEDPFNIHDLKVNVEHMTEKMKTDIQRGLV
     LRNEKCHDYYTTEFLYNLYSSEGKGVFDCRTNVLGHLQQGGAPTPFDRNYGTKLGVKA
     MLWLSEKLREVYRKGRVFANAPDSACVIGLKKKAVAFSPVTELKKDTDFEHRMPREQW
     WLSLRLMLKMLAQYRISMAAYVSGELEHVTRRTLSMDKGF
     source          1..2914
     CDS             56..2398

MOUSE: Pfkl
        1 gcggcgggag aggagcttgg gctcctggtc tccgctgccg ccatggctac cgtggacctg
       61 gagaaactgc ggatgtcggg ggctggcaag gccattggag tgctgaccag cggcggtgat
      121 gcgcaaggta tgaatgctgc tgtcagggct gtgacccgta tgggcatata tgtgggggcc
      181 aaagtcttcc tcatctatga gggctacgag ggccttgtgg aaggaggcga gaacatcaag
      241 ccagccaact ggctcagcgt ttccaatatc atccagctgg gtggcaccat tattggcagt
      301 gcccgctgta aggccttcac tacgagggaa ggccgcctgg ctgcagccta caatctgctc
      361 caacacggca tcaccaacct gtgtgtcatc ggtggcgacg gcagcctcac gggggccaac
      421 atcttccgca acgagtgggg cagcttgctg gaggagctgg tgaaggaagg caagatctca
      481 gagtccacag ctcagaacta cgcacacttg accatcgccg gtctggtggg ctccatcgat
      541 aacgacttct gtggcactga catgaccatt ggcacagact cagccctgca ccgcattatg
      601 gaggtcattg acgccatcac taccactgcc caaagtcacc agaggacctt tgttttggag
      661 gtgatgggac ggcactgcgg gtacctggcg ctggtgtctg ccctggcttc cggggctgat
      721 tggctattca ttcctgaagc gccccctgag gatggctggg agaacttcat gtgtgagagg
      781 ctgggcgaga ctcggagccg aggctctcgg ctgaacatca tcatcatcgc agagggtgcc
      841 attgaccggc atggaaagcc tatctcatcc agctacgtga aggatctggt ggttcagagg
      901 ctgggcttcg atacacgagt gactgtgctg ggtcatgtac agcgaggagg gacgccttca
      961 gccttcgacc gaatcctgag tagcaagatg ggtatggagg ccgtgatggc gctgctagag
     1021 gccacgcctg acacgccggc ctgtgtggtc agcctctccg ggaaccagtc tgtgaggctg
     1081 cctctcatgg agtgtgtgca agtgacaaag gacgtgcaga aggccatgga cgaggagagg
     1141 tttgacgagg ccatccagct ccgtggcagg agctttgaga acaactggaa aatttacaag
     1201 ctccttgccc accagaaggt gtctaaagag aagtccaact tctccctggc catcctgaat
     1261 gtgggggctc cagctgctgg catgaatgca gctgtgccgt ccgcagtgcg cactggtatc
     1321 tccgagggac acacggtata catcgtgcat gatggctttg agggtctggc caagggtcag
     1381 gtgcaagaag tgggctggca tgatgtggca ggctggctgg gacgtggtgg ctcgatgctg
     1441 gggaccaaga ggacactgcc caagccccac ctggaggcca ttgtggagaa tctccgcacc
     1501 tacaacatcc acgccctgct ggtgattggt ggctttgagg cctacgaggg tgtgctgcag
     1561 ctggtggagg cccgggggcg ctacgaggaa ctctgcattg tcatgtgtgt catcccagcc
     1621 accatcagca acaatgtgcc tggcactgac ttcagcctgg gctcagacac ggctgtcaac
     1681 gctgcaatgg agagttgtga tcgcatcaag cagtcagcct cagggacaaa gcggcgtgtg
     1741 ttcattgtag agaccatggg gggctactgt ggctacctgg ctactgtgac cggcattgct
     1801 gtgggtgccg atgctgccta cgtctttgag gaccctttca acatccatga cttaaaggcc
     1861 aatgtggagc atatgacaga gaagatgaag acagacatcc agaggggact ggtgctccgg
     1921 aacgagaagt gtcacgaaca ctacaccaca gagttcctat acaacctgta ctcctcagaa
     1981 ggcaggggcg tgtttgactg caggaccaat gtgctgggcc acttgcagca gggtggtgct
     2041 ccaacccctt tcgaccggaa ctatgggacc aaactggggg tgaaggccat gttgtgggtg
     2101 tctgagaagc tacgtgatgt ctaccgtaaa gggcgggtgt ttgccaatgc tccagactca
     2161 gcctgtgtga tcggcctgcg gaagaaggta gtggccttca gtccggtcac agaactcaag
     2221 aaagagactg attttgagca ccgcatgccc cgggagcagt ggtggctgaa tctgcggctg
     2281 atgctgaaga tgctggcaca ctaccgcatc agcatggcag actatgtgtc tggggagctg
     2341 gagcacgtca cacgccgcac cttgagcata gacaagggtt tctgagctta ctgtcactac
     2401 tgttcctgcg ttcccggact ctcaccctcc cagtgctagc cacagatccc agcaccgagg
     2461 ggaactcaag gggaactcgg agcccgtggc tggctgaggg atgtgggggt ctactgtgct
     2521 gctctggggc tcttcccttn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnncc
     2581 ctacctttca gtcagaccca cattgcctct ccctcactgg ccagctggct gcctcaccac
     2641 acggctgaaa agagcctcac ttttttagaa ataaagtcac ctgtctag
     MATVDLEKLRMSGAGKAIGVLTSGGDAQGMNAAVRAVTRMGIYV
     GAKVFLIYEGYEGLVEGGENIKPANWLSVSNIIQLGGTIIGSARCKAFTTREGRLAAA
     YNLLQHGITNLCVIGGDGSLTGANIFRNEWGSLLEELVKEGKISESTAQNYAHLTIAG
     LVGSIDNDFCGTDMTIGTDSALHRIMEVIDAITTTAQSHQRTFVLEVMGRHCGYLALV
     SALASGADWLFIPEAPPEDGWENFMCERLGETRSRGSRLNIIIIAEGAIDRHGKPISS
     SYVKDLVVQRLGFDTRVTVLGHVQRGGTPSAFDRILSSKMGMEAVMALLEATPDTPAC
     VVSLSGNQSVRLPLMECVQVTKDVQKAMDEERFDEAIQLRGRSFENNWKIYKLLAHQK
     VSKEKSNFSLAILNVGAPAAGMNAAVPSAVRTGISEGHTVYIVHDGFEGLAKGQVQEV
     GWHDVAGWLGRGGSMLGTKRTLPKPHLEAIVENLRTYNIHALLVIGGFEAYEGVLQLV
     EARGRYEELCIVMCVIPATISNNVPGTDFSLGSDTAVNAAMESCDRIKQSASGTKRRV
     FIVETMGGYCGYLATVTGIAVGADAAYVFEDPFNIHDLKANVEHMTEKMKTDIQRGLV
     LRNEKCHEHYTTEFLYNLYSSEGRGVFDCRTNVLGHLQQGGAPTPFDRNYGTKLGVKA
     MLWVSEKLRDVYRKGRVFANAPDSACVIGLRKKVVAFSPVTELKKETDFEHRMPREQW
     WLNLRLMLKMLAHYRISMADYVSGELEHVTRRTLSIDKGF
     source          1..2688
     gene            1..2688
     mRNA            <1..2688
     CDS             43..2385

DROME: Pfk
        1 agcttataga ttcagcttgt accatgccag gaataacatg aggattaacg cgcacgttca
       61 tttctgggtc tgtcaccggc gcggctaaat ttacaacttg ctgccagaat gtgccgccaa
      121 gaaccgcggt ttgtgccgga cgcacaacgc cttaacccaa ggcaaccaag ctgcagctgc
      181 ctcctccaag caccaccgga gtgcccgcct tagcagccag cagtttccgc cgctttgtga
      241 acttaccacg cccagcaatg tgccggtttc tttgacagga gaaagaatat cggtcatcgt
      301 aggccagcca tatccagcaa tgcaggtttc cagtcacggg tggttagatc aagaagtccc
      361 gtggtgccag cgttagaggg atcaacagct gaacgattgt gggtcgaacg taaacaaatt
      421 ggttaaacgc tattttccgc tcgttgctag tcgcgaaagt cgttcataac agacagaatc
      481 ctcagatttt cgacctaaat caaaccaagt tagggcaatc gcgttggagc gaactcttgg
      541 gcggatttag ccatccgaag tttgcattgc atcagtacgc acttacagaa agcccgtggc
      601 tgtgtgctgt gtccgtgtgt gttgtgtatg cgtctctggc ctgaaggtca ccttgaagct
      661 caaagcaaag cgaactgtga ataccgcctg cgagcggtat atattgctag taactgaaaa
      721 gccacggcaa ggagacgtag tagtagtatt tatagcccac ttgatataac ccagctccag
      781 cggcgctgct cgcatagttg caaaactccc taccgagtac aatagtggtt catagtgtgt
      841 gctttgtgcg atatccgtta cgaccccagt ttgatttaca tatagtgcaa aagattgaaa
      901 aatgaattcc gagattaatc aacgattcct ggcccgcggc tcgcagaagg acaaaggact
      961 ggcggtcttc accagcggcg gggattccca gggcatgaat gccgccgtgc gagcctgtgt
     1021 ccgtatggcc atctatttgg gctgcaaggt gagttggtga cctctgtcaa gtacttccgc
     1081 ccacgcagat cgcgtccggt gaccccgatc ccaggcacag gcaacaaacc catagtgaac
     1141 ccagaaattt cgtgaaacac ctggtaattt gcttatcagc agccgttaaa ccacgattat
     1201 tgggccgcaa agccagttag ataatctcca atcggtgcga aaagaaattc aagaatatat
     1261 gtgtacatgc acattgacat tgggtttatt ttcgggtcct cacatgcgat tttcgatttt
     1321 cggctaattt gtttcgtttt tttgttgtcg ctcttggttt ctattcggtt tatttaaatg
     1381 agttctttaa tttgttaggg aacttcttgc ccggccgttg gctccctcga aatatcgaaa
     1441 atgtgtcaat taacgtagcc aatttaaatt gataaactat tcatttgatt caatttctgg
     1501 ggcataaagt aaagtattgc tgccttgcat gaccagcgct tgaatatggt tcaataaatt
     1561 gacaaattaa taaatatatc atggtatgct aaacaaatgg ttcctaatca gttcaataat
     1621 ctaacctttg tttttaatct actagtgcct tggcatcatt attgtttatg ttattttttc
     1681 acttttcaaa ttaagagcgt tataaaattt gaattccctt ggttatctga gttgcttaaa
     1741 aagtatcgat ttaacatcga ttacattgta attacctgta acggtatttt gaatatgcaa
     1801 atgttttgtt gtttaaaact taaacttatc agtaaaagtt gagaaaagta tatgagataa
     1861 gtcatatcat attaatttct attgactgtt ctttactgac ttcctattaa atattacgac
     1921 tttggcagag tgaaatgaaa ttaaataatt tatactcgaa ttcggtgatt catttttaat
     1981 tgtgctaatg atgtcatgtg ccatgaagat accaaactct attctgtttt acaccatatc
     2041 tacaattgat tcgtgtttac ttcggcaagg tctacttcat tcgtgaaggc taccagggca
     2101 tggtggatgg tggcgactgc atcaggaagt ccaactgggc ctcagtctca tccattattc
     2161 cattcgttgg ttggcaccat ccattgctcc gccctttgcc agacttccgt gagcgtcagg
     2221 gtcgcttgaa agccgctaac aacctgattc agcgaggaat caccaatctg gtggtcattg
     2281 gaggcgatgg ctccctcacg ggcgccaatc tgttgcctca ggagtggtcc agcctgttgg
     2341 acgagctggt caagaacaag accattacca ccgagcagca ggaaaagttc aatgtcctgc
     2401 acatgcttgg attggtatgc tacacagagt attccttgga tatattttct tatggatgaa
     2461 tctttttgta ggttggctcc atcgacaacg atttctgtgg cactgacatg accatcggca
     2521 cggacacggc actgcatcgc atcatcgagc aatcgaaggc taaggtccaa tctccagtac
     2581 agcctaactc ccatcagcgc accttcatca tggaaggtca ggtgtctcat tgcgggtaag
     2641 ttgatctctg agcggatatt gcgaggaaaa gttggatgcc tctgtattag cctaagtgtc
     2701 agtgattaaa ttgggatttt agctaatgcc tggaacgact atctctagct atctttcggt
     2761 ggtagctggc attatctccg aaggcaagac tacgtctttc tgcccgagtc tcctccgcag
     2821 ccgattggcc cgatcgactt gtccttaaat tggaacaggc aagcccaaaa cggaaatctg
     2881 ttgaatgtcg tcgactcatt tcgcacattt ctgtttctat ggccgcagta ctatgtcgat
     2941 cgatccccat atcctccaaa atcccatccc ccttttgact aatattttgt aatatatatt
     3001 tttgcagcta tttagctctt gtgggtggac tggcgtgcga ggcgattcat attcatccga
     3061 atgcgccagg tcgattaggc cagacaggct ctgctctcag ctggacccag gtcaggaaga
     3121 tgagctccat ttccattcca tcaagtcact ggagaagtcc gaaaggcatc ggaaatatgt
     3181 tctcgagaga cttggtatag gatttaggat attcttatta atatagccag ttagctgtcg
     3241 aagataatat tcctgtttga gatagagttg tatacttcag tgcagttgtc gttgcttgat
     3301 gcttaagtag tacacctgta cacaattttt tgaaagacac attttaagag cgacacttgc
     3361 catacaaagc ttggttctta tttctgctta ctgcacacga atgtatcttt aaacacaaac
     3421 cggagatacg gaatgaatta cgcacagttt ttgatctgta ccagcataca aaatcatatg
     3481 taactaactt aagtttaccc agatactcca atcccggata atatctcccg acattgtgaa
     3541 ccatctttat tttgtaccta actcttgttt ttagttacta gccatatcgg cagccaatag
     3601 gccacagagg ctgatttatg ttcatacccg agagccggtg tcagtcaatt ggaaggacag
     3661 atctgtgtca agctccacca ggtcaggtcc agagtccttc gctatccaat taatttctag
     3721 ctactctttt gtcaaatttt tgaatttcta aattttattc tgcattgttt ttggactatt
     3781 cgatgtgccg aaatttccat ggtggcgata aacagcttta acagctattt gatttacttg
     3841 tttgggtttt cggtctctgt ttttgagtac cactatgatc tcactgagtt cccttactaa
     3901 cttttccaaa tccactaacg tccatcctcg ttaatcgatc gtaaatcttc atcaatgttt
     3961 ctattcatcg acttgactga tcggctaagg atcggctcaa gtcaacgtta atctaatcat
     4021 gaagcccgca ttatgatcga actgaatcat gaatatcata gaataacgtg agtactttag
     4081 aacgcatgca ctcatcgctt gctgatacac atttggtgac actattcaac attgtaagca
     4141 aagcatatgt aaactacatt attgtatgat gatgtctact catcatgccc tcttcataat
     4201 tcgtttgtgc ttttgtagtt tctgtatcat ccacgattag tatcttacat atatgcttaa
     4261 atgaatccct tcaccattga ccaacaggag cgatctgctg gccagcgtct gaacatcgtg
     4321 attgtggccg agggagccat ggatcgcgag ggtcatccca tcacagccga ggatgtaaag
     4381 aaggtgatcg acgagcgtct gaagcacgat gcccgcatca ctgtcttggg tcacgtgcag
     4441 cgcggtggca atcccagtgc cttcgatcgt tttttggtaa gtatttatac gaagatgacc
     4501 tcaataactg tatttttagt aatttacaat gctagctagt tttagattgt atcttttaaa
     4561 ggttaatatt aaaacactaa agttaccaaa ataaggatat acttattaag atatgattca
     4621 atctattttt gacttgagag ttaatgcttc taccccgcat aggcttgccg catgggagct
     4681 gagccacttt ggcccttgat ggaggccacc aaggactcgg tgccagtggt catctctctg
     4741 gacggcaacc aggcggttcg cgtgccgctg atggagtgcg tggagcgcac ccaggctggc
     4801 aaggccatgg cggagaaacg ctgggcggat gccgtcaacg tgcgcggacg ctccttcgag
     4861 cggaatctgg agacctacaa gatgctgacg cgcttgaagc cgcccaagga gaacttcgac
     4921 gccgatggca agggaatcga aggataccgc ctagctgtga tgcatattgg tgctccggct
     4981 tgcggtatga atgccgctgt gcgcagcttc gtgcgcaatg ccatctaccg cggtgatgtg
     5041 gtttatggaa tcaacgacgg tgtcgagggt ctgattgcgc gaaatgtccg cgagctgggc
     5101 tggtaagtaa tccgacaagg gatcactcta aatcgtgtct taatgcaatt caatttcagg
     5161 tcggatgtct caggatgggt tggtcagggt ggcgcctact tgggatccaa acgcacactg
     5221 cctgagggca agttcaagga gatcgccgct cgtctcaagg agtttaagat ccagggtctc
     5281 ctgatcattg gtggctttga gagttaccat gccgccggac agatcgccga tcagcggaca
     5341 actacccaca gcttctgcat ccccattgtg gttattccat cgacgatttc gaacaatgtg
     5401 cccggcacag aattttctct gggatgcgac accggtttaa atgagattac ggagatttgc
     5461 gaccgtatcc gtcagtcggc acagggaacc aagcgccgag tgttcgtcat tgagacgatg
     5521 ggtggctact gtggctattt gccaccgttg gccggtttgg ccggcggagc tgatgccgcc
     5581 tacatctacg aggagaagtt ctccatcaag gagctgcagc aggatgtcta ccacatgcct
     5641 ccaagatggc cgaggcgtct cccgcggtct aatcctgcga acgagaaggc tagcgagaac
     5701 tacagcacgg acttcattta ccgcctgtac tcggaggagg gcaagggcct cttcacctgc
     5761 cgtatgaaca tcctgggtca catgcagcag ggcggctcac ccactccctt cgaccgcaac
     5821 atgggcacca aaatggccgc caagtgtgtc gactgctggc cgcccagatc aaggcgaaca
     5881 tcgacggcca acggtgtggt caactgcaag tccccggaca ccgccacgct gctgggaatc
     5941 gtgtcgcggc agtaccgctt ctcaccgctg gtcgacctca ttgcagagac gaacttcgag
     6001 taagtttaac ccgatggtca ccacaaaggg gactatgaat tccctttaag ctcttggcat
     6061 aacccactcc tcttccagtc aacgcatccc gaagaagcag tggtggctgc gcctgcgtcc
     6121 cctgctgcgc atcctggcca agcacgattc cgcctacgag gaggagggta tgtacatcac
     6181 cgtcgaggag gagtgtgaca ctgacgccgt cgcctaagcg gactcggatc cggactctga
     6241 tccccacttc cgcttatcac caccatcgct gcatgcaagc atcaatgtcc acctatccgc
     6301 accctcgaat cagtctctgt gttcgctttt taagttgttt tggcaccgca tccgatccgt
     6361 tttatggttt ttaccaagat cagacgaaga ggcccatgac agcagcacat acgaaagtat
     6421 ttcataatct acagacgcat aaaaaagcac aaatacataa cttatttata ttgctcgcca
     6481 gtcgattctt tcttatgatt tttccaaata tcgtgtattc ttgaaatttg aatctcgaat
     6541 actgaataac gttaatagtt cattctacat tgcagccgtt ccgaagagtc tggcgaccta
     6601 ttagcggaaa acgtttcgta tattatcgta attgttggtt cttcagccca actaaattaa
     6661 atgttaaagt atttagacaa tttacccagt caaaggaaca aattctatct gcaaactgtt
     6721 tttcgagtat tgttatcgaa cgaagcaatg atctatttgt aacgacgtgc taaatacata
     6781 tcaaacacct gttggcacaa tttatcgtcg tttgttttct aattgttcag taggtatgtg
     6841 ggaattgagc ttgaatttca cttttggtta agaaaacatt tatttttgaa atggcttgct
     6901 gggcgcgatt ggaacagcaa tgtttcagtg gaatcagcct ataatacgat gtttctgcag
     6961 caacttcact gcttgcaagc tatcggctca atcgattgtg gtgccatcga tgcgcttcca
     7021 gcctagacac ttgacttttt gcacggatgt gtatgtagtt tattgtgctc gaaactgcgt
     7081 aagtgatgtc agcgtgactg a
     MNSEINQRFLARGSQKDKGLAVFTSGGDSQGMNAAVRACVRMAI
     YLGCKVYFIREGYQGMVDGGDCIRKSNWASVSSIIPFVGWHHPLLRPLPDFRERQGRL
     KAANNLIQRGITNLVVIGGDGSLTGANLLPQEWSSLLDELVKNKTITTEQQEKFNVLH
     MLGLVGSIDNDFCGTDMTIGTDTALHRIIEQSKAKVQSPVQPNSHQRTFIMEGQVSHC
     GYLALVGGLACEAIHIHPNAPGRLGQTGSALSWTQRSAGQRLNIVIVAEGAMDREGHP
     ITAEDVKKVIDERLKHDARITVLGHVQRGGNPSAFDRFLACRMGAEPLWPLMEATKDS
     VPVVISLDGNQAVRVPLMECVERTQAGKAMAEKRWADAVNVRGRSFERNLETYKMLTR
     LKPPKENFDADGKGIEGYRLAVMHIGAPACGMNAAVRSFVRNAIYRGDVVYGINDGVE
     GLIARNVRELGWSDVSGWVGQGGAYLGSKRTLPEGKFKEIAARLKEFKIQGLLIIGGF
     ESYHAAGQIADQRTTTHSFCIPIVVIPSTISNNVPGTEFSLGCDTGLNEITEICDRIR
     QSAQGTKRRVFVIETMGGYCGYLPPLAGLAGGADAAYIYEEKFSIKELQQDVYHMPPR
     WPRRLPRSNPANEKASENYSTDFIYRLYSEEGKGLFTCRMNILGHMQQGGSPTPFDRN
     MGTKMAAKCVDCWPPRSRRTSTANGVVNCKSPDTATLLGIVSRQYRFSPLVDLIAETN
     FDQRIPKKQWWLRLRPLLRILAKHDSAYEEEGMYITVEEECDTDAVA
     source          1..7101
     regulatory      698..704
     exon            719..1048
     5'UTR           719..901
     gene            join(902..1048,2070..2414,2472..2635,3008..3110,
                     4291..4476,4663..5102,5160..5999,6079..6217)
     CDS             join(902..1048,2070..2414,2472..2635,3008..3110,
                     4291..4476,4663..5102,5160..5999,6079..6217)
ARATH, ASPOR, BACTN, CAEEL, CANAX, CLOPE, KLULA, KOMPG, LACLL, NOSS1, PICPA, SYNY3, THET8, YEAST, ARATH, ASPOR, BACTN, CAEEL, CANAX, CLOPE, KLULA, KOMPG, LACLL, NOSS1, PICPA, STRCO, SYNY3, THET8, YEAST, ARATH, BACTN, STRCO, ARATH, ARATH, ARATH, ARATH, BOVIN, HUMAN, MOUSE, PONAB, L_RAT, BOVIN, CANLF, HORSE, HUMAN, MACFA, MOUSE, M_PIG, PONAB, RABIT, M_RAT, HUMAN, MOUSE, PONAB, RABIT, P_RAT, ACTP2, ACTP7, ACTPJ, ACTSZ, ALIF1, ALIFM, ALISL, ALKMQ, ALKOO, AMYME, ANAVT, ANOFW, AQUAE, ASPFU, ASPNG, BACAA, BACAC, BACAH, BACAN, BACC0, BACC1, BACC2, BACC3, BACC4, BACC7, BACCE, BACCN, BACCQ, BACCR, BACCZ, BACHD, BACHK, BACLD, BACP2, BACSK, BACSU, BACVZ, BACWK, BAUCH, BLOFL, BORBU, BREBN, BUCA5, BUCAI, BUCAP, BUCAT, BUCBP, BUCCC, CALFI, CALS4, CHLAA, CHLAD, CHLSY, CITK8, CLOAB, CLOB1, CLOB6, CLOBA, CLOBB, CLOBH, CLOBJ, CLOBK, CLOBL, CLOBM, CLONN, CLOTE, COREF, CORGL, COXBU, CROS8, CYTH3, DEIRA, DICDI, DROME, ECO24, ECO27, ECO45, ECO55, ECO57, ECO5E, ECO7I, ECO81, ECO8A, ECOBW, ECODH, ECOHS, ECOL5, ECOL6, ECOLC, ECOLI, ECOLU, ECOSE, ECOSM, EDWI9, ENT38, ENTCL, ENTFA, ENTHI, ERWT9, ESCF3, FINM2, FUSNN, GEOKA, GEOSE, GEOSW, HAECO, HAEDU, HAEI8, HAEIE, HAEIN, HAEPS, HAES1, HALOH, HAMD5, HISS2, KLEP3, KLEP7, LACAC, LACCB, LACDE, LACGA, LACH4, LACJO, LACLA, LACLM, LACLS, LACP3, LACPL, LACS1, LEIDO, LISIN, LISMC, LISMF, LISMH, LISMO, LISW6, LYSSH, MACCJ, MANSM, MYCBO, MYCCT, MYCGE, MYCH2, MYCH7, MYCHJ, MYCLE, MYCMO, MYCPE, MYCPN, MYCPU, MYCTO, MYCTU, NATTJ, OCEIH, PAEMC, PASMU, PECAS, PECCP, PEDPA, PEPD6, PERMH, PHOPR, PROFC, SALA4, SALAR, SALCH, SALDC, SALEP, SALG2, SALHS, SALNS, SALPA, SALPB, SALPC, SALPK, SALSV, SALTI, SALTY, SCHMA, SCHPO, SERP5, SHIB3, SHIBS, SHIDS, SHIFL, SHISS, SODGM, SPICI, SPITD, STAA2, STAA8, STAA9, STAAB, STAAC, STAAE, STAAM, STAAN, STAAR, STAAS, STAAT, STAAW, STACT, STAEQ, STAES, STRA1, STRA3, STRA5, STRE4, STREM, STRGC, STRMU, STRP1, STRP2, STRP3, STRP4, STRP6, STRP7, STRP8, STRPB, STRPC, STRPD, STRPF, STRPG, STRPI, STRPJ, STRPM, STRPN, STRPQ, STRPS, STRPZ, STRR6, STRS7, STRSV, STRSY, STRTD, STRTR, STRU0, STRZJ, STRZP, STRZT, SULDN, SULNB, SULSY, TERTT, THEEB, THEMA, THENN, THEP1, THEP3, THEPX, THESQ, THET2, TOLAT, TREPA, TRYBB, TRYBO, TRYCC, UREPA, VIBCB, VIBCH, VIBPA, VIBVU, VIBVY, WHEAT, WOLSU, YARLI, YERE8, YERP3, YERPA, YERPB, YERPE, YERPG, YERPN, YERPP, YERPS, YERPY, ECOLI, MYCTO, MYCTU, THETC, 

#### 3.1.1.31
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: PGLS
        1 ccgccgccgc cctcgccatg gccgcgccgg ccccgggcct catctcggtg ttctcgagtt
       61 cccaggagct gggtgcggcg ctagcgcagc tggtggccca gcgcgcagca tgctgcctgg
      121 caggggcccg cgcccgtttc gcgctcggcc tgtcgggcgg gagcctcgtc tcgatgctag
      181 cccgcgagct acccgccgcc gtcgcccctg ccgggccagc tagcttagcg cgctggacgc
      241 tgggcttctg cgacgagcgc ctcgtgccct tcgatcacgc cgagagcacg tacggcctct
      301 accggacgca tcttctctcc agactgccga tcccagaaag ccaggtgatc accattaacc
      361 ccgagctgcc tgtggaggag gcggctgagg actacgccaa gaagctgaga caggcattcc
      421 aaggggactc catcccggtt ttcgacctgc tgatcctggg ggtgggcccc gatggtcaca
      481 cctgctcact cttcccagac caccccctcc tacaggagcg ggagaagatt gtggctccca
      541 tcagtgactc cccgaagcca ccgccacagc gtgtgaccct cacactacct gtcctgaatg
      601 cagcacgaac tgtcatcttt gtggcaactg gagaaggcaa ggcagctgtt ctgaagcgca
      661 ttttggagga ccaggaggaa aacccgctgc ccgccgccct ggtccagccc cacaccggga
      721 aactgtgctg gttcttggac gaggcggccg cccgcctcct gaccgtgccc ttcgagaagc
      781 attccacttt gtagctggcc agagggacgc cgcagctggg accaggcacg cggcccatgg
      841 ggctgggccc ctgctggccg ccactctccg ggctctcctt tcaaaaagcc acgtcgtgct
      901 gctgctggaa gccaacagcc tccggccagc agccctaccc ggggctcaac acacaggctg
      961 tggctctgga catccggata ttaaaaggag cgttgctgga aaaaaaaaaa
      MAAPAPGLISVFSSSQELGAALAQLVAQRAACCLAGARARFALG
     LSGGSLVSMLARELPAAVAPAGPASLARWTLGFCDERLVPFDHAESTYGLYRTHLLSR
     LPIPESQVITINPELPVEEAAEDYAKKLRQAFQGDSIPVFDLLILGVGPDGHTCSLFP
     DHPLLQEREKIVAPISDSPKPPPQRVTLTLPVLNAARTVIFVATGEGKAAVLKRILED
     QEENPLPAALVQPHTGKLCWFLDEAAARLLTVPFEKHSTL
     source          1..1010
     gene            1..1010
     CDS             18..794

MOUSE: Pgls
        1 ggccgggaac accgccgcct ccccaccgcc atggcagcac ccgcgcccag tctcatctcg
       61 gtcttctcca gcccgcaaga gctgggcgcg tcgctggcgc agctggtggc gcagcgggcc
      121 gcgagctgcc tggaagggga ccgtggccgc ttcgcgcttg gtctgtcagg cggcagcctg
      181 gtctccatgc tagcccgaga cctgcccgcc gccgccgctc ccgctggacc agccagcttt
      241 gcgcgctgga cgctcggctt ctgcgacgag cgcctcgtgc ccttcgacca cgccgagagc
      301 acgtacggcc tctaccggac acacctgctc tcaaagctgc ccatcccaga cagccaggtc
      361 cttaccatca atcctgccct acctgtggag gatgctgcag aggactatgc caggaaactg
      421 agacaggcct tgcaaggaga cgctgtccct gtgtttgacc tgctgatcct gggagtgggc
      481 cctgacggcc atacctgttc gctcttccct gaccatcccc tcctacagga gcgggagaag
      541 atcgtggctc ccatcagtga ctccccaaag ccaccaccgc agagggtgac cctaacgctt
      601 cctgtgctga acgcagccca aagtatcatc tttgtggcca cgggggaagg caaggcagct
      661 gtgctgaagc gcatcctgga ggacaaggag ggcacgttgc ccgccgcctt ggtgcagccg
      721 cgcacgggcg ccctctgctg gttcctggac gaggcagctg cccggctgct gtctgtgccc
      781 ttcgagaagc attccacatt gtagggggtg cgccatgcac gccgtgggca cttcgggtgt
      841 tgtgggagcg gactagctgc ggattaaaca gctttgctgg
      MAAPAPSLISVFSSPQELGASLAQLVAQRAASCLEGDRGRFALG
     LSGGSLVSMLARDLPAAAAPAGPASFARWTLGFCDERLVPFDHAESTYGLYRTHLLSK
     LPIPDSQVLTINPALPVEDAAEDYARKLRQALQGDAVPVFDLLILGVGPDGHTCSLFP
     DHPLLQEREKIVAPISDSPKPPPQRVTLTLPVLNAAQSIIFVATGEGKAAVLKRILED
     KEGTLPAALVQPRTGALCWFLDEAAARLLSVPFEKHSTL
     source          1..880
     CDS             31..804
     regulatory      863..868
     polyA_site      880

DROME: CG17333
        1 caatatgtcg gagaaaaagg gtgcgctaaa agtaatcccg tccgcttcgg aggagcaact
       61 tgtccaggcc ctgggcgatc ttctccagcg ctgctcccag gaggcgctgg ccaaacatga
      121 taagttcagc gtgggacttt cgggtggttc cctcgtccag ttgctaacga aagccctgaa
      181 atcgtgcaac ttaaaaacgg ccaaatgggt gtttttcttc tgtgacgagc ggtatgttcg
      241 cctggatgac agcgattcca cctatggtgc ctacagggcc gagtggctaa cccaattgcc
      301 ctgcatccag gaatcccagt tcgtccgcgc cgataccagc caaccgctgg acgcctgcgc
      361 cgcagattac gaggcgaagg tcaaaagtca agtcgatcgc ttcgatctgc tgctgcttgg
      421 catgggaccc gatggccaca cctgctccct ctttcccgag cagccagcca ccctgcagga
      481 gaccaagcgc ctggttatcc ccatccggaa ctcgcccaag ccgcctcccg agcggatcac
      541 tttcaccctg ccgctgatca ataaggcacg gaatgtcgcc ttcgtggtta cgggcgccgc
      601 aaaagccagt gtcgtcaaga gtgtgtttgt cgatctggac aagaagtttc ccgctgcgtg
      661 ggtgaatccg accaaagggc agttgacatt gattgtggac gcgggtgctg gaaaagaaat
      721 tgaaacctta aaatgacatt ccttagttaa ctatcgcatc ttgtaaataa taattacctt
      781 gataatctta aaaaaaaaaa aaaaaaa
      MSEKKGALKVIPSASEEQLVQALGDLLQRCSQEALAKHDKFSVG
     LSGGSLVQLLTKALKSCNLKTAKWVFFFCDERYVRLDDSDSTYGAYRAEWLTQLPCIQ
     ESQFVRADTSQPLDACAADYEAKVKSQVDRFDLLLLGMGPDGHTCSLFPEQPATLQET
     KRLVIPIRNSPKPPPERITFTLPLINKARNVAFVVTGAAKASVVKSVFVDLDKKFPAA
     WVNPTKGQLTLIVDAGAGKEIETLK
     source          1..807
     gene            1..807
     misc_feature    1..789
     CDS             5..736

Other animals
ARATH, ORYSI, ORYSJ, ARATH, ORYSI, ORYSJ, ARATH, ORYSI, ORYSJ, ARATH, ORYSI, ORYSJ, ARATH, AGGAC, ARTBC, BACSU, BLOFL, BLOPB, BORBU, BOVIN, BUCA5, BUCAI, BUCAP, BUCAT, BUCBP, CAEEL, CAUVC, CHLMU, CHLPN, CHLTR, CITK8, CROS8, DICDI, DROME, ECO24, ECO27, ECO45, ECO55, ECO57, ECO5E, ECO7I, ECO81, ECO8A, ECOBW, ECODH, ECOHS, ECOK1, ECOL5, ECOL6, ECOLC, ECOLI, ECOLU, ECOSE, ECOSM, ECOUT, ENT38, ERWT9, ESCF3, HAEIN, HELPJ, HELPY, HUMAN, KLEP3, KLEP7, MOUSE, MYCBO, MYCLE, MYCTO, MYCTU, NEIMA, NEIMB, NOSS1, PECAS, PECCP, PHOLL, PSEAE, PSEPU, L_RAT, RHILO, RHIME, SALA4, SALAR, SALCH, SALDC, SALEP, SALG2, SALHS, SALNS, SALPA, SALPB, SALPC, SALPK, SALSV, SALTI, SALTY, SCHPO, SERP5, SHIB3, SHIBS, SHIDS, SHIF8, SHIFL, SHISS, SODGM, STRCO, SYNY3, THEMA, TREPA, XENNA, XYLFA, XYLFT, YERE8, YERP3, YERPA, YERPB, YERPE, YERPN, YERPP, YERPS, YERPY, HUMAN, MOUSE, RABIT, PLAF7, YEAS1, YEAS6, YEAS7, YEAST, YEAST, 

#### 4.1.2.13
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: ALDOA
        1 agtaccgggt acgcaggggt gcctcaacca cactccgtcc acggactctc cgttatttta
       61 ggaggtccct ggccaaagat ttatttctct tgacaaccaa gggcctccgt ctggatttcc
      121 aaggaagaat ttcctctgaa gcaccggaac ttgctactac cagcaccatg ccctaccaat
      181 atccagcact gaccccggag cagaagaagg agctgtctga catcgctcac cgcatcgtgg
      241 cacctggcaa gggcatcctg gctgcagatg agtccactgg gagcattgcc aagcggctgc
      301 agtccattgg caccgagaac accgaggaga accggcgctt ctaccgccag ctgctgctga
      361 cagctgacga ccgcgtgaac ccctgcattg ggggtgtcat cctcttccat gagacactct
      421 accagaaggc ggatgatggg cgtcccttcc cccaagttat caaatccaag ggcggtgttg
      481 tgggcatcaa ggtagacaag ggcgtggtcc ccctggcagg gacaaatggc gagactacca
      541 cccaagggtt ggatgggctg tctgagcgct gtgcccagta caagaaggac ggagctgact
      601 tcgccaagtg gcgttgtgtg ctgaagattg gggaacacac cccctcagcc ctcgccatca
      661 tggaaaatgc caatgttctg gcccgttatg ccagtatctg ccagcagaat ggcattgtgc
      721 ccatcgtgga gcctgagatc ctccctgatg gggaccatga cttgaagcgc tgccagtatg
      781 tgaccgagaa ggtgctggct gctgtctaca aggctctgag tgaccaccac atctacctgg
      841 aaggcacctt gctgaagccc aacatggtca ccccaggcca tgcttgcact cagaagtttt
      901 ctcatgagga gattgccatg gcgaccgtca cagcgctgcg ccgcacagtg ccccccgctg
      961 tcactgggat caccttcctg tctggaggcc agagtgagga ggaggcgtcc atcaacctca
     1021 atgccattaa caagtgcccc ctgctgaagc cctgggccct gaccttctcc tacggccgag
     1081 ccctgcaggc ctctgccctg aaggcctggg gcgggaagaa ggagaacctg aaggctgcgc
     1141 aggaggagta tgtcaagcga gccctggcca acagccttgc ctgtcaagga aagtacactc
     1201 cgagcggtca ggctggggct gctgccagcg agtccctctt cgtctctaac cacgcctatt
     1261 aagcggaggt gttcccaggc tgcccccaac aactccaggc cctgccccct cccactcttg
     1321 aagaggaggc cgcctcctcg gggctccagg ctggcttgcc cgcgctcttt cttccctcgt
     1381 gacagtggtg tgtggtgtcg tctgtgaatg ctaagtccat caccctttcc ggcacactgc
     1441 caaataaaca gctatttaag gggg
     MPYQYPALTPEQKKELSDIAHRIVAPGKGILAADESTGSIAKRL
     QSIGTENTEENRRFYRQLLLTADDRVNPCIGGVILFHETLYQKADDGRPFPQVIKSKG
     GVVGIKVDKGVVPLAGTNGETTTQGLDGLSERCAQYKKDGADFAKWRCVLKIGEHTPS
     ALAIMENANVLARYASICQQNGIVPIVEPEILPDGDHDLKRCQYVTEKVLAAVYKALS
     DHHIYLEGTLLKPNMVTPGHACTQKFSHEEIAMATVTALRRTVPPAVTGITFLSGGQS
     EEEASINLNAINKCPLLKPWALTFSYGRALQASALKAWGGKKENLKAAQEEYVKRALA
     NSLACQGKYTPSGQAGAAASESLFVSNHAY
     source          1..1464
     gene            1..1464
     CDS             168..1262

MOUSE: Aldoa
        1 aagtccaagg gtggtgttgt gggcattaag gtagataagg gtgtggtgcc cctggcagga
       61 accaatggcg agacaactac ccaggggctg gatgggctgt ctgaacgctg tgcccagtat
      121 aagaaggatg gagccgactt tgccaagtgg cgctgtgtgc taaagattgg ggaacatact
      181 ccctcggccc tggccatcat ggaaaatgcc aatgtgctgg cccgttatgc cagcatctgc
      241 cagcagaatg gcattgtacc cattgtggag cctgaaattc tccctgatgg ggaccatgac
      301 ttgaagcgct gccagtatgt tactgagaag gtcctggcgg ctgtctacaa ggctctgagc
      361 gaccaccatg tctatctgga aggcacattg ctgaagccca acatggtcac ccctggccat
      421 gcttgcaccc agaaattttc caatgaggag attgccatgg caacggtcac agcacttcgt
      481 cgcacagtgc cccctgctgt cactggggtc actttcctgt ctggagggca gagtgaggaa
      541 gaggcatgca tcaacctcaa tgctatcaac aagtgccccc tgctgaagcc atgggccttg
      601 actttctcct atggtcgagc cctgcaggcc tctgctctaa aggcctgggg tgggaagaag
      661 gagaacctga aggcagccca ggaggagtac atcaagcgcg ccctggccaa cagcctcgct
      721 tgtcaaggaa agtatacccc aagtggccag tctggagccg cagccagtga at
      KSKGGVVGIKVDKGVVPLAGTNGETTTQGLDGLSERCAQYKKDG
     ADFAKWRCVLKIGEHTPSALAIMENANVLARYASICQQNGIVPIVEPEILPDGDHDLK
     RCQYVTEKVLAAVYKALSDHHVYLEGTLLKPNMVTPGHACTQKFSNEEIAMATVTALR
     RTVPPAVTGVTFLSGGQSEEEACINLNAINKCPLLKPWALTFSYGRALQASALKAWGG
     KKENLKAAQEEYIKRALANSLACQGKYTPSGQSGAAASE
     source          1..772
     CDS             <1..>772

DROME: Ald
        1 gaattcgata gctaacttat taaaacacaa tgtccgctac tctttttcat ccaacaaaat
       61 aacaccacac caaatcaaac gtaaatggat cttcgtgctg cagaactaca ctcgaatctc
      121 aaaaatgacc acgtacttca actaccccag caaggagctg caggatgagc tgcgcgaaat
      181 tgcccagaaa atcgtggccc ccggcaaggg tatcctcgcc gccgatgagt ccggtcccac
      241 ccatgggaag cgtctgcagg acatcggcgt ggagaacacc gaggacaacc gccgtgccta
      301 ccgtcagctg ttgttcagca ctgaccccaa gctggccgag aacatctctg gagtgattct
      361 gttccacgag accctctacc agaaggccga tgatggcacc cccttcgccg agatcctgaa
      421 gaagaaggga atcattctgg gcatcaaggt cgacaagggt gttgtcccac tgttcggctc
      481 tgaggatgag gtcaccaccc agggtctgga tgacctggcc gcccgttgcg cccagtacaa
      541 gaaggacggt tgcgacttcg ccaagtggcg ttgcgtcctg aagatcggca agaacacccc
      601 atcctaccag tcgatcctgg agaacgccaa tgtcctggcc cgctacgcct ccatctgcca
      661 gtcggagcgc atcgtcccta ttgtggagcc cgaggttctg cccgatggcg atcacgatct
      721 ggaccgcgcc cagaaggtca ccgagaccgt cctggccgcc gtctacaagg ccctgagcga
      781 ccaccacgtc tacctggagg gtactctgct gaagcccaac atggtcaccg ccggtcagtc
      841 ggccaagaag aacaccccag aggagatcgc tctggccacc gtgcaggctc tgcgccgtac
      901 cgttcccgcc gccgttactg gtgagtcatc aaatccaact gtaatctctg gattggaatg
      961 cattcacctt ggttttttgc aatgaatcct atgtaatcga ttgtttgtcc tacaggcgtg
     1021 accttcctgt ctggaggtca gtctcgtagg aggaggccac cgtcaacctg gtgccatcaa
     1081 caacgtcctg atccgccatg ggcccttgag cgaccaccac gtctacctgg agggtaccct
     1141 tctgaagccc aacatggtca ccgccggtca gtcggccaag aagaacaccc cagaggagat
     1201 cgctctgtta ccgtgcaggc tctctcgcac cgttcccgcc gccgttactt gtgagtcatc
     1261 aaattccaac tgtaatctct ggattggaat gcattcacct tgttttttgc aatgaatcct
     1321 atctaatcga ttgtttgtct acaggcgtga ccttcctgtc tggaggtcag tccgaggagg
     1381 aggccaccgt caacctgagt gccatcaaca acgttccctt gatccgccca tgggccctca
     1441 ccttctcgta cggtcgtgcc ctgcaggcct ccgtcctgcg tgcctgggct ggcaagaagg
     1501 agaacatcgc tgccggccag aacgagctgc ttaagcgcgc caaggtgagt ccttggatag
     1561 ttgatctatg cacgattggt tgcagttagc aatttaagtg gtgaatgtat taagagtgtc
     1621 aggtatatgc ttcggaagta ttccttgggc taagaaatat tatacatgta taatataaca
     1681 tacagcatat tcccagccat tgattccatt tccaatccca aatgacccca atcttcttct
     1741 aatcctctaa tcttatccct tttatttccc taccattatt tgtaaccttt ttttgctttt
     1801 gtacgtgaga cattaattca tcatcaataa ccacacatat catgccaggc taacggagag
     1861 gcggcttgtg gtaactatac agctggatcg gttaaggggt tcgctggaaa agatactttg
     1921 catgtggatg accacaggta ttgatcaaag gattgaagaa ttgctgcctt aagatggcga
     1981 tgaacaagct ttcatggggt aacttaagaa tcatagccgc ctttcaccaa atccgactta
     2041 tcgcaaatgc ctttaacata ctgtcctcgt gccactcatg ctcgcttgct ctaaacctaa
     2101 tccacaaaag ccaaaaatct gattaatccc aaccaaaatc ccgctctcct cccgcttcca
     2161 caggccaatt cccaggcctg ccagggtatt tacgtgcccg gctcaattcc gtcgtttgcc
     2221 ggcaatgcca acctctttgt cgcccagcac aaatactaag tcctaaatgc cacgcactaa
     2281 tcccgagtca caatcgagcg aagtatatcc caagcgaatc cagataatcc gcaagagtta
     2341 ctgatcgagg cccagctgga gacgggcaac atttatattc ctccaacaat ggaactgcaa
     2401 atatattcct tttatacatt tttacatttt accgaataaa ctgactagac cttaaagaaa
     2461 atatttttgg cgaacagaaa taaattatat atttctaata ataccttgct tatgcatttt
     2521 gtttacttta gttagcttta aacaaaaatt cgattttatt ttacctttta atttaattta
     2581 aatacatttt aattaaaaat gtcttgtcta actttattca ttaaagccct ttgcaaactt
     2641 cctactgtta attagaataa taattcggaa tatctgcacc tgacagttaa gttgaaaaca
     2701 acgtaaaatt cgttcggaga gctgttactt atatataacg aatcataatt ttcctccaaa
     2761 gaacttgcaa gattaaattt tccaaaactt tccgcagtac gcagcatgta ttcgtgcgct
     2821 tggatgcgtg gaaagttttt agaaaattgc ccgacggtgg aaaaagtggc ggaagttctt
     2881 cgagcgcagg caaaaatcag tgtgaaaact tttttatgct gggggaaaaa cttttttgct
     2941 gcggctcgcc aagttacaac taagtaataa ttaggagtag gcatttctca caacgaaatt
     3001 aatcaatttt ccccgctttc tttaccctcc tccaggccaa cggtgatgct gctcagggca
     3061 agtacgttgc cggcagcgct ggtgccggat ctggatccct gttcgtggcc aaccacgcct
     3121 actaaggtct tggtgtgacc ttggctacac gttactacaa aaaaaaaaat acgaagcaga
     3181 ttgctggaaa agtttggcag atttgtttat ttttacctta gtttcgagag ctaagcaaag
     3241 caagcattac aaaaaataac caaaaaaaaa aaagatgaac gattacactt tcaaaacatg
     3301 ttatatatat gtagtacgtg acatttttgc aagtttatta tattataaca ttattttaga
     3361 gaacaactaa atgatgagtg cagaagaaag gattgaatat gttcgatgga gaaacaattc
     3421 aacaattcaa acaattttat ctttagtttt aagcacataa acctattatt gttgaagtta
     3481 ttacatttct attctattat tatgattatg caagatttca atgaaaacaa aaggatatgt
     3541 cgtaaatcgc tagctaaagc acattttatg gtgaaaacaa cagcaatcac tatcagcaac
     3601 acctaaatgt atgaggcttg taacattgaa gtcgccgcgt tttttaattt ttttaatgtt
     3661 ttataaaaag tccactatga aaatcgatgt tttaccatta ttattattat taaactttat
     3721 atttatgatt gataaggtat aaggtgaaac aaatgacgag gataaacaaa cacattaaaa
     3781 taaacccgaa aagcccccaa aacaacttta ttaaccttat atacatatat ttacattgtt
     3841 aaaagagaac ttgttgttgc aaaatactaa aagaaatata tgaatttata tattcaacat
     3901 ttgacttcag tgtccaatgg cttctaaact gtgctggggc acaatgcttg ttactagaat
     3961 gtttttgaaa ccaactctga ttctctatcc aaaacgcgat gggtagtaac aaaggcagca
     4021 acgacattat cacagtacat atttaaatac aaaaatattg taccaatgac taacccacat
     4081 atttatcaaa tcatgtttta atttacacgt tattcaagtt gcaaattctg catatcgttg
     4141 ttattcacac aattgtttga agtgcaatgt gaaaatataa cagacacgag tgaaggatat
     4201 acaataatac ctaccggaag ggttaagctt aaaatagttt attgtgaaat aaaaaccacc
     4261 acaaacggca acaacaacca gctgtacagt ccaatataca agaaataaaa aacaacaaat
     4321 aaacatcatc cgcatacaag taatggtgta aagtaacatc tttcaataaa aaaccttaag
     4381 agcaaagaaa cccgaattgg tttaatttta ttgtattgtt ttaaaaagcg ttgcataact
     4441 ccaggcctga gttacagttt aaaaggtact gtgggcttaa aaccaagtca tctttctcat
     4501 tgaggttaca tgtagcattc gaagttctta tatcactgaa agtcaattag taataacctt
     4561 gggcagttgc tattaacata gccaaaggta aagccgcaga ccttgcaggt caacgcagaa
     4621 tctgtaccca atttcgagag ttttgtgtta cttaaattta caatttcgct tatttgtaat
     4681 gcaaatggaa gcaaaagcac agcgcgaaca gggttcgtaa tctgcaccgt gatccctttt
     4741 caattgggtt tgtggtattc gcgaggtgca aacttcgctt aatcacaccc aaatcaaatg
     4801 cgcaacggcc cagacagagc aactcgatga taagatgaca cagggatttt tagcatgttg
     4861 aaggggaatg aaacctgcac ggaaagaata ttccagacta attcagcatt cagattcact
     4921 taaaaatcta aaacgagcat ttaatacaag cataattttt ctaagtgtga atttaatgtt
     4981 cgattatggt caatttactc acgattgttt tcgggttact tctgatttat agcgctgggc
     5041 tgaacgactt gctacaccat tgcgtcattg attgccttcg tccaaagata ataaggaaac
     5101 ttcaaagtgt tcgtggaaca gttcgaccgc aactgtgctc ctcgttgggg ttaacagcca
     5161 caaaggggaa cggtaggaaa atccaacaaa aggtgctggc atttggcatc ctgatccaca
     5221 atccctgtgg cagtgtcaac atttcctgtg tcacacttgc actcgccctc acagacctgc
     5281 tggcacaaag attgtcacaa aagtggaatt aattgtattt gcataggatg taaacatcat
     5341 cacgttgccg gcaggatctt gtcctgcaac gtttctaaac tggattcagt atggctcgca
     5401 gcctttcgcc accttcatgt cactctgccg ccaacaaaca caaggggaaa tgcagtttag
     5461 gttgaaagag ttaagattaa tggaagcaat tgatactttt aaaaaatctt aagattaatt
     5521 agggcagctg taatttatga ttatttattt tagtataaat acttattagt tagttattag
     5581 gttgaatatt ccattatttg cagtgcattg acatacattg tatccatcga cttctgcggt
     5641 gcaatagtga ttttacctta ccctggcacg ttgctgtacg ctccaaggag aagcgtcgct
     5701 gcgtcctgaa ttc
     MTTYFNYPSKELQDELREIAQKIVAPGKGILAADESGPTHGKRL
     QDIGVENTEDNRRAYRQLLFSTDPKLAENISGVILFHETLYQKADDGTPFAEILKKKG
     IILGIKVDKGVVPLFGSEDEVTTQGLDDLAARCAQYKKDGCDFAKWRCVLKIGKNTPS
     YQSILENANVLARYASICQSERIVPIVEPEVLPDGDHDLDRAQKVTETVLAAVYKALS
     DHHVYLEGTLLKPNMVTAGQSAKKNTPEEIALATVQALRRTVPAAVTGVTFLSGGQSE
     EEATVNLSAINNVPLIRPWALTFSYGRALQASVLRAWAGKKENIAAGQNELLKRAKAN
     GDAAQGKYVAGSAGAGSGSLFVANHAY
     source          1..5713
     mRNA            join(<1..920,1345..1544,2164..2336,3036..3785)


### Citrate

#### 4.1.1.32
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: PCK1
atgcctcctcagctgcaaaacggcctgaacctctcggccaaagttgtccagggaagcctg
gacagcctaccccaggcagtgagggagtttctcgagaataacgctgagctgtgtcagcct
gatcacatccacatctgtgacggctctgaggaggagaatgggcggcttctgggccagatg
gaggaagagggcatcctcaggcggctgaagaagtatgacaactgctggttggctctcact
gaccccagggatgtggccaggatcgaaagcaagacggttatcgtcacccaagagcaaaga
gacacagtgcccatccccaaaacaggcctcagccagctcggtcgctggatgtcagaggag
gattttgagaaagcgttcaatgccaggttcccagggtgcatgaaaggtcgcaccatgtac
gtcatcccattcagcatggggccgctgggctcgcctctgtcaaagatcggcatcgagctg
acggattcaccctacgtggtggccagcatgcggatcatgacgcggatgggcacgcccgtc
ctggaagcagtgggcgatggggagtttgtcaaatgcctccattctgtggggtgccctctg
cctttacaaaagcctttggtcaacaactggccctgcaacccggagctgacgctcatcgcc
cacctgcctgaccgcagagagatcatctcctttggcagtgggtacggcgggaactcgctg
ctcgggaagaagtgctttgctctcaggatggccagccggctggccaaggaggaagggtgg
ctggcagagcacatgctgattctgggtataaccaaccctgagggtgagaagaagtacctg
gcggccgcatttcccagcgcctgcgggaagaccaacctggccatgatgaaccccagcctc
cccgggtggaaggttgagtgcgtcggggatgacattgcctggatgaagtttgacgcacaa
ggtcatttaagggccatcaacccagaaaatggctttttcggtgtcgctcctgggacttca
gtgaagaccaaccccaatgccatcaagaccatccagaagaacacaatctttaccaatgtg
gccgagaccagcgacgggggcgtttactgggaaggcattgatgagccgctagcttcaggt
gtcaccatcacgtcctggaagaataaggagtggagctcagaggatggggaaccttgtgcc
caccccaactcgaggttctgcacccctgccagccagtgccccatcattgatgctgcctgg
gagtctccggaaggtgttcccattgaaggcattatctttggaggccgtagacctgctggt
gtccctctagtctatgaagctctcagctggcaacatggagtctttgtgggggcggccatg
agatcagaggccacagcggctgcagaacataaaggcaaaatcatcatgcatgaccccttt
gccatgcggcccttctttggctacaacttcggcaaatacctggcccactggcttagcatg
gcccagcacccagcagccaaactgcccaagatcttccatgtcaactggttccggaaggac
aaggaaggcaaattcctctggccaggctttggagagaactccagggtgctggagtggatg
ttcaaccggatcgatggaaaagccagcaccaagctcacgcccataggctacatccccaag
gaggatgccctgaacctgaaaggcctggggcacatcaacatgatggagcttttcagcatc
tccaaggaattctgggagaaggaggtggaagacatcgagaagtatctggaggatcaagtc
aatgccgacctcccctgtgaaatcgagagagagatccttgccttgaagcaaagaataagc
cagatgtaa
MPPQLQNGLNLSAKVVQGSLDSLPQAVREFLENNAELCQPDHIHICDGSEEENGRLLGQM
EEEGILRRLKKYDNCWLALTDPRDVARIESKTVIVTQEQRDTVPIPKTGLSQLGRWMSEE
DFEKAFNARFPGCMKGRTMYVIPFSMGPLGSPLSKIGIELTDSPYVVASMRIMTRMGTPV
LEAVGDGEFVKCLHSVGCPLPLQKPLVNNWPCNPELTLIAHLPDRREIISFGSGYGGNSL
LGKKCFALRMASRLAKEEGWLAEHMLILGITNPEGEKKYLAAAFPSACGKTNLAMMNPSL
PGWKVECVGDDIAWMKFDAQGHLRAINPENGFFGVAPGTSVKTNPNAIKTIQKNTIFTNV
AETSDGGVYWEGIDEPLASGVTITSWKNKEWSSEDGEPCAHPNSRFCTPASQCPIIDAAW
ESPEGVPIEGIIFGGRRPAGVPLVYEALSWQHGVFVGAAMRSEATAAAEHKGKIIMHDPF
AMRPFFGYNFGKYLAHWLSMAQHPAAKLPKIFHVNWFRKDKEGKFLWPGFGENSRVLEWM
FNRIDGKASTKLTPIGYIPKEDALNLKGLGHINMMELFSISKEFWEKEVEDIEKYLEDQV
NADLPCEIEREILALKQRISQM

MOUSE: Pck1
atgcctcctcagctgcataacggtctggacttctctgccaaggtcatccagggcagcctc
gacagcctgccccaggcagtgaggaagttcgtggaaggcaatgctcagctgtgccagccg
gagtatatccacatctgcgatggctccgaggaggagtacgggcagttgctggcccacatg
caggaggagggtgtcatccgcaagctgaagaaatatgacaactgttggctggctctcact
gaccctcgagatgtggccaggatcgaaagcaagacagtcatcatcacccaagagcagaga
gacacagtgcccatccccaaaactggcctcagccagctgggccgctggatgtcggaagag
gactttgagaaagcattcaacgccaggttcccagggtgcatgaaaggccgcaccatgtat
gtcatcccattcagcatggggccactgggctcgccgctggccaagattggtattgaactg
acagactcgccctatgtggtggccagcatgcggatcatgactcggatgggcatatctgtg
ctggaggccctgggagatggggagttcatcaagtgcctgcactctgtggggtgccctctc
cccttaaaaaagcctttggtcaacaactgggcctgcaaccctgagctgaccctgatcgcc
cacctcccggaccgcagagagatcatctcctttggaagcggatatggtgggaactcacta
ctcgggaagaaatgctttgcgttgcggatcgccagccgtctggctaaggaggaagggtgg
ctggcggagcatatgctgatcctgggcataactaaccccgaaggcaagaagaaatacctg
gccgcagccttccctagtgcctgtgggaagactaacttggccatgatgaaccccagcctg
cccgggtggaaggtcgaatgtgtgggcgatgacattgcctggatgaagtttgatgcccaa
ggcaacttaagggctatcaacccagaaaacgggttttttggagttgctcctggcacctca
gtgaagacaaatccaaatgccattaaaaccatccagaaaaacaccatcttcaccaacgtg
gccgagactagcgatgggggtgtttactgggaaggcatcgatgagccgctggccccggga
gtcaccatcacctcctggaagaacaaggagtggagaccgcaggacgcggaaccatgtgcc
catcccaactcgagattctgcacccctgccagccagtgccccattattgaccctgcctgg
gaatctccagaaggagtacccattgagggtatcatctttggtggccgtagacctgaaggt
gtcccccttgtctatgaagccctcagctggcagcatggggtgtttgtaggagcagccatg
agatctgaggccacagctgctgcagaacacaagggcaagatcatcatgcacgaccccttt
gccatgcgacccttcttcggctacaacttcggcaaatacctggcccactggctgagcatg
gcccaccgcccagcagccaagttgcccaagatcttccatgtcaactggttccggaaggac
aaagatggcaagttcctctggccaggctttggcgagaactcccgggtgctggagtggatg
ttcgggcggattgaaggggaagacagcgccaagctcacgcccatcggctacatccctaag
gaaaacgccttgaacctgaaaggcctggggggcgtcaacgtggaggagctgtttgggatc
tctaaggagttctgggagaaggaggtggaggagatcgacaggtatctggaggaccaggtc
aacaccgacctcccttacgaaattgagagggagctccgagccctgaaacagagaatcagc
cagatgtaa
MPPQLHNGLDFSAKVIQGSLDSLPQAVRKFVEGNAQLCQPEYIHICDGSEEEYGQLLAHM
QEEGVIRKLKKYDNCWLALTDPRDVARIESKTVIITQEQRDTVPIPKTGLSQLGRWMSEE
DFEKAFNARFPGCMKGRTMYVIPFSMGPLGSPLAKIGIELTDSPYVVASMRIMTRMGISV
LEALGDGEFIKCLHSVGCPLPLKKPLVNNWACNPELTLIAHLPDRREIISFGSGYGGNSL
LGKKCFALRIASRLAKEEGWLAEHMLILGITNPEGKKKYLAAAFPSACGKTNLAMMNPSL
PGWKVECVGDDIAWMKFDAQGNLRAINPENGFFGVAPGTSVKTNPNAIKTIQKNTIFTNV
AETSDGGVYWEGIDEPLAPGVTITSWKNKEWRPQDAEPCAHPNSRFCTPASQCPIIDPAW
ESPEGVPIEGIIFGGRRPEGVPLVYEALSWQHGVFVGAAMRSEATAAAEHKGKIIMHDPF
AMRPFFGYNFGKYLAHWLSMAHRPAAKLPKIFHVNWFRKDKDGKFLWPGFGENSRVLEWM
FGRIEGEDSAKLTPIGYIPKENALNLKGLGGVNVEELFGISKEFWEKEVEEIDRYLEDQV
NTDLPYEIERELRALKQRISQM

DROME: Pepck2
atgctgaagaagggaaccatcattcctctgccgaagtacgagaattgctggctggcaaga
accaatccggcggatgtggctagagtggagggaaaaacgttcatctcaacggattcgaag
gagcagacagtaccggttacggagaaggccacaccgggaatgctgggtaactggatagcc
gaaaaggacatgcaggcggcgatcaaggaaagattccccggctgcatgaaaggtcgcacc
atgtatgtcattccttttagcatgggtccagtgggctcacctctctccaaaatcggaatc
gagatcacagactcaccatacgtcgtcgagtccatgaagatcatgactagggcgggcaat
ccagtgcttaattatctgcaatctggggatggtcagtttgtcaagtgcctgcattccgtg
ggtacgcccaaaagtggtgtccaggcaatgccatcctggccctgcgatcccgaacgcact
attgtgctgcacaagccagcagaaaatgagattgtatcttatggatctgggtatggtggt
aactccctgctgggcaagaagtgcctcgctctgaggattggcagcaccattgccaaacga
gagggctggctggccgagcacatgttgatactgggcatcaccaatccgcaaggtaagaag
atctacatagctgccgcctttccatcagcttgcggtaagaccaacctggcgatgatgact
cctaccctgcctggctacaaagtggagtgcgtgggcgatgacatcgcctggatgaagttc
gataacaagggtgtgctgcgagcgattaatccggagaatggattctttggcgtggcgccc
ggaacgtcgagggccaccaatcccatagccatggatacgatcttccgaaactctgtcttt
acgaacgtggcctctacatccgatggaggtgtctactgggagggaatggaaaaggatcag
ctgaagggggtgactgtcacggactggttgggtaaactctggtcccaggaatccggaaag
ccagctgcccatcccaactccaggttctgtacacccgcctctcagtgtcccattattgat
cccgcctgggaggatagcgaaggagtgcccatctccgcaattcttttcggaggtcgtcgt
cccagtggagttcccttggtttacgaggctcgagactggaagcacggcgtatttattgga
gctgctatgaggagcgaggccacggcagccgctgagttcaagggcaaggtcatcatgcac
gatcccttcgccatgagaccctttttcggctacaacttcggcgactatctgggtcactgg
ctaagcatggagcagcgtggccaggtgcccaagatctttcacgtaaattggttccgaaag
agcagtgagggcaagttcctttggcccggattcggggagaactcacgagtcctggactgg
atcttccggcgggtggagggcgagcagtgcttcgaggactctcccattggccgcctgccc
agcaagaattcattgaacttggatagtttggaaaacattgatctcgaccagcttttcgat
ctgccaaaagatttctgggagcaggaggtggctgccatagagaggtacttcgaggagcag
gtgggccaccatctgccaggtgccgtggccgaggagctgagggagctgaaggcgcgtgtt
gctgacatgtga
MLKKGTIIPLPKYENCWLARTNPADVARVEGKTFISTDSKEQTVPVTEKATPGMLGNWIA
EKDMQAAIKERFPGCMKGRTMYVIPFSMGPVGSPLSKIGIEITDSPYVVESMKIMTRAGN
PVLNYLQSGDGQFVKCLHSVGTPKSGVQAMPSWPCDPERTIVLHKPAENEIVSYGSGYGG
NSLLGKKCLALRIGSTIAKREGWLAEHMLILGITNPQGKKIYIAAAFPSACGKTNLAMMT
PTLPGYKVECVGDDIAWMKFDNKGVLRAINPENGFFGVAPGTSRATNPIAMDTIFRNSVF
TNVASTSDGGVYWEGMEKDQLKGVTVTDWLGKLWSQESGKPAAHPNSRFCTPASQCPIID
PAWEDSEGVPISAILFGGRRPSGVPLVYEARDWKHGVFIGAAMRSEATAAAEFKGKVIMH
DPFAMRPFFGYNFGDYLGHWLSMEQRGQVPKIFHVNWFRKSSEGKFLWPGFGENSRVLDW
IFRRVEGEQCFEDSPIGRLPSKNSLNLDSLENIDLDQLFDLPKDFWEQEVAAIERYFEEQ
VGHHLPGAVAEELRELKARVADM

#### 2.3.1.12
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: DLAT
atgtggcgcgtctgtgcgcgacgggctcagaatgtagccccatgggcgggactcgaggct
cggtggacggccttgcaggaggtacccggaactccacgagtgacctcgcgatctggcccg
gctcccgctcgtcgcaacagcgtgactacagggtatggcggggtccgggcactgtgcggc
tggacccccagttctggggccacgccgcggaaccgcttactgctgcagcttttggggtcg
cccggccgccgctattacagtcttcccccgcatcagaaggttccattgccttctctttcc
cccacaatgcaggcaggcaccatagcccgttgggaaaaaaaagagggggacaaaatcaat
gaaggtgacctaattgcagaggttgaaactgataaagccactgttggatttgagagcctg
gaggagtgttatatggcaaagatacttgttgctgaaggtaccagggatgttcccatcgga
gcgatcatctgtatcacagttggcaagcctgaggatattgaggcctttaaaaattataca
ctggattcctcagcagcacctaccccacaagcggccccagcaccaacccctgctgccact
gcttcgccacctacaccttctgctcaggctcctggtagctcatatccccctcacatgcag
gtacttcttcctgccctctctcccaccatgaccatgggcacagttcagagatgggaaaaa
aaagtgggtgagaagctaagtgaaggagacttactggcagagatagaaactgacaaagcc
actataggttttgaagtacaggaagaaggttatctggcaaaaatcctggtccctgaaggc
acaagagatgtccctctaggaaccccactctgtatcattgtagaaaaagaggcagatata
tcagcatttgctgactataggccaaccgaagtaacagatttaaaaccacaagtgccacca
cctaccccacccccggtggccgctgttcctccaactccccagcctttagctcctacacct
tcagcaccctgcccagctactcctgctggaccaaagggaagggtgtttgttagccctctt
gcaaagaagttggcagtagagaaagggattgatcttacacaagtaaaagggacaggacca
gatggtagaatcaccaagaaggatatcgactcttttgtgcctagtaaagttgctcctgct
ccggcagctgttgtgcctcccacaggtcctggaatggcaccagttcctacaggtgtcttc
acagatatcccaatcagcaacattcgtcgggttattgcacagcgattaatgcaatcaaag
caaaccatacctcattattacctttctatcgatgtaaatatgggagaagttttgttggta
cggaaagaacttaataagatattagaagggagaagcaaaatttctgtcaatgacttcatc
ataaaagcttcagctttggcatgtttaaaagttcccgaagcaaattcttcttggatggac
acagttataagacaaaatcatgttgttgatgtcagtgttgcggtcagtactcctgcagga
ctcatcacacctattgtgtttaatgcacatataaaaggagtggaaaccattgctaatgat
gttgtttctttagcaaccaaagcaagagagggtaaactacagccacatgaattccagggt
ggcacttttacgatctccaatttaggaatgtttggaattaagaatttctctgctattatt
aacccacctcaagcatgtattttggcaattggtgcttcagaggataaactggtccctgca
gataatgaaaaagggtttgatgtggctagcatgatgtctgttacactcagttgtgatcac
cgggtggtggatggagcagttggagcccagtggcttgctgagtttagaaagtaccttgaa
aaacctatcactatgttgttgtaa
MWRVCARRAQNVAPWAGLEARWTALQEVPGTPRVTSRSGPAPARRNSVTTGYGGVRALCG
WTPSSGATPRNRLLLQLLGSPGRRYYSLPPHQKVPLPSLSPTMQAGTIARWEKKEGDKIN
EGDLIAEVETDKATVGFESLEECYMAKILVAEGTRDVPIGAIICITVGKPEDIEAFKNYT
LDSSAAPTPQAAPAPTPAATASPPTPSAQAPGSSYPPHMQVLLPALSPTMTMGTVQRWEK
KVGEKLSEGDLLAEIETDKATIGFEVQEEGYLAKILVPEGTRDVPLGTPLCIIVEKEADI
SAFADYRPTEVTDLKPQVPPPTPPPVAAVPPTPQPLAPTPSAPCPATPAGPKGRVFVSPL
AKKLAVEKGIDLTQVKGTGPDGRITKKDIDSFVPSKVAPAPAAVVPPTGPGMAPVPTGVF
TDIPISNIRRVIAQRLMQSKQTIPHYYLSIDVNMGEVLLVRKELNKILEGRSKISVNDFI
IKASALACLKVPEANSSWMDTVIRQNHVVDVSVAVSTPAGLITPIVFNAHIKGVETIAND
VVSLATKAREGKLQPHEFQGGTFTISNLGMFGIKNFSAIINPPQACILAIGASEDKLVPA
DNEKGFDVASMMSVTLSCDHRVVDGAVGAQWLAEFRKYLEKPITMLL
     source          1..2399
     CDS             <49..1992

MOUSE: Dlat
atgtggcgcgtctgtgcgcggagggcgcggagtgctgtgcccagggatgggttcagggct
cggtgggcggccttgaaggaaggccccggggccccatgcgggagcccgcggattggcccc
gctgcggtccgttgcggtagtgggatcccccgctatggggtccgctccttgtgcggctgg
agctccggctccggcactgtcccgcgtaaccgcttgctgcgacaactcctggggtcgccc
agccgccgctcttacagcctccctccgcatcagaaggttccattaccttccctttcccct
acaatgcaggcaggcaccatagcccgctgggaaaaaaaagaaggggaaaaaatcagtgag
ggtgatctaattgcagaggttgaaactgataaagccactgttgggtttgagagcctggag
gagtgctatatggccaagatccttgttcctgaagggaccagagatgttccagttgggtcc
atcatctgtatcacagttgaaaagcctcaggatattgaggcctttaaaaattatacattg
gatttggcggcggcagctgccccacaggcagccccagctgcagccccagctccagctgct
gccccagcggcaccttctgcaagcgctcccggtagctcctatcctactcatatgcagatt
gttcttcctgccctctccccaaccatgaccatgggcacggtccagaggtgggaaaagaaa
gtgggcgagaagctgagtgaaggagacttgctggcagagatagagaccgacaaggccacc
ataggctttgaagtacaagaagaaggttatctggcaaaaatcctggtccctgaaggcaca
agggatgttcctctgggagctccactatgtatcatagtagaaaaacaggaagatatagca
gcatttgcagactacaggccaacagaagtgaccagcttaaagccacaggcagcaccacct
gccccacccccggtggcagctgttcctcccactccccagcctgtagcacctaccccctca
gctgctcctgctggaccaaagggaagggtgttcgttagtcctcttgcgaagaagttggca
gcagagaaagggattgacctcacccaagttaaagggacgggaccagaaggcagaatcatc
aagaaggacattgactcttttgtgccttctaaggctgctcctgctgcagcagctgccatg
gctcccccgggtccaagagtggcaccagctcctgcaggtgtcttcacagacatccccatc
agcaacattcgtcgagtgattgcgcagaggctcatgcagtcgaagcagactatacctcat
tattacctttctgtcgatgtaaatatgggagaggtgctgttggtacggaaggaacttaat
aagatgcttgaagggaaagggaaaatctccgtcaacgacttcattataaaggcttcagct
ttggcctgtctgaaagttcccgaagcaaactcgtcttggatggacacagttataaggcaa
aatcatgtggttgacgtcagtgttgctgtcagtacccctgcaggacttatcacccctatt
gtgtttaatgcacacataaaaggactggaaaccattgctagtgatgttgtttctttagcc
tccaaagcgagagagggtaaacttcagcctcatgagttccagggtggaacatttacaatc
tccaacttagggatgtttggaattaagaatttctctgcaattattaatccacctcaggca
tgtattctggcaatcggtgcttcagaggataaactgatcccagcagataatgagaaaggc
tttgatgtggctagtgtgatgtccgttacactcagctgtgatcatcgagttgtggatgga
gcagttggagcccagtggcttgctgaattcaaaaagtaccttgaaaagcctataactatg
ttgttataa
MWRVCARRARSAVPRDGFRARWAALKEGPGAPCGSPRIGPAAVRCGSGIPRYGVRSLCGW
SSGSGTVPRNRLLRQLLGSPSRRSYSLPPHQKVPLPSLSPTMQAGTIARWEKKEGEKISE
GDLIAEVETDKATVGFESLEECYMAKILVPEGTRDVPVGSIICITVEKPQDIEAFKNYTL
DLAAAAAPQAAPAAAPAPAAAPAAPSASAPGSSYPTHMQIVLPALSPTMTMGTVQRWEKK
VGEKLSEGDLLAEIETDKATIGFEVQEEGYLAKILVPEGTRDVPLGAPLCIIVEKQEDIA
AFADYRPTEVTSLKPQAAPPAPPPVAAVPPTPQPVAPTPSAAPAGPKGRVFVSPLAKKLA
AEKGIDLTQVKGTGPEGRIIKKDIDSFVPSKAAPAAAAAMAPPGPRVAPAPAGVFTDIPI
SNIRRVIAQRLMQSKQTIPHYYLSVDVNMGEVLLVRKELNKMLEGKGKISVNDFIIKASA
LACLKVPEANSSWMDTVIRQNHVVDVSVAVSTPAGLITPIVFNAHIKGLETIASDVVSLA
SKAREGKLQPHEFQGGTFTISNLGMFGIKNFSAIINPPQACILAIGASEDKLIPADNEKG
FDVASVMSVTLSCDHRVVDGAVGAQWLAEFKKYLEKPITMLL
     source          1..4034
     CDS             316..2244
     regulatory      4006..4011
     polyA_site      4034

DROME: muc
atgctgcgctcccttgcaacaacacgaaacgaacttggggcccttcgctccgtgctcctg
cgatcgaataacgccacctatgtccgccgatcgacgggaaatgtggttgtgcgcgccctc
agcagccagctgatcaactcccggaaactccagagcatcaggtcgaaacttaacactagc
cagtcaccggtcacatggagctacaacttcgcccgtgcctatgccaaccttccggaacac
atcagggtgccactgcccgcactttccccgactatggagcgcggatcgattgtcagctgg
gagaagaaggagggcgataagctcaacgaaggtgacttgctgtgcgagattgagacggat
aaggccaccatgggctttgagacgcccgaggagggctttctggctaagattctcatccag
ggcggcaccaaggacgttcccgttggccagctgctgtgcattatcgtgccggaccaaggc
agcgtagctgctttcgcgaacttcaaggacgacggtgccgccgcagcaccagctgctccg
gcagcagctccagctccagcaccggcagcagcagcagctccgccaccaccaccaccaccc
gccgcagctccagcagccgctgcgcctccaccagctcccgccgctgctccagctgcagca
ggccagaaagcagcagccaagccagctgctgcggcacctgccaaggcccccagggcagct
ggagcgcgctacgaggacattccggtgaccaacatgcgcgcagtgattgccaaacgtctg
ctggagtccaagacacaactgcctcactactacgtcaccgtgcaatgccaagtggataag
ctgctgaagttccgcgcgaaggtgaacaagaagtacgagaagcagggtgcccgcgtctct
gtaaacgacttcattatcaaggccgtggccattgccagtcttaaggttcccgaagcgaac
tccgcctggatggacacagtaattcgcaagtacgacgacgtcgatgtttcggttgctgtc
tccacagacaagggtctgattaccccgattgttttcaatgccgaccgcaagggtgtcctg
gagatctctaaggatgtcaaggcgctggcagccaaggcgcgcgacaacaaacttcagccc
cacgaattccagggtggcaccatctcggtttctaatctgggcatgttcggtgtgaaccag
tttgccgctgtcatcaaccctcctcaatcgtgcatccttgccattggcaccacaacgaaa
cagttggttgctgatcccgacagtctcaagggcttcaaggaggtcaacatgctgacggtc
accctgagtgctgatcatcgtgttgtggatggtgctgttgctgccaggtggctgcagcac
ttccgcgactacatggaggatccttccaatatggtattgtaa
MLRSLATTRNELGALRSVLLRSNNATYVRRSTGNVVVRALSSQLINSRKLQSIRSKLNTS
QSPVTWSYNFARAYANLPEHIRVPLPALSPTMERGSIVSWEKKEGDKLNEGDLLCEIETD
KATMGFETPEEGFLAKILIQGGTKDVPVGQLLCIIVPDQGSVAAFANFKDDGAAAAPAAP
AAAPAPAPAAAAAPPPPPPPAAAPAAAAPPPAPAAAPAAAGQKAAAKPAAAAPAKAPRAA
GARYEDIPVTNMRAVIAKRLLESKTQLPHYYVTVQCQVDKLLKFRAKVNKKYEKQGARVS
VNDFIIKAVAIASLKVPEANSAWMDTVIRKYDDVDVSVAVSTDKGLITPIVFNADRKGVL
EISKDVKALAAKARDNKLQPHEFQGGTISVSNLGMFGVNQFAAVINPPQSCILAIGTTTK
QLVADPDSLKGFKEVNMLTVTLSADHRVVDGAVAARWLQHFRDYMEDPSNMVL

#### 1.1.1.37
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: MDH1
atgtctgaaccaatcagagtccttgtgactggagcagctggtcaaattgcatattcactg
ctgtacagtattggaaatggatctgtctttggtaaagatcagcctataattcttgtgctg
ttggatatcacccccatgatgggtgtcctggacggtgtcctaatggaactgcaagactgt
gcccttcccctcctgaaagatgtcatcgcaacagataaagaagacgttgccttcaaagac
ctggatgtggccattcttgtgggctccatgccaagaagggaaggcatggagagaaaagat
ttactgaaagcaaatgtgaaaatcttcaaatcccagggtgcagccttagataaatacgcc
aagaagtcagttaaggttattgttgtgggtaatccagccaataccaactgcctgactgct
tccaagtcagctccatccatccccaaggagaacttcagttgcttgactcgtttggatcac
aaccgagctaaagctcaaattgctcttaaacttggtgtgactgctaatgatgtaaagaat
gtcattatctggggaaaccattcctcgactcagtatccagatgtcaaccatgccaaggtg
aaattgcaaggaaaggaagttggtgtttatgaagctctgaaagatgacagctggctcaag
ggagaatttgtcacgactgtgcagcagcgtggcgctgctgtcatcaaggctcgaaaacta
tccagtgccatgtctgctgcaaaagccatctgtgaccacgtcagggacatctggtttgga
accccagagggagagtttgtgtccatgggtgttatctctgatggcaactcctatggtgtt
cctgatgatctgctctactcattccctgttgtaatcaagaataagacctggaagtttgtt
gaaggtctccctattaatgatttctcacgtgagaagatggatcttactgcaaaggaactg
acagaagaaaaagaaagtgcttttgaatttctttcctctgcctga
MSEPIRVLVTGAAGQIAYSLLYSIGNGSVFGKDQPIILVLLDITPMMGVLDGVLMELQDC
ALPLLKDVIATDKEDVAFKDLDVAILVGSMPRREGMERKDLLKANVKIFKSQGAALDKYA
KKSVKVIVVGNPANTNCLTASKSAPSIPKENFSCLTRLDHNRAKAQIALKLGVTANDVKN
VIIWGNHSSTQYPDVNHAKVKLQGKEVGVYEALKDDSWLKGEFVTTVQQRGAAVIKARKL
SSAMSAAKAICDHVRDIWFGTPEGEFVSMGVISDGNSYGVPDDLLYSFPVVIKNKTWKFV
EGLPINDFSREKMDLTAKELTEEKESAFEFLSSA
     source          1..1267
     CDS             56..1060
     regulatory      1248..1253

MOUSE: Mdh2
atgctgtccgctctcgcccgtcctgccggcgccgctctccgccgcagcttcagcacttcg
gcccagaacaatgctaaagtggctgtcctgggagcttctgggggcattgggcaacccctt
tcactcctgctgaagaacagccccctagtgagccgcctgaccctctacgatatcgctcac
acacctggtgtggcagcagatctgagtcacattgagaccagagcaaatgtgaaaggctac
cttggaccggagcagttgccagattgcctcaaaggttgtgatgtggtggtcatcccagcc
ggagtgcccaggaaaccaggaatgacacgggatgacctgttcaacaccaacgctaccatt
gtggccaccctgacggctgcctgtgcccagcactgtcctgaagccatggtttgcatcatt
gccaacccagtgaactccaccatccccatcacagcagaagttttcaagaagcacggtgtg
tacaaccctaacaagatcttcggtgtgacaacccttgacatcgtcagagcgaacacgttt
gtggcagagctaaagggtttggatccagctcgagtcaacgtgcctgtcattggcggccac
gccgggaagacgatcatccccctgatctctcagtgtaccccgaaggttgactttccccaa
gaccagctggccacactcaccgggaggatccaggaggctggcacagaagtcgtgaaggcc
aaggctggagcaggttctgccactctgtccatggcttatgctggagcccgctttgtcttc
tccctcgtggacgccatgaacgggaaggaaggagtcgttgagtgttcttttgttcagtcc
aaagagacggaatgcacttacttctctacgcccttgctcttggggaaaaagggcctggag
aagaacctgggcattggcaagatcactccttttgaggaaaaaatgattgccgaggctatc
cctgagctgaaagcctccatcaagaaaggcgaggactttgtcaagaacatgaagtga
MLSALARPAGAALRRSFSTSAQNNAKVAVLGASGGIGQPLSLLLKNSPLVSRLTLYDIAH
TPGVAADLSHIETRANVKGYLGPEQLPDCLKGCDVVVIPAGVPRKPGMTRDDLFNTNATI
VATLTAACAQHCPEAMVCIIANPVNSTIPITAEVFKKHGVYNPNKIFGVTTLDIVRANTF
VAELKGLDPARVNVPVIGGHAGKTIIPLISQCTPKVDFPQDQLATLTGRIQEAGTEVVKA
KAGAGSATLSMAYAGARFVFSLVDAMNGKEGVVECSFVQSKETECTYFSTPLLLGKKGLE
KNLGIGKITPFEEKMIAEAIPELKASIKKGEDFVKNMK
     source          1..1244
     mRNA            <1..1244
     CDS             47..1063

DROME: CG10748
MLLLTSLKSLAKPATWGVVVRTLKVAVVGAGGGIGQPLSLLLRRCPGIDELALHDLSEMK
GIATDLSHISQTGKVIGFTGEKELESAVSGADVVVVAAGMPRLPGMQRDHLMAANGNVAV
KVATAISNASPRAHLAFITNPVNMIVPAAAEVLMAHGTFDSRRLFGITTLDVVRSKKFIG
DSMNISPDDVNIPVIGGHAGITILPLISQCQPIYRCDLQEIQNLTHRIQEAGTEVVNAKA
GKGSATLSMAYAGATFVNSLLRGIAGQDGLIECAFVASKLTDAPFFASPLELGKDGIKRY
IPLPQMSDYEKEALEKLLPILRQNADEGVNFAKMILSGQSHSPIPAALP
atgttgttactgacaagtcttaaaagcctggcaaaaccagctacatggggagttgtggtc
cgcactttaaaggtcgccgttgtcggtgccggaggaggaattggacaaccgctatcgctt
ctgctccgtcgctgtcctggaatcgatgagctggctctacatgatctcagcgaaatgaag
ggaattgctacggatctatcccatataagccaaacgggaaaggtgataggttttaccggt
gaaaaggaactggagtcggcggtgagtggagctgatgtggtggttgtggcggcagggatg
ccacgtctgccaggaatgcaaagggatcacctgatggccgccaatggaaatgttgcagtg
aaagttgccactgccattagcaatgcctctccacgagctcatcttgcctttattaccaat
ccggtcaatatgattgtgcccgccgcagctgaggttcttatggcccatggaacttttgat
tctcgtcggctcttcggtattacgactttggatgtggtgcgatcgaaaaagttcattggt
gattctatgaacatatcaccggatgacgtaaacattccagttattggtggccatgcgggg
attacaattctaccgctcatttcgcagtgtcagccgatatatagatgtgatctccaggag
atccagaatctaactcatcgcattcaggaggcgggcacagaggtggtgaatgccaaagct
ggaaaaggatctgccaccctatcgatggcttatgctggcgcaactttcgtgaactccctg
ctgcgtggaattgctggacaggatggtctaatcgagtgcgcttttgtcgcctccaaacta
accgacgccccattctttgctagtccattggaattgggaaaggatggtatcaagcgctat
ataccacttccccagatgagtgactacgaaaaggaggctttggaaaagctactacctatt
ctacgacagaatgctgatgagggtgtcaattttgcaaaaatgattttgagtggacaatca
cattctcccattccagcggccttgccgtaa

#### 4.2.1.2
ANIMAL: GeneName
DNASeq
ProteinSeq
SequenceInfo

HUMAN: FH
atgtaccgagcacttcggctcctcgcgcgctcgcgtcccctcgtgcgggctccagccgca
gccttagcttcggctcccggcttgggtggcgcggccgtgccctcgttttggcctccgaac
gcggctcgaatggcaagccaaaattccttccggatagaatatgatacctttggtgaacta
aaggtgccaaatgataagtattatggcgcccagaccgtgagatctacgatgaactttaag
attggaggtgtgacagaacgcatgccaaccccagttattaaagcttttggcatcttgaag
cgagcggccgctgaagtaaaccaggattatggtcttgatccaaagattgctaatgcaata
atgaaggcagcagatgaggtagctgaaggtaaattaaatgatcattttcctctcgtggta
tggcagactggatcaggaactcagacaaatatgaatgtaaatgaagtcattagcaataga
gcaattgaaatgttaggaggtgaacttggcagcaagatacctgtgcatcccaacgatcat
gttaataaaagccagagctcaaatgatacttttcccacagcaatgcacattgctgctgca
atagaagttcatgaagtactgttaccaggactacagaagttacatgatgctcttgatgca
aaatccaaagagtttgcacagatcatcaagattggacgtactcatactcaggatgctgtt
ccacttactcttgggcaggaatttagtggttatgttcaacaagtaaaatatgcaatgaca
agaataaaagctgccatgccaagaatctatgagctcgcagctggaggcactgctgttggt
acaggtttaaatactagaattggctttgcagaaaaggttgctgcaaaagtggctgcactt
acaggcttgccttttgtcactgctccgaataaatttgaagctctggctgctcatgacgct
ctggttgagctcagtggagccatgaacactactgcctgcagtctgatgaagatagcaaat
gatattcgatttttgggttctggtcctcggtcaggtctgggagaattgatcttgcctgaa
aatgaaccaggaagcagtatcatgccaggcaaggtgaaccctactcagtgtgaagcaatg
accatggttgcagcccaagtcatggggaaccatgttgctgtcactgtcggaggcagcaat
ggacattttgagttgaatgttttcaagccaatgatgattaaaaatgtgttacactcagcc
aggctgctgggggatgcttcagtttcctttacagaaaactgcgtggtgggaatccaggcc
aatacagaaaggatcaacaagctgatgaatgagtctctaatgttggtgacagctctcaat
cctcatatagggtatgacaaggcagcaaagattgctaagacagcacacaaaaatggatca
accttaaaggaaactgctatcgaacttggctatctcacagcagagcagtttgacgaatgg
gtaaaacctaaggacatgctgggtccaaagtga
MYRALRLLARSRPLVRAPAAALASAPGLGGAAVPSFWPPNAARMASQNSFRIEYDTFGEL
KVPNDKYYGAQTVRSTMNFKIGGVTERMPTPVIKAFGILKRAAAEVNQDYGLDPKIANAI
MKAADEVAEGKLNDHFPLVVWQTGSGTQTNMNVNEVISNRAIEMLGGELGSKIPVHPNDH
VNKSQSSNDTFPTAMHIAAAIEVHEVLLPGLQKLHDALDAKSKEFAQIIKIGRTHTQDAV
PLTLGQEFSGYVQQVKYAMTRIKAAMPRIYELAAGGTAVGTGLNTRIGFAEKVAAKVAAL
TGLPFVTAPNKFEALAAHDALVELSGAMNTTACSLMKIANDIRFLGSGPRSGLGELILPE
NEPGSSIMPGKVNPTQCEAMTMVAAQVMGNHVAVTVGGSNGHFELNVFKPMMIKNVLHSA
RLLGDASVSFTENCVVGIQANTERINKLMNESLMLVTALNPHIGYDKAAKIAKTAHKNGS
TLKETAIELGYLTAEQFDEWVKPKDMLGPK
     source          1..1792
     gene            1..1792
     5'UTR           1..33
     CDS             34..1566
     sig_peptide     34..162
     mat_peptide     163..1563
     3'UTR           1567..1792
     regulatory      1768..1773

MOUSE: Fh1
MYRALRLLARSRRLLRVPSAGAAVSGEATTLPRCAPNVARMASQNSFRVEFDTFGELKVP
TDKYYGAQTVRSTMNFKIGGATERMPIPVIQAFGILKRAAAEVNQEYGLDPKIASAIMKA
ADEVAEGKLNDHFPLVVWQTGSGTQTNMNVNEVISNRAIEMLGGELGSKKPVHPNDHVNK
SQSSNDTFPTAMHIAAAVEVHKVLLPGLQKLHDALSAKSKEFAQVIKIGRTHTQDAVPLT
LGQEFSGYVQQVQYAMVRIKAAMPRIYELAAGGTAVGTGLNTRIGFAEKVAAKVAALTGL
PFVTAPNKFEALAAHDALVELSGAMNTAACSLMKIANDIRFLGSGPRSGLGELILPENEP
GSSIMPGKVNPTQCEAMTMVAAQVMGNHVAVTVGGSNGHFELNVFKPMMIKNVLHSARLL
GDASVSFTDNCVVGIQANTERINKLMNESLMLVTALNPHIGYDKAAKIAKTAHKNGSTLK
ETAIELGYLTAEQFDEWVKPKDMLGPK
atgtaccgcgcactccgtctcctcgcgcgctcgcgtcgcctcctgcgggttccgtccgcc
ggtgctgcagtgtctggggaagcgaccaccctcccgcggtgtgctccgaacgtcgcgcga
atggcaagccaaaattccttccgtgtagagttcgacacctttggtgaattgaaggttcca
accgataagtattatggtgctcagaccgtaagatctacgatgaactttaagattggaggt
gctacggaacgtatgccaatcccagtcattcaagctttcggcatcttgaagcgagctgct
gctgaagtaaaccaggagtatggtctcgatccaaagattgctagtgcaataatgaaggcc
gcagatgaggtagctgaaggtaaattaaatgatcactttcctctggtggtttggcagact
ggatcaggaacccagacaaacatgaatgtaaatgaagtcattagcaacagagcaattgaa
atgttaggaggtgaacttggcagcaagaagcctgtgcaccccaatgatcatgttaacaaa
agccagagctcgaatgacacctttcccacagcaatgcatattgctgctgcagtggaagtt
cacaaggtcctgttgccagggttacagaagctccatgatgctctcagtgcaaaatccaaa
gagtttgcgcaggtcatcaaaattgggcgaactcacacgcaggatgctgtccctcttact
cttggacaggaattcagtggttacgttcagcaagtccagtatgcgatggtgagaataaaa
gccgccatgccaagaatctacgagctcgctgctggaggcactgctgtggggacggggtta
aacaccaggatcggtttcgcagaaaaggtggccgcaaaagtagcagcactcacaggtttg
ccttttgtcactgccccgaataagtttgaagctctggctgctcatgatgctctggttgag
cttagtggagccatgaacactgccgcctgcagtctaatgaagatagcgaatgatattcgc
ttcctgggttctggtcctcggtcaggtttgggagagctgatcttgcctgaaaacgagcca
gggagcagcatcatgccaggaaaggtgaaccctactcagtgtgaagcgatgaccatggtt
gcagcccaagtcatggggaatcacgttgctgttaccgttggaggcagcaatggacatttt
gaactgaatgtgtttaaaccaatgatgattaagaatgtgctgcactcagccaggctactg
ggagatgcttcagtgtccttcacagacaactgtgtggtcgggatccaggccaacacagag
cggatcaacaagctaatgaatgagtctttaatgttggtcacagctcttaatccacatata
gggtatgacaaagcagcaaagattgccaagaccgcacacaagaacggatcaaccttaaag
gaaacggctattgaacttggctatctcacagcagagcagtttgatgagtgggtgaaaccc
aaggatatgctgggtccaaagtga
     source          1..1620
     CDS             57..1580
     regulatory      1601..1606
     polyA_site      1620

DROME: Fum4
MSFDQKEIFSLMYKLARLIVPDTRVEYDSMGAVHIPLDRMFGPQTMRSLMKFPIGGVEER
MPRPLIKALGIVKKSAAETNKIHCLEEHLCDAISKACDDVISGKLYDEEHFPLVIWQDGS
GEHTNMNVNEVICNRAIEILGGQMGSKEPVDPNEHVNMAQSSHDTFSTAVRIAVAMQLQE
TLYPSLRTFIDLLGKKSNDWMDLIKIGRTHLMDAVPLSLGQEFSGYQQQLVNGRTRLDCA
MCRLYQLPMGGTSVGTKVDTKAEYSAQCIKRIAELTFLPFVESPNFFESISACDCLVELH
GELNTIAASVMKIANDIRFLGSGPRCGFGELHLPENEPGSSIMPGKVNPTQCEAMSMICA
QVMGNHVAVSMGGSSGHFQLNTFMPMIASNVLRSITLLGDGMKSFCTNCLEGIEPNRSKI
GSIVKESLMLVTALSPHIGYERSAAIAKAAHHNGTTLEQEAILDGIQREDFREWVQPSKM
LGPE
atgtctttcgatcagaaggagattttcagtttgatgtacaaactggctcggctaatagtg
ccggatactcgagttgaatatgattcgatgggtgccgtgcacattcctctcgatcgaatg
ttcggtccgcaaaccatgagatccctgatgaaatttccaattggcggagttgaggaacga
atgccacgacccctaataaaagccctgggcatagtgaagaaatcagctgcggagacgaac
aaaatccattgtctggaggagcatctatgcgatgccatttccaaggcctgcgatgatgtt
atatcgggcaaactctatgacgaggaacactttccgttggttatatggcaggatggaagc
ggcgagcacacaaacatgaacgtaaacgaggttatatgcaatcgagccatcgaaattctg
ggcggtcagatgggctccaaggagccggtggatcccaatgaacatgtcaacatggcgcaa
agttcccatgacaccttctcgacagccgtgcgcatcgccgtggccatgcagttgcaggag
acgctgtatcccagcttaaggacctttattgatttgctgggcaagaagtcgaacgattgg
atggatttgatcaagattggtagaacgcatctgatggacgcagttcctctgtccctcggc
caggagttcagtggctatcagcagcaacttgtgaacggaaggacgcgattggactgtgcc
atgtgccgattgtatcagttgcccatgggcggcaccagtgtgggcaccaaagtggacacc
aaggcggaatattctgcgcagtgcatcaagcgtatagccgagctaacattcctacccttt
gtcgagtccccgaacttttttgaatccatctccgcctgcgattgcctggtggaactgcac
ggtgaactcaacacgattgcagcgagtgtgatgaagatagcgaatgatatacgattcctt
ggatcgggaccacgttgcggatttggtgaactacatctgccggagaacgaaccaggtagt
tccataatgcccggcaaagtgaatcccacgcaatgcgaggccatgtccatgatctgtgcc
caggtgatgggcaaccatgtggccgtctccatgggtggttcctctggccactttcagctg
aacacctttatgcccatgattgcctccaatgttttgcgctcgattacacttttgggcgat
ggcatgaagtccttttgcaccaattgcctcgagggcatcgagcccaataggagcaagatt
ggtagcatcgtcaaggagtccctgatgctggtcactgccctcagtccacacattggctac
gaacgatccgctgcgatcgccaaggcagcgcatcacaatggaaccactttggaacaggag
gccatacttgatggcattcaacgggaggacttcagggagtgggtgcagcccagcaagatg
ctgggtcccgaatag
     source          1..1642
     gene            1..1642
     misc_feature    1..1623
     CDS             73..1527

# Code for How I would construct the Database

### Inserting into a normal table (genes, pathways, enzymes)

INSERT INTO table_name (column1, column2, column3, ...)
VALUES (value1, value2, value3, ...);

- Do not specify the primary key. That will be taken care of. Fill in only the columns of which data we have.

### Inserting into a connection table

INSERT INTO connection_table (table1, table2) SELECT t1.id, t2.id FROM    table2 t2 LEFT JOIN table1 t1 ON t1._valueOnWhichTheyConnectInT1_ = somevalue AND t2._valueOnWhichTheyConnectInT2_ = somevalue;
                
INNER JOIN table2 t2 ON t1._valueOnWhichTheyConnectInT1_ = t2._valueOnWhichTheyConnectInT2_


Simply insert the data I collected above into these statements to create the database.




## Code for more data extraction

In [67]:
# This is the code that I used to extract all the organisms in UNIPROT with this exact enzyme number.

current_item = '3.1.1.31'

text = ""
with open(current_item + '.txt') as f:
    for line in f.readlines():
        line_split = line.split(";")
        for s in line_split:
            if len(s) > 8:
                text += s[-5:] + ", "
print(text)

ARATH, ORYSI, ORYSJ, ARATH, ORYSI, ORYSJ, ARATH, ORYSI, ORYSJ, ARATH, ORYSI, ORYSJ, ARATH, AGGAC, ARTBC, BACSU, BLOFL, BLOPB, BORBU, BOVIN, BUCA5, BUCAI, BUCAP, BUCAT, BUCBP, CAEEL, CAUVC, CHLMU, CHLPN, CHLTR, CITK8, CROS8, DICDI, DROME, ECO24, ECO27, ECO45, ECO55, ECO57, ECO5E, ECO7I, ECO81, ECO8A, ECOBW, ECODH, ECOHS, ECOK1, ECOL5, ECOL6, ECOLC, ECOLI, ECOLU, ECOSE, ECOSM, ECOUT, ENT38, ERWT9, ESCF3, HAEIN, HELPJ, HELPY, HUMAN, KLEP3, KLEP7, MOUSE, MYCBO, MYCLE, MYCTO, MYCTU, NEIMA, NEIMB, NOSS1, PECAS, PECCP, PHOLL, PSEAE, PSEPU, L_RAT, RHILO, RHIME, SALA4, SALAR, SALCH, SALDC, SALEP, SALG2, SALHS, SALNS, SALPA, SALPB, SALPC, SALPK, SALSV, SALTI, SALTY, SCHPO, SERP5, SHIB3, SHIBS, SHIDS, SHIF8, SHIFL, SHISS, SODGM, STRCO, SYNY3, THEMA, TREPA, XENNA, XYLFA, XYLFT, YERE8, YERP3, YERPA, YERPB, YERPE, YERPN, YERPP, YERPS, YERPY, HUMAN, MOUSE, RABIT, PLAF7, YEAS1, YEAS6, YEAS7, YEAST, YEAST, 


## Other code that I tested

In [None]:
# I was testing some database connections

Entrez.email = "ngopaul@berkeley.edu"
handle = Entrez.efetch(db="genome", id="algC", rettype="gb", retmode="text")
print(handle.readline().strip())
handle = Entrez.efetch(db="genome", id="2.7.1.199", rettype=None, retmode="text")
print(handle.readline().strip())


In [36]:
# I was testing some database reading

import csv
with open('uniprot_sprot.dat') as f:
    reader = csv.reader(f, delimiter="\t")
    max_count = 5000
    
    general_count = 0
    count = 0
    for line in reader:
#         if general_count == max_count:
#             break
        current_id = line[0][:2]
        current_line = line[0][5:]
#         print(current_id, current_line)
        if current_id == "ID" and current_line == "ALGC_PSEAB":
            count = 100
        if count > 0:
            print(current_id, current_line)
            count -= 1
            if count == 0:
                break
        else:
            general_count += 1
            continue