## section 1:

In [1]:
import pyopenms

## 1) constant

In [2]:
help(pyopenms.Constants)

Help on module pyopenms.Constants in pyopenms:

NAME
    pyopenms.Constants

DESCRIPTION
    # @brief Mathematical and physical constants namespace.
    # 
    # This namespace contains definitions for some basic mathematical and physical constants.
    # All constants are double precision.

DATA
    AVOGADRO = 6.0221367e+23
    BOHR_RADIUS = 5.29177249e-11
    BOLTZMANN = 1.380657e-23
    C13C12_MASSDIFF_U = 1.0033548378
    CAL_PER_JOULE = 0.2390057361376673
    DEG_PER_RAD = 57.29577951308232
    E = 2.718281828459045
    ELECTRON_MASS = 9.1093897e-31
    ELECTRON_MASS_U = 0.0005485799042984105
    ELEMENTARY_CHARGE = 1.60217738e-19
    EPSILON = 1e-06
    F = 96485.31200007845
    FARADAY = 96485.31200007845
    FINE_STRUCTURE_CONSTANT = 0.00729735
    FRAGMENT_ANNOTATION_USERPARAM = 'fragment_annotation'
    GAS_CONSTANT = 8.314505189811898
    GRAVITATIONAL_CONSTANT = 6.67259e-11
    JOULE_PER_CAL = 4.184
    MM_PER_INCH = 25.4
    MOL = 6.0221367e+23
    M_PER_FOOT = 3.048
    N

## 2)Elements

In [3]:
from pyopenms import*

In [4]:
newEle=ElementDB()

In [7]:
newEle.hasElement("Ag")

True

In [8]:
sliver=newEle.getElement("Ag")


In [9]:
print(sliver.getName())
print(sliver.getSymbol())
print(sliver.getMonoWeight())
print(sliver.getAverageWeight())

Silver
Ag
106.905093
107.86815069743


In [10]:
print ("One mole of oxygen weighs", 2*sliver.getAverageWeight(), "grams")
print ("One mole of 16O2 weighs", 2*sliver.getMonoWeight(), "grams")

One mole of oxygen weighs 215.73630139486 grams
One mole of 16O2 weighs 213.810186 grams


## 3)isotops

In [11]:
sliver_Iso=sliver.getIsotopeDistribution()

In [24]:
sliver_Iso=sliver.getIsotopeDistribution()
for iso in sliver_Iso.getContainer():
    print ("sliver isotope", iso.getMZ(), "has abundance", iso.getIntensity()*100, "%")

sliver isotope 106.905093 has abundance 51.83899998664856 %
sliver isotope 108.904756 has abundance 48.16100001335144 %


## 4)Molecular formula:

In [28]:
water = EmpiricalFormula("H2O")
ethanol = EmpiricalFormula("CH2") + water
print("Ethanol chemical formula:", ethanol.toString())
print("Ethanol composition:", ethanol.getElementalComposition())
print("Ethanol has", ethanol.getElementalComposition()[b"H"], "hydrogen atoms")

Ethanol chemical formula: C1H4O1
Ethanol composition: {b'C': 1, b'H': 4, b'O': 1}
Ethanol has 4 hydrogen atoms


## 5) Isotopic Distributions

## 6) Amino acid:

In [33]:
val=ResidueDB().getResidue("Valine")

In [38]:
print(val.getName())
print(val.getThreeLetterCode())
print(val.getOneLetterCode())
print(val.getAverageWeight())
print(val.getMonoWeight())
print(val.getPka())
print(val.getFormula())


Valine
Val
V
117.14658151860637
117.0789793509
2.39
C5H11N1O2


## 7)Amino Acid Modifications

In [40]:
ox = ModificationsDB().getModification("Oxidation")


In [42]:
print(ox.getUniModAccession())
print(ox.getUniModRecordId())
print(ox.getDiffMonoMass())
print(ox.getFullId())
print(ox.getId())
print(ox.getName())
print(ox.getFullName())
print(ox.getDiffFormula())
print(ox.getFormula())

UniMod:35
35
15.994915
Oxidation (H)
Oxidation

Oxidation or Hydroxylation
O1



## 8)Ribonucleotides

In [49]:
cyt= RibonucleotideDB().getRibonucleotide(b"C")

In [50]:
print(cyt.getName())
print(cyt.getCode())
print(cyt.getAvgMass())
print(cyt.getMonoMass())
print(cyt.getFormula())
print(cyt.isModified())
methyladenosine = RibonucleotideDB().getRibonucleotide(b"m1A")
print(methyladenosine.getName())
print(methyladenosine.isModified())

cytidine
C
243.2197
243.0855
C9H13N3O5
False
1-methyladenosine
True


# section 2:

In [51]:
seq=AASequence.fromString("DFPIANGER")


In [52]:
pref=seq.getPrefix(3)
suf=seq.getSuffix(3)
newseq=seq+seq
print("Sequence:", seq)
print("Prefix:", pref)
print("Suffix:", suf)
print("Concatenated:", newseq)

Sequence: DFPIANGER
Prefix: DFP
Suffix: GER
Concatenated: DFPIANGERDFPIANGER


In [56]:
MW=seq.getMonoWeight()
mprec=seq.getMonoWeight(Residue.ResidueType.Full,2)
mz=seq.getMonoWeight(Residue.ResidueType.Full, 2)
mz = seq.getMZ(2) 

In [57]:
print("Monoisotopic mass of peptide [M] is", MW)
print("Monoisotopic mass of peptide precursor [M+2H]2+ is", mprec)
print("Monoisotopic m/z of [M+2H]2+ is", mz)

Monoisotopic mass of peptide [M] is 1017.4879641373001
Monoisotopic mass of peptide precursor [M+2H]2+ is 1019.5025170708421
Monoisotopic m/z of [M+2H]2+ is 509.7512585354211


In [58]:
print("The peptide", seq, "consists of the following amino acids:")
for aa in seq:
    print(aa.getName(), ":", aa.getMonoWeight())

The peptide DFPIANGER consists of the following amino acids:
Aspartate : 133.03750922330002
Phenylalanine : 165.0789793509
Proline : 115.0633292871
Isoleucine : 131.0946294147
Alanine : 89.04767922330001
Asparagine : 132.0534932552
Glycine : 75.0320291595
Glutamate : 147.0531592871
Arginine : 174.1116764466


In [60]:
seq = AASequence.fromString("C[143]PKCK(Label:13C(6)15N(2))CR")
seq.toString()

'.(Pyro-carbamidomethyl)CPKCK(Label:13C(6)15N(2))CR'

In [64]:
if seq.hasNTerminalModification():
    print("N-Term Modification: ",seq.getNTerminalModification().getFullId())
if seq.hasCTerminalModification():
    print("C-Term Modification: ", seq.getCTerminalModification().getFullId())   

N-Term Modification:  Pyro-carbamidomethyl (N-term C)


In [68]:
for i in seq:
    if(i.isModified()):
        print(i.getName(),":",i.getMonoWeight(),":",i.getModificationName())
    else:
        print(i.getName(),":",i.getMonoWeight())

Cysteine : 121.0197499533
Proline : 115.0633292871
Lysine : 146.1055284466
Cysteine : 121.0197499533
Lysine : 154.11972844660002 : Label:13C(6)15N(2)
Cysteine : 121.0197499533
Arginine : 174.1116764466


In [69]:
seq = AASequence.fromString("DFPIANGER")

print("Peptide", seq, "has molecular formula",seq.getFormula())

Peptide DFPIANGER has molecular formula C44H67N13O15


## Isotope patterns

## Fragment ions

## Modified Sequences

In [71]:
seq = AASequence.fromString("PEPTIDESEKUEM(Oxidation)CER")


In [72]:
    print(seq.toUnmodifiedString())
    print(seq.toString())
    print(seq.toUniModString())
    print(seq.toBracketString())
    print(seq.toBracketString(False))

    print(AASequence.fromString("DFPIAM(UniMod:35)GER"))
    print(AASequence.fromString("DFPIAM[+16]GER"))
    print(AASequence.fromString("DFPIAM[+15.99]GER"))
    print(AASequence.fromString("DFPIAM[147]GER"))
    print(AASequence.fromString("DFPIAM[147.035405]GER"))

PEPTIDESEKUEMCER
PEPTIDESEKUEM(Oxidation)CER
PEPTIDESEKUEM(UniMod:35)CER
PEPTIDESEKUEM[147]CER
PEPTIDESEKUEM[147.035400017100017]CER
DFPIAM(Oxidation)GER
DFPIAM(Oxidation)GER
DFPIAM(Oxidation)GER
DFPIAM(Oxidation)GER
DFPIAM(Oxidation)GER


In [73]:
    s = AASequence.fromString(".(Dimethyl)DFPIAMGER.")
    print(s, s.hasNTerminalModification())
    s = AASequence.fromString(".DFPIAMGER.(Label:18O(2))")
    print(s, s.hasCTerminalModification())
    s = AASequence.fromString(".DFPIAMGER(Phospho).")
    print(s, s.hasCTerminalModification())

.(Dimethyl)DFPIAMGER True
DFPIAMGER.(Label:18O(2)) True
DFPIAMGER(Phospho) False


In [74]:
    bsa = FASTAEntry() # one entry in a FASTA file
    bsa.sequence = "MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGE"
    bsa.description = "BSA Bovine Albumin (partial sequence)"
    bsa.identifier = "BSA"
    alb = FASTAEntry()
    alb.sequence = "MKWVTFISLLFLFSSAYSRGVFRRDAHKSEVAHRFKDLGE"
    alb.description = "ALB Human Albumin (partial sequence)"
    alb.identifier = "ALB"

    entries = [bsa, alb]

    f = FASTAFile()
    f.store("example.fasta", entries)

In [76]:
    entries = []
    f = FASTAFile()
    f.load("example.fasta", entries)
    print( len(entries) )
    for e in entries:
      print (e.identifier, e.sequence)

2
BSA MKWVTFISLLLLFSSAYSRGVFRRDTHKSEIAHRFKDLGE
ALB MKWVTFISLLFLFSSAYSRGVFRRDAHKSEVAHRFKDLGE
