In [1]:
from pyopenms import *


seq = AASequence.fromString("DFPIANGER")     # create AASequence object from string representation


prefix = seq.getPrefix(4)                    # extract prefix of length 4


suffix = seq.getSuffix(5)                    # extract suffix of length 5


concat = seq + seq                          # concatenate two sequences


print("Sequence:", seq)
print("Prefix:", prefix)
print("Suffix:", suffix)
print("Concatenated:", concat)

Sequence: DFPIANGER
Prefix: DFPI
Suffix: ANGER
Concatenated: DFPIANGERDFPIANGER


In [5]:
from pyopenms import *

seq = AASequence.fromString("RANIAAHMED")  

prefix = seq.getPrefix(3)                   

print("Sequence:", seq)
print("Prefix:", prefix)

Sequence: RANIAAHMED
Prefix: RAN


In [6]:
suffix = seq.getSuffix(4)
print(suffix)

HMED


In [7]:
concat = seq + seq
print(concat)

RANIAAHMEDRANIAAHMED


In [8]:
mfull = seq.getMonoWeight()
print("Monoisotopic mass of peptide [M] is", mfull)


Monoisotopic mass of peptide [M] is 1126.5189470906


In [12]:
seq = AASequence.fromString("RANIA") 
print("The peptide", str(seq), "consists of the following amino acids:")
for aa in seq:
    print(aa.getName(), ":", aa.getMonoWeight())

The peptide RANIA consists of the following amino acids:
Arginine : 174.1116764466
Alanine : 89.0476792233
Asparagine : 132.0534932552
Isoleucine : 131.0946294147
Alanine : 89.0476792233


In [13]:
seq = AASequence.fromString("RANIA")
seq_formula = seq.getFormula()
print("Peptide", seq, "has molecular formula", seq_formula)

Peptide RANIA has molecular formula C22H41N9O7


In [14]:
suffix = seq.getSuffix(2)                                       


print("y3 ion sequence:", suffix)

y3_formula = suffix.getFormula(Residue.ResidueType.YIon, 2)        

suffix.getMonoWeight(Residue.ResidueType.YIon, 2) / 2.0            

suffix.getMonoWeight(Residue.ResidueType.XIon, 2) / 2.0            



print("y3 mz:", suffix.getMonoWeight(Residue.ResidueType.YIon, 2) / 2.0 )

print("y3 molecular formula:", y3_formula)

y3 ion sequence: IA
y3 mz: 102.07314825387101
y3 molecular formula: C9H18N2O3


In [15]:
seq = AASequence.fromString("AHMED(Oxidation) HEIKAL")
print(seq.toUnmodifiedString())
print(seq.toString())
print(seq.toUniModString())
print(seq.toBracketString())
print(seq.toBracketString(False))

AHMEDHEIKAL
AHMED(Oxidation)HEIKAL
AHMED(UniMod:35)HEIKAL
AHMED[131]HEIKAL
AHMED[131.021859159499968]HEIKAL


In [16]:
print(AASequence.fromString("AHMED(UniMod:35)RA"))

print(AASequence.fromString("AHMED[+16]RA"))

print(AASequence.fromString("AHMED[+15.99]RA"))

print(AASequence.fromString("AHMED[147]RA"))

print(AASequence.fromString("AHMED[147.035405]HEI"))

AHMED(Oxidation)RA
AHMED(Oxidation)RA
AHMED(Oxidation)RA
AHMED(Sulfide)RA
AHMED[147.035405]HEI


In [17]:
bsa = FASTAEntry() 

bsa.sequence = "AASDDDFDSGFDFHRTFHJGYR"

bsa.description = "BSA (partial sequence)"

bsa.identifier = "BSA"

alb = FASTAEntry()

alb.sequence = "NNNNNNNNNNNNNNNNNNNNNNNNNNNN"

alb.description = "ALB (partial sequence)"

alb.identifier = "ALB"


entries = [bsa, alb]

f = FASTAFile()

f.store("example.fasta", entries)

In [18]:
entries = []

f = FASTAFile()

f.load("example.fasta", entries)

print( len(entries) )

for e in entries:
    print (e.identifier, e.sequence)

2
BSA AASDDDFDSGFDFHRTFHJGYR
ALB NNNNNNNNNNNNNNNNNNNNNNNNNNNN
