In [8]:
>>> from Bio.Data import CodonTable
>>> standard_table = CodonTable.unambiguous_dna_by_id[1]
>>> mito_table = CodonTable.unambiguous_dna_by_id[2]

In [9]:
print(standard_table)

Table 1 Standard, SGC0

  |  T      |  C      |  A      |  G      |
--+---------+---------+---------+---------+--
T | TTT F   | TCT S   | TAT Y   | TGT C   | T
T | TTC F   | TCC S   | TAC Y   | TGC C   | C
T | TTA L   | TCA S   | TAA Stop| TGA Stop| A
T | TTG L(s)| TCG S   | TAG Stop| TGG W   | G
--+---------+---------+---------+---------+--
C | CTT L   | CCT P   | CAT H   | CGT R   | T
C | CTC L   | CCC P   | CAC H   | CGC R   | C
C | CTA L   | CCA P   | CAA Q   | CGA R   | A
C | CTG L(s)| CCG P   | CAG Q   | CGG R   | G
--+---------+---------+---------+---------+--
A | ATT I   | ACT T   | AAT N   | AGT S   | T
A | ATC I   | ACC T   | AAC N   | AGC S   | C
A | ATA I   | ACA T   | AAA K   | AGA R   | A
A | ATG M(s)| ACG T   | AAG K   | AGG R   | G
--+---------+---------+---------+---------+--
G | GTT V   | GCT A   | GAT D   | GGT G   | T
G | GTC V   | GCC A   | GAC D   | GGC G   | C
G | GTA V   | GCA A   | GAA E   | GGA G   | A
G | GTG V   | GCG A   | GAG E   | GGG G   | G
--+---------

In [10]:
from Bio import SeqIO

# Reading the sequence from the provided FASTA file
file_path = '/Users/ashwinnallamothu/Desktop/rest.uniprot.org_uniprotkb_G3ECR1.fasta.txt'  # Replace with your file path
sequence = SeqIO.read(file_path, 'fasta')

# Calculating sequence length
seq_length = len(sequence.seq)
print(f"Sequence Length: {seq_length}")

# Calculating amino acid composition
aa_count = sequence.seq.count("A")  # Replace with any amino acid you want to count
print(f"Number of Alanine (A) residues: {aa_count}")


Sequence Length: 1409
Number of Alanine (A) residues: 64


In [13]:
# Defining the average atomic masses for the common amino acids
aa_masses = {
    'A': 89.09, 'R': 174.20, 'N': 132.12, 'D': 133.10, 'C': 121.15,
    'E': 147.13, 'Q': 146.15, 'G': 75.07, 'H': 155.16, 'I': 131.17,
    'L': 131.17, 'K': 146.19, 'M': 149.21, 'F': 165.19, 'P': 115.13,
    'S': 105.09, 'T': 119.12, 'W': 204.23, 'Y': 181.19, 'V': 117.15
}

# Function to calculate molecular weight
def calculate_molecular_weight(sequence, aa_masses):
    return sum(aa_masses[aa] for aa in sequence) - (len(sequence) - 1) * 18.015  # subtracting the water mass released during peptide bond formation

# Function to calculate amino acid composition
def calculate_aa_composition(sequence):
    aa_comp = {aa: 0 for aa in aa_masses.keys()}
    for aa in sequence:
        aa_comp[aa] += 1
    return aa_comp

# Amino acid sequence of Hemoglobin subunit beta
sequence = "MVHLTPEEKSAVTALWGKVNVDEVGGEALGRLLVVYPWTQRFFESFGDLSTPDAVMGNPKVKAHGKKVLGAFSDGLAHLDNLKGTFATLSELHCDKLHVDPENFRLLGNVLVCVLAHHFGKEFTPPVQAAYQKVVAGVANALAHKYH"

# Calculating molecular weight
mol_weight = calculate_molecular_weight(sequence, aa_masses)

# Calculating amino acid composition
aa_comp = calculate_aa_composition(sequence)

# Print the results
print("Molecular Weight:", mol_weight)
print("Amino Acid Composition:", aa_comp)


Molecular Weight: 15998.339999999998
Amino Acid Composition: {'A': 15, 'R': 3, 'N': 6, 'D': 7, 'C': 2, 'E': 8, 'Q': 3, 'G': 13, 'H': 9, 'I': 0, 'L': 18, 'K': 11, 'M': 2, 'F': 8, 'P': 7, 'S': 5, 'T': 7, 'W': 2, 'Y': 3, 'V': 18}
