# list of 20 standard amino acids in peptides



In [6]:
#!pip install tabulate
from tabulate import tabulate

amino_acids = [
    ["A", "Ala", "Alanine", 0, 0, 0],
    ["R", "Arg", "Arginine", 1, 0, 0],
    ["N", "Asn", "Asparagine", 1, 0, 1],
    ["D", "Asp", "Aspartic acid", 1, 0, 1],
    ["C", "Cys", "Cysteine", 0, 1, 1],
    ["E", "Glu", "Glutamic acid", 1, 0, 1],
    ["Q", "Gln", "Glutamine", 1, 0, 1],
    ["G", "Gly", "Glycine", 0, 0, 0],
    ["H", "His", "Histidine", 1, 0, 1],
    ["I", "Ile", "Isoleucine", 0, 0, 0],
    ["L", "Leu", "Leucine", 0, 0, 0],
    ["K", "Lys", "Lysine", 1, 0, 0],
    ["M", "Met", "Methionine", 0, 1, 0],
    ["F", "Phe", "Phenylalanine", 0, 0, 1],
    ["P", "Pro", "Proline", 0, 0, 0],
    ["S", "Ser", "Serine", 1, 0, 0],
    ["T", "Thr", "Threonine", 1, 0, 0],
    ["W", "Trp", "Tryptophan", 1, 0, 1],
    ["Y", "Tyr", "Tyrosine", 1, 0, 1],
    ["V", "Val", "Valine", 0, 0, 0]
]

print(tabulate(amino_acids, headers=["One-Letter Code", "Three-Letter Code", "Name", "Hydrogen Bonding", "Sulfur", "Resonance Structure"], tablefmt="fancy_grid"))

╒═══════════════════╤═════════════════════╤═══════════════╤════════════════════╤══════════╤═══════════════════════╕
│ One-Letter Code   │ Three-Letter Code   │ Name          │   Hydrogen Bonding │   Sulfur │   Resonance Structure │
╞═══════════════════╪═════════════════════╪═══════════════╪════════════════════╪══════════╪═══════════════════════╡
│ A                 │ Ala                 │ Alanine       │                  0 │        0 │                     0 │
├───────────────────┼─────────────────────┼───────────────┼────────────────────┼──────────┼───────────────────────┤
│ R                 │ Arg                 │ Arginine      │                  1 │        0 │                     0 │
├───────────────────┼─────────────────────┼───────────────┼────────────────────┼──────────┼───────────────────────┤
│ N                 │ Asn                 │ Asparagine    │                  1 │        0 │                     1 │
├───────────────────┼─────────────────────┼───────────────┼─────────────

In [16]:
import pandas as pd

file_path = 'PA_Database.csv'  
df = pd.read_csv(file_path)
peptide_seq = df.iloc[:579, 5]  

print(peptide_seq.head(10))
print(peptide_seq.tail(10))

0    GG
1    GG
2    AG
3    AG
4    AA
5    AA
6    LG
7    LG
8    FG
9    FG
Name: Pep Seq, dtype: object
569           GANPNAAG
570      AAAAGGGEIKVAV
571      AAAAGGGEIKVAV
572             KKLLAK
573         RGDSKKLLAK
574    AAAAGGGLRKKLGKA
575    AAAAGGGLLGARKKK
576            AAAAAAD
577            AAAAAAK
578           GAAVILRR
Name: Pep Seq, dtype: object


In [20]:
#!pip install biopython
from Bio.SeqUtils import ProtParam

def calculate_hydrophobicity(sequence):
    analyzed_seq = ProtParam.ProteinAnalysis(sequence)
    return analyzed_seq.gravy()

hydrophobicities = peptide_seq.apply(calculate_hydrophobicity)

df['Hydrophobicity'] = hydrophobicities
new_file_path = 'Modified_PA_Database.csv'
df.to_csv(new_file_path, index=False)

print(df[['Pep Seq', 'Hydrophobicity']].head(10))
print(df.iloc[569:579][['Pep Seq', 'Hydrophobicity']])

  Pep Seq  Hydrophobicity
0      GG            -0.4
1      GG            -0.4
2      AG             0.7
3      AG             0.7
4      AA             1.8
5      AA             1.8
6      LG             1.7
7      LG             1.7
8      FG             1.2
9      FG             1.2
             Pep Seq  Hydrophobicity
569         GANPNAAG       -0.500000
570    AAAAGGGEIKVAV        1.023077
571    AAAAGGGEIKVAV        1.023077
572           KKLLAK       -0.383333
573       RGDSKKLLAK       -1.150000
574  AAAAGGGLRKKLGKA       -0.080000
575  AAAAGGGLLGARKKK       -0.080000
576          AAAAAAD        1.042857
577          AAAAAAK        0.985714
578         GAAVILRR        0.837500
