Some descriptors from the ModlAMP package were used to calculate physicochemical properties from the peptide sequences.

Reference:
Müller A. T. et al. (2017) modlAMP: Python for antimicrobial peptides, Bioinformatics 33, (17), 2753-2755, DOI:10.1093/bioinformatics/btx285

## Set directory

In [1]:
pwd

'C:\\Users\\sakma\\Proyectos python\\Artículo ordenado'

## Modules

In [2]:
pip install modlamp




In [1]:
import pandas                      as pd
import numpy                       as np
import matplotlib.pyplot           as plt
import csv
from modlamp.descriptors import PeptideDescriptor, GlobalDescriptor

## Global Descriptors

In [2]:
Global_training_ds = GlobalDescriptor("Training_dataset.fasta")
Global_training_ds.calculate_all(amide=False, ph = 7.4)
Global_training_ds.featurenames
Global_training_ds.descriptor
colnames_GD = 'ID, Sequence,Length,MW,Charge,ChargeDensity,pI,InstabilityIndex,Aromaticity,AliphatiIndex,BomanIndex,HydrophobicRatio'
Global_training_ds.save_descriptor('C:\\Users\\sakma\\Proyectos python\\Artículo ordenado\\modlamps_global_descriptos.csv',header=colnames_GD)

## Peptide Descriptos

In [3]:
Training_ds_PD1 = PeptideDescriptor("Training_dataset.fasta","AASI") #amino acid selectivity index
Training_ds_PD1.calculate_global(window=1000, modality='mean')
Training_ds_PD2 = PeptideDescriptor("Training_dataset.fasta","ABHPRK") #physicochemical feature scale
Training_ds_PD2.calculate_global(window=1000, modality='mean')
Training_ds_PD3 = PeptideDescriptor("Training_dataset.fasta","argos") #hydrophobicity scale
Training_ds_PD3.calculate_global(window=1000, modality='mean')
Training_ds_PD4 = PeptideDescriptor("Training_dataset.fasta","bulkiness") #bulkiness scale
Training_ds_PD4.calculate_global(window=1000, modality='mean')
Training_ds_PD5 = PeptideDescriptor("Training_dataset.fasta","charge_phys") 
Training_ds_PD5.calculate_global(window=1000, modality='mean')
Training_ds_PD6 = PeptideDescriptor("Training_dataset.fasta","charge_acid") 
Training_ds_PD6.calculate_global(window=1000, modality='mean')
Training_ds_PD7 = PeptideDescriptor("Training_dataset.fasta","cougar") #modlabs inhouse selection of global peptide descriptors
Training_ds_PD7.calculate_global(window=1000, modality='mean')
Training_ds_PD8 = PeptideDescriptor("Training_dataset.fasta","eisenberg") #hydrophobicity scale
Training_ds_PD8.calculate_global(window=1000, modality='mean')
Training_ds_PD9 = PeptideDescriptor("Training_dataset.fasta","Ez") #potential that assesses energies
Training_ds_PD9.calculate_global(window=1000, modality='mean')
Training_ds_PD10 = PeptideDescriptor("Training_dataset.fasta","flexibility") #flexibilitiy scale
Training_ds_PD10.calculate_global(window=1000, modality='mean')
Training_ds_PD11 = PeptideDescriptor("Training_dataset.fasta","grantham") # polarity and molecular volume
Training_ds_PD11.calculate_global(window=1000, modality='mean')
Training_ds_PD12 = PeptideDescriptor("Training_dataset.fasta","gravy") #hydrophobicity scale
Training_ds_PD12.calculate_global(window=1000, modality='mean')
Training_ds_PD13 = PeptideDescriptor("Training_dataset.fasta","ISAECI") #Isotropic Surface Area and Electronic Charge Index 
Training_ds_PD13.calculate_global(window=1000, modality='mean')
Training_ds_PD14 = PeptideDescriptor("Training_dataset.fasta","janin") #hydrophobicity scale
Training_ds_PD14.calculate_global(window=1000, modality='mean')
Training_ds_PD15 = PeptideDescriptor("Training_dataset.fasta","kytedoolittle") #hydrophobicity scale
Training_ds_PD15.calculate_global(window=1000, modality='mean')
Training_ds_PD16 = PeptideDescriptor("Training_dataset.fasta","levitt_alpha") #alpha-helix propensity scale
Training_ds_PD16.calculate_global(window=1000, modality='mean')
Training_ds_PD17 = PeptideDescriptor("Training_dataset.fasta","MSS") #graph-theoretical index
Training_ds_PD17.calculate_global(window=1000, modality='mean')
Training_ds_PD18 = PeptideDescriptor("Training_dataset.fasta","MSW") #molecular surface based WHIM descriptor
Training_ds_PD18.calculate_global(window=1000, modality='mean')
Training_ds_PD19 = PeptideDescriptor("Training_dataset.fasta","pepArc") #pharmacophoric feature scale
Training_ds_PD19.calculate_global(window=1000, modality='mean')
Training_ds_PD20 = PeptideDescriptor("Training_dataset.fasta","pepcats") #pharmacophoric feature scale
Training_ds_PD20.calculate_global(window=1000, modality='mean')
Training_ds_PD21 = PeptideDescriptor("Training_dataset.fasta","polarity") #polarity scale
Training_ds_PD21.calculate_global(window=1000, modality='mean')
Training_ds_PD22 = PeptideDescriptor("Training_dataset.fasta","PPCALI") #amino acid property scales
Training_ds_PD22.calculate_global(window=1000, modality='mean')
Training_ds_PD23 = PeptideDescriptor("Training_dataset.fasta","refractivity") #relative amino acid refractivity values
Training_ds_PD23.calculate_global(window=1000, modality='mean')
Training_ds_PD24 = PeptideDescriptor("Training_dataset.fasta","t_scale") #PCA derived scale based on amino acid 
Training_ds_PD24.calculate_global(window=1000, modality='mean')
Training_ds_PD25 = PeptideDescriptor("Training_dataset.fasta","TM_tend") #AA transmembrane propensity scale
Training_ds_PD25.calculate_global(window=1000, modality='mean')
Training_ds_PD26 = PeptideDescriptor("Training_dataset.fasta","z3") #three dimensional Z-scale
Training_ds_PD26.calculate_global(window=1000, modality='mean')
Training_ds_PD27 = PeptideDescriptor("Training_dataset.fasta","z5") #five dimensional Z-scale
Training_ds_PD27.calculate_global(window=1000, modality='mean')
Training_ds_PD28 = PeptideDescriptor("Training_dataset.fasta","hopp-woods") ##hydrophobicity scale
Training_ds_PD28.calculate_global(window=1000, modality='mean')

In [4]:
#List of results
DsResultList =  list(zip(Training_ds_PD1.descriptor, Training_ds_PD2.descriptor, Training_ds_PD3.descriptor,Training_ds_PD4.descriptor, 
                        Training_ds_PD5.descriptor, Training_ds_PD6.descriptor, Training_ds_PD7.descriptor, Training_ds_PD8.descriptor, Training_ds_PD9.descriptor,
                          Training_ds_PD10.descriptor, Training_ds_PD11.descriptor, Training_ds_PD12.descriptor, Training_ds_PD13.descriptor, Training_ds_PD14.descriptor,
                          Training_ds_PD15.descriptor, Training_ds_PD16.descriptor, Training_ds_PD17.descriptor, Training_ds_PD18.descriptor, Training_ds_PD19.descriptor, 
                          Training_ds_PD20.descriptor, Training_ds_PD21.descriptor, Training_ds_PD22.descriptor, Training_ds_PD23.descriptor, Training_ds_PD24.descriptor,
                          Training_ds_PD25.descriptor,Training_ds_PD26.descriptor, Training_ds_PD27.descriptor, Training_ds_PD28.descriptor))

Training_dsResultsDF = pd.DataFrame(DsResultList, columns = ['AASI', 'ABHPRK', 'argos', 'bulkiness', 'charge_phys', 'charge_acid',
                                                     'cougar','eisenberg', 'Ez', 'flexibility', 'grantham', 'gravy',  
                                                     'ISAECI', 'janin','kytedoolittle', 'levitt_alpha', 'MSS', 'MSW', 
                                                     'pepArc', 'pepcats', 'polarity', 'PPCALI', 'refractivity', 't_scale',
                                                     'TM_tend', 'z3', 'z5',"hopp-woods"], index = None)
Training_dsResultsDF

#Save dataframe
Training_dsResultsDF.to_csv ('C:\\Users\\sakma\\Proyectos python\\Artículo ordenado\\Modlamp_Peptide_descriptors.csv'
                     ,index = True, header = True)