This notebook implements different functions from the modlamp package to generate physico-chemical descriptors calculated from peptide primary sequences.

Müller A. T. et al. (2017) modlAMP: Python for antimicrobial peptides, Bioinformatics 33, (17), 2753-2755, DOI:10.1093/bioinformatics/btx285.

#### Set working directory

In [1]:
import os
os.chdir('/Users/fabienplisson/Desktop/MODELS/')
print(os.getcwd())

/Users/fabienplisson/Desktop/MODELS


#### Install modules

In [2]:
# Pip install modules
import sys
!{sys.executable} -m pip install --upgrade pip
!{sys.executable} -m pip install modlamp
!{sys.executable} -m pip install mysql.connector

Collecting pip
  Downloading pip-20.2-py2.py3-none-any.whl (1.5 MB)
[K     |████████████████████████████████| 1.5 MB 1.4 MB/s 
[?25hInstalling collected packages: pip
  Attempting uninstall: pip
    Found existing installation: pip 20.1.1
    Uninstalling pip-20.1.1:
      Successfully uninstalled pip-20.1.1
Successfully installed pip-20.2


In [3]:
import matplotlib.pyplot as plt
import pandas as pd

#### Calculate Decriptors

In [41]:
from modlamp.descriptors import PeptideDescriptor, GlobalDescriptor

Peptides from APD database

In [47]:
#N=3081
pepdesc_totalAPD = PeptideDescriptor('./Data/total_APD.fasta', 'eisenberg')
globdesc_totalAPD = GlobalDescriptor('./Data/total_APD.fasta')

Peptides HemoPI-1 from Hemolytik

In [28]:
# N=442
pepdesc_HemoPI1pm = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_model_class1.fasta', 'eisenberg')
globdesc_HemoPI1pm = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_model_class1.fasta')

In [29]:
# N=442
pepdesc_HemoPI1nm = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_model_class0.fasta', 'eisenberg')
globdesc_HemoPI1nm = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_model_class0.fasta')

In [30]:
# N=110
pepdesc_HemoPI1pv = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_validation_class1.fasta', 'eisenberg')
globdesc_HemoPI1pv = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_validation_class1.fasta')

In [31]:
# N=110
pepdesc_HemoPI1nv = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_validation_class0.fasta', 'eisenberg')
globdesc_HemoPI1nv = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-1/HemoPI-1_validation_class0.fasta')

Peptides HemoPI-2 from Hemolytik

In [19]:
# N=442
pepdesc_HemoPI2pm = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_model_class1.fasta', 'eisenberg')
globdesc_HemoPI2pm = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_model_class1.fasta')

In [20]:
# N=370
pepdesc_HemoPI2nm = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_model_class0.fasta', 'eisenberg')
globdesc_HemoPI2nm = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_model_class0.fasta')

In [21]:
# N=110
pepdesc_HemoPI2pv = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_validation_class1.fasta', 'eisenberg')
globdesc_HemoPI2pv = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_validation_class1.fasta')

In [22]:
# N=92
pepdesc_HemoPI2nv = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_validation_class0.fasta', 'eisenberg')
globdesc_HemoPI2nv = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-2/HemoPI-2_validation_class0.fasta')

Peptides HemoPI-3 from Hemolytik

In [23]:
# N=708
pepdesc_HemoPI3pm = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_model_class1.fasta', 'eisenberg')
globdesc_HemoPI3pm = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_model_class1.fasta')

In [24]:
# N=590
pepdesc_HemoPI3nm = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_model_class0.fasta', 'eisenberg')
globdesc_HemoPI3nm = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_model_class0.fasta')

In [25]:
# N=177
pepdesc_HemoPI3pv = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_validation_class1.fasta', 'eisenberg')
globdesc_HemoPI3pv = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_validation_class1.fasta')

In [26]:
# N=148
pepdesc_HemoPI3nv = PeptideDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_validation_class0.fasta', 'eisenberg')
globdesc_HemoPI3nv = GlobalDescriptor('./Data/Hemolytik_datasets/HemoPI-3/HemoPI-3_validation_class0.fasta')

#### Peptide Descriptors

In [48]:
pepdesc_totalAPD.load_scale('eisenberg')
pepdesc_totalAPD.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_totalAPD.calculate_moment(append=True)
pepdesc_totalAPD.load_scale('gravy')  # load GRAVY scale
pepdesc_totalAPD.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_totalAPD.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_totalAPD.load_scale('z3')  # load old Z scale
pepdesc_totalAPD.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_totalAPD.load_scale('z5')  # load old Z scale
pepdesc_totalAPD.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_totalAPD.load_scale('AASI')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global AASI index
pepdesc_totalAPD.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_totalAPD.load_scale('ABHPRK')
pepdesc_totalAPD.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_totalAPD.load_scale('argos')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global argos index
pepdesc_totalAPD.calculate_moment(append=True)  # calculate argos index moment
pepdesc_totalAPD.load_scale('bulkiness')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_totalAPD.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_totalAPD.load_scale('charge_phys')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_totalAPD.load_scale('charge_acid')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_totalAPD.load_scale('Ez')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_totalAPD.load_scale('flexibility')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_totalAPD.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_totalAPD.load_scale('grantham')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_totalAPD.load_scale('hopp-woods')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_totalAPD.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_totalAPD.load_scale('ISAECI')
pepdesc_totalAPD.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_totalAPD.load_scale('janin')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_totalAPD.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_totalAPD.load_scale('kytedoolittle')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_totalAPD.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_totalAPD.load_scale('levitt_alpha')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_totalAPD.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_totalAPD.load_scale('MSS')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_totalAPD.calculate_moment(append=True)  # calculate MSS moment
pepdesc_totalAPD.load_scale('MSW')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_totalAPD.load_scale('pepArc')
pepdesc_totalAPD.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_totalAPD.load_scale('pepcats')
pepdesc_totalAPD.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_totalAPD.load_scale('polarity')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_totalAPD.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_totalAPD.load_scale('PPCALI')
pepdesc_totalAPD.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_totalAPD.load_scale('refractivity')
pepdesc_totalAPD.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_totalAPD.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_totalAPD.load_scale('t_scale')
pepdesc_totalAPD.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_totalAPD.load_scale('TM_tend')
pepdesc_totalAPD.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_totalAPD.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_totalAPD.save_descriptor('./Descriptors/pep_descriptors_totalAPD.csv', header=col_names1)

Peptides from Hemolytik database: class1 & model (pm), class0 & model (nm), class1 & validation (pv), class 0 & validation (nv)

HemoPI-1 dataset

In [32]:
pepdesc_HemoPI1pm.load_scale('eisenberg')
pepdesc_HemoPI1pm.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI1pm.calculate_moment(append=True)
pepdesc_HemoPI1pm.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI1pm.load_scale('z3')  # load old Z scale
pepdesc_HemoPI1pm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1pm.load_scale('z5')  # load old Z scale
pepdesc_HemoPI1pm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1pm.load_scale('AASI')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI1pm.load_scale('ABHPRK')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI1pm.load_scale('argos')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI1pm.load_scale('bulkiness')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI1pm.load_scale('charge_phys')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI1pm.load_scale('charge_acid')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI1pm.load_scale('Ez')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI1pm.load_scale('flexibility')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI1pm.load_scale('grantham')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI1pm.load_scale('hopp-woods')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI1pm.load_scale('ISAECI')
pepdesc_HemoPI1pm.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI1pm.load_scale('janin')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI1pm.load_scale('kytedoolittle')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI1pm.load_scale('levitt_alpha')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI1pm.load_scale('MSS')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI1pm.load_scale('MSW')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI1pm.load_scale('pepArc')
pepdesc_HemoPI1pm.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI1pm.load_scale('pepcats')
pepdesc_HemoPI1pm.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI1pm.load_scale('polarity')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI1pm.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI1pm.load_scale('PPCALI')
pepdesc_HemoPI1pm.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI1pm.load_scale('refractivity')
pepdesc_HemoPI1pm.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI1pm.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI1pm.load_scale('t_scale')
pepdesc_HemoPI1pm.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI1pm.load_scale('TM_tend')
pepdesc_HemoPI1pm.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI1pm.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI1pm.save_descriptor('./Descriptors/pep_descriptors_HemoPI1pm.csv', header=col_names1)

In [33]:
pepdesc_HemoPI1nm.load_scale('eisenberg')
pepdesc_HemoPI1nm.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI1nm.calculate_moment(append=True)
pepdesc_HemoPI1nm.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI1nm.load_scale('z3')  # load old Z scale
pepdesc_HemoPI1nm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1nm.load_scale('z5')  # load old Z scale
pepdesc_HemoPI1nm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1nm.load_scale('AASI')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI1nm.load_scale('ABHPRK')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI1nm.load_scale('argos')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI1nm.load_scale('bulkiness')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI1nm.load_scale('charge_phys')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI1nm.load_scale('charge_acid')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI1nm.load_scale('Ez')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI1nm.load_scale('flexibility')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI1nm.load_scale('grantham')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI1nm.load_scale('hopp-woods')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI1nm.load_scale('ISAECI')
pepdesc_HemoPI1nm.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI1nm.load_scale('janin')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI1nm.load_scale('kytedoolittle')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI1nm.load_scale('levitt_alpha')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI1nm.load_scale('MSS')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI1nm.load_scale('MSW')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI1nm.load_scale('pepArc')
pepdesc_HemoPI1nm.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI1nm.load_scale('pepcats')
pepdesc_HemoPI1nm.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI1nm.load_scale('polarity')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI1nm.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI1nm.load_scale('PPCALI')
pepdesc_HemoPI1nm.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI1nm.load_scale('refractivity')
pepdesc_HemoPI1nm.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI1nm.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI1nm.load_scale('t_scale')
pepdesc_HemoPI1nm.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI1nm.load_scale('TM_tend')
pepdesc_HemoPI1nm.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI1nm.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI1nm.save_descriptor('./Descriptors/pep_descriptors_HemoPI1nm.csv', header=col_names1)

In [34]:
pepdesc_HemoPI1pv.load_scale('eisenberg')
pepdesc_HemoPI1pv.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI1pv.calculate_moment(append=True)
pepdesc_HemoPI1pv.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI1pv.load_scale('z3')  # load old Z scale
pepdesc_HemoPI1pv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1pv.load_scale('z5')  # load old Z scale
pepdesc_HemoPI1pv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1pv.load_scale('AASI')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI1pv.load_scale('ABHPRK')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI1pv.load_scale('argos')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI1pv.load_scale('bulkiness')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI1pv.load_scale('charge_phys')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI1pv.load_scale('charge_acid')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI1pv.load_scale('Ez')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI1pv.load_scale('flexibility')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI1pv.load_scale('grantham')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI1pv.load_scale('hopp-woods')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI1pv.load_scale('ISAECI')
pepdesc_HemoPI1pv.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI1pv.load_scale('janin')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI1pv.load_scale('kytedoolittle')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI1pv.load_scale('levitt_alpha')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI1pv.load_scale('MSS')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI1pv.load_scale('MSW')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI1pv.load_scale('pepArc')
pepdesc_HemoPI1pv.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI1pv.load_scale('pepcats')
pepdesc_HemoPI1pv.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI1pv.load_scale('polarity')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI1pv.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI1pv.load_scale('PPCALI')
pepdesc_HemoPI1pv.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI1pv.load_scale('refractivity')
pepdesc_HemoPI1pv.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI1pv.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI1pv.load_scale('t_scale')
pepdesc_HemoPI1pv.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI1pv.load_scale('TM_tend')
pepdesc_HemoPI1pv.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI1pv.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI1pv.save_descriptor('./Descriptors/pep_descriptors_HemoPI1pv.csv', header=col_names1)

In [35]:
pepdesc_HemoPI1nv.load_scale('eisenberg')
pepdesc_HemoPI1nv.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI1nv.calculate_moment(append=True)
pepdesc_HemoPI1nv.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI1nv.load_scale('z3')  # load old Z scale
pepdesc_HemoPI1nv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1nv.load_scale('z5')  # load old Z scale
pepdesc_HemoPI1nv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI1nv.load_scale('AASI')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI1nv.load_scale('ABHPRK')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI1nv.load_scale('argos')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI1nv.load_scale('bulkiness')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI1nv.load_scale('charge_phys')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI1nv.load_scale('charge_acid')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI1nv.load_scale('Ez')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI1nv.load_scale('flexibility')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI1nv.load_scale('grantham')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI1nv.load_scale('hopp-woods')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI1nv.load_scale('ISAECI')
pepdesc_HemoPI1nv.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI1nv.load_scale('janin')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI1nv.load_scale('kytedoolittle')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI1nv.load_scale('levitt_alpha')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI1nv.load_scale('MSS')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI1nv.load_scale('MSW')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI1nv.load_scale('pepArc')
pepdesc_HemoPI1nv.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI1nv.load_scale('pepcats')
pepdesc_HemoPI1nv.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI1nv.load_scale('polarity')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI1nv.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI1nv.load_scale('PPCALI')
pepdesc_HemoPI1nv.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI1nv.load_scale('refractivity')
pepdesc_HemoPI1nv.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI1nv.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI1nv.load_scale('t_scale')
pepdesc_HemoPI1nv.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI1nv.load_scale('TM_tend')
pepdesc_HemoPI1nv.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI1nv.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI1nv.save_descriptor('./Descriptors/pep_descriptors_HemoPI1nv.csv', header=col_names1)

HemoPI-2 dataset

In [36]:
pepdesc_HemoPI2pm.load_scale('eisenberg')
pepdesc_HemoPI2pm.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI2pm.calculate_moment(append=True)
pepdesc_HemoPI2pm.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI2pm.load_scale('z3')  # load old Z scale
pepdesc_HemoPI2pm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2pm.load_scale('z5')  # load old Z scale
pepdesc_HemoPI2pm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2pm.load_scale('AASI')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI2pm.load_scale('ABHPRK')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI2pm.load_scale('argos')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI2pm.load_scale('bulkiness')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI2pm.load_scale('charge_phys')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI2pm.load_scale('charge_acid')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI2pm.load_scale('Ez')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI2pm.load_scale('flexibility')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI2pm.load_scale('grantham')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI2pm.load_scale('hopp-woods')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI2pm.load_scale('ISAECI')
pepdesc_HemoPI2pm.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI2pm.load_scale('janin')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI2pm.load_scale('kytedoolittle')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI2pm.load_scale('levitt_alpha')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI2pm.load_scale('MSS')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI2pm.load_scale('MSW')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI2pm.load_scale('pepArc')
pepdesc_HemoPI2pm.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI2pm.load_scale('pepcats')
pepdesc_HemoPI2pm.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI2pm.load_scale('polarity')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI2pm.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI2pm.load_scale('PPCALI')
pepdesc_HemoPI2pm.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI2pm.load_scale('refractivity')
pepdesc_HemoPI2pm.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI2pm.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI2pm.load_scale('t_scale')
pepdesc_HemoPI2pm.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI2pm.load_scale('TM_tend')
pepdesc_HemoPI2pm.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI2pm.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI2pm.save_descriptor('./Descriptors/pep_descriptors_HemoPI2pm.csv', header=col_names1)

In [37]:
pepdesc_HemoPI2nm.load_scale('eisenberg')
pepdesc_HemoPI2nm.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI2nm.calculate_moment(append=True)
pepdesc_HemoPI2nm.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI2nm.load_scale('z3')  # load old Z scale
pepdesc_HemoPI2nm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2nm.load_scale('z5')  # load old Z scale
pepdesc_HemoPI2nm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2nm.load_scale('AASI')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI2nm.load_scale('ABHPRK')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI2nm.load_scale('argos')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI2nm.load_scale('bulkiness')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI2nm.load_scale('charge_phys')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI2nm.load_scale('charge_acid')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI2nm.load_scale('Ez')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI2nm.load_scale('flexibility')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI2nm.load_scale('grantham')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI2nm.load_scale('hopp-woods')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI2nm.load_scale('ISAECI')
pepdesc_HemoPI2nm.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI2nm.load_scale('janin')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI2nm.load_scale('kytedoolittle')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI2nm.load_scale('levitt_alpha')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI2nm.load_scale('MSS')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI2nm.load_scale('MSW')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI2nm.load_scale('pepArc')
pepdesc_HemoPI2nm.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI2nm.load_scale('pepcats')
pepdesc_HemoPI2nm.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI2nm.load_scale('polarity')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI2nm.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI2nm.load_scale('PPCALI')
pepdesc_HemoPI2nm.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI2nm.load_scale('refractivity')
pepdesc_HemoPI2nm.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI2nm.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI2nm.load_scale('t_scale')
pepdesc_HemoPI2nm.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI2nm.load_scale('TM_tend')
pepdesc_HemoPI2nm.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI2nm.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI2nm.save_descriptor('./Descriptors/pep_descriptors_HemoPI2nm.csv', header=col_names1)

In [38]:
pepdesc_HemoPI2pv.load_scale('eisenberg')
pepdesc_HemoPI2pv.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI2pv.calculate_moment(append=True)
pepdesc_HemoPI2pv.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI2pv.load_scale('z3')  # load old Z scale
pepdesc_HemoPI2pv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2pv.load_scale('z5')  # load old Z scale
pepdesc_HemoPI2pv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2pv.load_scale('AASI')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI2pv.load_scale('ABHPRK')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI2pv.load_scale('argos')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI2pv.load_scale('bulkiness')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI2pv.load_scale('charge_phys')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI2pv.load_scale('charge_acid')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI2pv.load_scale('Ez')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI2pv.load_scale('flexibility')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI2pv.load_scale('grantham')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI2pv.load_scale('hopp-woods')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI2pv.load_scale('ISAECI')
pepdesc_HemoPI2pv.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI2pv.load_scale('janin')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI2pv.load_scale('kytedoolittle')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI2pv.load_scale('levitt_alpha')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI2pv.load_scale('MSS')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI2pv.load_scale('MSW')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI2pv.load_scale('pepArc')
pepdesc_HemoPI2pv.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI2pv.load_scale('pepcats')
pepdesc_HemoPI2pv.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI2pv.load_scale('polarity')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI2pv.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI2pv.load_scale('PPCALI')
pepdesc_HemoPI2pv.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI2pv.load_scale('refractivity')
pepdesc_HemoPI2pv.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI2pv.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI2pv.load_scale('t_scale')
pepdesc_HemoPI2pv.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI2pv.load_scale('TM_tend')
pepdesc_HemoPI2pv.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI2pv.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI2pv.save_descriptor('./Descriptors/pep_descriptors_HemoPI2pv.csv', header=col_names1)

In [39]:
pepdesc_HemoPI2nv.load_scale('eisenberg')
pepdesc_HemoPI2nv.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI2nv.calculate_moment(append=True)
pepdesc_HemoPI2nv.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI2nv.load_scale('z3')  # load old Z scale
pepdesc_HemoPI2nv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2nv.load_scale('z5')  # load old Z scale
pepdesc_HemoPI2nv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI2nv.load_scale('AASI')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI2nv.load_scale('ABHPRK')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI2nv.load_scale('argos')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI2nv.load_scale('bulkiness')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI2nv.load_scale('charge_phys')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI2nv.load_scale('charge_acid')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI2nv.load_scale('Ez')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI2nv.load_scale('flexibility')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI2nv.load_scale('grantham')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI2nv.load_scale('hopp-woods')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI2nv.load_scale('ISAECI')
pepdesc_HemoPI2nv.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI2nv.load_scale('janin')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI2nv.load_scale('kytedoolittle')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI2nv.load_scale('levitt_alpha')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI2nv.load_scale('MSS')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI2nv.load_scale('MSW')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI2nv.load_scale('pepArc')
pepdesc_HemoPI2nv.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI2nv.load_scale('pepcats')
pepdesc_HemoPI2nv.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI2nv.load_scale('polarity')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI2nv.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI2nv.load_scale('PPCALI')
pepdesc_HemoPI2nv.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI2nv.load_scale('refractivity')
pepdesc_HemoPI2nv.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI2nv.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI2nv.load_scale('t_scale')
pepdesc_HemoPI2nv.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI2nv.load_scale('TM_tend')
pepdesc_HemoPI2nv.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI2nv.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI2nv.save_descriptor('./Descriptors/pep_descriptors_HemoPI2nv.csv', header=col_names1)

HemoPI-3 dataset

In [40]:
pepdesc_HemoPI3pm.load_scale('eisenberg')
pepdesc_HemoPI3pm.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI3pm.calculate_moment(append=True)
pepdesc_HemoPI3pm.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI3pm.load_scale('z3')  # load old Z scale
pepdesc_HemoPI3pm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3pm.load_scale('z5')  # load old Z scale
pepdesc_HemoPI3pm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3pm.load_scale('AASI')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI3pm.load_scale('ABHPRK')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI3pm.load_scale('argos')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI3pm.load_scale('bulkiness')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI3pm.load_scale('charge_phys')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI3pm.load_scale('charge_acid')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI3pm.load_scale('Ez')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI3pm.load_scale('flexibility')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI3pm.load_scale('grantham')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI3pm.load_scale('hopp-woods')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI3pm.load_scale('ISAECI')
pepdesc_HemoPI3pm.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI3pm.load_scale('janin')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI3pm.load_scale('kytedoolittle')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI3pm.load_scale('levitt_alpha')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI3pm.load_scale('MSS')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI3pm.load_scale('MSW')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI3pm.load_scale('pepArc')
pepdesc_HemoPI3pm.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI3pm.load_scale('pepcats')
pepdesc_HemoPI3pm.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI3pm.load_scale('polarity')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI3pm.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI3pm.load_scale('PPCALI')
pepdesc_HemoPI3pm.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI3pm.load_scale('refractivity')
pepdesc_HemoPI3pm.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI3pm.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI3pm.load_scale('t_scale')
pepdesc_HemoPI3pm.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI3pm.load_scale('TM_tend')
pepdesc_HemoPI3pm.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI3pm.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI3pm.save_descriptor('./Descriptors/pep_descriptors_HemoPI3pm.csv', header=col_names1)

In [41]:
pepdesc_HemoPI3nm.load_scale('eisenberg')
pepdesc_HemoPI3nm.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI3nm.calculate_moment(append=True)
pepdesc_HemoPI3nm.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI3nm.load_scale('z3')  # load old Z scale
pepdesc_HemoPI3nm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3nm.load_scale('z5')  # load old Z scale
pepdesc_HemoPI3nm.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3nm.load_scale('AASI')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI3nm.load_scale('ABHPRK')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI3nm.load_scale('argos')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI3nm.load_scale('bulkiness')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI3nm.load_scale('charge_phys')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI3nm.load_scale('charge_acid')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI3nm.load_scale('Ez')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI3nm.load_scale('flexibility')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI3nm.load_scale('grantham')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI3nm.load_scale('hopp-woods')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI3nm.load_scale('ISAECI')
pepdesc_HemoPI3nm.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI3nm.load_scale('janin')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI3nm.load_scale('kytedoolittle')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI3nm.load_scale('levitt_alpha')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI3nm.load_scale('MSS')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI3nm.load_scale('MSW')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI3nm.load_scale('pepArc')
pepdesc_HemoPI3nm.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI3nm.load_scale('pepcats')
pepdesc_HemoPI3nm.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI3nm.load_scale('polarity')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI3nm.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI3nm.load_scale('PPCALI')
pepdesc_HemoPI3nm.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI3nm.load_scale('refractivity')
pepdesc_HemoPI3nm.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI3nm.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI3nm.load_scale('t_scale')
pepdesc_HemoPI3nm.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI3nm.load_scale('TM_tend')
pepdesc_HemoPI3nm.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI3nm.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI3nm.save_descriptor('./Descriptors/pep_descriptors_HemoPI3nm.csv', header=col_names1)

In [42]:
pepdesc_HemoPI3pv.load_scale('eisenberg')
pepdesc_HemoPI3pv.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI3pv.calculate_moment(append=True)
pepdesc_HemoPI3pv.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI3pv.load_scale('z3')  # load old Z scale
pepdesc_HemoPI3pv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3pv.load_scale('z5')  # load old Z scale
pepdesc_HemoPI3pv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3pv.load_scale('AASI')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI3pv.load_scale('ABHPRK')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI3pv.load_scale('argos')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI3pv.load_scale('bulkiness')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI3pv.load_scale('charge_phys')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI3pv.load_scale('charge_acid')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI3pv.load_scale('Ez')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI3pv.load_scale('flexibility')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI3pv.load_scale('grantham')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI3pv.load_scale('hopp-woods')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI3pv.load_scale('ISAECI')
pepdesc_HemoPI3pv.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI3pv.load_scale('janin')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI3pv.load_scale('kytedoolittle')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI3pv.load_scale('levitt_alpha')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI3pv.load_scale('MSS')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI3pv.load_scale('MSW')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI3pv.load_scale('pepArc')
pepdesc_HemoPI3pv.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI3pv.load_scale('pepcats')
pepdesc_HemoPI3pv.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI3pv.load_scale('polarity')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI3pv.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI3pv.load_scale('PPCALI')
pepdesc_HemoPI3pv.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI3pv.load_scale('refractivity')
pepdesc_HemoPI3pv.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI3pv.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI3pv.load_scale('t_scale')
pepdesc_HemoPI3pv.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI3pv.load_scale('TM_tend')
pepdesc_HemoPI3pv.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI3pv.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI3pv.save_descriptor('./Descriptors/pep_descriptors_HemoPI3pv.csv', header=col_names1)

In [43]:
pepdesc_HemoPI3nv.load_scale('eisenberg')
pepdesc_HemoPI3nv.calculate_global()  # calculate global Eisenberg hydrophobicity
pepdesc_HemoPI3nv.calculate_moment(append=True)
pepdesc_HemoPI3nv.load_scale('gravy')  # load GRAVY scale
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global GRAVY hydrophobicity
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate GRAVY hydrophobic moment
pepdesc_HemoPI3nv.load_scale('z3')  # load old Z scale
pepdesc_HemoPI3nv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3nv.load_scale('z5')  # load old Z scale
pepdesc_HemoPI3nv.calculate_autocorr(1, append=True)  # calculate global Z scale (=window1 autocorrelation)
pepdesc_HemoPI3nv.load_scale('AASI')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global AASI index
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate AASI index moment
pepdesc_HemoPI3nv.load_scale('ABHPRK')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate ABHPRK feature 
pepdesc_HemoPI3nv.load_scale('argos')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global argos index
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate argos index moment
pepdesc_HemoPI3nv.load_scale('bulkiness')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global bulkiness index
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate bulkiness index moment
pepdesc_HemoPI3nv.load_scale('charge_phys')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global charge_phys index
pepdesc_HemoPI3nv.load_scale('charge_acid')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global charge_acid index
pepdesc_HemoPI3nv.load_scale('Ez')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global energies of insertion of amino acid side chains into lipid bilayers index
pepdesc_HemoPI3nv.load_scale('flexibility')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global flexibility scale
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate flexibility moment
pepdesc_HemoPI3nv.load_scale('grantham')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global amino acid side chain composition, polarity and molecular volume
pepdesc_HemoPI3nv.load_scale('hopp-woods')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global Hopp-Woods hydrophobicity scale
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate Hopp-Woods hydrophobicity moment
pepdesc_HemoPI3nv.load_scale('ISAECI')
pepdesc_HemoPI3nv.calculate_global(append=True) # calculate global ISAECI (Isotropic Surface Area (ISA) and Electronic Charge Index (ECI) of amino acid side chains) index
pepdesc_HemoPI3nv.load_scale('janin')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global Janin hydrophobicity scale
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate Janin hydrophobicity moment
pepdesc_HemoPI3nv.load_scale('kytedoolittle')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global Kyte & Doolittle hydrophobicity scale
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate Kyte & Doolittle hydrophobicity moment
pepdesc_HemoPI3nv.load_scale('levitt_alpha')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global Levitt alpha-helix propensity scale
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate Levitt alpha-helix propensity moment
pepdesc_HemoPI3nv.load_scale('MSS')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global MSS index, graph-theoretical index that reflects topological shape and size of amino acid side chains
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate MSS moment
pepdesc_HemoPI3nv.load_scale('MSW')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global MSW scale, Amino acid scale based on a PCA of the molecular surface based WHIM descriptor (MS-WHIM), extended to natural amino acids
pepdesc_HemoPI3nv.load_scale('pepArc')
pepdesc_HemoPI3nv.calculate_global(append=True) # calculate global pepArc, modlabs pharmacophoric feature scale, dimensions are: hydrophobicity, polarity, positive charge, negative charge, proline.
pepdesc_HemoPI3nv.load_scale('pepcats')
pepdesc_HemoPI3nv.calculate_global(append=True) # calculate global pepcats, modlabs pharmacophoric feature based PEPCATS scale
pepdesc_HemoPI3nv.load_scale('polarity')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global AA polarity 
pepdesc_HemoPI3nv.calculate_moment(append=True)  # calculate AA polarity moment
pepdesc_HemoPI3nv.load_scale('PPCALI')
pepdesc_HemoPI3nv.calculate_global(append=True)  # calculate global modlabs inhouse scale derived from a PCA of 143 amino acid property scales
pepdesc_HemoPI3nv.load_scale('refractivity')
pepdesc_HemoPI3nv.calculate_global(append=True) # calculate global relative AA refractivity
pepdesc_HemoPI3nv.calculate_moment(append=True) # calculate relative AA refractivity moment
pepdesc_HemoPI3nv.load_scale('t_scale')
pepdesc_HemoPI3nv.calculate_global(append=True) # calculate global t scale, A PCA derived scale based on amino acid side chain properties calculated with 6 different probes of the GRID program
pepdesc_HemoPI3nv.load_scale('TM_tend')
pepdesc_HemoPI3nv.calculate_global(append=True) # calculate global Amino acid transmembrane propensity scale
pepdesc_HemoPI3nv.calculate_moment(append=True) # calculate Amino acid transmembrane propensity scale moment


col_names1 = 'ID,Sequence,H_Eisenberg,uH_Eisenberg,H_GRAVY,uH_GRAVY,Z3_1,Z3_2,Z3_3, Z5_1,Z5_2,Z5_3, Z5_4,Z5_5,S_AASI, uS_AASI, modlas_ABHPRK, H_argos, uH_argos, B_Builkiness, uB_Builkiness, charge_phys, charge_acid, Ez, flexibility, u_flexibility, Grantham, H_HoppWoods, uH-HoppWoods, ISAECI, H_Janin, uH_Janin, H_KyteDoolittle, uH_KyteDoolittle, F_Levitt, uF_Levitt, MSS_shape, u_MSS_shape, MSW, pepArc, pepcats, polarity, u_polarity, PPCALI, refractivity, u_refractivity, t_scale, TM_tend, u_TM_tend'
pepdesc_HemoPI3nv.save_descriptor('./Descriptors/pep_descriptors_HemoPI3nv.csv', header=col_names1)

#### Global Descriptors

Peptides from APD database

In [80]:
globdesc_totalAPD.length()  # sequence length
globdesc_totalAPD.boman_index(append=True)  # Boman index
globdesc_totalAPD.aromaticity(append=True)  # global aromaticity
globdesc_totalAPD.aliphatic_index(append=True)  # aliphatic index
globdesc_totalAPD.instability_index(append=True)  # instability index
globdesc_totalAPD.calculate_charge(ph=7.4, amide=False, append=True)  # net charge
globdesc_totalAPD.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_totalAPD.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_totalAPD.hydrophobic_ratio(append=True)
#globdesc_totalAPD.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_totalAPD.save_descriptor('./Descriptors/global_descriptors_totalAPD.csv', header=col_names2)

Peptides from Hemolytik database: class1 & model (pm), class0 & model (nm), class1 & validation (pv), class 0 & validation (nv)

HemoPI-1 dataset

In [44]:
globdesc_HemoPI1pm.length()  # sequence length
globdesc_HemoPI1pm.boman_index(append=True)  # Boman index
globdesc_HemoPI1pm.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI1pm.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI1pm.instability_index(append=True)  # instability index
globdesc_HemoPI1pm.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI1pm.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI1pm.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI1pm.hydrophobic_ratio(append=True)
#globdesc_HemoPI1pm.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI1pm.save_descriptor('./Descriptors/global_descriptors_HemoPI1pm.csv', header=col_names2)

In [45]:
globdesc_HemoPI1nm.length()  # sequence length
globdesc_HemoPI1nm.boman_index(append=True)  # Boman index
globdesc_HemoPI1nm.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI1nm.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI1nm.instability_index(append=True)  # instability index
globdesc_HemoPI1nm.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI1nm.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI1nm.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI1nm.hydrophobic_ratio(append=True)
#globdesc_HemoPI1nm.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI1nm.save_descriptor('./Descriptors/global_descriptors_HemoPI1nm.csv', header=col_names2)

In [46]:
globdesc_HemoPI1pv.length()  # sequence length
globdesc_HemoPI1pv.boman_index(append=True)  # Boman index
globdesc_HemoPI1pv.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI1pv.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI1pv.instability_index(append=True)  # instability index
globdesc_HemoPI1pv.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI1pv.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI1pv.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI1pv.hydrophobic_ratio(append=True)
#globdesc_HemoPI1pv.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI1pv.save_descriptor('./Descriptors/global_descriptors_HemoPI1pv.csv', header=col_names2)

In [47]:
globdesc_HemoPI1nv.length()  # sequence length
globdesc_HemoPI1nv.boman_index(append=True)  # Boman index
globdesc_HemoPI1nv.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI1nv.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI1nv.instability_index(append=True)  # instability index
globdesc_HemoPI1nv.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI1nv.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI1nv.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI1nv.hydrophobic_ratio(append=True)
#globdesc_HemoPI1nv.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI1nv.save_descriptor('./Descriptors/global_descriptors_HemoPI1nv.csv', header=col_names2)

HemoPI-2 dataset

In [48]:
globdesc_HemoPI2pm.length()  # sequence length
globdesc_HemoPI2pm.boman_index(append=True)  # Boman index
globdesc_HemoPI2pm.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI2pm.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI2pm.instability_index(append=True)  # instability index
globdesc_HemoPI2pm.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI2pm.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI2pm.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI2pm.hydrophobic_ratio(append=True)
#globdesc_HemoPI2pm.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI2pm.save_descriptor('./Descriptors/global_descriptors_HemoPI2pm.csv', header=col_names2)

In [49]:
globdesc_HemoPI2nm.length()  # sequence length
globdesc_HemoPI2nm.boman_index(append=True)  # Boman index
globdesc_HemoPI2nm.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI2nm.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI2nm.instability_index(append=True)  # instability index
globdesc_HemoPI2nm.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI2nm.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI2nm.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI2nm.hydrophobic_ratio(append=True)
#globdesc_HemoPI2nm.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI2nm.save_descriptor('./Descriptors/global_descriptors_HemoPI2nm.csv', header=col_names2)

In [50]:
globdesc_HemoPI2pv.length()  # sequence length
globdesc_HemoPI2pv.boman_index(append=True)  # Boman index
globdesc_HemoPI2pv.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI2pv.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI2pv.instability_index(append=True)  # instability index
globdesc_HemoPI2pv.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI2pv.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI2pv.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI2pv.hydrophobic_ratio(append=True)
#globdesc_HemoPI2pv.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI2pv.save_descriptor('./Descriptors/global_descriptors_HemoPI2pv.csv', header=col_names2)

In [51]:
globdesc_HemoPI2nv.length()  # sequence length
globdesc_HemoPI2nv.boman_index(append=True)  # Boman index
globdesc_HemoPI2nv.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI2nv.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI2nv.instability_index(append=True)  # instability index
globdesc_HemoPI2nv.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI2nv.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI2nv.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI2nv.hydrophobic_ratio(append=True)
#globdesc_HemoPI2nv.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI2nv.save_descriptor('./Descriptors/global_descriptors_HemoPI2nv.csv', header=col_names2)

HemoPI-3 dataset

In [52]:
globdesc_HemoPI3pm.length()  # sequence length
globdesc_HemoPI3pm.boman_index(append=True)  # Boman index
globdesc_HemoPI3pm.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI3pm.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI3pm.instability_index(append=True)  # instability index
globdesc_HemoPI3pm.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI3pm.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI3pm.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI3pm.hydrophobic_ratio(append=True)
#globdesc_HemoPI3pm.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI3pm.save_descriptor('./Descriptors/global_descriptors_HemoPI3pm.csv', header=col_names2)

In [53]:
globdesc_HemoPI3nm.length()  # sequence length
globdesc_HemoPI3nm.boman_index(append=True)  # Boman index
globdesc_HemoPI3nm.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI3nm.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI3nm.instability_index(append=True)  # instability index
globdesc_HemoPI3nm.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI3nm.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI3nm.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI3nm.hydrophobic_ratio(append=True)
#globdesc_HemoPI3nm.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI3nm.save_descriptor('./Descriptors/global_descriptors_HemoPI3nm.csv', header=col_names2)

In [54]:
globdesc_HemoPI3pv.length()  # sequence length
globdesc_HemoPI3pv.boman_index(append=True)  # Boman index
globdesc_HemoPI3pv.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI3pv.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI3pv.instability_index(append=True)  # instability index
globdesc_HemoPI3pv.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI3pv.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI3pv.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI3pv.hydrophobic_ratio(append=True)
#globdesc_HemoPI3pv.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI3pv.save_descriptor('./Descriptors/global_descriptors_HemoPI3pv.csv', header=col_names2)

In [55]:
globdesc_HemoPI3nv.length()  # sequence length
globdesc_HemoPI3nv.boman_index(append=True)  # Boman index
globdesc_HemoPI3nv.aromaticity(append=True)  # global aromaticity
globdesc_HemoPI3nv.aliphatic_index(append=True)  # aliphatic index
globdesc_HemoPI3nv.instability_index(append=True)  # instability index
globdesc_HemoPI3nv.calculate_charge(ph=7.4, amide=True, append=True)  # net charge
globdesc_HemoPI3nv.calculate_MW(amide=False, append=True)  # molecular weight
globdesc_HemoPI3nv.isoelectric_point(amide=False,append=True) # isoelectric point
globdesc_HemoPI3nv.hydrophobic_ratio(append=True)
#globdesc_HemoPI3nv.charge_density(ph=7.4, amide=False, append=True) # charge density (does not work)

col_names2 = 'ID, Sequence,Length,BomanIndex,Aromaticity,AliphaticIndex,InstabilityIndex, NetCharge, MW, IsoelectricPoint, HydrophobicRatio'
globdesc_HemoPI3nv.save_descriptor('./Descriptors/global_descriptors_HemoPI3nv.csv', header=col_names2)

#### Merge datasets

APD dataset

In [None]:
pepdesc_totalAPD = pd.read_csv('./Descriptors/pep_descriptors_totalAPD.csv', index_col=0)
globdesc_totalAPD = pd.read_csv('./Descriptors/global_descriptors_totalAPD.csv', index_col=0)
totalAPD = pepdesc_totalAPD.join(globdesc_totalAPD)
print(totalAPD.shape)

In [None]:
totalAPD.to_csv('./Descriptors/totalAPD_descriptors.csv')

HemoPI-1 dataset

In [92]:
pepdesc_HemoPI1pm = pd.read_csv('./Descriptors/pep_descriptors_HemoPI1pm.csv', index_col=0)
globdesc_HemoPI1pm = pd.read_csv('./Descriptors/global_descriptors_HemoPI1pm.csv', index_col=0)
HemoPI1pm = pepdesc_HemoPI1pm.join(globdesc_HemoPI1pm)

In [93]:
pepdesc_HemoPI1nm = pd.read_csv('./Descriptors/pep_descriptors_HemoPI1nm.csv', index_col=0)
globdesc_HemoPI1nm = pd.read_csv('./Descriptors/global_descriptors_HemoPI1nm.csv', index_col=0)
HemoPI1nm = pepdesc_HemoPI1nm.join(globdesc_HemoPI1nm)

In [94]:
pepdesc_HemoPI1pv = pd.read_csv('./Descriptors/pep_descriptors_HemoPI1pv.csv', index_col=0)
globdesc_HemoPI1pv = pd.read_csv('./Descriptors/global_descriptors_HemoPI1pv.csv', index_col=0)
HemoPI1pv = pepdesc_HemoPI1pv.join(globdesc_HemoPI1pv)

In [95]:
pepdesc_HemoPI1nv = pd.read_csv('./Descriptors/pep_descriptors_HemoPI1nv.csv', index_col=0)
globdesc_HemoPI1nv = pd.read_csv('./Descriptors/global_descriptors_HemoPI1nv.csv', index_col=0)
HemoPI1nv = pepdesc_HemoPI1nv.join(globdesc_HemoPI1nv)

In [96]:
print(HemoPI1pm.shape, HemoPI1nm.shape, HemoPI1pv.shape, HemoPI1nv.shape)

((442, 58), (442, 58), (110, 58), (110, 58))


Add classes 1 and 0 to model and validation from HemoPI-1 dataset

In [128]:
# 884 peptides for model
HemoPI1_model = pd.concat([HemoPI1pm, HemoPI1nm], axis=0)
HemoPI1_model['y_model_2cl'] = [1]*442 + [0]*442

In [129]:
# 220 peptides for validation
HemoPI1_validation = pd.concat([HemoPI1pv, HemoPI1nv], axis=0)
HemoPI1_validation['y_validation_2cl'] = [1]*110 + [0]*110

Save HemoPI-1 datasets and 56 modlamp properties to csv files

In [131]:
HemoPI1_model.to_csv('./Descriptors/HemoPI1_model.csv')
HemoPI1_validation.to_csv('./Descriptors/HemoPI1_validation.csv')

HemoPI-2 dataset

In [66]:
pepdesc_HemoPI2pm = pd.read_csv('./Descriptors/pep_descriptors_HemoPI2pm.csv', index_col=0)
globdesc_HemoPI2pm = pd.read_csv('./Descriptors/global_descriptors_HemoPI2pm.csv', index_col=0)
HemoPI2pm = pepdesc_HemoPI2pm.join(globdesc_HemoPI2pm)

In [67]:
pepdesc_HemoPI2nm = pd.read_csv('./Descriptors/pep_descriptors_HemoPI2nm.csv', index_col=0)
globdesc_HemoPI2nm = pd.read_csv('./Descriptors/global_descriptors_HemoPI2nm.csv', index_col=0)
HemoPI2nm = pepdesc_HemoPI2nm.join(globdesc_HemoPI2nm)

In [68]:
pepdesc_HemoPI2pv = pd.read_csv('./Descriptors/pep_descriptors_HemoPI2pv.csv', index_col=0)
globdesc_HemoPI2pv = pd.read_csv('./Descriptors/global_descriptors_HemoPI2pv.csv', index_col=0)
HemoPI2pv = pepdesc_HemoPI2pv.join(globdesc_HemoPI2pv)

In [71]:
pepdesc_HemoPI2nv = pd.read_csv('./Descriptors/pep_descriptors_HemoPI2nv.csv', index_col=0)
globdesc_HemoPI2nv = pd.read_csv('./Descriptors/global_descriptors_HemoPI2nv.csv', index_col=0)
HemoPI2nv = pepdesc_HemoPI2nv.join(globdesc_HemoPI2nv)

In [72]:
print(HemoPI2pm.shape, HemoPI2nm.shape, HemoPI2pv.shape, HemoPI2nv.shape)

((442, 58), (370, 58), (110, 58), (92, 58))


Add classes 1 and 0 to model and validation from HemoPI-2 dataset

In [134]:
HemoPI2_model = pd.concat([HemoPI2pm, HemoPI2nm], axis=0)
HemoPI2_model['y_model_2cl'] = [1]*442 + [0]*370

In [135]:
HemoPI2_validation = pd.concat([HemoPI2pv, HemoPI2nv], axis=0)
HemoPI2_validation['y_validation_2cl'] = [1]*110 + [0]*92

Save HemoPI-2 datasets and 56 modlamp properties to csv files

In [137]:
HemoPI2_model.to_csv('./Descriptors/HemoPI2_model.csv')
HemoPI2_validation.to_csv('./Descriptors/HemoPI2_validation.csv')

HemoPI-3 dataset

In [74]:
pepdesc_HemoPI3pm = pd.read_csv('./Descriptors/pep_descriptors_HemoPI3pm.csv', index_col=0)
globdesc_HemoPI3pm = pd.read_csv('./Descriptors/global_descriptors_HemoPI3pm.csv', index_col=0)
HemoPI3pm = pepdesc_HemoPI3pm.join(globdesc_HemoPI3pm)

In [79]:
pepdesc_HemoPI3nm = pd.read_csv('./Descriptors/pep_descriptors_HemoPI3nm.csv', index_col=0)
globdesc_HemoPI3nm = pd.read_csv('./Descriptors/global_descriptors_HemoPI3nm.csv', index_col=0)
HemoPI3nm = pepdesc_HemoPI3nm.join(globdesc_HemoPI3nm)

In [76]:
pepdesc_HemoPI3pv = pd.read_csv('./Descriptors/pep_descriptors_HemoPI3pv.csv', index_col=0)
globdesc_HemoPI3pv = pd.read_csv('./Descriptors/global_descriptors_HemoPI3pv.csv', index_col=0)
HemoPI3pv = pepdesc_HemoPI3pv.join(globdesc_HemoPI3pv)

In [77]:
pepdesc_HemoPI3nv = pd.read_csv('./Descriptors/pep_descriptors_HemoPI3nv.csv', index_col=0)
globdesc_HemoPI3nv = pd.read_csv('./Descriptors/global_descriptors_HemoPI3nv.csv', index_col=0)
HemoPI3nv = pepdesc_HemoPI3nv.join(globdesc_HemoPI3nv)

In [80]:
print(HemoPI3pm.shape, HemoPI3nm.shape, HemoPI3pv.shape, HemoPI3nv.shape)

((708, 58), (590, 58), (177, 58), (148, 58))


Add classes 1 and 0 to model and validation from HemoPI-3 dataset

In [139]:
# 1298 peptides for model
HemoPI3_model = pd.concat([HemoPI3pm, HemoPI3nm], axis=0)
HemoPI3_model['y_model_2cl'] = [1]*708 + [0]*590

In [145]:
# 325 peptides for validation
HemoPI3_validation = pd.concat([HemoPI3pv, HemoPI3nv], axis=0)
HemoPI3_validation['y_validation_2cl'] = [1]*177 + [0]*148

Save HemoPI-3 datasets and 56 modlamp properties to csv files

In [141]:
HemoPI3_model.to_csv('./Descriptors/HemoPI3_model.csv')
HemoPI3_validation.to_csv('./Descriptors/HemoPI3_validation.csv')