### Usage tutorial

In [3]:
# print available options
!/NERVE/code/NERVE.py -h

usage: NERVE.py [-h] [-a ] [-ev ] -g  [-ml ] [-mm ] [-m ] [-mpsl ] -p1
                 [-p2 ] [-paefilter ] [-pacfilter ] [-pl ] [-rz ]
                [-rl ] [-s ] [-ss ] [-tdl ] [-vl ] [-vir ] [-wd ]
                [-nd ] [-id ] [-dfd ]

Run vaccine candidate prediction

optional arguments:
  -h, --help            show this help message and exit
  -a , --annotation   Activation (True) or deactivation (False) of
                        annotation module. Uses DeepFri to retrieve protein
                        functional onthologies (default: True)
  -ev , --e_value     Expect-value used in blastp for immunity modules
                        (default: 1e-10)
  -g , --gram         Negative (n) or positive (p) gram stain of the
                        pathogen of interest (default: None)
  -ml , --minlength   Minimal length required for shared peptides to be
                        extracted in comparison analyses versus human and/or
  

In [1]:
# run on Neisseria meningitidis serogroup B (strain MC58) (MC58) (uniprot id: UP000000425)
# note that it is essential to specify the gram type (-g option)
!/NERVE/code/NERVE.py -p1 UP000002493 -p2 UP000032406 -wd ./UP000002493 -g n

Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [2]:
# explore the results
import os
os.listdir("./UP000002493/")

['proteome1.fasta',
 'cleaned_proteome1.fasta',
 'proteome2.fasta',
 'logfile.log',
 'cleaned_proteome2.fasta',
 'vaccine_candidates.csv',
 'conservation_raw_output.txt',
 'discarded_sequences_proteome1.fasta',
 'discarded_sequences_proteome2.fasta',
 'discarded_proteins.csv']

In [3]:
# vaccine_candidates.csv contains vaccine candidates extracted from the input proteome with the select module
# while discarded_proteins.csv contains excluded proteins
import pandas as pd
vaccine_candidates=pd.read_csv("./UP000002493/vaccine_candidates.csv")
vaccine_candidates

Unnamed: 0,id,uniprot_accession_code,score,length,transmembrane_doms,localization,localization score,virulence_probability,adhesin_probability,conservation_score,...,shared_mouse_peps,shared_conserv_proteome_peps,human_peptides_sum,mouse_peptides_sum,annotations,list_of_peptides_from_comparison_with_mhcpep_sapiens,list_of_peptides_from_comparison_with_mhcpep_mouse,sequence,original_sequence_if_razor,tmhmm_seq
0,tr|Q87GL4|Q87GL4_VIBPA Pentapeptide repeat-con...,Q87GL4,0.9813,682,0,Extracellular,9.65,0.9445,0.9592,0.0000,...,0,0,0.0000,0.0000,,,,MKSIASYQIKFKVLFTLTCSCIFATACNSDNTSTEIQSKLLVEKDF...,,
1,tr|Q87HS4|Q87HS4_VIBPA Heme transport protein ...,Q87HS4,0.9799,693,0,OuterMembrane,10.00,0.9315,0.9282,1.0649,...,0,698,0.0000,0.0000,,,,MYNKSILSASILIALSQGAYAEDHSTFNEVVVTATRTNSQIEDTAA...,,
2,tr|Q87IP5|Q87IP5_VIBPA Alginate_exp domain-con...,Q87IP5,0.9789,405,0,OuterMembrane,9.49,0.9344,0.9686,1.0000,...,0,397,0.0000,0.0000,,,,MHSGLHIRFSPPWMVVVSQALSLSLLGFFSFCAVANIPGLQPQKSW...,,
3,tr|Q87JI6|Q87JI6_VIBPA Flagellar hook protein ...,Q87JI6,0.9743,398,0,Extracellular,10.00,0.8660,0.9540,0.3869,...,0,42,0.0000,0.0000,,,,MSFNIALSGLDATNTELNTISHNIANASTYGFKGARTEFAAVYNGM...,,
4,tr|Q87GE5|Q87GE5_VIBPA Type III effector HopI1...,Q87GE5,0.9742,484,0,Extracellular,9.72,0.9644,0.8827,0.0000,...,0,0,0.0000,0.0000,,,,MLKIKLPQQTSLAPSSETTQRLPVKISIKSICNKSICKTLHSLADK...,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
1679,tr|Q87J15|Q87J15_VIBPA ribonuclease H OS=Vibri...,Q87J15,0.5034,169,0,Unknown,0.00,0.9290,0.0152,0.9822,...,2,150,0.1065,0.1065,,,,MNTQLQTTHLLHNAQHPLSIYCDGSAPDNQHGCLQGGVGIAVYDAL...,,
1680,tr|Q87M94|Q87M94_VIBPA 4-methyl-5(B-hydroxyeth...,Q87M94,0.4849,199,0,Periplasmic,9.51,0.1114,0.0067,1.0000,...,9,191,0.1256,0.1256,,,,MSKKILVPIAPGTEEMEAVTVIDLMVRAGYDVTVASAAFDGALTMK...,,
1681,sp|Q87KZ9|PSD_VIBPA Phosphatidylserine decarbo...,Q87KZ9,0.4835,285,0,CytoplasmicMembrane,7.88,0.2315,0.0492,1.0000,...,4,277,0.1263,0.1263,,,,MDKIKVGLQYWIPQHGLTRLVGKLASAKAGSLTTAVIRWFIKQYNV...,,
1682,tr|Q87T63|Q87T63_VIBPA Putative oxidoreductase...,Q87T63,0.4422,253,0,Unknown,0.00,0.8465,0.0673,0.0830,...,8,5,0.1462,0.1265,,,,MLKDKKIVIAGAGGLLGASVVKSILEAGGSVVATDVSLEHLKARLS...,,


In [5]:
# 1684 proteins have been selected as potential vaccine candidates.
discarded_proteins=pd.read_csv("./UP000002493/discarded_proteins.csv")
discarded_proteins

Unnamed: 0,id,uniprot_accession_code,score,length,transmembrane_doms,localization,localization score,virulence_probability,adhesin_probability,conservation_score,...,shared_mouse_peps,shared_conserv_proteome_peps,human_peptides_sum,mouse_peptides_sum,annotations,list_of_peptides_from_comparison_with_mhcpep_sapiens,list_of_peptides_from_comparison_with_mhcpep_mouse,sequence,original_sequence_if_razor,tmhmm_seq
0,tr|Q87SP5|Q87SP5_VIBPA Putative CFA/I fimbrial...,Q87SP5,0.9677,241,0,Cytoplasmic,9.97,0.9458,0.8311,0.0000,...,0,0,0.0000,0.0000,,,,MIRERSINLGHQVEGAIFTRHNHIVSVDGDGILSFQNNITKVKPNE...,,
1,tr|Q87I72|Q87I72_VIBPA Putative transcriptiona...,Q87I72,0.9677,332,0,Cytoplasmic,9.97,0.9262,0.8509,2.1295,...,0,467,0.0000,0.0000,DNA binding | DNA-binding transcription factor...,,,MQTRVRLTPPERNRMKNKDKNKKPLHNLDLNLLKIFRVVSEEKKTV...,,
2,sp|Q87MV3|NDPA_VIBPA Nucleoid-associated prote...,Q87MV3,0.9623,332,0,Cytoplasmic,9.97,0.8771,0.8620,1.0000,...,0,324,0.0000,0.0000,,,,MSLHLSNVILHQLCKNDQDELVVKLRPASLENDASTENLVAELHRV...,,
3,tr|Q87Q23|Q87Q23_VIBPA Transcriptional regulat...,Q87Q23,0.9620,254,0,Cytoplasmic,8.96,0.9320,0.9063,1.7441,...,0,315,0.0000,0.0000,,,,MNVGPKFLLAALRQKIKDEGLCYSSLSEKSGIPLSSIKRHLHNPSL...,,
4,tr|Q87MU3|Q87MU3_VIBPA KfrA_N domain-containin...,Q87MU3,0.9537,339,0,Cytoplasmic,8.96,0.9414,0.8382,0.0000,...,0,0,0.0000,0.0000,,,,MVNSMARPKTYTDEDLIQVANELISRGKKPSGWRIREYLQRGKSSS...,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
3132,tr|Q87HW1|Q87HW1_VIBPA ATP-dependent RNA helic...,Q87HW1,-16.8591,421,0,Cytoplasmic,9.97,0.1758,0.0125,3.0285,...,1465,795,8.9762,9.5036,"hydrolase activity, acting on acid anhydrides,...",,,MRFIMSVNFADLGIEQQLVETLNNMNIVTPTPVQEKSIPHVLEGKD...,,
3133,tr|Q87IM3|Q87IM3_VIBPA Putative ATP-dependent ...,Q87IM3,-16.9428,416,0,Cytoplasmic,9.97,0.3993,0.0104,2.4784,...,1285,399,9.0120,9.5889,ATPase activity | nucleoside-triphosphatase ac...,,,MTDKTQQATFADLGLIPTLVERLEALEYNQPTPIQSHAIPHVLDGR...,,
3134,tr|Q87SB9|Q87SB9_VIBPA ATP-dependent RNA helic...,Q87SB9,-16.9689,407,0,Cytoplasmic,9.97,0.2234,0.0104,2.8010,...,1363,692,9.0221,9.5799,"ATPase activity | hydrolase activity, acting o...",,,MIRTFAELDLDQNLLEAIEEMGYERPTKIQAEAIPQALDGRDILAS...,,
3135,tr|Q87LZ5|Q87LZ5_VIBPA ATP-dependent zinc meta...,Q87LZ5,-20.0077,662,2,CytoplasmicMembrane,10.00,0.1107,0.0086,0.9955,...,1190,651,4.0423,4.3837,purine ribonucleotide binding | purine ribonuc...,GPPGTGKTLLA,,MSDMAKNLILWLVIAVVLMSVFQSFGPGESNGRTVDYTTFVQEVGQ...,,iiiiiiMMMMMMMMMMMMMMMMMMMMoooooooooooooooooooo...


In [2]:
# 3137 proteins have been discarded.

In [1]:
!/NERVE/code/NERVE.py -p1 UP000000585 -wd ./UP000000585 -g p

Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [2]:
!/NERVE/code/NERVE.py -p1 UP000000821 -wd ./UP000000821 -g p --select False

Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [3]:
!/NERVE/code/NERVE.py -p1 UP000000801 -wd ./UP000000801 -g n --select False


Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [8]:
!/NERVE/code/NERVE.py -p1 UP000000535 -wd ./UP000000535 -g n --select False -nd ../../


Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [9]:
!/NERVE/code/NERVE.py -p1 UP000000540 -wd ./UP000000540 -g n --select False -nd ../../


Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [10]:
!/NERVE/code/NERVE.py -p1 UP000000431 -wd ./UP000000431 -g n --select False -nd ../../



Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [11]:
!/NERVE/code/NERVE.py -p1 UP000000806 -wd ./UP000000806 -g n --select False -nd ../../


Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.


In [12]:
!/NERVE/code/NERVE.py -p1 UP000023582 -wd ./UP000023582 -g n --select False -nd ../../


Start NERVE 1.5
10% done
20% done
30% done
40% done
50% done
60% done
70% done
80% done
90% done
100% done
End NERVE computation successfully.
