In [1]:
import pandas as pd

# OptiVax-Robust Augmentation Constructs

In [2]:
# (Kreiter et al., 2008; Sahin et al., 2017)
# https://www.jimmunol.org/content/180/1/309.full
# https://www.nature.com/articles/nature23003

SIGNAL_SEQ = 'MRVTAPRTLILLLSGALALTETWAGS'
MITD_SEQ = 'IVGIVAGLAVLAVVVIGAVVATVMCRRKSSGGKGGSYSQAASSDSAQGSDVSLTA'
START_LINKER_SEQ = 'GGSGGGGSGG'
MIDDLE_LINKER_SEQ = 'GGSGGGGSGG'
END_LINKER_SEQ = 'GGSLGGGGSG'
print(len(SIGNAL_SEQ), len(MITD_SEQ), len(MIDDLE_LINKER_SEQ))

26 55 10


## Separate Designs

In [3]:
s_peptides = pd.read_csv('S-augmentation-peptide.txt', names=['peptide'])
s_peptides['mhc_1'] = [len(x) <= 12 for x in s_peptides['peptide'].values]
s_peptides

Unnamed: 0,peptide,mhc_1
0,ATSRTLSYY,True
1,FAYANRNRF,True
2,FLNRFTTTL,True
3,FTYASALWEI,True
4,SINFVRIIMR,True
5,SPRWYFYYL,True
6,TVYSHLLLV,True
7,YIFFASFYY,True
8,YLDAYNMMI,True
9,AVFQSASKIITLKKRWQLA,False


In [4]:
s_mhc1_peptides = s_peptides.loc[s_peptides['mhc_1']]['peptide'].values.tolist()
print(len(s_mhc1_peptides))
print(s_mhc1_peptides)

9
['ATSRTLSYY', 'FAYANRNRF', 'FLNRFTTTL', 'FTYASALWEI', 'SINFVRIIMR', 'SPRWYFYYL', 'TVYSHLLLV', 'YIFFASFYY', 'YLDAYNMMI']


In [5]:
s_mhc2_peptides = s_peptides.loc[~s_peptides['mhc_1']]['peptide'].values.tolist()
print(len(s_mhc2_peptides))
print(s_mhc2_peptides)

20
['AVFQSASKIITLKKRWQLA', 'DGVKHVYQLRARSVSPKLFI', 'DNKFALTCFSTQFAFACPDG', 'DQVILLNKHIDAYKTFPPT', 'EHVTFFIYNKIVDEPEEHV', 'HQPYVVDDPCPIHFYSKWYI', 'IITLKKRWQLALSKGVHFV', 'MDLFMRIFTIGTVTLKQGE', 'MWLSYFIASFRLFARTRSM', 'NGGDAALALLLLDRLNQLE', 'PKEITVATSRTLSYYKLGA', 'PRQKRTATKAYNVTQAFGR', 'PSDFVRATATIPIQASLPF', 'RWYFYYLGTGPEAGLPYGA', 'SFRLFARTRSMWSFNPETN', 'SYFTSDYYQLYSTQLSTDT', 'TGPEAGLPYGANKDGIIWV', 'TSPARMAGNGGDAALALLL', 'TYTGAIKLDDKDPNFKDQV', 'VKDCVVLHSYFTSDYYQLY']


In [6]:
s_mhc1_construct = (
    SIGNAL_SEQ +
    START_LINKER_SEQ +
    MIDDLE_LINKER_SEQ.join(s_mhc1_peptides) +
    END_LINKER_SEQ +
    MITD_SEQ
)
s_mhc2_construct = (
    SIGNAL_SEQ +
    START_LINKER_SEQ +
    MIDDLE_LINKER_SEQ.join(s_mhc2_peptides) +
    END_LINKER_SEQ +
    MITD_SEQ
)

print('S MHC 1 construct length: ', len(s_mhc1_construct))
print('S MHC 2 construct length: ', len(s_mhc2_construct))

S MHC 1 construct length:  264
S MHC 2 construct length:  674


In [7]:
print(s_mhc1_construct)

MRVTAPRTLILLLSGALALTETWAGSGGSGGGGSGGATSRTLSYYGGSGGGGSGGFAYANRNRFGGSGGGGSGGFLNRFTTTLGGSGGGGSGGFTYASALWEIGGSGGGGSGGSINFVRIIMRGGSGGGGSGGSPRWYFYYLGGSGGGGSGGTVYSHLLLVGGSGGGGSGGYIFFASFYYGGSGGGGSGGYLDAYNMMIGGSLGGGGSGIVGIVAGLAVLAVVVIGAVVATVMCRRKSSGGKGGSYSQAASSDSAQGSDVSLTA


In [8]:
print(s_mhc2_construct)

MRVTAPRTLILLLSGALALTETWAGSGGSGGGGSGGAVFQSASKIITLKKRWQLAGGSGGGGSGGDGVKHVYQLRARSVSPKLFIGGSGGGGSGGDNKFALTCFSTQFAFACPDGGGSGGGGSGGDQVILLNKHIDAYKTFPPTGGSGGGGSGGEHVTFFIYNKIVDEPEEHVGGSGGGGSGGHQPYVVDDPCPIHFYSKWYIGGSGGGGSGGIITLKKRWQLALSKGVHFVGGSGGGGSGGMDLFMRIFTIGTVTLKQGEGGSGGGGSGGMWLSYFIASFRLFARTRSMGGSGGGGSGGNGGDAALALLLLDRLNQLEGGSGGGGSGGPKEITVATSRTLSYYKLGAGGSGGGGSGGPRQKRTATKAYNVTQAFGRGGSGGGGSGGPSDFVRATATIPIQASLPFGGSGGGGSGGRWYFYYLGTGPEAGLPYGAGGSGGGGSGGSFRLFARTRSMWSFNPETNGGSGGGGSGGSYFTSDYYQLYSTQLSTDTGGSGGGGSGGTGPEAGLPYGANKDGIIWVGGSGGGGSGGTSPARMAGNGGDAALALLLGGSGGGGSGGTYTGAIKLDDKDPNFKDQVGGSGGGGSGGVKDCVVLHSYFTSDYYQLYGGSLGGGGSGIVGIVAGLAVLAVVVIGAVVATVMCRRKSSGGKGGSYSQAASSDSAQGSDVSLTA


## Joint Design

In [9]:
joint_s_peptides = pd.read_csv('Joint-vaccine-peptide.txt', names=['peptide'])['peptide'].values.tolist()
print(len(joint_s_peptides))
print(joint_s_peptides)

33
['ASEFSSLPSYAAFATAQEAYEQAVA', 'DTDFVNEFYAYLRKHFSMMILSDDA', 'DYPKCDRAMPNMLRIMASLVLARKH', 'EKVNINIVGDFKLNEEIAIILASFS', 'ESPFVMMSAPPAQYELKHGTFTCAS', 'FGLVAEWFLAYILFTRFFYVLGLAA', 'FKIYSKHTPINLVRDLPQGFSALEP', 'FRNARNGVLITEGSVKGLQPSVGPK', 'GAGAALQIPFAMQMAYRFNGIGVTQ', 'GIATVREVLSDRELHLSWEVGKPRP', 'GLMWLSYFIASFRLFARTRSMWSFN', 'GVSFSTFEEAALCTFLLNKEMYLKL', 'GVYDYLVSTQEFRYMNSQGLLPPKN', 'GWTAGAAAYYVGYLQPRTFLLKYNE', 'IICISTKHFYWFFSNYLKRRVVFNG', 'IPKDMTYRRLISMMGFKMNYQVNGY', 'LDISASIVAGGIVAIVVTCLAYYFM', 'LQSLQTYVTQQLIRAAEIRASANLA', 'NNLVVMAYITGGVVQLTSQWLTNIF', 'PLIQPIGALDISASIVAGGIVAIVV', 'QPTESIVRFPNITNLCPFGEVFNAT', 'SIKNFKSVLYYQNNVFMSEAKCWTE', 'SQSIIAYTMSLGAENSVAYSNNSIA', 'TDTPKGPKVKYLYFIKGLNNLNRGM', 'TFCAGSTFISDEVARDLSLQFKRPI', 'TFYLTNDVSFLAHIQWMVMFTPLVP', 'TITQMNLKYAISAKNRARTVAGVSI', 'TITSGWTFGAGAALQIPFAMQMAYR', 'TSQWLTNIFGTVYEKLKPVLDWLEE', 'VRKIFVDGVPFVVSTGYHFRELGVV', 'VVFVLWAHGFELTSMKYFVKIGPER', 'WESGVKDCVVLHSYFTSDYYQLYST', 'YESLRPDTRYVLMDGSIIQFPNTYL']


In [10]:
s_joint_construct = (
    SIGNAL_SEQ +
    START_LINKER_SEQ +
    MIDDLE_LINKER_SEQ.join(joint_s_peptides) +
    END_LINKER_SEQ +
    MITD_SEQ
)

print('S Joint MHC I/II construct length: ', len(s_joint_construct))

S Joint MHC I/II construct length:  1246


In [11]:
print(s_joint_construct)

MRVTAPRTLILLLSGALALTETWAGSGGSGGGGSGGASEFSSLPSYAAFATAQEAYEQAVAGGSGGGGSGGDTDFVNEFYAYLRKHFSMMILSDDAGGSGGGGSGGDYPKCDRAMPNMLRIMASLVLARKHGGSGGGGSGGEKVNINIVGDFKLNEEIAIILASFSGGSGGGGSGGESPFVMMSAPPAQYELKHGTFTCASGGSGGGGSGGFGLVAEWFLAYILFTRFFYVLGLAAGGSGGGGSGGFKIYSKHTPINLVRDLPQGFSALEPGGSGGGGSGGFRNARNGVLITEGSVKGLQPSVGPKGGSGGGGSGGGAGAALQIPFAMQMAYRFNGIGVTQGGSGGGGSGGGIATVREVLSDRELHLSWEVGKPRPGGSGGGGSGGGLMWLSYFIASFRLFARTRSMWSFNGGSGGGGSGGGVSFSTFEEAALCTFLLNKEMYLKLGGSGGGGSGGGVYDYLVSTQEFRYMNSQGLLPPKNGGSGGGGSGGGWTAGAAAYYVGYLQPRTFLLKYNEGGSGGGGSGGIICISTKHFYWFFSNYLKRRVVFNGGGSGGGGSGGIPKDMTYRRLISMMGFKMNYQVNGYGGSGGGGSGGLDISASIVAGGIVAIVVTCLAYYFMGGSGGGGSGGLQSLQTYVTQQLIRAAEIRASANLAGGSGGGGSGGNNLVVMAYITGGVVQLTSQWLTNIFGGSGGGGSGGPLIQPIGALDISASIVAGGIVAIVVGGSGGGGSGGQPTESIVRFPNITNLCPFGEVFNATGGSGGGGSGGSIKNFKSVLYYQNNVFMSEAKCWTEGGSGGGGSGGSQSIIAYTMSLGAENSVAYSNNSIAGGSGGGGSGGTDTPKGPKVKYLYFIKGLNNLNRGMGGSGGGGSGGTFCAGSTFISDEVARDLSLQFKRPIGGSGGGGSGGTFYLTNDVSFLAHIQWMVMFTPLVPGGSGGGGSGGTITQMNLKYAISAKNRARTVAGVSIGGSGGGGSGGTITSGWTFGAGAALQIPFA