In [1]:
import typing
import os

import hpotk
from phenopackets import Phenopacket

from genophenocorr.patient import PhenopacketPatientCreator
from genophenocorr.phenotype import PhenotypeCreator
from genophenocorr.protein import UniprotProteinMetadataService, ProteinAnnotationCache, ProtCachingFunctionalAnnotator
from genophenocorr.variant import VarCachingFunctionalAnnotator, VariantAnnotationCache, VepFunctionalAnnotator
from genophenocorr.cohort import PhenopacketCohortCreator, CohortAnalysis


In [2]:
fpath_hpo = 'hpo_data/hp.json'
cache_dir = 'KBG/annotations'
fpath_phenopackets = 'KBG/phenopackets'
tx_id = 'NM_013275.6'
protein_id = 'Q15327'
if not os.path.isdir(cache_dir):
    os.mkdir(cache_dir)

In [3]:
hpo: hpotk.ontology.Ontology = hpotk.ontology.load.obographs.load_ontology(fpath_hpo)
validators = [
    hpotk.validate.AnnotationPropagationValidator(hpo),
    hpotk.validate.ObsoleteTermIdsValidator(hpo),
    hpotk.validate.PhenotypicAbnormalityValidator(hpo)
]
phenotype_creator = PhenotypeCreator(hpo, hpotk.validate.ValidationRunner(validators))

In [4]:
# Protein metadata
pm = UniprotProteinMetadataService()
pac = ProteinAnnotationCache(cache_dir)
pfa = ProtCachingFunctionalAnnotator(pac, pm)

# Functional annotator
vac = VariantAnnotationCache(cache_dir)
vep = VepFunctionalAnnotator(pfa)
vfa = VarCachingFunctionalAnnotator(vac, vep)


# Assemble the patient creator
pc = PhenopacketPatientCreator(phenotype_creator, vfa)

In [5]:
cc = PhenopacketCohortCreator(pc)

In [6]:
patientCohort = cc.create_cohort(fpath_phenopackets)

Expected at least one HPO term per patient, but received none for patient VanDongen2019_P2
Expected at least one HPO term per patient, but received none for patient VanDongen2019_P12
Expected at least one HPO term per patient, but received none for patient Reuter2020
Expected at least one HPO term per patient, but received none for patient Novara, 2017_P10
Expected at least one variant per patient, but received none for patient Parenti2016_P1
Expected at least one HPO term per patient, but received none for patient VanDongen2019_P13
Expected at least one HPO term per patient, but received none for patient VanDongen2019_P8
Expected at least one HPO term per patient, but received none for patient VanDongen2019_P4
Expected at least one HPO term per patient, but received none for patient VanDongen2019_P5
Expected at least one HPO term per patient, but received none for patient KBG31B
Expected at least one HPO term per patient, but received none for patient VanDongen2019_P9
Expected at leas

In [7]:
patientCohort.list_all_phenotypes()

[('HP:0006482', 224),
 ('HP:0011446', 220),
 ('HP:0001249', 194),
 ('HP:0001155', 189),
 ('HP:0012758', 176),
 ('HP:0004322', 150),
 ('HP:0010938', 134),
 ('HP:0000534', 126),
 ('HP:0000343', 121),
 ('HP:0000365', 97),
 ('HP:0000325', 83),
 ('HP:0000356', 77),
 ('HP:0007018', 61),
 ('HP:0000729', 56)]

In [8]:
patientCohort.list_all_variants()

[('16_89284634_GTGTTT/G', 34),
 ('16_89284129_CTTTTT/C', 10),
 ('16_89284140_TTTTC/T', 9),
 ('16_89285157_GTTTC/G', 8),
 ('16_89275181_-/G', 5),
 ('16_89279750_-/G', 5),
 ('16_89217282_deletion', 4),
 ('16_89182742_deletion', 4),
 ('16_89277486_deletion', 4),
 ('16_89284345_G/A', 3),
 ('16_89284363_CTTTG/C', 3),
 ('16_89274958_C/G', 3),
 ('16_89282136_C/T', 3),
 ('16_89284565_G/C', 3),
 ('16_89284358_GAT/G', 3),
 ('16_89283314_CCTTT/C', 3),
 ('16_89284524_duplication', 3),
 ('16_89282710_T/A', 3),
 ('16_88197356_deletion', 3),
 ('16_89284209_TTCTC/T', 2),
 ('16_89321706_deletion', 2),
 ('16_89282947_CTTTTT/C', 2),
 ('16_89280029_-/G', 2),
 ('16_89095277_deletion', 2),
 ('16_89283233_-/T', 2),
 ('16_89275128_G/A', 2),
 ('16_89282834_CTGTT/C', 2),
 ('16_89262070_deletion', 2),
 ('16_89283496_CG/C', 2),
 ('16_89285153_TTTTG/T', 2),
 ('16_89280752_G/T', 2),
 ('16_89228900_deletion', 2),
 ('16_89268636_C/A', 2),
 ('16_89282455_G/A', 2),
 ('16_89281054_C/A', 2),
 ('16_89282158_-/T', 2),
 ('1

In [9]:
patientCohort.list_all_patients()

['Goldenberg2016_P13',
 'Low, 2016_P9 (1)',
 'VanDongen2019_P2',
 'Low, 2016_P29 (27)',
 'Ockeloen2015_P20',
 'Gnazzo, 2020_P29',
 'Gnazzo, 2020_P4',
 'Kutkowska-Kazmierczak2021_P22',
 'Low, 2016_P5 (6)',
 'VanDongen2019_P12',
 'Low, 2016_P2 (26)',
 'Walz2015_PC',
 'Ockeloen2015_P5',
 'Novara, 2017_P1',
 'Reuter2020',
 'KBG57',
 'Goldenberg2016_P29',
 'Scarano, 2013_P6',
 'Kutkowska-Kazmierczak2021_P18',
 'Novara, 2017_P10',
 'KBG41',
 'Gnazzo, 2020_P13',
 'KBG16',
 'Kutkowska-Kazmierczak2021_P3',
 'Khalifa, 2013_P1B',
 'KBG36',
 'KBG10B',
 'KBG20',
 'Gnazzo, 2020_P8',
 'Gnazzo, 2020_P25',
 'Goldenberg2016_P1',
 'Parenti2021_P13',
 'Goldenberg2016_P25',
 'Ockeloen2015_P9',
 'Sirmaci2011_P2/F1? (previously published Tekin, 2004)',
 'Goldenberg2016_P33',
 'Kutkowska-Kazmierczak2021_P14',
 'Parenti2016_P1',
 'Ockeloen2015_P16',
 'Ockeloen2015_P17',
 'Kutkowska-Kazmierczak2021_P15',
 'Goldenberg2016_P32',
 'Bucerzan2020',
 'Ockeloen2015_P8',
 'Goldenberg2016_P24',
 'Parenti2021_P12',
 'Mur

In [10]:
patientCohort.list_data_by_tx('NM_013275.6')

{'NM_013275.6': Counter({'stop_gained': 52,
          'splice_acceptor_variant': 2,
          'coding_sequence_variant': 43,
          '5_prime_UTR_variant': 42,
          'intron_variant': 54,
          'feature_truncation': 51,
          'splice_donor_variant': 2,
          'frameshift_variant': 97,
          'stop_lost': 28,
          '3_prime_UTR_variant': 29,
          'transcript_ablation': 14,
          'missense_variant': 7,
          'inframe_deletion': 2,
          'splice_region_variant': 2,
          'transcript_amplification': 1,
          'downstream_gene_variant': 1,
          'feature_elongation': 1})}

In [11]:
patientCohort.list_data_by_tx()

{'NM_001173541.2': Counter({'transcript_ablation': 8,
          'coding_sequence_variant': 1,
          '5_prime_UTR_variant': 1,
          'intron_variant': 1,
          'feature_truncation': 1,
          'transcript_amplification': 1}),
 'NM_001171815.2': Counter({'transcript_ablation': 19,
          'stop_lost': 1,
          'coding_sequence_variant': 1,
          '5_prime_UTR_variant': 1,
          '3_prime_UTR_variant': 1,
          'intron_variant': 1,
          'feature_truncation': 1,
          'transcript_amplification': 1}),
 'NM_144604.4': Counter({'transcript_ablation': 16,
          'transcript_amplification': 1,
          'stop_lost': 2,
          'coding_sequence_variant': 2,
          '5_prime_UTR_variant': 1,
          '3_prime_UTR_variant': 2,
          'intron_variant': 2,
          'feature_truncation': 2}),
 'NM_001351938.2': Counter({'transcript_ablation': 5,
          'transcript_amplification': 1,
          'upstream_gene_variant': 1}),
 'NM_017869.4': Counter({

In [12]:
patientCohort.all_proteins

{ProteinMetadata(id=NP_000092.2, label=Cytochrome b-245 light chain, features=(SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=134, end=195)),)),
 ProteinMetadata(id=NP_000476.1, label=Adenine phosphoribosyltransferase, features=()),
 ProteinMetadata(id=NP_000503.1, label=N-acetylgalactosamine-6-sulfatase, features=(SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Catalytic domain, start=27, end=379)),)),
 ProteinMetadata(id=NP_000968.2, label=60S ribosomal protein L13, features=()),
 ProteinMetadata(id=NP_001012777.1, label=Cytoplasmic tRNA 2-thiolation protein 2, features=(SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=1, end=24)), SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=188, end=217)))),
 ProteinMetadata(id=NP_001012780.1, label=Cytoplasmic tRNA 2-thiolation protein 2, features=(SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(na

In [13]:
analysis = CohortAnalysis(patientCohort, 'NM_013275.6', include_unmeasured=False)
analysis._testing_hpo_terms

{Phenotype(identifier=HP:0000325, observed=True),
 Phenotype(identifier=HP:0000343, observed=True),
 Phenotype(identifier=HP:0000356, observed=True),
 Phenotype(identifier=HP:0000365, observed=True),
 Phenotype(identifier=HP:0000534, observed=True),
 Phenotype(identifier=HP:0000729, observed=True),
 Phenotype(identifier=HP:0001155, observed=True),
 Phenotype(identifier=HP:0001249, observed=True),
 Phenotype(identifier=HP:0004322, observed=True),
 Phenotype(identifier=HP:0006482, observed=True),
 Phenotype(identifier=HP:0007018, observed=True),
 Phenotype(identifier=HP:0010938, observed=True),
 Phenotype(identifier=HP:0011446, observed=True),
 Phenotype(identifier=HP:0012758, observed=True)}

In [14]:
from genophenocorr.constants import variant_effects

In [15]:
variant_effects.MISSENSE_VARIANT.effect_description

'A sequence variant, that changes one or more bases, resulting in a different amino acid sequence but where the length is preserved'

In [16]:
analysis.compare_by_variant_type(variant_effects.FRAMESHIFT_VARIANT)

Unnamed: 0,with count,% with frameshift variant,count,% without frameshift variant,p-value
HP:0011446 (Abnormality of higher mental function),114,82.014388,106,95.495495,0.001371
HP:0007018 (Attention deficit hyperactivity disorder),35,81.395349,26,66.666667,0.13903
HP:0000325 (Triangular face),45,71.428571,38,58.461538,0.141518
HP:0001249 (Intellectual disability),100,84.745763,94,89.52381,0.323694
HP:0006482 (Abnormality of dental morphology),125,85.616438,99,81.818182,0.408845
HP:0001155 (Abnormality of the hand),101,67.333333,88,72.131148,0.428461
HP:0012758 (Neurodevelopmental delay),86,94.505495,90,96.774194,0.494487
HP:0000365 (Hearing impairment),52,80.0,45,76.271186,0.666875
HP:0010938 (Abnormal external nose morphology),71,89.873418,63,92.647059,0.772039
HP:0000729 (Autistic behavior),27,56.25,29,60.416667,0.836156


In [17]:
analysis.compare_by_variant('16_89284634_GTGTTT/G')

Unnamed: 0,with count,% with 16_89284634_GTGTTT/G,count,% without 16_89284634_GTGTTT/G,p-value
HP:0011446 (Abnormality of higher mental function),19,70.37037,201,90.134529,0.007468
HP:0010938 (Abnormal external nose morphology),13,81.25,121,92.366412,0.153085
HP:0007018 (Attention deficit hyperactivity disorder),7,100.0,54,72.0,0.182109
HP:0001249 (Intellectual disability),15,78.947368,179,87.745098,0.283659
HP:0000534 (Abnormal eyebrow morphology),10,71.428571,116,82.269504,0.299278
HP:0001155 (Abnormality of the hand),22,78.571429,167,68.442623,0.385988
HP:0000729 (Autistic behavior),3,42.857143,53,59.550562,0.445576
HP:0000365 (Hearing impairment),7,70.0,90,78.947368,0.452661
HP:0012758 (Neurodevelopmental delay),14,93.333333,162,95.857988,0.500526
HP:0000343 (Long philtrum),11,73.333333,110,80.291971,0.50892


In [18]:
analysis2 = CohortAnalysis(patientCohort, 'NM_013275.6', include_unmeasured=False, include_large_SV=False)

analysis2.compare_by_exon(9)

Unnamed: 0,with count,% inside exon 9,count,% outside exon 9,p-value
HP:0004322 (Short stature),107,62.941176,8,36.363636,0.021011
HP:0011446 (Abnormality of higher mental function),155,85.164835,23,100.0,0.049316
HP:0001155 (Abnormality of the hand),136,70.103093,19,90.47619,0.070007
HP:0007018 (Attention deficit hyperactivity disorder),43,81.132075,8,61.538462,0.151609
HP:0000365 (Hearing impairment),65,78.313253,9,69.230769,0.48669
HP:0000534 (Abnormal eyebrow morphology),94,82.45614,10,76.923077,0.703322
HP:0001249 (Intellectual disability),137,86.708861,21,91.304348,0.743049
HP:0000729 (Autistic behavior),33,56.896552,8,66.666667,0.749049
HP:0012758 (Neurodevelopmental delay),120,96.0,12,100.0,1.0
HP:0000356 (Abnormality of the outer ear),49,81.666667,9,90.0,1.0


In [19]:
from genophenocorr.protein import FeatureType


In [20]:
analysis.compare_by_protein_feature_type(FeatureType.REGION)

635
636
635
636
635
636
635
636
710
711
710
711
710
711
710
711
710
711
710
711
710
711
710
711
710
711
710
711
710
711
710
711
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
2494
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
733
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
956
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
1007
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
725
727
725
727
725
727
725
727
725
727
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
2334
461
462
461
462
461
462
461
462
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
883
487
488
487
488
487
488
487
488
635
636
635
636
635
636


635
636
635
636
635
636
800
801
800
801
800
801
800
801
800
801
800
801
800
801
800
801
800
801
800
801
800
801
800
801
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
2158
777
778
777
778
777
778
777
778
777
778
1
673
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
571
575
571
575
571
575
571
575
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
1325
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
769
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
2585
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
884
2228
2228


2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
2398
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1146
1154
1146
1154
1146
1154
1146
1154
1146
1154
1146
1154
1146
1154
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
1065
725
727
725
727
725
727
725
727
725
727
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
1074
1075
1074
1075
1074
1075
1074
1075
1074
1075
1074
1075
1074
1075
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406
2406

728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
728
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1708
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
1402
2005
2006
2005
2006
2005
2006
2005
2006
2005
2006
2005
2006
2005
2006
2005
2006
2005
2006
2005
2006
183
184
183
184
183
184
183
184
183
184
183
184
183
184
183
184
183
184
183
184
183
184
183
184
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
2063
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
1930
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
2234
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
1104
110

1735
1736
1735
1736
1735
1736
1735
1736
635
636
635
636
635
636
635
636
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
1985
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
647
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2471
2475
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
2612
1
673
461
462
461
462
461
462
461
462
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
803
805
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1716
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
1830
2264
2265
2264
2265
2264
2265
2264
2265
2264
2265
2264
2265
2264
2265
2264
2265
2264
2265
2264
226

1758
1759
1758
1759
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1406
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1113
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1391
1146
1154
1146
1154
1146
1154
1146
1154
1146
1154
1146
1154
1146
1154
766
767
766
767
766
767
766
767
766
767
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
1128
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
2397
725
727
725
727
725
727
725
727
725
727
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
1464
1465
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
659
1074
1075
1074
1075
1074
1075
1074
1075
1074
1075
1074

Unnamed: 0,with count,% inside FeatureType.REGION,count,% outside exon FeatureType.REGION,p-value
HP:0001249 (Intellectual disability),57,79.166667,137,90.728477,0.020101
HP:0007018 (Attention deficit hyperactivity disorder),23,85.185185,38,69.090909,0.177981
HP:0001155 (Abnormality of the hand),60,64.516129,129,72.067039,0.213516
HP:0011446 (Abnormality of higher mental function),69,84.146341,151,89.880952,0.215477
HP:0000325 (Triangular face),30,71.428571,53,61.627907,0.326993
HP:0004322 (Short stature),47,53.409091,103,60.233918,0.352367
HP:0000365 (Hearing impairment),27,72.972973,70,80.45977,0.353359
HP:0006482 (Abnormality of dental morphology),72,80.898876,152,85.393258,0.378986
HP:0000343 (Long philtrum),43,81.132075,78,78.787879,0.834111
HP:0012758 (Neurodevelopmental delay),64,95.522388,112,95.726496,1.0


In [21]:
for var in patientCohort.all_variants:
    for trans in var.tx_annotations:
        print(trans.protein_affected)

(ProteinMetadata(id=NP_001243111.1, label=Ankyrin repeat domain-containing protein 11, features=(SimpleProteinFeature(type=FeatureType.REPEAT, info=FeatureInfo(name=ANK 1, start=167, end=196)), SimpleProteinFeature(type=FeatureType.REPEAT, info=FeatureInfo(name=ANK 2, start=200, end=229)), SimpleProteinFeature(type=FeatureType.REPEAT, info=FeatureInfo(name=ANK 3, start=233, end=262)), SimpleProteinFeature(type=FeatureType.REPEAT, info=FeatureInfo(name=ANK 4, start=266, end=292)), SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=1, end=90)), SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=128, end=169)), SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=289, end=380)), SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=398, end=647)), SimpleProteinFeature(type=FeatureType.REGION, info=FeatureInfo(name=Disordered, start=723, end=783)), SimplePr