In [31]:
import os
import sys

from genophenocorr import *
import json
from google.protobuf.json_format import Parse
from phenopackets import Phenopacket 
import requests
import re
import pickle
from pyliftover import LiftOver

In [2]:
allKBGPatients = Cohort('phenopackets/*.json', transcript='NM_013275.6', pickled_dir='pickledVariants')




In [3]:
allKBGPatients.list_possible_tests()

{'variant_types': {'stop_lost': 34,
  'coding_sequence_variant': 51,
  '5_prime_UTR_variant': 47,
  '3_prime_UTR_variant': 35,
  'intron_variant': 63,
  'feature_truncation': 58,
  'copy_number_change': 80,
  'copy_number_decrease': 74,
  'frameshift_variant': 177,
  'missense_variant': 8,
  'stop_gained': 67,
  'transcript_ablation': 14,
  'splice_acceptor_variant': 5,
  'copy_number_increase': 6,
  'splice_donor_variant': 1,
  'feature_elongation': 3,
  'splice_region_variant': 2,
  'transcript_amplification': 1,
  'inframe_deletion': 1,
  'downstream_gene_variant': 1},
 'variants': {'16q24.3(88743575_89406219)x1': 1,
  'chr16:g.89284131_89284135del': 10,
  'chr16:g.89274920C>G': 1,
  'chr16:g.89284741G>A': 1,
  '16q24.3(88197484-89321695)x1': 1,
  '16q24.3(89217281_89506042)x1': 1,
  'chr16:g.89284641_89284645del': 34,
  '16q24.3(89409759-89418313)x1': 1,
  'chr16:g.89284450_89284454del': 1,
  'chr16:g.89284413del': 1,
  'chr16:g.89275185dup': 5,
  '16q24.2-q24.3 (88568592_89562542)

In [4]:
allKBGPatients.get_cohort_description_df()

Unnamed: 0,Patient ID,Disease,Gene,Variant,Protein,HPO Terms
0,Goldenberg2016_P13,OMIM:148050,{ANKRD11},{16q24.3(88743575_89406219)x1},{NP_037407.4},"{HP:0001155, HP:0004322}"
1,"Low, 2016_P9 (1)",OMIM:148050,{ANKRD11},{chr16:g.89284131_89284135del},{NP_037407.4},"{HP:0001155, HP:0000729, HP:0011446, HP:000432..."
2,VanDongen2019_P2,OMIM:148050,{ANKRD11},{chr16:g.89274920C>G},{NP_037407.4},{}
3,"Low, 2016_P29 (27)",OMIM:148050,{ANKRD11},{chr16:g.89284741G>A},{NP_037407.4},"{HP:0000365, HP:0001155, HP:0006482}"
4,Ockeloen2015_P20,OMIM:148050,{ANKRD11},{16q24.3(88197484-89321695)x1},{NP_037407.4},"{HP:0001249, HP:0004322, HP:0011446, HP:0006482}"
...,...,...,...,...,...,...
335,"Murray, 2017_P13 (11.1)",OMIM:148050,{ANKRD11},{chr16:g.89279326G>A},{NP_037407.4},"{HP:0007018, HP:0001155, HP:0011446, HP:001093..."
336,Ockeloen2015_P19,OMIM:148050,{ANKRD11},{chr16:g.89285224G>A},{NP_037407.4},"{HP:0001155, HP:0011446, HP:0004322, HP:000648..."
337,"Gnazzo, 2020_P10",OMIM:148050,{ANKRD11},{chr16:g.89284144_89284147del},{NP_037407.4},"{HP:0001155, HP:0011446, HP:0000343, HP:000432..."
338,KBG15,OMIM:148050,{ANKRD11},{chr16:g.89279573_89279580del},{NP_037407.4},"{HP:0000729, HP:0000365, HP:0011446, HP:001093..."


In [5]:
allKBGPatients.run_stats(is_var_type, is_not_var_type, 'copy_number_change', 'copy_number_change', 
                         remove_not_measured=True)

Unnamed: 0,1 w/ hpo,1 w/o hpo,2 w/ hpo,2 w/o hpo,pval,adjusted pval
HP:0000325 - Triangular face,14,17,68,27,0.00961,0.134544
HP:0001155 - Abnormality of the hand,32,23,155,60,0.050844,0.355911
HP:0000356 - Abnormality of the outer ear,18,8,58,12,0.163971,0.693027
HP:0007018 - Attention deficit hyperactivity disorder,9,6,51,15,0.198008,0.693027
HP:0011446 - Abnormality of higher mental function,40,3,178,27,0.314422,0.880382
HP:0012758 - Neurodevelopmental delay,42,3,132,5,0.410544,0.917446
HP:0004322 - Short stature,35,30,115,77,0.466921,0.917446
HP:0006482 - Abnormality of dental morphology,42,10,182,32,0.524255,0.917446
HP:0000534 - Abnormal eyebrow morphology,21,6,104,23,0.595737,0.926702
HP:0000365 - Hearing impairment,22,5,74,22,0.794112,0.947301


In [6]:
allKBGPatients.run_stats(is_var_match, is_not_var_match, 'chr16:g.89284641_89284645del', 'chr16:g.89284641_89284645del', 
                         remove_not_measured=True, include_structural_vars=False)

Unnamed: 0,1 w/ hpo,1 w/o hpo,2 w/ hpo,2 w/o hpo,pval,adjusted pval
HP:0011446 - Abnormality of higher mental function,19,8,159,19,0.01264,0.176957
HP:0010938 - Abnormal external nose morphology,13,3,98,8,0.157888,0.733814
HP:0001249 - Intellectual disability,15,4,143,19,0.271433,0.733814
HP:0000534 - Abnormal eyebrow morphology,10,4,94,19,0.280936,0.733814
HP:0007018 - Attention deficit hyperactivity disorder,7,0,44,15,0.336415,0.733814
HP:0000729 - Autistic behavior,3,4,38,25,0.437512,0.733814
HP:0012758 - Neurodevelopmental delay,14,1,118,4,0.445111,0.733814
HP:0001155 - Abnormality of the hand,22,6,133,54,0.502506,0.733814
HP:0000343 - Long philtrum,11,4,91,22,0.504241,0.733814
HP:0004322 - Short stature,14,12,101,65,0.524153,0.733814


In [7]:
allKBGPatients.run_stats(in_exon, not_in_exon, 9, 9, remove_not_measured=True, include_structural_vars=False)

Unnamed: 0,1 w/ hpo,1 w/o hpo,2 w/ hpo,2 w/o hpo,pval,adjusted pval
HP:0004322 - Short stature,107,63,8,14,0.021011,0.294157
HP:0011446 - Abnormality of higher mental function,155,27,23,0,0.049316,0.3267
HP:0001155 - Abnormality of the hand,136,58,19,2,0.070007,0.3267
HP:0007018 - Attention deficit hyperactivity disorder,43,10,8,5,0.151609,0.530632
HP:0000365 - Hearing impairment,65,18,9,4,0.48669,1.0
HP:0000534 - Abnormal eyebrow morphology,94,20,10,3,0.703322,1.0
HP:0001249 - Intellectual disability,137,21,21,2,0.743049,1.0
HP:0000729 - Autistic behavior,33,25,8,4,0.749049,1.0
HP:0006482 - Abnormality of dental morphology,161,29,21,3,1.0,1.0
HP:0000325 - Triangular face,57,23,11,4,1.0,1.0


In [11]:
patTest = allKBGPatients.all_variants_d.popitem()

In [12]:
patTest

('chr16:g.89279573_89279580del',
 <genophenocorr.variant.Variant at 0x28de628c0>)

In [14]:
patTest[1]._varInterp.allelic_state

ga4gh.vrsatile.v1.vrsatile_pb2.VariationDescriptor

In [16]:
testPat = allKBGPatients.all_variants_d.popitem()
testPat

('16q24.2-q24.3 (87306529_89269020)x1',
 <genophenocorr.variant.Variant at 0x28d465690>)

In [21]:
len(testPat[1]._varInterp.vcf_record.alt) == 0

True

In [27]:
chrom = re.findall(r'NC_0000(\d{2}).\d\d', testPat[1]._varInterp.variation.copy_number.allele.sequence_location.sequence_id)[0]


In [29]:
chrom = '01'
if chrom.startswith('0'):
    chrom = str(int(chrom))
print(chrom)

1


In [23]:
patTest[1]._varInterp.

[syntax: "hgvs.c"
value: "NM_013275.6:c.6968_6975del"
, syntax: "hgvs.g"
value: "NC_000016.10:g.89279573_89279580del"
]

In [32]:
lift = LiftOver('hg19', 'hg38')

In [33]:
lift.convert_coordinate(chromosome='chr16', position=89279853)

[('chr16', 89213445, '+', 7470613414)]

In [1]:
import ensembl_rest

In [2]:
import requests

In [3]:
json_results = requests.get('https://rest.variantvalidator.org/VariantFormatter/variantformatter/GRCh38/16%3A89279850%3AG%3AGC/all/all/True?content-type=application%2Fjson')



In [6]:
json = json_results.json()

In [13]:
print(json.keys())
key = list(json.keys())[0]
value = json[key][key]['g_hgvs']
print(value)

dict_keys(['16:89279850:G:GC', 'metadata'])
NC_000016.10:g.89279853dup


In [1]:
import phenopackets

In [None]:
phenopackets.GenomicInterpretation