In [1]:
"""
    Switch between multiple references.
"""
from biograph import new_graph, reference, find_variants, visualize

# Import data
bg = new_graph("/mnt/NA12878_S1.gbwt")

# Import two references
grch37 = reference("/reference/human_g1k_v37/")
grch38 = reference("/reference/homo_sapiens_GCA_000001405.19_GRCh38.p4/")

# Find variants for both reference coordinate systems
grch37_coords = find_variants(bg, grch37, "1", 245822567, 245824567)

# The equivalent locus in GRCh38
# http://www.ncbi.nlm.nih.gov/nuccore/KI270759.1
grch38_coords = find_variants(bg, grch38, "KI270759.1", 356442, 360442)

# Let's see GRCh37
for v in grch37_coords:
    visualize(v.variants, v.coverage, v.ref_range)

                                .
                                .
                                .
           1:245822860      44 T│ 
           1:245822861      45 A│ 
           1:245822862      45 C│ 
                             1  ├───╮  44
           1:245822863       0 C│   │T 44
                             0  ├───╯  44
           1:245822864      44 G│ 
           1:245822865      44 G│ 
           1:245822866      43 G│ 
                                .
                                .
                                .
           1:245823566      31 G│ 
           1:245823567      31 T│ 
           1:245823568      31 C│ 
                             0  ├───╮  31  CTGAGGATCTAAGTACAGGG...[3865]
                                │   ╰──────────────────────────┄ 1:245823631 ╮
           1:245823569       0 G│ 
           1:245823570       0 T│ 
           1:245823571       0 G│ 
                                .
                                .
                              

In [6]:
# The variant was included in GRCh38, alternate locus KI270759.1

# Nature. 2001 Feb 15;409(6822):860-921.
# http://www.ncbi.nlm.nih.gov/pubmed/11237011
    
# We would not expect to see it called against GRCh38.
for v in grch38_coords:
    visualize(v.variants, v.coverage, v.ref_range)

No variants found.
