In [3]:
from Bio.SeqIO.FastaIO import SimpleFastaParser
import config_readwrite as crw

import glob
import gzip
import numpy as np
import os, sys
import pandas as pd
import subprocess as sp

# find coordinates of kmers

In [4]:
CL, MER, NMUTS, BUILD, FO_ONLY = "common", "14", "2", "hs1", True
config, cfn = crw.read(os.path.join(os.getcwd(), "config.ini"))

In [5]:
COOR = f"/wynton/home/ahituv/fongsl/MPRA/agarwal_2023/kmers/{MER}mers/coor"

FA_MUT =  config[f"common.{MER}mer.{NMUTS}mut"]["fa_fo-true"]
TSV_MUT =  config[f"common.{MER}mer.{NMUTS}mut"]["tsv_fo-true"]

# load TSV

In [43]:
tsv=pd.read_csv(TSV_MUT, sep='\t', header=None, 
                names=["kmer", "nKmer", "gcKmer", "null", "nNull", "gcNull", "pretty"])
tsv.head(17)

Unnamed: 0,kmer,nKmer,gcKmer,null,nNull,gcNull,pretty
0,CTTGGCGTAGTCCG,2,0.64,CGTAGCGTAGTCCG,1,0.64,.G.A..........
1,CTTGGCGAATATAG,2,0.43,CGTCGCGAATATAG,1,0.5,.G.C..........
2,AAATTGCGCGTAAC,4,0.43,GAATCGCGCGTAAC,1,0.57,G...C.........
3,TTGGGCGCCGCAAT,2,0.64,TTGCGCGCCGTAAT,1,0.57,...C......T...
4,TTGGGTTCGGCGAC,2,0.64,ATGCGTTCGGCGAC,1,0.64,A..C..........
5,TTGGGAATCGCGCG,2,0.64,TAGCGAATCGCGCG,1,0.64,.A.C..........
6,TTGGGCGCGAATTA,2,0.5,TTGCGCGCGAGTTA,1,0.57,...C......G...
7,AATTTTGCGCGTCT,2,0.43,AATTTCGCGCGTCC,1,0.57,.....C.......C
8,GGGCCGATCGTGCG,2,0.79,GGGTCGATCGTACG,1,0.64,...T.......A..
9,GGGCCTATTCGGAC,2,0.64,GCGCGTATTCGGAC,1,0.64,.C..G.........


# explode columns - nullomer, gc, pretty 

In [60]:
explode_cols = ["null", "gcNull", "pretty"]
for col in explode_cols:
    tsv[col]=tsv[col].apply(lambda x: x.split(","))

tsv = tsv.explode(explode_cols)
tsv["coor"] = None
tsv.head(18)

Unnamed: 0,kmer,nKmer,gcKmer,null,nNull,gcNull,pretty,coor
0,CTTGGCGTAGTCCG,2,0.64,CGTAGCGTAGTCCG,1,0.64,.G.A..........,
1,CTTGGCGAATATAG,2,0.43,CGTCGCGAATATAG,1,0.5,.G.C..........,
2,AAATTGCGCGTAAC,4,0.43,GAATCGCGCGTAAC,1,0.57,G...C.........,
3,TTGGGCGCCGCAAT,2,0.64,TTGCGCGCCGTAAT,1,0.57,...C......T...,
4,TTGGGTTCGGCGAC,2,0.64,ATGCGTTCGGCGAC,1,0.64,A..C..........,
5,TTGGGAATCGCGCG,2,0.64,TAGCGAATCGCGCG,1,0.64,.A.C..........,
6,TTGGGCGCGAATTA,2,0.5,TTGCGCGCGAGTTA,1,0.57,...C......G...,
7,AATTTTGCGCGTCT,2,0.43,AATTTCGCGCGTCC,1,0.57,.....C.......C,
8,GGGCCGATCGTGCG,2,0.79,GGGTCGATCGTACG,1,0.64,...T.......A..,
9,GGGCCTATTCGGAC,2,0.64,GCGCGTATTCGGAC,1,0.64,.C..G.........,


In [18]:
def dissectFaId(line):
    """
    dissect mutated fa id line for kmer, nullomer information, and get the coordinate file
    """
    # process the line
    kmer, null_index = line.strip('\n').strip(">").split(".")
            
    # get key and value sequence to look up
    key, value_seq = kmer[:5], kmer[5:]

    coor_file = os.path.join(COOR, f"{key}_coor.csv.gz")
    
    return kmer, key, value_seq, coor_file

In [19]:
def getCoor(value_seq, coor_file):
    """
    get coordinates that match to a kmer
    """
    
    with gzip.open(coor_file, "rt") as reader:
        for line in reader:
            seq = line.strip('\n').split(",")[0]
            regions = ",".join(line.strip('\n').split(",")[1:])
            
            if seq == value_seq:
                return regions

# add kmer coordinates 

In [62]:
with open(FA_MUT, "r") as fasta_reader:
    out = FA_MUT.strip(".fa") + ".ext4096.fa"
    
    for values in SimpleFastaParser(fasta_reader):
        
        # parse fasta
        name, null = values
        
        # get kmer information
        kmer, key, value_seq, coor_file = dissectFaId(name)
        
        # regions linked to kmer
        region_str = getCoor(value_seq, coor_file)
        print(kmer, region_str)
        tsv.loc[tsv["kmer"]==kmer, "coor"] = region_str


GACTATCGTGCGCG chr1:110145315-110145515_+,chr1:110145315-110145515_-,
GACTACGGTCTACG chr1:116160053-116160253_+,chr1:116160053-116160253_-,
GACTACCATCGACC chr10:38036108-38036308_+,chr10:38036108-38036308_-,
GACTAGCGAGCGTA chr22:40675835-40676035_+,chr22:40675835-40676035_-,
GACTATCGCCCGGA chr7:102400460-102400660_+,chr7:102400475-102400675_+,chr7:102400460-102400660_-,chr7:102400475-102400675_-,
ACTAGCCGGACGCG chr14:48384041-48384241_+,chr14:48384041-48384241_-,
ACTAGCCAGCGCGT chr16:74035752-74035952_+,chr16:74035752-74035952_-,
ACTAGCGTCGTCCG chr17:36355607-36355807_+,chr17:36355607-36355807_-,
ACTAGGCCAGTTCG chr19:13402663-13402863_+,chr19:13402663-13402863_-,
ACTAGACGGCGCAA chr19:21341626-21341826_+,chr19:21341626-21341826_-,
ACTAGGCCGTCTAC chr5:141625691-141625891_+,chr5:141625691-141625891_-,
ACTAGCGAGCCGCG chr9:138722654-138722854_+,chr9:138722654-138722854_-,
ACTAGAAGGCGCGT chr9:19477488-19477688_+,chr9:19477488-19477688_-,
CTAGACGGGCGAAT chr1:185643147-185643347_+,chr1:1856431

TCGTCCGGGATCGT chr14:16754977-16755176_+,chr14:16754977-16755176_-,
TCGTCGCGAACGAT chr15:49189034-49189234_+,chr15:49189034-49189234_-,
TCGTCGCGAACGAT chr15:49189034-49189234_+,chr15:49189034-49189234_-,
TCGTCGCGAACGAT chr15:49189034-49189234_+,chr15:49189034-49189234_-,
TCGTCGCGAACGAT chr15:49189034-49189234_+,chr15:49189034-49189234_-,
TCGTCCGTCCCGTC chr15:76674926-76675126_+,chr15:76674926-76675126_-,
TCGTCAGTCATAAT chr16:136102-136302_+,chr16:136102-136302_-,
TCGTCCAGCAACGT chr16:22090782-22090982_+,chr16:22090782-22090982_-,
TCGTCCGTGTAGCG chr17:46583909-46584109_+,chr17:46583915-46584115_+,chr17:46583909-46584109_-,chr17:46583915-46584115_-,
TCGTCGCTCGCGGA chr17:65970592-65970792_+,chr17:65970624-65970824_+,chr17:65970592-65970792_-,chr17:65970624-65970824_-,
TCGTCCCGTGCGCG chr17:9483479-9483679_+,chr17:9483479-9483679_-,
TCGTCGCTAGACGG chr18:7080652-7080852_+,chr18:7080652-7080852_-,
TCGTCACGTTGAAC chr18:75776490-75776690_+,chr18:75776490-75776690_-,
TCGTCCGCGTGGGA chr19:3936284

CGTCGAAGGGCGCT chr22:46747942-46748142_+,chr22:46747942-46748142_-,
CGTCGAAGGGCGCT chr22:46747942-46748142_+,chr22:46747942-46748142_-,
CGTCGTCGCTAGCG chr3:138941926-138942126_+,chr3:138941926-138942126_-,
CGTCGCCTCGCGCA chr3:155932783-155932983_+,chr3:155932783-155932983_-,
CGTCGAGTCCAACC chr3:189567816-189568016_+,chr3:189567816-189568016_-,
CGTCGCGTGGTGCG chr3:198367595-198367795_+,chr3:198367595-198367795_-,
CGTCGAGTCCCGAC chr4:3673916-3674116_+,chr4:3673916-3674116_-,
CGTCGGTCGCTAGC chr5:136551387-136551587_+,chr5:136551387-136551587_-,
CGTCGGCGGAGCGT chr5:164040599-164040799_+,chr5:164040599-164040799_-,
CGTCGGCGGAGCGT chr5:164040599-164040799_+,chr5:164040599-164040799_-,
CGTCGATCTTCCTT chr5:16460921-16461121_+,chr5:16460921-16461121_-,
CGTCGTAGTGCGCA chr5:80891830-80892030_+,chr5:80891830-80892030_-,
CGTCGCGTGAGACG chr6:170233547-170233747_+,chr6:170233572-170233772_+,chr6:170233547-170233747_-,chr6:170233572-170233772_-,
CGTCGCGTGAGACG chr6:170233547-170233747_+,chr6:170233572

TCGCTAAGCGCGAG chr6:3029850-3030050_+,chr6:3029850-3030050_-,
TCGCTCACGCGCCG chr6:31592964-31593164_+,chr6:31592964-31593164_-,
TCGCTCGGTGGATG chr7:103650459-103650659_+,chr7:103650459-103650659_-,
TCGCTACCGACCCC chr7:25704410-25704610_+,chr7:25704410-25704610_-,
TCGCTGCTCGTCGC chr7:43046471-43046671_+,chr7:43046548-43046748_+,chr7:43046471-43046671_-,chr7:43046548-43046748_-,
TCGCTGGTTTATCG chr7:100739131-100739331_+,chr7:100739131-100739331_-,
TCGCTTCGTGGGAA chr9:117143455-117143655_+,chr9:117143455-117143655_-,
TCGCTACCCGAGGG chr9:138829064-138829264_+,chr9:138829064-138829264_-,
TCGCTACTTCGCCC chr9:145236580-145236780_+,chr9:145236580-145236780_-,
TCGCTCGGCGGAGC chrX:39510268-39510468_+,chrX:39510268-39510468_-,
TCGCTACGTACTCT chrX:47983424-47983624_+,chrX:47983424-47983624_-,
CGCTGCCGCGTACG chr1:15648294-15648494_+,chr1:15648294-15648494_-,
CGCTGCTTATAATA chr10:50372777-50372977_+,chr10:50372777-50372977_-,
CGCTGGATCTACGT chr10:70435932-70436132_+,chr10:70435932-70436132_-,
CGCTGA

CTTGGCGAATATAG chr4:97936775-97936975_+,chr4:97936775-97936975_-,
AAATTGCGCGTAAC chr3:100743096-100743296_+,chr3:100743099-100743299_+,chr3:100743096-100743296_-,chr3:100743099-100743299_-,
TTGGGCGCCGCAAT chr11:2239158-2239358_+,chr11:2239158-2239358_-,
TTGGGTTCGGCGAC chr19:11489403-11489603_+,chr19:11489403-11489603_-,
TTGGGAATCGCGCG chr20:21159756-21159956_+,chr20:21159756-21159956_-,
TTGGGCGCGAATTA chr6:49305248-49305448_+,chr6:49305248-49305448_-,
AATTTTGCGCGTCT chr9:134662540-134662740_+,chr9:134662540-134662740_-,
GGGCCGATCGTGCG chr1:29103313-29103513_+,chr1:29103313-29103513_-,
GGGCCTATTCGGAC chr1:33156762-33156962_+,chr1:33156762-33156962_-,
GGGCCACGCCAATA chr12:121930406-121930606_+,chr12:121930406-121930606_-,
GGGCCGAGCGAACT chr17:37795459-37795659_+,chr17:37795459-37795659_-,
GGGCCGAAACCGGT chr8:134335719-134335919_+,chr8:134335719-134335919_-,
TGGGCCGCGTCGTA chr1:15668837-15669037_+,chr1:15668837-15669037_-,
TGGGCGATGATAGC chr16:19532301-19532502_+,chr16:19532301-19532502_-

AGGTGGTTAAGCGT chr2:169617563-169617763_+,chr2:169617563-169617763_-,
AGGTGGCGAATACG chr2:203070193-203070393_+,chr2:203070193-203070393_-,
AGGTGGCGACGTTA chr3:144873579-144873779_+,chr3:144873579-144873779_-,
AGGTGCGCGATATA chr4:11559066-11559266_+,chr4:11559066-11559266_-,
TGGTTGCCACCGGA chr1:217519863-217520063_+,chr1:217519863-217520063_-,
TGGTTACGGCGGAC chr1:60935953-60936153_+,chr1:60935953-60936153_-,
TGGTTAGTCGAAAG chr10:102338198-102338398_+,chr10:102338198-102338398_-,
TGGTTCGCGCACGC chr11:65218965-65219169_+,chr11:65218965-65219169_-,
TGGTTCCCGATCGT chr19:39164696-39164896_+,chr19:39164696-39164896_-,
TGGTTGTACCAACG chr20:65606057-65606257_+,chr20:65606057-65606257_-,
TGGTTACGCTCGCG chr5:135556207-135556407_+,chr5:135556207-135556407_-,
TGGTTGACGAACCA chr5:150964718-150964918_+,chr5:150964718-150964918_-,
TGGTTCATCGACCA chr6:80956468-80956668_+,chr6:80956468-80956668_-,
TGGTTGGCGCGATA chr9:126184887-126185087_+,chr9:126184887-126185087_-,
GGTTGCGCGGATTC chr11:124774525-12477

CTGTACACTGTTCG chr12:51340049-51340249_+,chr12:51340049-51340249_-,
CTGTACGTTAGAGC chr16:89936644-89936844_+,chr16:89936644-89936844_-,
CTGTAAACCGGACG chr4:8466505-8466705_+,chr4:8466505-8466705_-,
CTGTATCCAACGTA chr5:131936917-131937117_+,chr5:131936917-131937117_-,
CTGTAGTCGGTAGG chr5:142682468-142682668_+,chr5:142682468-142682668_-,
CTGTACGCGCGCTG chr7:5091691-5091891_+,chr7:5091691-5091891_-,
CTGTACCGTCGCGA chr8:98403579-98403779_+,chr8:98403579-98403779_-,
CTGTATACCGCGCA chr9:149394245-149394445_+,chr9:149394245-149394445_-,
ACTCCGCCGACGAC chr15:34623939-34624139_+,chr15:34623939-34624139_-,
ACTCCATCGTCGCG chr15:39391762-39391962_+,chr15:39391762-39391962_-,
ACTCCATCGTCGCG chr15:39391762-39391962_+,chr15:39391762-39391962_-,
TGTAGCGCGATCGG chr1:160965905-160966105_+,chr1:160965905-160966105_-,
TGTAGCGCGATCGG chr1:160965905-160966105_+,chr1:160965905-160966105_-,
TGTAGTCGGCGCCC chr1:9130235-9130435_+,chr1:9130235-9130435_-,
TGTAGCTACGTCTA chr12:106703013-106703213_+,chr12:106703013

GACAGCGCGGCGTG chr19:17595559-17595759_+,chr19:17595559-17595759_-,
GACAGTCGTATCTG chr22:46596464-46596664_+,chr22:46596464-46596664_-,
CTACTCGTACGGCT chr19:57060588-57060788_+,chr19:57060588-57060788_-,
CTACTATCAACGCG chr22:22126441-22126641_+,chr22:22126441-22126641_-,
CTACTACGAACCGC chr9:96106707-96106907_+,chr9:96106707-96106907_-,
ACAGATAGTCTACG chr10:57998250-57998450_+,chr10:57998250-57998450_-,
ACAGATAGTCTACG chr10:57998250-57998450_+,chr10:57998250-57998450_-,
ACAGATTTACACGC chr16:63114307-63114507_+,chr16:63114307-63114507_-,
ACAGAGGTCGACGC chr19:57006309-57006509_+,chr19:57006309-57006509_-,
ACAGACGCGCGCCG chr5:139003280-139003480_+,chr5:139003280-139003480_-,
ACAGATGGGCACGA chr6:7131714-7131914_+,chr6:7131714-7131914_-,
TACTCGACTCGATA chr1:225595957-225596157_+,chr1:225595957-225596157_-,
TACTCGACTCGATA chr1:225595957-225596157_+,chr1:225595957-225596157_-,
TACTCGTGCCGCGC chr1:234552851-234553051_+,chr1:234552851-234553051_-,
TACTCCGTGGGCGT chr10:121137868-121138068_+,chr10

AGGAACACGTACCG chr4:60685753-60685953_+,chr4:60685753-60685953_-,
GAGGACGTCGCGAC chr13:110237126-110237326_+,chr13:110237126-110237326_-,
GAGGAGACGTATCG chr17:4529294-4529494_+,chr17:4529294-4529494_-,
GAGGATGACGCGAC chrX:47436907-47437107_+,chrX:47436907-47437107_-,
GGAAACGCCGCGGA chr10:68632503-68632703_+,chr10:68632503-68632703_-,
GGAAATCCGACGAT chr10:8051587-8051787_+,chr10:8051587-8051787_-,
GGAAACGCATTTCG chr13:27138443-27138643_+,chr13:27138443-27138643_-,
GGAAACGCGATTCG chr5:111602826-111603026_+,chr5:111602826-111603026_-,
GGAAACGCGATTCG chr5:111602826-111603026_+,chr5:111602826-111603026_-,
AGGATAGGTGGCGT chr13:36091944-36092144_+,chr13:36091944-36092144_-,
AGGATCGGGAACCG chr17:37795118-37795318_+,chr17:37795118-37795318_-,
AGGATCGCGATCGC chr20:40461729-40461929_+,chr20:40461729-40461929_-,
AGAACGAGTATCGA chr1:153471568-153471768_+,chr1:153471568-153471768_-,
AGAACGCGCTGACG chr1:211803906-211804106_+,chr1:211803906-211804106_-,
AGAACTGCGCTCGG chr13:107824087-107824287_+,chr13

AGAAGCGCCGTACG chr11:26737738-26737938_+,chr11:26737738-26737938_-,
AGAAGCGCCGTACG chr11:26737738-26737938_+,chr11:26737738-26737938_-,
AGAAGTCTCTCGCG chr13:24294046-24294246_+,chr13:24294046-24294246_-,
AGAAGTCGCTCGCG chr20:25863752-25863952_+,chr20:25863752-25863952_-,
AGAAGTCGCTCGCG chr20:25863752-25863952_+,chr20:25863752-25863952_-,
TATCCGCTCGGTTA chr1:120428181-120428381_+,chr1:120428181-120428381_-,
TATCCGCCGCGCGC chr1:227653152-227653352_+,chr1:227653152-227653352_-,
TATCCGCCGCGCGC chr1:227653152-227653352_+,chr1:227653152-227653352_-,
TATCCGCCTAATCG chr1:229556798-229556998_+,chr1:229556798-229556998_-,
TATCCGGGGGCGAT chr1:233541369-233541569_+,chr1:233541369-233541569_-,
TATCCTCGCCGGCG chr10:70445945-70446145_+,chr10:70445945-70446145_-,
TATCCCCGATCCCT chr10:75420215-75420415_+,chr10:75420215-75420415_-,
TATCCTACCGCCAT chr15:95520849-95521049_+,chr15:95520849-95521049_-,
TATCCGGCTTAAGG chr16:3050507-3050707_+,chr16:3050507-3050707_-,
TATCCCCGAGATTA chr16:66314569-66314769_+,c

TCCATCGCTCGATA chr6:28700056-28700256_+,chr6:28700056-28700256_-,
TCCATATGTCGTCT chr8:134147188-134147388_+,chr8:134147188-134147388_-,
TCCATCGTGCCGCG chrX:133377423-133377623_+,chrX:133377423-133377623_-,
CCATGTATCGACCC chr2:101273292-101273492_+,chr2:101273292-101273492_-,
CCATGCGCGCGTCC chr7:119530287-119530487_+,chr7:119530287-119530487_-,
CCATGGACGATCGC chr9:6710992-6711192_+,chr9:6710992-6711192_-,
CCATGGACGATCGC chr9:6710992-6711192_+,chr9:6710992-6711192_-,
CCATGGAAATCGCG chr9:95368927-95369127_+,chr9:95368927-95369127_-,
CCATGGACGCACGT chr9:103056086-103056286_+,chr9:103056086-103056286_-,
TGGTCGGCGTGTAA chr12:62792077-62792277_+,chr12:62792077-62792277_-,
TGGTCCGTGCGCGA chr15:47429254-47429455_+,chr15:47429254-47429455_-,
TGGTCGCGCGACAC chr19:1847470-1847670_+,chr19:1847470-1847670_-,
TGGTCGACCTTAGA chr19:23416545-23416745_+,chr19:23416545-23416745_-,
TGGTCCGGGCGAAT chr19:56005917-56006117_+,chr19:56005917-56006117_-,
TGGTCTCTGGACCG chr2:196725352-196725552_+,chr2:196725352-1

GTGGAGCACAACGT chr7:76092972-76093172_+,chr7:76092972-76093172_-,
GTGGACGTGATAGG chr8:144084029-144084229_+,chr8:144084029-144084229_-,
GTGGAGCGTAGGAC chr9:21979901-21980101_+,chr9:21979901-21980101_-,
GTGGACCGTTGTCG chrX:259547-259747_+,chrX:259547-259747_-,
GTGGAACGGCATTC chrX:67570440-67570640_+,chrX:67570440-67570640_-,
TGGAACTACGCTCC chr19:1876528-1876728_+,chr19:1876528-1876728_-,
TGGAATCAGTACGC chr19:35567628-35567828_+,chr19:35567628-35567828_-,
TGGAAACCCGGTCG chr3:13763642-13763842_+,chr3:13763642-13763842_-,
TGGAAGGATGCGCG chr4:168304512-168304712_+,chr4:168304512-168304712_-,
GGAATCACATCGGT chr10:33955897-33956097_+,chr10:33955897-33956097_-,
GGAATGCGCGCGAC chr11:1454206-1454406_+,chr11:1454206-1454406_-,
GGAATAGTGGCGCG chr17:14686192-14686392_+,chr17:14686192-14686392_-,
GGAATGCGACGGCG chr19:20560901-20561101_+,chr19:20560901-20561101_-,
GGAATCGCGCTACA chr3:187589212-187589412_+,chr3:187589212-187589412_-,
GGAATCGGAGCGTC chr5:89146906-89147106_+,chr5:89146906-89147106_-,
GA

TGACTTACGTCGTA chr3:191390932-191391132_+,chr3:191390932-191391132_-,
GACTCTTCTCGCGA chr1:111463932-111464132_+,chr1:111463932-111464132_-,
GACTCGTTACACAC chr11:36684308-36684508_+,chr11:36684308-36684508_-,
GACTCAACGCCTAT chr16:3998662-3998862_+,chr16:3998662-3998862_-,
GACTCGTACGACGT chr16:761474-761674_+,chr16:761474-761674_-,
GACTCGCCGATTGG chr19:43434559-43434759_+,chr19:43434559-43434759_-,
GACTCGTAAATTCG chr2:165858674-165858874_+,chr2:165858674-165858874_-,
TGGCCGATGACGGC chr16:3190061-3190268_+,chr16:3190061-3190268_-,
TGGCCGAATCCGGT chr17:44836672-44836872_+,chr17:44836672-44836872_-,
TGGCCCGTAACGTC chr17:50651675-50651875_+,chr17:50651675-50651875_-,
TGGCCGCTCGTCCG chr17:9553177-9553377_+,chr22:41672631-41672831_+,chr17:9553177-9553377_-,chr22:41672631-41672831_-,
TGGCCCCTCGACCG chr19:12907257-12907458_+,chr19:12907257-12907458_-,
TGGCCCACTAATCG chr3:187542922-187543122_+,chr3:187542922-187543122_-,
TGGCCGACGATCGC chr4:26650016-26650216_+,chr4:26650016-26650216_-,
TGGCCGAACG

GTATGACGATTCCG chr7:39020733-39020933_+,chr7:39020733-39020933_-,
GTATGGTCCGTGGA chr9:23444659-23444859_+,chr9:23444659-23444859_-,
TATGTTTCCGCCCG chr1:121030104-121030304_+,chr1:148836684-148836884_+,chr1:121030104-121030304_-,chr1:148836684-148836884_-,
TATGTGCCGAACGA chr1:70623277-70623477_+,chr1:70623277-70623477_-,
TATGTGAATGGCGC chr12:107368716-107368916_+,chr12:107368743-107368943_+,chr12:107368716-107368916_-,chr12:107368743-107368943_-,
TATGTCGCATACAA chr14:86821069-86821269_+,chr14:86821069-86821269_-,
TATGTGGATTGCGA chr3:139773523-139773723_+,chr3:139773523-139773723_-,
TATGTCCGTATGCG chr9:108211932-108212132_+,chr9:108211932-108212132_-,
TATGTCCGTATGCG chr9:108211932-108212132_+,chr9:108211932-108212132_-,
ATGTGGAACCTCGT chr22:24968611-24968815_+,chr22:24968611-24968815_-,
TGTGACCGCGCGGA chr7:22991285-22991485_+,chr7:22991285-22991485_-,
GAGTGACGCGTCAA chr1:40520374-40520574_+,chr1:40520374-40520574_-,
GAGTGTATCGCGCG chr17:65016290-65016490_+,chr17:65016337-65016537_+,chr17

TATCTGCCCAGCGA chr5:172154935-172155135_+,chr5:172154935-172155135_-,
TATCTGGGGACGAC chr6:35519092-35519292_+,chr6:35519092-35519292_-,
TATCTACTGACGTT chr8:93142499-93142699_+,chr8:93142499-93142699_-,
TATCTCGGAGCCGC chrX:128276180-128276380_+,chrX:128276180-128276380_-,
TATCTCGCGCCTCG chrX:47029641-47029841_+,chrX:47029641-47029841_-,
ATCTCTGGACGAAT chr10:22408947-22409147_+,chr10:22408947-22409147_-,
ATCTCCGGAGCGAC chr12:7974930-7975130_+,chr12:7974930-7975130_-,
ATCTCTATCCGACA chr2:219484465-219484665_+,chr2:219484465-219484665_-,
ATCTCAGCGTATCA chr2:231849821-231850021_+,chr2:231849821-231850021_-,
ATCTCACCGCGAGG chr3:197957412-197957612_+,chr3:197957412-197957612_-,
ATCTCGGACGATGC chr3:44011985-44012185_+,chr3:44011985-44012185_-,
ATCTCGCAACGCAA chr7:26993207-26993407_+,chr7:26993207-26993407_-,
ATCTCGCAACGCAA chr7:26993207-26993407_+,chr7:26993207-26993407_-,
ATCTCGTAGGCGAC chr8:145692541-145692741_+,chr8:145692541-145692741_-,
ATCTCGGCCAATCG chr9:143582917-143583117_+,chr9:14358

GACGCGCGTCGAAT chrX:53333728-53333928_+,chrX:53333728-53333928_-,
GACGCGCGTCGAAT chrX:53333728-53333928_+,chrX:53333728-53333928_-,
ACGCAAGGATGGGG chr11:110473461-110473661_+,chr11:110473461-110473661_-,
ACGCAGACGAACTA chr11:15790793-15790993_+,chr11:15790793-15790993_-,
ACGCACGCGCGGAT chr11:44192744-44192944_+,chr11:44192747-44192947_+,chr11:44192744-44192944_-,chr11:44192747-44192947_-,
ACGCACTTACTAGT chr12:31368363-31368563_+,chr12:31368363-31368563_-,
ACGCAGAGCGCGCG chr13:20491069-20491269_+,chr13:20491098-20491298_+,chr13:20491069-20491269_-,chr13:20491098-20491298_-,
ACGCACGTACTCGT chr14:88308471-88308671_+,chr14:88308471-88308671_-,
ACGCACGGCGATAT chr20:35856111-35856311_+,chr20:35856111-35856311_-,
ACGCAACATATCGT chr4:82289767-82289967_+,chr4:82289774-82289974_+,chr4:82289767-82289967_-,chr4:82289774-82289974_-,
ACGCATAACGTCTG chr5:112660306-112660506_+,chr5:112660306-112660506_-,
ACGCAGCGCGTAAT chr5:138705213-138705413_+,chr5:138705213-138705413_-,
ACGCATAACGCTGT chr6:16960806

CGAGAGAGGGACCG chr3:140915418-140915617_+,chr3:140915418-140915617_-,
CGAGACGCGTCGCC chr3:13895454-13895654_+,chr3:13895454-13895654_-,
CGAGAAGTCGGCCG chr3:97640692-97640892_+,chr3:97640692-97640892_-,
CGAGACGCGCCGGT chr5:20307476-20307676_+,chr5:20307476-20307676_-,
CGAGAATTCGAGCG chr6:161772085-161772285_+,chr6:161772085-161772285_-,
CGAGATTTCAATAG chr6:52502466-52502666_+,chr6:52502466-52502666_-,
CGAGATTCCACCGT chr7:75684946-75685146_+,chr7:75684946-75685146_-,
CGAGAAATCTCGCG chr8:67455006-67455206_+,chr8:67455006-67455206_-,
CGAGAGTATATCAC chr8:75296203-75296403_+,chr8:75296203-75296403_-,
CGAGACTTGTCACG chrX:23339825-23340025_+,chrX:23339825-23340025_-,
GGAACGACCACGAA chr1:26995680-26995880_+,chr1:26995680-26995880_-,
GGAACAGTTGCGCG chr19:34746226-34746426_+,chr19:34746226-34746426_-,
GGAACGAAAGGCGT chr19:57102477-57102677_+,chr19:57102477-57102677_-,
GGAACCGCGTTACG chr2:235056592-235056790_+,chr2:235056592-235056790_-,
GGAACTACGGTAGA chr7:75852399-75852599_+,chr7:75852399-758525

CGGCGCTACGGCTA chr14:14830149-14830344_+,chr14:14830149-14830344_-,
CGGCGAGCCGTCGC chr14:71335106-71335306_+,chr14:71335106-71335306_-,
CGGCGGTCGAAAGA chr15:20386672-20386872_+,chr15:20386672-20386872_-,
CGGCGTCGCGAACA chr15:38735413-38735613_+,chr15:38735413-38735613_-,
CGGCGTCGCGAACA chr15:38735413-38735613_+,chr15:38735413-38735613_-,
CGGCGGCGCGTAGT chr16:30072797-30072997_+,chr16:30072797-30072997_-,
CGGCGGATCGGAAC chr16:31830087-31830287_+,chr16:31830087-31830287_-,
CGGCGGGAACGATT chr16:60088547-60088747_+,chr16:60088547-60088747_-,
CGGCGGGAACGATT chr16:60088547-60088747_+,chr16:60088547-60088747_-,
CGGCGTATCAGACG chr16:74316546-74316746_+,chr16:74316546-74316746_-,
CGGCGTTGCGCGTC chr17:37468873-37469073_+,chr17:37468873-37469073_-,
CGGCGAACTGCGGT chr17:46075417-46075617_+,chr17:46075417-46075617_-,
CGGCGGCCTACGTA chr17:62279715-62279915_+,chr17:62279715-62279915_-,
CGGCGGCCTACGTA chr17:62279715-62279915_+,chr17:62279715-62279915_-,
CGGCGGCCTACGTA chr17:62279715-62279915_+,chr17:6

GCGCGTAACGACTG chr13:49344442-49344642_+,chr13:49344442-49344642_-,
GCGCGTCCCGACCG chr15:32559817-32560017_+,chr15:32559817-32560017_-,
GCGCGAGAAATCGC chr15:76300685-76300885_+,chr15:76300685-76300885_-,
GCGCGAGAAATCGC chr15:76300685-76300885_+,chr15:76300685-76300885_-,
GCGCGTAGGATGTA chr16:27884371-27884571_+,chr16:27884371-27884571_-,
GCGCGTTGGCTGAT chr16:29431302-29431502_+,chr16:29431302-29431502_-,
GCGCGTTAAAGCGA chr16:3177075-3177275_+,chr16:3177075-3177275_-,
GCGCGTAGCCGGAA chr16:54040967-54041167_+,chr16:54040967-54041167_-,
GCGCGTCGGAGGTA chr16:56539622-56539822_+,chr16:56539622-56539822_-,
GCGCGGTTAATCCA chr17:1092621-1092820_+,chr17:1092621-1092820_-,
GCGCGCCGAACGGC chr17:29260782-29260982_+,chr17:29260782-29260982_-,
GCGCGCCGAACGGC chr17:29260782-29260982_+,chr17:29260782-29260982_-,
GCGCGCCGCTTAAC chr17:45298806-45299006_+,chr17:45298806-45299006_-,
GCGCGTGACGTCCA chr17:4628970-4629170_+,chr17:4628970-4629170_-,
GCGCGTGGCCGGTA chr19:10421682-10421882_+,chr19:10421682-1042

CGCGGCGTACTACA chr3:28351162-28351362_+,chr3:28351162-28351362_-,
CGCGGCCAATCCAA chr3:46993074-46993274_+,chr3:46993074-46993274_-,
CGCGGAGCCTAACG chr3:75708949-75709149_+,chr3:75708949-75709149_-,
CGCGGGCGCAGACA chr4:191565574-191565774_+,chr4:191565574-191565774_-,
CGCGGACGCCCGCT chr4:24451931-24452145_+,chr4:24451931-24452145_-,
CGCGGTAGCACCGA chr5:127748929-127749129_+,chr5:127748929-127749129_-,
CGCGGATTGGTAGC chr5:138705213-138705413_+,chr5:138705213-138705413_-,
CGCGGGTCGAGCAA chr5:142375612-142375812_+,chr5:142375612-142375812_-,
CGCGGGTCGAGCAA chr5:142375612-142375812_+,chr5:142375612-142375812_-,
CGCGGAGGTCGACT chr5:167497358-167497558_+,chr5:167497358-167497558_-,
CGCGGATGCCGAGG chr5:80891830-80892030_+,chr5:80891830-80892030_-,
CGCGGGATTGAAGT chr6:11891179-11891379_+,chr6:11891179-11891379_-,
CGCGGCGGATGGGT chr6:149947111-149947311_+,chr6:149947111-149947311_-,
CGCGGAAGGATCGC chr6:151268349-151268549_+,chr6:151268349-151268549_-,
CGCGGTCGTCGGCT chr6:1483491-1483691_+,chr6:1

CCGCGTCGAGCGAC chr1:30654128-30654328_+,chr1:30654128-30654328_-,
CCGCGTCGAGCGAC chr1:30654128-30654328_+,chr1:30654128-30654328_-,
CCGCGTCGAGCGAC chr1:30654128-30654328_+,chr1:30654128-30654328_-,
CCGCGTCGAGCGAC chr1:30654128-30654328_+,chr1:30654128-30654328_-,
CCGCGTCGAGCGAC chr1:30654128-30654328_+,chr1:30654128-30654328_-,
CCGCGCGATCCGAA chr1:8716838-8717038_+,chr1:8716838-8717038_-,
CCGCGCTACGCGTA chr1:92143789-92143989_+,chr1:92143789-92143989_-,
CCGCGCTACGCGTA chr1:92143789-92143989_+,chr1:92143789-92143989_-,
CCGCGCTACGCGTA chr1:92143789-92143989_+,chr1:92143789-92143989_-,
CCGCGCTACGCGTA chr1:92143789-92143989_+,chr1:92143789-92143989_-,
CCGCGAATGACTAT chr10:3779280-3779480_+,chr10:3779280-3779480_-,
CCGCGTGAATAGCG chr10:92769316-92769516_+,chr10:92769316-92769516_-,
CCGCGTGCGCGATG chr11:44472196-44472396_+,chr11:44472196-44472396_-,
CCGCGTAGACGCGC chr11:47494196-47494396_+,chr11:47494196-47494396_-,
CCGCGACGGTCGCA chr11:75281123-75281323_+,chr11:75281123-75281323_-,
CCGCGAAG

ATTGGCGCGTCAAC chr5:31645814-31646014_+,chr5:31645814-31646014_-,
ATTGGGCGACGGTC chr7:92512115-92512315_+,chr7:92512119-92512319_+,chr7:92512115-92512315_-,chr7:92512119-92512319_-,
ATTGGCGCCTATAT chr8:120565952-120566152_+,chr8:120565952-120566152_-,
GCCACGACGACTCG chr1:167287341-167287541_+,chr1:167287341-167287541_-,
GCCACCGTATGGTA chr13:103325776-103325976_+,chr13:103325776-103325976_-,
GCCACGAACAGATA chr17:78016243-78016443_+,chr17:78016287-78016487_+,chr17:78016243-78016443_-,chr17:78016287-78016487_-,
GCCACGTATTACCT chr2:27454867-27455067_+,chr2:27454867-27455067_-,
GCCACGAACCGGTA chr8:131330655-131330855_+,chr8:131330655-131330855_-,
CCACGTAGTGCGAA chr1:15933083-15933283_+,chr1:15933083-15933283_-,
CCACGGATCATTAC chr1:34362258-34362458_+,chr1:34362258-34362458_-,
CCACGTATAAGGGA chr10:98988124-98988324_+,chr10:98988124-98988324_-,
CCACGATCGTGGGA chr12:4864839-4865039_+,chr12:4864848-4865048_+,chr12:4864839-4865039_-,chr12:4864848-4865048_-,
CCACGCGTAACGCT chr17:59499858-59500058

CGTCCGGGATCGCG chr4:59537779-59537979_+,chr4:59537779-59537979_-,
CGTCCTCCAATCCG chr5:31645814-31646014_+,chr5:31645814-31646014_-,
CGTCCGGCGAGCGA chr5:36940209-36940409_+,chr5:36940209-36940409_-,
CGTCCGGCGAGCGA chr5:36940209-36940409_+,chr5:36940209-36940409_-,
CGTCCGGCGAGCGA chr5:36940209-36940409_+,chr5:36940209-36940409_-,
CGTCCGGCGCAACC chr5:73932696-73932896_+,chr5:73932696-73932896_-,
CGTCCCGCGGATAC chr6:7395914-7396114_+,chr6:7395914-7396114_-,
CGTCCGAACGTAGC chr7:140813399-140813599_+,chr7:140813399-140813599_-,
CGTCCGTATGCGCG chr7:23610335-23610535_+,chr7:23610335-23610535_-,
CGTCCGTATGCGCG chr7:23610335-23610535_+,chr7:23610335-23610535_-,
CGTCCGTATGCGCG chr7:23610335-23610535_+,chr7:23610335-23610535_-,
CGTCCGGCCAAACG chr7:75549762-75549962_+,chr7:75549762-75549962_-,
CGTCCCGTCAGAAG chr7:900968-901168_+,chr7:900968-901168_-,
CGTCCGTCCGGTCG chr8:123864826-123865026_+,chr8:123864835-123865035_+,chr8:123864826-123865026_-,chr8:123864835-123865035_-,
CGTCCCGCACAACG chr9:145768

AGCCCGCGTAACGT chr18:24592031-24592231_+,chr18:24592031-24592231_-,
AGCCCGTTAGCGCG chr22:21878461-21878661_+,chr22:21878461-21878661_-,
AGCCCGTCGACCGA chr6:57011167-57011367_+,chr6:57011167-57011367_-,
AGCCCGTCGACCGA chr6:57011167-57011367_+,chr6:57011167-57011367_-,
AGCCCTTCGACGCG chrX:46642552-46642752_+,chrX:46642552-46642752_-,
GCCCCGATTACCGA chr11:44475102-44475302_+,chr11:44475102-44475302_-,
GCCCCGATCGAGTG chr12:114372696-114372896_+,chr12:114372696-114372896_-,
GCCCCGTCGACGAA chr12:3129047-3129247_+,chr12:3129047-3129247_-,
GCCCCGATACAGGT chr7:152147829-152148030_+,chr7:152147829-152148030_-,
CCCCGTCGCGCGTA chr1:46366882-46367082_+,chr1:46366882-46367082_-,
CCCCGCGCGCTATA chr1:94389694-94389894_+,chr1:94389694-94389894_-,
CCCCGCGCGCTATA chr1:94389694-94389894_+,chr1:94389694-94389894_-,
CCCCGCGCGCTATA chr1:94389694-94389894_+,chr1:94389694-94389894_-,
CCCCGTTCGATCCT chr10:35407171-35407371_+,chr10:35407171-35407371_-,
CCCCGTCCTATGAT chr16:5121861-5122061_+,chr3:75482053-7548225

GACGGTCGGTCGGG chr14:69468085-69468285_+,chr14:69468085-69468285_-,
GACGGATAGTCCGT chr15:62842621-62842821_+,chr15:62842621-62842821_-,
GACGGAAGGACGTC chr17:304926-305126_+,chr17:304926-305126_-,
GACGGTGATAATCG chr2:11516310-11516512_+,chr2:11516310-11516512_-,
GACGGAGAACGACG chr2:23387029-23387229_+,chr2:23387029-23387229_-,
GACGGGCGACAAAG chr22:46351533-46351733_+,chr22:46351533-46351733_-,
GACGGACAATCAAC chr3:24675384-24675584_+,chr3:24675384-24675584_-,
GACGGCGGATCGTC chr4:113916866-113917066_+,chr4:113916866-113917066_-,
GACGGGACTTATCG chr5:181649588-181649788_+,chr5:181649588-181649788_-,
GACGGTGGAGACGA chr6:11467157-11467357_+,chr6:11467157-11467357_-,
GACGGTGCACGTTA chr7:50016761-50016961_+,chr7:50016761-50016961_-,
ACGGGCGAATCACG chr1:185643147-185643347_+,chr1:185643147-185643347_-,
ACGGGCGGATCGCG chr11:46706744-46706944_+,chr11:46706744-46706944_-,
ACGGGTCGGACACG chr11:47317903-47318103_+,chr11:47317903-47318103_-,
ACGGGTCTTACGCA chr15:25013006-25013206_+,chr15:25013006-2501

CGTGATGCGTACTA chr16:90804809-90805009_+,chr16:90804809-90805009_-,
CGTGAAGCGCGAGA chr17:82027707-82027923_+,chr17:82027827-82028027_+,chr17:82027707-82027923_-,chr17:82027827-82028027_-,
CGTGAACGCGCAAA chr19:47582949-47583149_+,chr19:47582949-47583149_-,
CGTGACGCGTGGGG chr19:47826052-47826252_+,chr19:47826052-47826252_-,
CGTGACGCCCTCGT chr2:242500056-242500256_+,chr2:242500056-242500256_-,
CGTGATACGGTGCG chr2:3325342-3325542_+,chr2:3325342-3325542_-,
CGTGATCGACGAGT chr2:70975972-70976172_+,chr2:70975972-70976172_-,
CGTGACGCGCCGGT chr22:24164493-24164693_+,chr22:24164495-24164695_+,chr22:24164493-24164693_-,chr22:24164495-24164695_-,
CGTGACGCGCCGGT chr22:24164493-24164693_+,chr22:24164495-24164695_+,chr22:24164493-24164693_-,chr22:24164495-24164695_-,
CGTGACGCGACTTA chr22:24164493-24164693_+,chr22:24164495-24164695_+,chr22:24164493-24164693_-,chr22:24164495-24164695_-,
CGTGAGTACCATCG chr3:145094888-145095088_+,chr3:145094888-145095088_-,
CGTGATAGACATCT chr4:191802340-191802540_+,chr4:1

GCCGCAACGCGACG chr9:35866973-35867173_+,chr9:35866973-35867173_-,
GCCCTTCGCGCGAT chr11:121317649-121317849_+,chr11:121317649-121317849_-,
GCCCTTCGCGCGAT chr11:121317649-121317849_+,chr11:121317649-121317849_-,
GCCCTATTCGCATA chr12:108840838-108841038_+,chr12:108840838-108841038_-,
GCCCTTCGACGGGA chr2:174499351-174499551_+,chr2:174499351-174499551_-,
GCCCTCTATAATCG chr3:162506859-162507059_+,chr3:162506859-162507059_-,
GCCCTACGACTCGC chr4:56032414-56032614_+,chr4:56032414-56032614_-,
GCCCTTCGACGCGT chrX:46642552-46642752_+,chrX:46642552-46642752_-,
GCCCTTCGACGCGT chrX:46642552-46642752_+,chrX:46642552-46642752_-,
GCCCTACTCGCCGA chrX:67126993-67127193_+,chrX:67126993-67127193_-,
GCCCTTCGCGCGCA chrY:8963877-8964077_+,chrY:8963877-8964077_-,
CTGTTCGGCCGCCG chr10:102023503-102023703_+,chr10:102023503-102023703_-,
CTGTTTCCACGACG chr16:27646952-27647152_+,chr16:27646952-27647152_-,
CTGTTCCTATAGCG chr2:44979400-44979600_+,chr2:44979400-44979600_-,
CTGTTCGCGTGTAA chr5:6752343-6752543_+,chr5:675

AGGGGTTCGATCAA chr2:60824144-60824344_+,chr2:60824144-60824344_-,
GGGGATACGCCGTG chr11:340647-340847_+,chr11:340647-340847_-,
GGGGACGGACCGTA chr16:54040967-54041167_+,chr16:54040967-54041167_-,
GGGGATGGCGACTA chr2:164560712-164560912_+,chr2:164560712-164560912_-,
GGGAACGGATTATG chr11:63010026-63010226_+,chr11:63010026-63010226_-,
GGGAACCTTACGCT chr14:67750590-67750790_+,chr14:67750590-67750790_-,
GGGAACGATCAAAG chr20:21137333-21137533_+,chr20:21137333-21137533_-,
GGGAATCGCGCGAG chr20:21159756-21159956_+,chr20:21159756-21159956_-,
GGGAACGCCTATCG chr7:139208548-139208749_+,chr7:139208548-139208749_-,
GAAAGCGCGGCGCA chr18:37021811-37022011_+,chr18:37021811-37022011_-,
GAAAGAGCGACGCG chr9:106334024-106334224_+,chr9:106334033-106334233_+,chr9:106334024-106334224_-,chr9:106334033-106334233_-,
AAGAGCCGACGCGA chr10:50459012-50459212_+,chr10:50459012-50459212_-,
AAGAGGCCCGTACG chr17:45905341-45905541_+,chr17:45905341-45905541_-,
AAGAGTGGTTCGAC chr20:10050701-10050901_+,chr20:10050701-10050901_-

AGGGATCGGCGATC chr6:28771654-28771854_+,chr6:28771654-28771854_-,
AAAGCGCGAACGCA chr1:120860185-120860386_+,chr1:143653828-143654028_+,chr1:143653810-143654010_+,chr1:120860185-120860386_-,chr1:143653828-143654028_-,chr1:143653810-143654010_-,
AAAGCGGTCCGTTA chr2:143152537-143152737_+,chr2:143152537-143152737_-,
AAGCGCAATATTCG chr12:77156783-77156983_+,chr13:43194670-43194870_+,chr2:197011161-197011361_+,chr8:75377799-75377999_+,chr12:77156783-77156983_-,chr13:43194670-43194870_-,chr2:197011161-197011361_-,chr8:75377799-75377999_-,
AAGCGTCGTAAGAC chr14:49418391-49418591_+,chr14:49418391-49418591_-,
AAGCGGCGTCGCGA chr15:38735413-38735613_+,chr15:38735413-38735613_-,
AAGCGGCGTCGCGA chr15:38735413-38735613_+,chr15:38735413-38735613_-,
AAGCGGCGTCGCGA chr15:38735413-38735613_+,chr15:38735413-38735613_-,
AAGCGACGCGGTAT chr15:56907033-56907233_+,chr15:56907033-56907233_-,
AAGCGCGACCGACC chr16:83778555-83778755_+,chr16:83778555-83778755_-,
AAGCGGTCGCGGGA chr3:187358925-187359125_+,chr3:1873589

ACCGCGCGTACCCG chr5:164040599-164040799_+,chr5:164040599-164040799_-,
ACCGCGGGAACGAA chr5:1559245-1559445_+,chr5:1559250-1559450_+,chr5:1559245-1559445_-,chr5:1559250-1559450_-,
ACCGCGCGTAACAG chr7:140813399-140813599_+,chr7:140813399-140813599_-,
ACCGCCATAACCAT chr7:2065973-2066173_+,chr7:2065973-2066173_-,
ACCGCGCGGACGGA chr7:22991285-22991485_+,chr7:22991285-22991485_-,
ACCGCGCGGACGGA chr7:22991285-22991485_+,chr7:22991285-22991485_-,
ACCGCCCGTCCGAT chr9:104973897-104974097_+,chr9:104973897-104974097_-,
CCGCAGCGACGTCG chr1:54920262-54920462_+,chr1:54920262-54920462_-,
CCGCACCCGTAACT chr10:62332281-62332481_+,chr10:62332281-62332481_-,
CCGCAACGTTCGCG chr11:67311663-67311863_+,chr11:67311663-67311863_-,
CCGCACGCCAAACG chr11:72007254-72007454_+,chr11:72007254-72007454_-,
CCGCATCGCGCGAG chr13:108316028-108316228_+,chr13:108316028-108316228_-,
CCGCATCGCGCGAG chr13:108316028-108316228_+,chr13:108316028-108316228_-,
CCGCACTAGCGTCG chr17:36355607-36355807_+,chr17:36355607-36355807_-,
CCGCAC

GCGGTGACCGTACT chr6:43892050-43892250_+,chr6:43892050-43892250_-,
GCGGTCTAGCCGCG chr7:1149278-1149478_+,chr7:1149278-1149478_-,
GCGGTATCTCGGCC chr9:143582917-143583117_+,chr9:143582917-143583117_-,
GCGGTATGTCGGGG chr9:36347573-36347773_+,chr9:36347573-36347773_-,
GCGGTCCTTACGTG chrX:15258257-15258475_+,chrX:15258257-15258475_+,chrX:15258257-15258475_-,chrX:15258257-15258475_-,
GCGGTCGCGCTACG chrX:17237935-17238135_+,chrX:17237935-17238135_-,
CGGTGTTACGCCCT chr1:180545346-180545546_+,chr1:180545346-180545546_-,
CGGTGGTTACGGCG chr1:60935953-60936153_+,chr1:60935953-60936153_-,
CGGTGCGCTCGGCG chr10:15737750-15737950_+,chr10:15737750-15737950_-,
CGGTGCGTGTCCCG chr10:69769893-69770093_+,chr10:69769893-69770093_-,
CGGTGAGTCGCATA chr11:102532820-102533020_+,chr11:102532820-102533020_-,
CGGTGGGAGTACGT chr11:36887856-36888056_+,chr11:36887858-36888058_+,chr11:36887856-36888056_-,chr11:36887858-36888058_-,
CGGTGCGCGTCCCG chr11:86978700-86978900_+,chr11:86978700-86978900_-,
CGGTGACGAGCGAC chr15:4

CAACCTTCGCGTCG chr20:10477156-10477356_+,chr20:10477156-10477356_-,
CAACCCGTGGACGC chr4:57723063-57723263_+,chr4:57723066-57723266_+,chr4:57723063-57723263_-,chr4:57723066-57723266_-,
CAACCGGGCTTACG chr9:136243569-136243769_+,chr9:136243569-136243769_-,
AACCATAGACGACT chr1:109750393-109750593_+,chr1:109750393-109750593_-,
AACCAACGCGCGTA chr10:117682418-117682618_+,chr10:117682418-117682618_-,
AACCAGGGTCGACG chr2:225491240-225491440_+,chr2:225491240-225491440_-,
AACCATCGAGGCCG chr7:158593963-158594163_+,chr7:158593963-158594163_-,
ACCAGTCGCGCGTG chr17:62268654-62268854_+,chr17:62268654-62268854_-,
ACCAGGGTCGACGC chr2:225491240-225491440_+,chr2:225491240-225491440_-,
ACCAGCGTGCGACC chr8:8059602-8059802_+,chr8:8059602-8059802_-,
GACGTACGCGAGCG chr10:131039427-131039627_+,chr10:131039427-131039627_-,
GACGTACGCGAGCG chr10:131039427-131039627_+,chr10:131039427-131039627_-,
GACGTCAAACCGTC chr10:15210640-15210840_+,chr10:15210640-15210840_-,
GACGTCCCTCGCGT chr11:118630296-118630496_+,chr11:118

TACGTCTCATCGGC chr7:157803270-157803470_+,chr7:157803270-157803470_-,
TACGTCATCGTAAG chr7:25997751-25997951_+,chr7:25997751-25997951_-,
TACGTTGTCCTACG chr7:28158133-28158333_+,chr7:28158133-28158333_-,
TACGTCGCCGGAAG chr7:77454056-77454256_+,chr7:77454056-77454256_-,
TACGTCGCCGGAAG chr7:77454056-77454256_+,chr7:77454056-77454256_-,
ACGTACATCCGCTA chr1:52285937-52286137_+,chr1:52285937-52286137_-,
ACGTAGTCCCCACG chr1:52584858-52585058_+,chr1:52584858-52585058_-,
ACGTAGTCCCCACG chr1:52584858-52585058_+,chr1:52584858-52585058_-,
ACGTATGATTGGCA chr1:57160391-57160591_+,chr1:57160391-57160591_-,
ACGTACGCGAGCGT chr10:131039427-131039627_+,chr10:131039427-131039627_-,
ACGTACCATCGGAC chr10:29152166-29152366_+,chr10:29152166-29152366_-,
ACGTACATCGCCCA chr10:8046038-8046238_+,chr10:8046038-8046238_-,
ACGTACCGATGACG chr11:133973041-133973241_+,chr11:133973041-133973241_-,
ACGTACCGATGACG chr11:133973041-133973241_+,chr11:133973041-133973241_-,
ACGTACGTGCACGA chr15:75764236-75764436_+,chr15:7576423

CCACCGATATCGAC chrX:147852496-147852696_+,chrX:147852496-147852696_-,
CCCTAACTGATCGC chr1:23454323-23454523_+,chr1:23454416-23454616_+,chr1:23454323-23454523_-,chr1:23454416-23454616_-,
CCCTACGCGCGTGT chr1:28423784-28423984_+,chr1:28423806-28424006_+,chr1:28423784-28423984_-,chr1:28423806-28424006_-,
CCCTATCCGTCCAA chr1:39901695-39901895_+,chr1:39901695-39901895_-,
CCCTATTCGGGACG chr1:9232729-9232929_+,chr1:9232729-9232929_-,
CCCTATTACGCAAT chr3:191166508-191166708_+,chr3:191166508-191166708_-,
CCCTATAGGAACCG chr5:169523339-169523539_+,chr5:169523339-169523539_-,
CCCTAGTGAACGAC chr7:142329099-142329299_+,chr7:142329099-142329299_-,
CCTAATAAGCGCGA chr10:68632503-68632703_+,chr10:68632503-68632703_-,
CCTAAAGTTCGACC chr10:73126186-73126386_+,chr10:73126186-73126386_-,
CCTAAGATTGCGAA chr12:113248781-113248981_+,chr12:113248781-113248981_-,
CCTAACGGGACGGT chr2:177037985-177038185_+,chr2:177037985-177038185_-,
CCTAACCGGTTACG chr2:188005643-188005843_+,chr2:188005643-188005843_-,
CCTAAGCGGTAC

TTTCCGCCACGAGT chr20:38329388-38329588_+,chr20:38329388-38329588_-,
TTTCCGGGCGACGC chr20:59128839-59129039_+,chr20:59128839-59129039_-,
TTTCCACGTTTGCG chr3:10977871-10978071_+,chr3:10977871-10978071_-,
TTTCCACGTGCGCG chr7:109894294-109894494_+,chr7:109894294-109894494_-,
TTTCCCCGTGCAAC chr7:96482813-96483013_+,chr7:96482813-96483013_-,
TTTCCACGTTCGAG chrX:22917560-22917760_+,chrX:22917560-22917760_-,
CCACTACTCGTACG chr19:57060588-57060788_+,chr19:57060588-57060788_-,
CCAGTAACGATGGG chr2:206266531-206266731_+,chr2:206266531-206266731_-,
CCAGTACGCCGATC chr5:103070305-103070505_+,chr5:103070305-103070505_-,
CCAGTACGACTCGA chr7:156586185-156586385_+,chr7:156586185-156586385_-,
CCAGTACGACTCGA chr7:156586185-156586385_+,chr7:156586185-156586385_-,
CCAGTACGACTCGA chr7:156586185-156586385_+,chr7:156586185-156586385_-,
CAGTGGCGTAATCG chr22:31896674-31896874_+,chr22:31896674-31896874_-,
CAGTGACGTCGCGA chr6:35551807-35552007_+,chr6:35551807-35552007_-,
CAGTGCGTCGCGCC chr9:146241241-146241441_+,ch

TCTTGGACTCGGCG chr17:82027707-82027923_+,chr17:82027707-82027923_-,
TCTTGAGGCGTAAC chr6:75751872-75752072_+,chr6:75751872-75752072_-,
CTTGTCGTAAGGCG chr10:111820657-111820857_+,chr10:111820657-111820857_-,
CTTGTACGATTGAC chr14:20031987-20032187_+,chr14:20031987-20032187_-,
CTTGTTAAGCGTCG chr19:54482877-54483077_+,chr19:54482956-54483156_+,chr19:54482957-54483157_+,chr19:54482877-54483077_-,chr19:54482956-54483156_-,chr19:54482957-54483157_-,
TTGTCGTGTCAGAC chr1:162238113-162238313_+,chr1:162238113-162238313_-,
TTGTCGCGGCGGGC chr1:199005099-199005299_+,chr1:199005099-199005299_-,
TTGTCCGCGCGTCA chr1:28423761-28423961_+,chr1:28423784-28423984_+,chr1:28423806-28424006_+,chr1:28423761-28423961_-,chr1:28423784-28423984_-,chr1:28423806-28424006_-,
TTGTCGCGTCTGGC chr1:64776126-64776326_+,chr1:64776126-64776326_-,
TTGTCGTAAGGCGG chr10:111820657-111820857_+,chr10:111820657-111820857_-,
TTGTCGTAAGGCGG chr10:111820657-111820857_+,chr10:111820657-111820857_-,
TTGTCGCTCTATAC chr11:76737791-76737992

TCTGTTACACGTCG chr5:16460921-16461121_+,chr5:16460921-16461121_-,
TCTGTTAGGACGAG chr7:103177224-103177424_+,chr7:103177224-103177424_-,
TGTTCCGCGACCGC chr1:225309815-225310015_+,chr1:225309815-225310015_-,
TGTTCACGCGTCGA chr14:17183014-17183214_+,chr14:17183014-17183214_-,
TGTTCGCCTAGTCG chr14:62725220-62725420_+,chr14:62725220-62725420_-,
TGTTCTCGCGGAGA chr16:73020989-73021189_+,chr16:73020989-73021189_-,
TGTTCGAGCTGACG chr17:81091625-81091825_+,chr17:81091625-81091825_-,
TGTTCCACCGGCTT chr18:5399486-5399686_+,chr18:5399486-5399686_-,
TGTTCGCGCGGCGA chr2:224428529-224428729_+,chr2:224428529-224428729_-,
TGTTCGCGCGGCGA chr2:224428529-224428729_+,chr2:224428529-224428729_-,
TGTTCGGGGTAACG chr4:24453645-24453845_+,chr4:24453645-24453845_-,
TGTTCGTCGAATCA chr6:169474371-169474571_+,chr6:169474371-169474571_-,
TGTTCGCTCGCAAC chr7:30732289-30732489_+,chr7:30732289-30732489_-,
TGTTCATCCGCGGT chr9:145452386-145452586_+,chr9:145452386-145452586_-,
GTTCGATTTACGCA chr1:155595147-155595347_+,chr1

CGTCGGTCTCGTAA chr16:14323156-14323356_+,chr17:32495756-32495956_+,chr16:14323156-14323356_-,chr17:32495756-32495956_-,
CGTCGGTCTCGTAA chr16:14323156-14323356_+,chr17:32495756-32495956_+,chr16:14323156-14323356_-,chr17:32495756-32495956_-,
CGTCGACTGTTCCG chr16:3006959-3007159_+,chr16:3006959-3007159_-,
CGTCGACTGTTCCG chr16:3006959-3007159_+,chr16:3006959-3007159_-,
CGTCGACTGTTCCG chr16:3006959-3007159_+,chr16:3006959-3007159_-,
CGTCGCCGCGAGAT chr16:89992408-89992608_+,chr16:89992408-89992608_-,
CGTCGCCGCGAGAT chr16:89992408-89992608_+,chr16:89992408-89992608_-,
CGTCGGGAAGTACA chr17:2613265-2613465_+,chr17:2613265-2613465_-,
CGTCGTGCGAACCG chr17:2742482-2742682_+,chr17:2742482-2742682_-,
CGTCGTGCGAACCG chr17:2742482-2742682_+,chr17:2742482-2742682_-,
CGTCGTGCGAACCG chr17:2742482-2742682_+,chr17:2742482-2742682_-,
CGTCGTGCGAACCG chr17:2742482-2742682_+,chr17:2742482-2742682_-,
CGTCGAGGCGCCAT chr17:50962223-50962424_+,chr17:50962223-50962424_-,
CGTCGCTCGCGGAT chr17:65970592-65970792_+,chr

GTCGCGGGCACGTA chr6:117734611-117734811_+,chr6:117734611-117734811_-,
GTCGCCGTTCAAAG chr6:127292705-127292905_+,chr6:127292705-127292905_-,
GTCGCTACTAGTCT chr6:145576808-145577008_+,chr6:145576808-145577008_-,
GTCGCGGGTTCGAT chr6:26422474-26422674_+,chr6:26624860-26625060_+,chr6:27557889-27558089_+,chr6:26422474-26422674_-,chr6:26624860-26625060_-,chr6:27557889-27558089_-,
GTCGCAACCGTTTA chr6:41135645-41135845_+,chr6:41135645-41135845_-,
GTCGCGAACGCGCG chr7:114437604-114437804_+,chr7:114437604-114437804_-,
GTCGCAACCCGTTG chr7:150466867-150467067_+,chr7:150466867-150467067_-,
GTCGCTGCGCGCTA chr7:43046471-43046671_+,chr7:43046548-43046748_+,chr7:43046471-43046671_-,chr7:43046548-43046748_-,
GTCGCCCGTGTCGC chr7:44304090-44304290_+,chr7:44304090-44304290_-,
GTCGCCACTAGGCG chr7:77606264-77606464_+,chr7:77606264-77606464_-,
GTCGCTCCTCGGTG chr8:100072503-100072703_+,chr8:100072503-100072703_-,
GTCGCTAAGCGATG chr9:136476285-136476485_+,chr9:136476285-136476485_-,
GTCGCGTACTCCCG chr9:141406593-

TTAACCTCCCGAGT chr18:9966688-9966888_+,chr18:9966688-9966888_-,
TTAACGGCGCAAGT chr2:27062112-27062312_+,chr2:27062112-27062312_-,
TAACACGTCCTTCC chr10:33955897-33956097_+,chr10:33955897-33956097_-,
TAACACGCCGGGCG chr11:70152854-70153054_+,chr11:70152854-70153054_-,
TAACATACCACGTG chr18:3346727-3346927_+,chr18:3346727-3346927_-,
TAACAGCTCGCGTA chr20:21866180-21866380_+,chr20:21866180-21866380_-,
TAACAGCTCGCGTA chr20:21866180-21866380_+,chr20:21866180-21866380_-,
TAACAGCTCGCGTA chr20:21866180-21866380_+,chr20:21866180-21866380_-,
TAACAGACGACACG chr4:172481706-172481906_+,chr4:172481706-172481906_-,
TAACACGCGAAAGG chr5:181729533-181729733_+,chr5:181729533-181729733_-,
TAACATACCACGGG chr7:77606264-77606464_+,chr7:77606264-77606464_-,
AACAATCGACAACT chr1:181616175-181616375_+,chr1:181616175-181616375_-,
ACAAGTGCGGTTCG chr11:64886677-64886877_+,chr11:64886677-64886877_-,
ACAAGTCGCACGCG chr17:60434238-60434438_+,chr17:60434238-60434438_-,
ACAAGTGTCGCCCG chr8:61334084-61334284_+,chr8:61334084-

TTCACGGGGTATAG chr4:38047758-38047958_+,chr4:38047758-38047958_-,
TTCACGCGACGCCT chr5:132614367-132614567_+,chr5:132614367-132614567_-,
TTCACGTGACTTAA chr7:47428253-47428453_+,chr7:47428253-47428453_-,
ACCCGTGTCCCGCG chr1:47589148-47589348_+,chr1:47589148-47589348_-,
ACCCGCCACACGAC chr12:123858250-123858450_+,chr12:123858250-123858450_-,
ACCCGAACGGGCGT chr16:31021291-31021491_+,chr16:31021291-31021491_-,
ACCCGTCGTCGCGT chr19:48270763-48270963_+,chr19:48270763-48270963_-,
ACCCGTCGTCGCGT chr19:48270763-48270963_+,chr19:48270763-48270963_-,
ACCCGCGTCTCCCG chr22:46781380-46781580_+,chr22:46781380-46781580_-,
ACCCGCGGTAGGAC chr4:176065641-176065841_+,chr4:176065641-176065841_-,
ACCCGCATCGCGGG chr5:51741929-51742129_+,chr5:51741929-51742129_-,
ACCCGCTTATTGCG chr6:139962039-139962239_+,chr6:139962039-139962239_-,
ACCCGCTAGAGAGT chr6:26383464-26383664_+,chr6:26383464-26383664_-,
ACCCGCGAGCTACG chr9:113658295-113658495_+,chr9:113658295-113658495_-,
ACCCGTAACGCGGA chrX:47033701-47033901_+,chrX:4

GAGTTCGGACCGAA chr7:5356325-5356525_+,chr7:5356325-5356525_-,
GAGTTGCGTAAACG chr9:119443548-119443748_+,chr9:119443548-119443748_-,
TTGGACGCGATAAG chr15:54267932-54268132_+,chr15:54267932-54268132_-,
TTGGACGTACTGCG chr19:51328096-51328296_+,chr19:51328096-51328296_-,
TTGGACCATCGCCG chr19:58181561-58181761_+,chr19:58181561-58181761_-,
TTGGACGCGCGCAA chr2:241716592-241716792_+,chr2:241716592-241716792_-,
TTGGACCAACGCGC chr3:46926001-46926201_+,chr3:46926001-46926201_-,
TTGGACACGCGAAA chr3:58218239-58218439_+,chr3:58218239-58218439_-,
TTGGATAGCCGACG chr8:127114277-127114477_+,chr8:127114277-127114477_-,
GCTGGACGGTCGTA chr1:162413812-162414012_+,chr1:162413812-162414012_-,
GCTGGTTATTCGAT chr7:70626231-70626431_+,chr7:70626231-70626431_-,
GGGACGGCGCTACG chr1:14100690-14100890_+,chr1:14100690-14100890_-,
GGGACGATCGGCTA chr1:70407037-70407237_+,chr1:70407039-70407239_+,chr1:70407037-70407237_-,chr1:70407039-70407239_-,
GGGACGTACGCGAG chr10:131039427-131039627_+,chr10:131039427-131039627_-,
GG

GCGTGGCCAATATA chr19:17789263-17789463_+,chr19:17789263-17789463_-,
GCGTGTTACGTCCG chr19:44927994-44928194_+,chr19:44927994-44928194_-,
GCGTGCCTCGGTAC chr19:5706718-5706918_+,chr19:5706718-5706918_-,
GCGTGTATTCTGAC chr2:35415646-35415846_+,chr2:35415646-35415846_-,
GCGTGCCGGTGCGC chr20:2131819-2132019_+,chr20:2131819-2132019_-,
GCGTGCGTCGCGAC chr3:124555037-124555237_+,chr3:124555037-124555237_-,
GCGTGCGTCGCGAC chr3:124555037-124555237_+,chr3:124555037-124555237_-,
GCGTGTAACCAGCG chr7:5605459-5605659_+,chr7:5605459-5605659_-,
GCGTGGGCCTAACG chr8:54835089-54835289_+,chr8:54835089-54835289_-,
GCGTGCTTATAGCG chr9:35574676-35574876_+,chr9:35574688-35574888_+,chr9:35574676-35574876_-,chr9:35574688-35574888_-,
CATCCACCGCGATC chr13:44836919-44837119_+,chr13:44836919-44837119_-,
CATCCGACCGGTAT chr16:63095467-63095667_+,chr16:63095467-63095667_-,
CATCCTCGCGTATC chr21:13838708-13838908_+,chr21:13838708-13838908_-,
CATCCGACCGATCG chr6:26195903-26196103_+,chr6:26195921-26196121_+,chr6:26195940-261

ACGGCGGATCCTCC chr19:13973839-13974039_+,chr19:13973839-13974039_-,
ACGGCATTCGCGCG chr19:51164171-51164371_+,chr19:51164171-51164371_-,
ACGGCCGGCGCTCG chr2:6887295-6887495_+,chr2:6887295-6887495_-,
ACGGCTGAACGTAT chr21:28761850-28762050_+,chr21:28761850-28762050_-,
ACGGCGGAGCCTAC chr21:31531339-31531539_+,chr21:31531339-31531539_-,
ACGGCGGGCGAAAA chr3:189628340-189628540_+,chr3:189628340-189628540_-,
ACGGCGGATCGTCT chr4:113916866-113917066_+,chr4:113916866-113917066_-,
ACGGCAGTACCCTA chr5:153219929-153220129_+,chr5:153219929-153220129_-,
ACGGCGGGCGTCGT chr5:80971996-80972196_+,chr5:80971996-80972196_-,
ACGGCTCCTGCGTA chr6:44110466-44110666_+,chr6:44110466-44110666_-,
ACGGCGATCGACCG chr7:146016712-146016912_+,chr7:146016712-146016912_-,
ACGGCGGATCTCAC chrX:108861122-108861322_+,chrX:108861130-108861330_+,chrX:108861122-108861322_-,chrX:108861130-108861330_-,
CGGCATAGCGCGTT chr19:51831235-51831435_+,chr19:51831235-51831435_-,
CGGCAACTATACGT chr19:54416063-54416263_+,chr19:54416063-544162

CTGTCGTACGGCAA chr16:30721507-30721707_+,chr16:30721507-30721707_-,
CTGTCGAGCCACCA chr4:1801346-1801546_+,chr4:1801346-1801546_-,
CTGTCGATCGGCCA chr5:153219929-153220129_+,chr5:153219929-153220129_-,
CTGTCGTTACGCCC chr5:181614978-181615178_+,chr5:181614978-181615178_-,
CTGTCCACGATAGT chr6:166815-167015_+,chr6:166815-167015_-,
CTGTCGTTAGTCGG chr7:5091691-5091891_+,chr7:5091691-5091891_-,
TGTCACCGCGATAT chr14:13868985-13869185_+,chr14:13868985-13869185_-,
TGTCACGTGATACC chr19:1824715-1824915_+,chr19:1824715-1824915_-,
TGTCAGATAGCGAT chr19:50479239-50479439_+,chr19:50479239-50479439_-,
TGTCACAGGCGATA chr2:16348342-16348542_+,chr2:16348342-16348542_-,
TGTCACGGGAACTA chr8:131519377-131519577_+,chr8:131519377-131519577_-,
CATGTCGCGTCATT chr1:20251559-20251759_+,chr1:20251559-20251759_-,
CATGTGATTCGCGG chr16:56657731-56657931_+,chr16:56657731-56657931_-,
CATGTGGCGCCATT chr22:43664712-43664912_+,chr22:43664727-43664927_+,chr22:43664712-43664912_-,chr22:43664727-43664927_-,
CATGTGGGGCGATT chr3:

TAAGCCGGGAACGA chr15:54294064-54294264_+,chr15:54294064-54294264_-,
TAAGCGTCGCGAGC chr19:54482877-54483077_+,chr19:54482956-54483156_+,chr19:54482957-54483157_+,chr19:54482877-54483077_-,chr19:54482956-54483156_-,chr19:54482957-54483157_-,
TAAGCGTCGCGAGC chr19:54482877-54483077_+,chr19:54482956-54483156_+,chr19:54482957-54483157_+,chr19:54482877-54483077_-,chr19:54482956-54483156_-,chr19:54482957-54483157_-,
TAAGCACCGCTCCG chr2:231141909-231142109_+,chr2:231141909-231142109_-,
TAAGCAATCTGTCG chr3:156998781-156998981_+,chr3:156998781-156998981_-,
TAAGCCGCCCTATC chr4:6084090-6084290_+,chr4:6084090-6084290_-,
TAAGCATCGGCGCG chr5:164040599-164040799_+,chr5:164040599-164040799_-,
TAAGCTACATAGCG chr6:138741398-138741598_+,chr6:138741398-138741598_-,
TAAGCTCGTCTGAC chr6:14084265-14084465_+,chr6:14084265-14084465_-,
TAAGCGCGAGCCGA chr6:3029850-3030050_+,chr6:3029850-3030050_-,
TAAGCAGTCGAGCG chr7:10215821-10216021_+,chr7:10215821-10216021_-,
TAAGCGGCGGTGCG chr7:91369937-91370137_+,chr7:9136993

CCTCGCGTCGCGTA chr22:30230190-30230390_+,chr22:30230190-30230390_-,
CCTCGACGGAACGT chr5:178535362-178535562_+,chr5:178535362-178535562_-,
CCTCGCTTACTCGA chr6:27557889-27558089_+,chr6:27557889-27558089_-,
CCTCGACGTCACCG chr7:45146960-45147160_+,chr7:45146960-45147160_-,
CCTCGAATGACGCT chr8:133798771-133798971_+,chr8:133798771-133798971_-,
CCTCGCAGTTAGAT chr8:73670032-73670232_+,chr8:73670032-73670232_-,
CCTCGCGTGATCCA chr9:141262768-141262968_+,chr9:141262768-141262968_-,
CTCGACGCGGACTC chr10:102023503-102023703_+,chr10:102023503-102023703_-,
CTCGACACTTCGGT chr10:12207111-12207311_+,chr10:12207111-12207311_-,
CTCGACGCTATATA chr11:340647-340847_+,chr11:340647-340847_-,
CTCGAACCCACGAC chr14:52446773-52446973_+,chr14:52446785-52446985_+,chr14:52446773-52446973_-,chr14:52446785-52446985_-,
CTCGATAAACGCGA chr15:43087289-43087489_+,chr15:43087289-43087489_-,
CTCGATGCGATCGG chr15:60926541-60926741_+,chr15:60926541-60926741_-,
CTCGATGCGATCGG chr15:60926541-60926741_+,chr15:60926541-60926741_-,


TAGACGCACGGACG chr19:12926205-12926405_+,chr19:12926205-12926405_-,
TAGACGCACCTAAA chr2:106113736-106113936_+,chr2:106113736-106113936_-,
TAGACAGGTCGAAG chr22:24987067-24987267_+,chr22:24987067-24987267_-,
TAGACGCCCGGATG chr5:173257091-173257291_+,chr5:173257091-173257291_-,
TAGACGCCCGTCCA chr7:1276701-1276901_+,chr7:1276701-1276901_-,
TAGACGCCGGCGGG chr7:5506294-5506494_+,chr7:5506294-5506494_-,
TAGACCGGTCCGTG chr8:42102379-42102579_+,chr8:42102379-42102579_-,
TAGACGAATAGACG chr9:145399893-145400093_+,chr9:145399893-145400093_-,
AGACCGTAACGCCT chr12:2336076-2336276_+,chr12:2336076-2336276_-,
AGACCGAACCGCTA chr20:25110470-25110670_+,chr20:25110470-25110670_-,
AGACCGGTGCGGCG chr20:33742622-33742822_+,chr20:33742622-33742822_-,
AGACCGCGCGTACC chr5:164040599-164040799_+,chr5:164040599-164040799_-,
GACCCGTTACGCCC chr1:160577417-160577617_+,chr1:160577452-160577652_+,chr1:160577417-160577617_-,chr1:160577452-160577652_-,
GACCCGTAGAGTAA chr11:117568652-117568852_+,chr11:117568652-117568852_-

GTTCTAAACGACGC chr19:59361751-59361951_+,chr19:59361751-59361951_-,
GTTCTCGATCCTCG chr2:219994525-219994725_+,chr2:219994525-219994725_-,
GTTCTAGCGCGCGT chr2:232146844-232147044_+,chr2:232146844-232147044_-,
GTTCTCCAGTCGTA chr2:238356423-238356623_+,chr2:238356423-238356623_-,
GTTCTCGTTGGGAC chr3:125641498-125641698_+,chr3:125641498-125641698_-,
GTTCTCGCTACGTA chrX:47983424-47983624_+,chrX:47983424-47983624_-,
TTCATTACGCGCTA chr10:118445722-118445922_+,chr10:118445722-118445922_-,
TTCATCGCGTCCGA chr4:115829379-115829579_+,chr4:115829379-115829579_-,
TTCATCTGTCGATC chr5:153219929-153220129_+,chr5:153219929-153220129_-,
GAGGTCGGTCGGAC chr1:208922141-208922341_+,chr1:208922141-208922341_-,
GAGGTACGGCGCGT chr12:114417608-114417808_+,chr12:114417608-114417808_-,
GAGGTCAAACCGTA chr12:43634725-43634919_+,chr12:43634725-43634919_-,
GAGGTCCGGACGCG chr17:80742669-80742869_+,chr17:80742669-80742869_-,
GAGGTCGCCACTAG chr5:92129352-92129552_+,chr5:92129352-92129552_-,
GAGGTGGAACGTAC chr9:132633558-

TGTCCGTACGATCC chr16:60734908-60735108_+,chr16:60734908-60735108_-,
TGTCCGCCCGGCGT chr16:63096502-63096702_+,chr16:63096560-63096760_+,chr16:63096502-63096702_-,chr16:63096560-63096760_-,
TGTCCGACCCGCGT chr22:17714180-17714380_+,chr22:17714180-17714380_-,
TGTCCGCGAGACGG chr3:150140112-150140312_+,chr3:150140112-150140312_-,
TGAAACGCGTTTCT chr17:40325203-40325403_+,chr17:40325203-40325403_-,
TGAAACTCCGCGAT chr4:105659682-105659882_+,chr4:105659682-105659882_-,
TGAAACGCCGCGTT chr6:5720320-5720520_+,chr6:5720320-5720520_-,
AATGTATCGATCGT chr1:84274244-84274444_+,chr1:84274252-84274452_+,chr1:84274244-84274444_-,chr1:84274252-84274452_-,
AATGTCCGCGTTCG chr19:1415596-1415796_+,chr19:1415629-1415829_+,chr19:1415596-1415796_-,chr19:1415629-1415829_-,
AATGTCTCGCGGCC chr3:46993074-46993274_+,chr3:46993074-46993274_-,
ATGTACAGTGCGCG chr1:25835491-25835691_+,chr1:25835491-25835691_-,
ATGTAAGCTGTACG chr3:52905383-52905583_+,chr3:52905383-52905583_-,
TGTACGTCTTATCG chr1:38603170-38603370_+,chr1:386

ATAGCAGACGATAC chr6:26173747-26173963_+,chr6:26173752-26173968_+,chr6:26173747-26173963_-,chr6:26173752-26173968_-,
ATAGCACACGCGCG chr6:28130941-28131141_+,chr6:28130941-28131141_-,
ATAGCGCGCGCGTG chr7:102092632-102092833_+,chr7:102092632-102092833_-,
ATAGCGCGCGCGTG chr7:102092632-102092833_+,chr7:102092632-102092833_-,
ATAGCGCAAGGGTC chr7:11324106-11324306_+,chr7:11324106-11324306_-,
ATAGCCGTCGTGTG chr7:17364254-17364454_+,chr7:17364254-17364454_-,
ATAGCGTCGCGGCC chr7:66973016-66973216_+,chr7:66973016-66973216_-,
ATAGCATGGCGCCG chr9:140138456-140138656_+,chr9:140138456-140138656_-,
TAGCTCGTGCGACA chr21:41762474-41762674_+,chr21:41762474-41762674_-,
TAGCTCGTGCGACA chr21:41762474-41762674_+,chr21:41762474-41762674_-,
TAGCTGAACGACGG chr8:8347434-8347634_+,chr8:8347434-8347634_-,
TGGATAACGCGTTA chr1:191823807-191824007_+,chr1:191823807-191824007_-,
TGGATCGACATACC chr10:47446823-47447023_+,chr10:47446823-47447023_-,
TGGATTCGCCGTCG chr12:94168131-94168331_+,chr12:94168131-94168331_-,
TGGATA

AGCATCGCGTAATT chr17:48886327-48886527_+,chr17:48886327-48886527_-,
AGCATAGGACGATA chr18:31160505-31160705_+,chr18:31160505-31160705_-,
AGCATAGCGCCGAT chr6:10822235-10822435_+,chr6:10822235-10822435_-,
GCATGATCGGCGTG chr1:242240273-242240473_+,chr1:242240273-242240473_-,
GCATGATTAACGTC chr4:149156346-149156546_+,chr4:149156346-149156546_-,
GCATGAGCGTCGTA chr5:155181236-155181436_+,chr5:155181236-155181436_-,
AGTAATGTTCGACG chr1:169813769-169813969_+,chr1:169813769-169813969_-,
AGTAAACGACCGCG chr1:211853597-211853797_+,chr1:211853597-211853797_-,
AGTAACGTCGCCGA chr11:50357273-50357473_+,chr11:50357273-50357473_-,
AGTAAGGTCCTCGC chr15:86985214-86985414_+,chr15:86985214-86985414_-,
AGTAAGAGTAACGT chr3:4574728-4574928_+,chr3:4574728-4574928_-,
AGTAACGGTAGCGA chrY:13812940-13813140_+,chrY:13812940-13813140_-,
TAAACGGCCCCGAA chr12:57833445-57833645_+,chr12:57833445-57833645_-,
TAAACCGGGTCGCA chr16:95328544-95328744_+,chr16:95328544-95328744_-,
TAAACCGCGCCTTA chr19:1719475-1719675_+,chr19:171

CTGCGTTCGGCGGC chr10:130896914-130897114_+,chr10:130896914-130897114_-,
CTGCGAGTGAGTCG chr10:76386627-76386827_+,chr10:76386627-76386827_-,
CTGCGACGCGTAAT chr11:47932149-47932349_+,chr11:47932149-47932349_-,
CTGCGACGCGTAAT chr11:47932149-47932349_+,chr11:47932149-47932349_-,
CTGCGATACGCCGA chr11:86978700-86978900_+,chr11:86978700-86978900_-,
CTGCGATACGCCGA chr11:86978700-86978900_+,chr11:86978700-86978900_-,
CTGCGATGCGTTCG chr11:95158624-95158824_+,chr11:95158624-95158824_-,
CTGCGTCCGTCGCG chr12:131257048-131257248_+,chr12:131257048-131257248_-,
CTGCGTCCGTCGCG chr12:131257048-131257248_+,chr12:131257048-131257248_-,
CTGCGTCCGTCGCG chr12:131257048-131257248_+,chr12:131257048-131257248_-,
CTGCGATCGGCAAC chr15:81706416-81706616_+,chr15:81706416-81706616_-,
CTGCGCGTTATATA chr16:19017524-19017724_+,chr16:19017524-19017724_-,
CTGCGCGAAGCGAT chr16:60449595-60449795_+,chr16:60449595-60449795_-,
CTGCGTACTAACGG chr19:50072781-50072979_+,chr19:50072781-50072979_-,
CTGCGCGTGCGTAG chr19:5815630-581

CCGCTATGGTACGA chr6:158277954-158278154_+,chr6:158277954-158278154_-,
CCGCTCTCGATACA chr6:167815268-167815468_+,chr6:167815268-167815468_-,
CCGCTTATTACCCG chr6:100787470-100787670_+,chr6:100787470-100787670_-,
GCTCTGCTCGTACG chr15:38318994-38319194_+,chr15:38319028-38319228_+,chr15:38318994-38319194_-,chr15:38319028-38319228_-,
GCTCTGATCTTACG chr2:217032492-217032692_+,chr2:217032492-217032692_-,
GCTCTGATCCTACG chr9:105595484-105595684_+,chr9:105595488-105595688_+,chr9:105595484-105595684_-,chr9:105595488-105595688_-,
GCTCTCGCGCTACG chrX:3433935-3434135_+,chrX:3433935-3434135_-,
TGCCCGTAAGTGTA chr1:12325881-12326081_+,chr1:12325881-12326081_-,
GCGATACGCCGAGC chr11:86978700-86978900_+,chr11:86978700-86978900_-,
GCGATCGGTTCGAC chr11:89784038-89784238_+,chr11:89784038-89784238_-,
GCGATCGTAGCTCG chr12:111138253-111138453_+,chr12:111138253-111138453_-,
GCGATTCTCGGAAC chr12:130068123-130068323_+,chr12:130068123-130068323_-,
GCGATCGTATAAGG chr12:28115232-28115432_+,chr12:28115232-28115432_-,


TATAAAGCGCGCCG chr17:59499858-59500058_+,chr17:59499858-59500058_-,
TATAAAGGATCACG chr19:10397033-10397233_+,chr19:10397033-10397233_-,
TATAACGAGCGACA chr4:113933789-113933989_+,chr4:113933812-113934012_+,chr4:113933789-113933989_-,chr4:113933812-113934012_-,
TATAAGCGCGGGGA chr5:171928077-171928277_+,chr5:171928077-171928277_-,
TATAATAGCGATCC chr7:104227302-104227502_+,chr7:104227302-104227502_-,
TATAATGACTCCCG chr7:7075303-7075503_+,chr7:7075303-7075503_-,
TATAATTCCCCCGA chr8:42990537-42990737_+,chr8:42990537-42990737_-,
ATAAGAATCGGAGA chr11:35960930-35961130_+,chr11:35960930-35961130_-,
ATAAGACCATCGAC chr9:103648981-103649181_+,chr9:103648981-103649181_-,
TCTACGGTAGCGAC chr1:15587305-15587505_+,chr1:15587305-15587505_-,
TCTACGGTAGCGAC chr1:15587305-15587505_+,chr1:15587305-15587505_-,
TCTACGATAGTGAC chr1:211663389-211663589_+,chr1:211663389-211663589_-,
TCTACGGCGCTGCG chr11:65545212-65545412_+,chr11:65545212-65545412_-,
TCTACGTGTAGACG chr12:55586289-55586489_+,chr12:55586289-55586489

CATACGTCGTGTGG chr7:2871836-2872036_+,chr7:2871836-2872036_-,
ATACCTACGGCGGC chr1:85549078-85549278_+,chr1:85549078-85549278_-,
ATACCTTAGCGGCT chr11:46453047-46453247_+,chr11:46453047-46453247_-,
ATACCGGTGCGCGG chr11:67601437-67601637_+,chr11:67601437-67601637_-,
ATACCGGTGCGCGG chr11:67601437-67601637_+,chr11:67601437-67601637_-,
ATACCGGTGCGCGG chr11:67601437-67601637_+,chr11:67601437-67601637_-,
ATACCTTCGGCCGC chr13:25400388-25400588_+,chr13:25400388-25400588_-,
ATACCGCCTCGCGC chr15:65655719-65655919_+,chr15:65655719-65655919_-,
ATACCGCAATTCCA chr15:68391968-68392168_+,chr15:68391968-68392168_-,
ATACCGCGCTCCCA chr16:80821462-80821662_+,chr16:80821462-80821662_-,
ATACCTGGACCCGC chr3:110245540-110245740_+,chr3:110245540-110245740_-,
ATACCTCGATTGGA chr5:148194999-148195199_+,chr5:148194999-148195199_-,
ATACCCGGTCCTCG chr5:181147285-181147485_+,chr5:181147285-181147485_-,
ATACCAGTACACGA chr9:19187100-19187300_+,chr9:19187106-19187306_+,chr9:19187107-19187307_+,chr9:19187100-19187300_-,chr

GTGCGGTAATATCT chr9:147684786-147684986_+,chr9:147684786-147684986_-,
GTGCGTGCGGTATG chr9:36347573-36347773_+,chr9:36347573-36347773_-,
GTGCGACGATTTAC chrX:122143853-122144053_+,chrX:122143860-122144060_+,chrX:122143853-122144053_-,chrX:122143860-122144060_-,
GTGCGACATACCAA chrX:64412772-64412972_+,chrX:64412772-64412972_-,
TGCGTTCGCGCTTT chr1:16706554-16706753_+,chr1:16706554-16706753_-,
TGCGTGAAGGTCCG chr1:202479050-202479250_+,chr1:202479051-202479251_+,chr1:202479050-202479250_-,chr1:202479051-202479251_-,
TGCGTCGCGCGGTA chr1:227298111-227298311_+,chr1:227298111-227298311_-,
TGCGTCGCGCGGTA chr1:227298111-227298311_+,chr1:227298111-227298311_-,
TGCGTCGCGCGGTA chr1:227298111-227298311_+,chr1:227298111-227298311_-,
TGCGTCGCGTGTCT chr1:92286899-92287099_+,chr1:92286899-92287099_-,
TGCGTCGCATCGGC chr10:121839108-121839308_+,chr10:121839135-121839335_+,chr10:121839108-121839308_-,chr10:121839135-121839335_-,
TGCGTCCGTCGCGC chr12:131257048-131257248_+,chr12:131257048-131257248_-,
TGCGTGGC

GTATATCTTTGCGC chr12:7874256-7874456_+,chr12:7874256-7874456_-,
GTATACGCCCAGAT chr14:93216780-93216980_+,chr14:93216780-93216980_-,
GTATACGCGTTGTC chr16:64399957-64400158_+,chr16:64399957-64400158_-,
GTATACGTTTGCCT chr17:29131204-29131404_+,chr17:29131204-29131404_-,
GTATACCGAGAACA chr20:25081668-25081868_+,chr20:25081668-25081868_-,
TATATCGGAGCGCG chr1:75622727-75622927_+,chr1:75622727-75622927_-,
TATATCGGAGCGCG chr1:75622727-75622927_+,chr1:75622727-75622927_-,
TATATCTTTGCGCC chr12:7874256-7874456_+,chr12:7874256-7874456_-,
TATATCTTTGCGCC chr12:7874256-7874456_+,chr12:7874256-7874456_-,
TATATTCTTCGCGT chr14:52446773-52446973_+,chr14:52446785-52446985_+,chr14:52446773-52446973_-,chr14:52446785-52446985_-,
TATATCGCGGGGTG chr14:84621633-84621833_+,chr14:84621633-84621833_-,
TATATCGCGGCCGT chr4:98598455-98598655_+,chr4:98598455-98598655_-,
TATATCGCGGCCGT chr4:98598455-98598655_+,chr4:98598455-98598655_-,
TATATGCGGATAGA chr7:150038147-150038347_+,chr7:150038147-150038347_-,
TATATCCCGCACGT

ATATCGCGAGGTAT chr1:110044561-110044761_+,chr1:110044561-110044761_-,
ATATCGTTGCTCGC chr1:14427338-14427538_+,chr1:14427338-14427538_-,
ATATCCGCCGCGCG chr1:227653152-227653352_+,chr1:227653152-227653352_-,
ATATCCGCCGCGCG chr1:227653152-227653352_+,chr1:227653152-227653352_-,
ATATCTCTATGCGT chr1:35651230-35651430_+,chr1:35651230-35651430_-,
ATATCGGAGCGCGA chr1:75622727-75622927_+,chr1:75622727-75622927_-,
ATATCGGCCGGGCG chr14:15476782-15476982_+,chr14:15476782-15476982_-,
ATATCGGCTCCGAG chr19:48320401-48320601_+,chr19:48320401-48320601_-,
ATATCGGTGTGTCG chr2:177814434-177814634_+,chr2:177814434-177814634_-,
ATATCGGTGTGTCG chr2:177814434-177814634_+,chr2:177814434-177814634_-,
ATATCGGTGTGTCG chr2:177814434-177814634_+,chr2:177814434-177814634_-,
ATATCCCGCGCATA chr4:152789929-152790129_+,chr4:152789929-152790129_-,
ATATCCCGCGCATA chr4:152789929-152790129_+,chr4:152789929-152790129_-,
ATATCCCGCGCATA chr4:152789929-152790129_+,chr4:152789929-152790129_-,
ATATCGGTGCCGCT chr6:108672149-108672

TGGCGGTGGAACAT chr7:72118561-72118761_+,chr7:72118561-72118761_-,
TGGCGGTCTTAATG chr8:28141249-28141448_+,chr8:28141249-28141448_-,
TGGCGGATTCGTAT chrX:9702062-9702262_+,chrX:9702102-9702302_+,chrX:9702062-9702262_-,chrX:9702102-9702302_-,
TGGCGCCGATCAAC chrX:822907-823107_+,chrX:822907-823107_-,
GCTCGCCACCGCTA chr10:126329811-126330011_+,chr10:126329839-126330039_+,chr10:126329811-126330011_-,chr10:126329839-126330039_-,
GCTCGTAACGACAC chr10:60216766-60216968_+,chr10:60216766-60216968_-,
GCTCGACGCCAGTA chr11:57337404-57337604_+,chr11:57337404-57337604_-,
GCTCGTACGCGTAC chr12:51784946-51785146_+,chr12:51784946-51785146_-,
GCTCGCGTGAGTAT chr13:29652469-29652669_+,chr13:29652469-29652669_-,
GCTCGTATCCGGGT chr14:89601369-89601569_+,chr14:89601369-89601569_-,
GCTCGTCGCTAGCT chr17:40265498-40265698_+,chr17:40265498-40265698_-,
GCTCGAGGCGAGAC chr17:78775293-78775493_+,chr17:78775293-78775493_-,
GCTCGCGACCGCGA chr18:37021811-37022011_+,chr18:37021811-37022011_-,
GCTCGCCGCGAAAC chr19:5706718-5

GGACCGTAGCGCGT chr16:54040967-54041167_+,chr16:54040967-54041167_-,
GGACCGTAGCGCGT chr16:54040967-54041167_+,chr16:54040967-54041167_-,
GGACCGCGAACCGA chr3:120717369-120717569_+,chr3:120717369-120717569_-,
GGACCGTCCGAGTA chr6:138997477-138997677_+,chr6:138997477-138997677_-,
GGACCGCGCTACTA chr7:27238480-27238680_+,chr7:27238480-27238680_-,
GACCAGCGCGCGAA chr15:95418244-95418444_+,chr15:95418244-95418444_-,
GACCATAGGAGGCG chr16:2573764-2573964_+,chr16:2573764-2573964_-,
GACCATAGAGCGTA chr17:16177413-16177613_+,chr17:16177413-16177613_-,
GACCATGTGACGCG chr19:6742770-6742970_+,chr19:6742770-6742970_-,
GACCAATCGCGACC chr7:66446184-66446384_+,chr7:66446184-66446384_-,
AATTCTGTCCGACG chr10:3096694-3096894_+,chr10:3096694-3096894_-,
AATTCTATGCGGGA chr12:30292379-30292578_+,chr12:30292379-30292578_-,
AATTCCCGTCCGCG chr6:170233547-170233747_+,chr6:170233572-170233772_+,chr6:170233547-170233747_-,chr6:170233572-170233772_-,
AGGTAACGCCCGAA chr20:47868777-47868977_+,chr20:47868777-47868977_-,
AGGT

TCGTGACGTGTGAT chr20:8136840-8137040_+,chr20:8136840-8137040_-,
TCGTGCAAACGAAG chr22:22157791-22157991_+,chr22:22157791-22157991_-,
TCGTGTAACCCGCG chr3:22230015-22230215_+,chr3:22230015-22230215_-,
TCGTGCGGCTCCAC chr4:111672695-111672895_+,chr4:111672695-111672895_-,
TCGTGTTGACTATA chr5:176262679-176262879_+,chr5:176262679-176262879_-,
TCGTGGTTCGCCGT chr6:130104381-130104581_+,chr6:130104381-130104581_-,
TCGTGCGCGCGTGC chr6:26960573-26960773_+,chr6:26960573-26960773_-,
TCGTGCGTGCGCAG chr7:67874049-67874249_+,chr7:67874049-67874249_-,
TCGTGGATCGATAC chr9:121103424-121103624_+,chr9:121103424-121103624_-,
TCGTGTGGACGACG chr9:143975393-143975593_+,chr9:143975393-143975593_-,
TCGTGTGGACGACG chr9:143975393-143975593_+,chr9:143975393-143975593_-,
TCGTGCTGCATAAC chr9:98854681-98854881_+,chr9:98854681-98854881_-,
CGTGGTCGTGCGAA chr1:25835491-25835691_+,chr1:25835491-25835691_-,
CGTGGTCGTGCGAA chr1:25835491-25835691_+,chr1:25835491-25835691_-,
CGTGGAATCAGCGA chr1:31006921-31007121_+,chr1:3100692

GCGCTATACCTTCG chr13:25400388-25400588_+,chr13:25400388-25400588_-,
GCGCTATTAATAGC chr16:1558384-1558584_+,chr16:1558384-1558584_-,
GCGCTAGCGGTCGG chr17:39373314-39373514_+,chr17:39373314-39373514_-,
GCGCTGATCGAGGA chr19:58076620-58076820_+,chr19:58076620-58076820_-,
GCGCTCCGCGGTAG chr2:90793544-90793744_+,chr2:90793544-90793744_-,
GCGCTGTAGGACTA chr20:25472656-25472856_+,chr20:25472656-25472856_-,
GCGCTGCGTTCGCG chr22:20133477-20133677_+,chr22:20133477-20133677_-,
GCGCTTCGTACAAA chr4:1166332-1166532_+,chr4:1166332-1166532_-,
GCGCTTCCGCAATA chr6:35596870-35597070_+,chr6:35596870-35597070_-,
GCGCTGTACGCGCG chr7:5091691-5091891_+,chr7:5091691-5091891_-,
GCGCTATTACGTCG chr7:77454056-77454256_+,chr7:77454056-77454256_-,
CGCTTGGAACGGTT chr1:16672261-16672461_+,chr1:16672261-16672461_-,
CGCTTACGGGTAAG chr1:178123164-178123364_+,chr1:178123164-178123364_-,
CGCTTGACACGTAG chr1:206509776-206509976_+,chr1:206509776-206509976_-,
CGCTTTTGCGACGC chr1:88527586-88527786_+,chr1:88527586-88527786_-,
CG

TCGATCCCGTGTCG chr12:69263140-69263340_+,chr12:69263145-69263345_+,chr12:69263165-69263365_+,chr12:69263140-69263340_-,chr12:69263145-69263345_-,chr12:69263165-69263365_-,
TCGATCCCGTGTCG chr12:69263140-69263340_+,chr12:69263145-69263345_+,chr12:69263165-69263365_+,chr12:69263140-69263340_-,chr12:69263145-69263345_-,chr12:69263165-69263365_-,
TCGATCAACTACTC chr13:99448833-99449033_+,chr13:99448833-99449033_-,
TCGATACTCCGCGA chr14:50343745-50343945_+,chr14:50343745-50343945_-,
TCGATACTCCGCGA chr14:50343745-50343945_+,chr14:50343745-50343945_-,
TCGATACGTCGAAT chr14:79629020-79629218_+,chr14:79629020-79629218_-,
TCGATAAACGCGAC chr15:43087289-43087489_+,chr15:43087289-43087489_-,
TCGATAAACGCGAC chr15:43087289-43087489_+,chr15:43087289-43087489_-,
TCGATAAACGCGAC chr15:43087289-43087489_+,chr15:43087289-43087489_-,
TCGATAAACGCGAC chr15:43087289-43087489_+,chr15:43087289-43087489_-,
TCGATCTGCGTCGC chr17:45989344-45989544_+,chr17:45989344-45989544_-,
TCGATCGCCTGCGC chr17:48640122-48640322_+,chr

ATTACGCGCGGTGA chr10:133962691-133962891_+,chr10:133962691-133962891_-,
ATTACGTCTGTGGG chr11:19562374-19562574_+,chr11:19562374-19562574_-,
ATTACCGATCTATG chr11:44475102-44475302_+,chr11:44475102-44475302_-,
ATTACGCACCGCGG chr13:47257867-47258067_+,chr13:47257867-47258067_-,
ATTACCGCTAGACG chr19:45596030-45596230_+,chr19:45596030-45596230_-,
ATTACGCGCCGTCG chr2:166639248-166639446_+,chr2:166639248-166639446_-,
ATTACCGGCGCGAA chr20:42694529-42694729_+,chr20:42694529-42694729_-,
ATTACGACTGGCTA chr3:123343334-123343534_+,chr3:123343334-123343534_-,
ATTACGACAGAAGA chr4:23771647-23771847_+,chr4:23771647-23771847_-,
ATTACACGTACCGT chrX:315394-315594_+,chrX:315394-315594_-,
ATTACACGTACCGT chrX:315394-315594_+,chrX:315394-315594_-,
ACACGGGTTCGTCG chr11:59501280-59501480_+,chr11:59501350-59501550_+,chr11:59501280-59501480_-,chr11:59501350-59501550_-,
ACACGGTAACAGTA chr14:24203069-24203269_+,chr14:24203069-24203269_-,
ACACGGCGGATCGG chr16:31830087-31830287_+,chr16:31830087-31830287_-,
ACACGGTCCG

GGGATATGGTCGAT chr5:148846836-148847036_+,chr5:148846836-148847036_-,
GGGATATTGTATCG chr5:17383216-17383416_+,chr5:17383216-17383416_-,
GATCGTACGCCGGC chr1:176633380-176633580_+,chr1:176633380-176633580_-,
GATCGGCGAGTCAT chr1:225521563-225521763_+,chr1:225521563-225521763_-,
GATCGTCCGATGGG chr1:54920262-54920462_+,chr1:54920262-54920462_-,
GATCGACGAACTGC chr1:70100262-70100462_+,chr1:70100262-70100462_-,
GATCGCGATACTAG chr11:118307343-118307543_+,chr11:118307372-118307572_+,chr11:118307343-118307543_-,chr11:118307372-118307572_-,
GATCGGCAGGTCGA chr12:111971191-111971391_+,chr12:111971191-111971391_-,
GATCGGTCTTCGTT chr14:77084597-77084797_+,chr14:77084597-77084797_-,
GATCGACCTGCGAA chr16:26696762-26696962_+,chr16:26696762-26696962_-,
GATCGGGACGGCGA chr17:2613265-2613465_+,chr17:2613265-2613465_-,
GATCGGTTCGCTCT chr17:59527272-59527472_+,chr17:59527272-59527472_-,
GATCGGTCGGCTCG chr17:75734745-75734954_+,chr17:75734745-75734954_-,
GATCGGTCGGCTCG chr17:75734745-75734954_+,chr17:75734745-

CGCATCGGCATACC chr9:20756126-20756326_+,chr9:20756126-20756326_-,
GAACGTCCTCCCGA chr1:507815-508015_+,chr1:507815-508015_-,
GAACGTCGCGCCGA chr10:133435319-133435519_+,chr10:133435319-133435519_-,
GAACGCGAGACGCG chr12:102918645-102918845_+,chr12:102918645-102918845_-,
GAACGCGCGCCGTG chr2:232146844-232147044_+,chr2:232146844-232147044_-,
GAACGCGCGCCGTG chr2:232146844-232147044_+,chr2:232146844-232147044_-,
GAACGCGCGCCGTG chr2:232146844-232147044_+,chr2:232146844-232147044_-,
GAACGTAAAGACCG chr2:27706886-27707086_+,chr2:27706886-27707086_-,
GAACGGCGTAGCGA chr21:27248483-27248683_+,chr21:27248483-27248683_-,
GAACGTATGCCCCG chr21:41947637-41947837_+,chr21:41947637-41947837_-,
GAACGGCGGGCGAA chr3:189628340-189628540_+,chr3:189628340-189628540_-,
GAACGCCCACGATT chr6:143274553-143274753_+,chr6:143274553-143274753_-,
GAACGCGCGCGGAT chr7:158096773-158096973_+,chr7:158096773-158096973_-,
GAACGCGCGCGGAT chr7:158096773-158096973_+,chr7:158096773-158096973_-,
GAACGCGCGCGCCG chr8:70464557-70464757_+,

GCGCATCGCGACAC chr1:154365552-154365752_+,chr1:154365552-154365752_-,
GCGCACGCGCACCG chr1:16272096-16272296_+,chr1:16272096-16272296_-,
GCGCAAGCGGGACG chr1:19705797-19705997_+,chr1:19705797-19705997_-,
GCGCATTATTATCT chr1:20057115-20057315_+,chr1:20057115-20057315_-,
GCGCAGATACCGGG chr11:75512639-75512839_+,chr11:75512639-75512839_-,
GCGCAAAGATATAC chr12:8009011-8009211_+,chr12:8009011-8009211_-,
GCGCAATTAACGTG chr19:1427258-1427458_+,chr19:1427258-1427458_-,
GCGCACCGCGGTGC chr19:2758467-2758667_+,chr19:2758467-2758667_-,
GCGCAGATACCGCT chr19:2998486-2998686_+,chr19:2998486-2998686_-,
GCGCATCGCCCGCA chr19:58600235-58600435_+,chr19:58600235-58600435_-,
GCGCATCTCTCGCA chr21:40762738-40762938_+,chr21:40762738-40762938_-,
GCGCACGTTCCGCG chr3:155932783-155932983_+,chr3:155932783-155932983_-,
GCGCACCACGCGAC chr3:198709401-198709601_+,chr3:198709401-198709601_-,
GCGCACCACGCGAC chr3:198709401-198709601_+,chr3:198709401-198709601_-,
GCGCATGGTTGCCG chr4:186975950-186976150_+,chr4:186975950-18697

AACGACCATCCAGT chr10:114850358-114850558_+,chr10:114850358-114850558_-,
AACGAATCTGCCCA chr10:3486273-3486473_+,chr10:3486273-3486473_-,
AACGACGCGCATTT chr12:92318903-92319103_+,chr12:92318903-92319103_-,
AACGAATCTGCACA chr17:18919736-18919936_+,chr17:18919736-18919936_-,
AACGATTCGGCACA chr17:21148327-21148527_+,chr17:21148327-21148527_-,
AACGACCCGCGCGG chr17:77482474-77482674_+,chr17:77482474-77482674_-,
AACGACGGCCGGCG chr2:105304482-105304682_+,chr2:105304482-105304682_-,
AACGACGCGTCTTC chr2:20085037-20085237_+,chr2:20085037-20085237_-,
AACGAAGATCCTGT chr3:63111794-63111994_+,chr3:63111794-63111994_-,
AACGAACTAACGCG chr5:1559245-1559445_+,chr5:1559250-1559450_+,chr5:1559245-1559445_-,chr5:1559250-1559450_-,
AACGAGTCATCGTA chr8:23789348-23789548_+,chr8:23789348-23789548_-,
AACGACGCGATCGA chr9:140599420-140599620_+,chr9:140599420-140599620_-,
ACGAGTATCGATCG chr1:153471568-153471768_+,chr1:153471568-153471768_-,
ACGAGTCCTCCGAC chr1:154389298-154389498_+,chr1:154389298-154389498_-,
ACGAGC

CGTGCGAGTCATCG chr4:1041748-1041948_+,chr4:1041748-1041948_-,
CGTGCGACCGACAC chr4:142403821-142404021_+,chr4:142403821-142404021_-,
CGTGCGCGTGCGGT chr4:143747279-143747479_+,chr4:143747279-143747479_-,
CGTGCGCGTGCGGT chr4:143747279-143747479_+,chr4:143747279-143747479_-,
CGTGCGCGCGCGAA chr5:14201901-14202101_+,chr5:14201901-14202101_-,
CGTGCGCGAGAACG chr6:171184654-171184854_+,chr6:171184654-171184854_-,
CGTGCGCGAGAACG chr6:171184654-171184854_+,chr6:171184654-171184854_-,
CGTGCGCGAGAACG chr6:171184654-171184854_+,chr6:171184654-171184854_-,
CGTGCCCGTCGTTC chr7:47476600-47476800_+,chr7:47476600-47476800_-,
CGTGCGCGAGCTGA chr8:76737655-76737855_+,chr8:76737655-76737855_-,
CGTGCGCTTGAAGA chr9:136701371-136701571_+,chr9:136701371-136701571_-,
CGTGCGTAAATCGC chr9:139815389-139815589_+,chr9:139815421-139815621_+,chr9:139815389-139815589_-,chr9:139815421-139815621_-,
CGTGCGATCGCGTA chr9:29226355-29226555_+,chr9:29226355-29226555_-,
CGTGCGATCGCGTA chr9:29226355-29226555_+,chr9:29226355-292265

GCGACGAGGACGCG chr11:64230942-64231142_+,chr11:64230942-64231142_-,
GCGACGTGCGGTCG chr12:1687439-1687639_+,chr12:1687439-1687639_-,
GCGACTGGACGCGA chr12:30072699-30072899_+,chr12:30072699-30072899_-,
GCGACGCATTACGC chr13:47257867-47258067_+,chr13:47257867-47258067_-,
GCGACGCATTACGC chr13:47257867-47258067_+,chr13:47257867-47258067_-,
GCGACATCGCGTGG chr15:67216747-67216947_+,chr15:67216758-67216958_+,chr15:67216747-67216947_-,chr15:67216758-67216958_-,
GCGACCAATAGGAG chr15:87089551-87089751_+,chr15:87089551-87089751_-,
GCGACGATAACTGG chr16:27565180-27565380_+,chr16:27565180-27565380_-,
GCGACGCGAGATGG chr16:30072797-30072997_+,chr16:30072797-30072997_-,
GCGACCGTTCCTAT chr17:44566511-44566711_+,chr17:44566511-44566711_-,
GCGACGTCAGCGCG chr17:62321154-62321354_+,chr17:62321154-62321354_-,
GCGACGATGCGCGG chr17:75244784-75244984_+,chr17:75244784-75244984_-,
GCGACCGATAGCAT chr17:8555686-8555886_+,chr17:8555686-8555886_-,
GCGACGCGTGTCGG chr18:76504462-76504662_+,chr18:76504462-76504662_-,
GCGA

CACGACGACTCGCG chr1:167287341-167287541_+,chr1:167287341-167287541_-,
CACGATAGTCGCGG chr12:112085630-112085830_+,chr12:112085630-112085830_-,
CACGATCGTGGGAA chr12:4864839-4865039_+,chr12:4864848-4865048_+,chr12:4864839-4865039_-,chr12:4864848-4865048_-,
CACGAGTGTTCGAT chr2:113714892-113715092_+,chr2:113714892-113715092_-,
CACGAGAATCTAAT chr3:174489071-174489271_+,chr3:174489071-174489271_-,
CACGATCGCCCGGG chr3:189594855-189595055_+,chr3:189594855-189595055_-,
CACGAATAGTCGTG chr7:5546591-5546791_+,chr7:5546593-5546793_+,chr7:5546591-5546791_-,chr7:5546593-5546793_-,
CACGAATAGTCGTG chr7:5546591-5546791_+,chr7:5546593-5546793_+,chr7:5546591-5546791_-,chr7:5546593-5546793_-,
CACGACGCCACGTA chr9:89613925-89614125_+,chr9:89613925-89614125_-,
CACGACGCCACGTA chr9:89613925-89614125_+,chr9:89613925-89614125_-,
ACGAATCTCGACCA chr1:149191855-149192055_+,chr1:149191855-149192055_-,
ACGAACCTTCCACG chr12:120188172-120188372_+,chr12:120188172-120188372_-,
ACGAAGGTACGTCA chr13:97693158-97693358_+,chr13

CGTTCGGTCGACAA chr5:125323052-125323252_+,chr5:125323052-125323252_-,
CGTTCGCAGTCGGC chr6:152440899-152441099_+,chr6:152440899-152441099_-,
CGTTCAGGTGGCGA chr6:170373478-170373678_+,chr6:170373478-170373678_-,
CGTTCGTCGGAGGG chr6:26196450-26196650_+,chr6:26196450-26196650_-,
CGTTCCACCTGACG chr7:143067813-143068013_+,chr7:143067813-143068013_-,
CGTTCCACGCGTAA chr7:1969670-1969870_+,chr7:1969670-1969870_-,
CGTTCGCGTTTGGT chr8:75834304-75834504_+,chr8:75834304-75834504_-,
CGTTCATGCGAGAT chr9:31226802-31227002_+,chr9:31226802-31227002_-,
CGTTCTTCGGGCGA chrX:56906750-56906950_+,chrX:56906750-56906950_-,
CGCTACGCGCTTTT chr1:14100690-14100890_+,chr1:14100690-14100890_-,
CGCTAGTCGTGTTT chr1:15277154-15277356_+,chr1:15277154-15277356_-,
CGCTATCTGTAGAA chr1:228581687-228581887_+,chr1:228581687-228581887_-,
CGCTACGTGCCGGC chr1:41366489-41366689_+,chr5:91764377-91764577_+,chr1:41366489-41366689_-,chr5:91764377-91764577_-,
CGCTATGCGCTCCG chr1:44132441-44132641_+,chr1:44132441-44132641_-,
CGCTACGCGT

GACGATCACGTGAC chr15:71966061-71966261_+,chr15:71966061-71966261_-,
GACGATCTCGCGGG chr15:76300685-76300885_+,chr15:76300685-76300885_-,
GACGATCTCGCGGG chr15:76300685-76300885_+,chr15:76300685-76300885_-,
GACGAGCCGATTGG chr17:50962223-50962424_+,chr17:50962223-50962424_-,
GACGAAAAGCGCGG chr17:58881060-58881260_+,chr17:58881060-58881260_-,
GACGATCGCCCGTC chr18:24256095-24256295_+,chr18:24256095-24256295_-,
GACGATCGCCCGTC chr18:24256095-24256295_+,chr18:24256095-24256295_-,
GACGATCGCCCGTC chr18:24256095-24256295_+,chr18:24256095-24256295_-,
GACGATCGCCCGTC chr18:24256095-24256295_+,chr18:24256095-24256295_-,
GACGATGGTCCGTC chr18:62799586-62799786_+,chr18:62799586-62799786_-,
GACGATCACACGCG chr19:12926205-12926405_+,chr19:12926205-12926405_-,
GACGATCTGGGCCG chr19:14224451-14224651_+,chr19:14224451-14224651_-,
GACGACCTACGTCG chr19:2924141-2924341_+,chr19:2924141-2924341_-,
GACGACCTACGTCG chr19:2924141-2924341_+,chr19:2924141-2924341_-,
GACGACCTACGTCG chr19:2924141-2924341_+,chr19:2924141-292

TCGGTTGTGCAACA chr6:65087956-65088156_+,chr6:65087956-65088156_-,
TCGGTCCCGTAACC chr7:26511916-26512116_+,chr7:26511916-26512116_-,
TCGGTCTGAGCCAA chr7:43640987-43641187_+,chr7:43640987-43641187_-,
TCGGTCCGCGTAGA chr9:144661799-144661999_+,chr9:144661799-144661999_-,
TCGGTAGGCTATTG chrX:133650355-133650555_+,chrX:133650355-133650555_-,
TCGGTCAATGCGTT chrX:2648297-2648497_+,chrX:2648297-2648497_-,
CGGTCGGTCGCAGC chr1:10248183-10248383_+,chr1:10248183-10248383_-,
CGGTCGAGTGCACT chr1:145008789-145008989_+,chr1:145008789-145008989_-,
CGGTCGCCTTGTCA chr1:199296535-199296735_+,chr1:199296535-199296735_-,
CGGTCGGACCAACG chr1:208922141-208922341_+,chr1:208922141-208922341_-,
CGGTCGTTTTCGTA chr1:244921291-244921491_+,chr1:244921291-244921491_-,
CGGTCGAATTCGCT chr1:46043771-46043971_+,chr1:46043771-46043971_-,
CGGTCGCTCATTGG chr10:125797764-125797964_+,chr10:125797764-125797964_-,
CGGTCTGTACCCGA chr10:73126186-73126386_+,chr10:73126186-73126386_-,
CGGTCGTCACTTCG chr11:397080-397280_+,chr11:39708

ACCGACGTCGGTTG chr11:69461575-69461775_+,chr11:69461575-69461775_-,
ACCGATGAGATTAG chr11:91170494-91170694_+,chr11:91170494-91170694_-,
ACCGACGCGACGGA chr13:33968660-33968860_+,chr13:33968660-33968860_-,
ACCGAGGATACACC chr16:74316546-74316746_+,chr16:74316546-74316746_-,
ACCGACCTATCTAG chr18:9355173-9355373_+,chr18:9355173-9355373_-,
ACCGAGACGAGACG chr22:32217837-32218037_+,chr22:32217837-32218037_-,
ACCGAGGTCCGCTA chr4:4304765-4304965_+,chr4:4304787-4304987_+,chr4:4304765-4304965_-,chr4:4304787-4304987_-,
ACCGACGGTACCAT chr5:180349083-180349283_+,chr5:180349083-180349283_-,
ACCGAAAGACGACG chr6:165232323-165232523_+,chr6:165232323-165232523_-,
ACCGAAAGACGACG chr6:165232323-165232523_+,chr6:165232323-165232523_-,
ACCGACCCACGCGC chr6:43908067-43908267_+,chr6:43908080-43908280_+,chr6:43908067-43908267_-,chr6:43908080-43908280_-,
ACCGATCCTACGCC chr7:25992468-25992668_+,chr7:25992468-25992668_-,
ACCGATCCTACGCC chr7:25992468-25992668_+,chr7:25992468-25992668_-,
ACCGAAGTCCACCG chr7:5356325-53

CGCCGCGATTTGCG chr13:19333277-19333477_+,chr13:19333280-19333480_+,chr13:19333277-19333477_-,chr13:19333280-19333480_-,
CGCCGCGATTTGCG chr13:19333277-19333477_+,chr13:19333280-19333480_+,chr13:19333277-19333477_-,chr13:19333280-19333480_-,
CGCCGGGATTTCGA chr15:39138940-39139140_+,chr15:39138940-39139140_-,
CGCCGGGACAATAG chr15:46784327-46784527_+,chr15:46784327-46784527_-,
CGCCGATTGGTCCG chr15:67274802-67275002_+,chr15:67274802-67275002_-,
CGCCGCTGTCGTAC chr16:30721507-30721707_+,chr16:30721507-30721707_-,
CGCCGCTGTCGTAC chr16:30721507-30721707_+,chr16:30721507-30721707_-,
CGCCGTCAGCACGA chr16:4644142-4644342_+,chr16:4644142-4644342_-,
CGCCGAACGGCGTG chr17:29260782-29260982_+,chr17:29260782-29260982_-,
CGCCGCGCTCCATT chr17:37795459-37795659_+,chr17:37795459-37795659_-,
CGCCGTCGAGCGGA chr17:77000160-77000360_+,chr17:77000160-77000360_-,
CGCCGGATTCCCGC chr17:9553177-9553377_+,chr17:9553177-9553377_-,
CGCCGTAGTCCGAC chr18:57641277-57641477_+,chr18:57641277-57641477_-,
CGCCGTAGTCCGAC chr18

CGCGCTGACGTCGC chr19:14532783-14532983_+,chr22:41892709-41892909_+,chr5:140632736-140632936_+,chr19:14532783-14532983_-,chr22:41892709-41892909_-,chr5:140632736-140632936_-,
CGCGCAATTAACGT chr19:1427258-1427458_+,chr19:1427258-1427458_-,
CGCGCAATTAACGT chr19:1427258-1427458_+,chr19:1427258-1427458_-,
CGCGCAATTAACGT chr19:1427258-1427458_+,chr19:1427258-1427458_-,
CGCGCCTTAATCGA chr19:1719475-1719675_+,chr19:1719475-1719675_-,
CGCGCAATCCTCCA chr19:2924265-2924465_+,chr19:2924265-2924465_-,
CGCGCAGCGGCTAA chr19:38477415-38477615_+,chr19:38477415-38477615_-,
CGCGCGTTTCTCGC chr19:53910655-53910855_+,chr19:53910655-53910855_-,
CGCGCGCACTCGCA chr2:105334686-105334886_+,chr2:105334686-105334886_-,
CGCGCCTACTACCG chr2:241717168-241717368_+,chr2:241717168-241717368_-,
CGCGCGGACGACGA chr2:60741374-60741574_+,chr2:60741374-60741574_-,
CGCGCTCCGCGGTA chr2:90793544-90793744_+,chr2:90793544-90793744_-,
CGCGCGGCGTTCGA chr20:37771430-37771630_+,chr20:37771430-37771630_-,
CGCGCGTCTACATA chr20:45191149-

TGCGACGTATAGCC chr8:28602555-28602755_+,chr8:28602555-28602755_-,
TGCGACGTATAGCC chr8:28602555-28602755_+,chr8:28602555-28602755_-,
TGCGAACAACCGGT chrX:9252828-9253028_+,chrX:9252828-9253028_-,
CAACGCGGGACGAT chr1:244728310-244728510_+,chr1:244728310-244728510_-,
CAACGCGGGACGAT chr1:244728310-244728510_+,chr1:244728310-244728510_-,
CAACGCGGGACGAT chr1:244728310-244728510_+,chr1:244728310-244728510_-,
CAACGCGGGACGAT chr1:244728310-244728510_+,chr1:244728310-244728510_-,
CAACGCGCGTACAT chr10:117682418-117682618_+,chr10:117682418-117682618_-,
CAACGCGCGTACAT chr10:117682418-117682618_+,chr10:117682418-117682618_-,
CAACGCGTAACGGA chr11:116787580-116787780_+,chr11:116787580-116787780_-,
CAACGCGTAACGGA chr11:116787580-116787780_+,chr11:116787580-116787780_-,
CAACGCGTAACGGA chr11:116787580-116787780_+,chr11:116787580-116787780_-,
CAACGTGCGCCGTC chr11:67385944-67386144_+,chr11:67385944-67386144_-,
CAACGCATAGCAAC chr13:27182227-27182427_+,chr13:27182260-27182460_+,chr13:27182227-27182427_-,chr13

TCGCGCCTCGGATA chr12:120280243-120280442_+,chr12:120280243-120280442_-,
TCGCGCATCGCCCA chr12:1659407-1659607_+,chr12:1659407-1659607_-,
TCGCGGTCCGCAGT chr12:2800863-2801063_+,chr12:2800863-2801063_-,
TCGCGTGGTACGTA chr12:62792077-62792277_+,chr12:62792077-62792277_-,
TCGCGCCGACTACC chr12:6480883-6481083_+,chr12:6480883-6481083_-,
TCGCGGCGCTCTAT chr12:6876683-6876883_+,chr12:6876683-6876883_-,
TCGCGCGAGGACAT chr12:94082605-94082805_+,chr12:94082605-94082805_-,
TCGCGCGAGAAGAA chr13:108316028-108316228_+,chr13:108316028-108316228_-,
TCGCGCGAGAAGAA chr13:108316028-108316228_+,chr13:108316028-108316228_-,
TCGCGAGAGACTTA chr13:20333513-20333713_+,chr13:20333513-20333713_-,
TCGCGGTTTGCCGT chr13:83228856-83229056_+,chr13:83228856-83229056_-,
TCGCGTGCGGACGG chr14:96780996-96781196_+,chr14:96780996-96781196_-,
TCGCGGATCGCCGA chr14:15168943-15169143_+,chr14:15168943-15169143_-,
TCGCGGATCGCCGA chr14:15168943-15169143_+,chr14:15168943-15169143_-,
TCGCGGATCGCCGA chr14:15168943-15169143_+,chr14:15168

TCGCGACCATCACC chr9:6686472-6686672_+,chr9:6686493-6686693_+,chr9:6686472-6686672_-,chr9:6686493-6686693_-,
TCGCGCTCTCGTTT chr9:101474874-101475074_+,chr9:101474874-101475074_-,
TCGCGCGTAGACTC chrX:105589589-105589789_+,chrX:105589589-105589789_-,
TCGCGTAGGGTCCA chrX:117217144-117217344_+,chrX:117217144-117217344_-,
TCGCGCGGCGAGCG chrX:135875997-135876197_+,chrX:135875997-135876197_-,
TCGCGAGCGAAAAA chrX:52206085-52206285_+,chrX:52206085-52206285_-,
CGCACGCTCGCGCG chr1:16272096-16272296_+,chr1:16272096-16272296_-,
CGCACTTCGGGACG chr1:25713251-25713451_+,chr1:25713251-25713451_-,
CGCACTTCGGGACG chr1:25713251-25713451_+,chr1:25713251-25713451_-,
CGCACGAATGGTTA chr1:62315137-62315337_+,chr1:62315137-62315337_-,
CGCACGCCCGCCGA chr10:22344667-22344867_+,chr10:22344667-22344867_-,
CGCACTAACGCGAA chr10:51001014-51001214_+,chr10:51001014-51001214_-,
CGCACGTGTTACCG chr11:68302146-68302346_+,chr11:68302146-68302346_-,
CGCACCCGTGGTTA chr12:127119116-127119316_+,chr12:127119116-127119316_-,
CGCACG

CGACGGAACGTTCC chr5:178535362-178535562_+,chr5:178535362-178535562_-,
CGACGGAACGTTCC chr5:178535362-178535562_+,chr5:178535362-178535562_-,
CGACGCGCGCACGC chr6:164779154-164779354_+,chr6:164779154-164779354_-,
CGACGGGTGGAACG chr6:26390579-26390779_+,chr6:26390579-26390779_-,
CGACGCGACCTTAA chr7:101690599-101690799_+,chr7:101690599-101690799_-,
CGACGCCCGCAGAC chr7:1401511-1401711_+,chr7:1401511-1401711_-,
CGACGTTTGACGTG chr7:160198406-160198606_+,chr7:160198406-160198606_-,
CGACGGAACGAGAG chr7:93375563-93375763_+,chr7:93375563-93375763_-,
CGACGCTGACGCTA chr7:97945421-97945621_+,chr7:97945421-97945621_-,
CGACGTCTATGGTA chr8:27041844-27042044_+,chr8:27041844-27042044_-,
CGACGTATAGCCAC chr8:28602555-28602755_+,chr8:28602555-28602755_-,
CGACGTCACGAACG chr8:98403579-98403779_+,chr8:98403579-98403779_-,
CGACGTCACGAACG chr8:98403579-98403779_+,chr8:98403579-98403779_-,
CGACGCCATTTCCT chr9:125474290-125474490_+,chr9:125474290-125474490_-,
CGACGCGATCGACT chr9:140599420-140599620_+,chr9:140599420

ACGCGTGCGCATTA chr19:36886635-36886835_+,chr19:36886635-36886835_-,
ACGCGTTCCAACGG chr19:37449666-37449866_+,chr19:37449666-37449866_-,
ACGCGGTGTCATCG chr19:38425574-38425774_+,chr19:38425574-38425774_-,
ACGCGGCGCTCTAC chr19:51613564-51613764_+,chr19:51613564-51613764_-,
ACGCGCCCGGTACG chr19:52534248-52534448_+,chr19:52534248-52534448_-,
ACGCGATACAAACT chr19:56005555-56005755_+,chr19:56005555-56005755_-,
ACGCGCTGCGAACG chr19:7653043-7653243_+,chr19:7653043-7653243_-,
ACGCGCAGTATTCG chr2:118575910-118576110_+,chr2:118575994-118576194_+,chr2:118575910-118576110_-,chr2:118575994-118576194_-,
ACGCGAAACGCCGA chr2:161695740-161695940_+,chr2:161695740-161695940_-,
ACGCGAAACGCCGA chr2:161695740-161695940_+,chr2:161695740-161695940_-,
ACGCGCCGTCGCCA chr2:166639248-166639446_+,chr2:166639248-166639446_-,
ACGCGCTGCGTCCT chr2:204627493-204627693_+,chr2:204627493-204627693_-,
ACGCGTCGTAGTGC chr2:232906417-232906617_+,chr2:232906417-232906617_-,
ACGCGTTTGTAGAG chr21:42489176-42489376_+,chr21:4248917

GCCGATCGATAACT chr1:232015281-232015481_+,chr1:232015281-232015481_-,
GCCGACGCCGTGCG chr1:248297462-248297662_+,chr1:248297462-248297662_-,
GCCGAAAGATTATG chr1:44734377-44734577_+,chr1:44734377-44734577_-,
GCCGACGTGGCGAC chr11:2789363-2789563_+,chr11:2789363-2789563_-,
GCCGAGCGCTCAAC chr11:86978700-86978900_+,chr11:86978700-86978900_-,
GCCGAGTACGCGTG chr12:111990131-111990331_+,chr12:111990131-111990331_-,
GCCGATGCGCAGCG chr15:68407949-68408149_+,chr15:68407949-68408149_-,
GCCGACGCGAGGTG chr15:95669876-95670076_+,chr15:95669876-95670076_-,
GCCGAGCGCCCGAC chr18:57641277-57641477_+,chr18:57641277-57641477_-,
GCCGAGACGCAGCG chr19:1828665-1828865_+,chr19:1828665-1828865_-,
GCCGATCCTCGACG chr19:35696201-35696401_+,chr19:35696201-35696401_-,
GCCGATCCTCGACG chr19:35696201-35696401_+,chr19:35696201-35696401_-,
GCCGATATCGATGG chr2:149417932-149418132_+,chr2:149417932-149418132_-,
GCCGATCTTGTATG chr20:51354422-51354622_+,chr20:51354422-51354622_-,
GCCGACTACGCCAC chr4:91292004-91292204_+,chr4:912

CGCGACTGGATCCC chr16:75132284-75132484_+,chr16:75132284-75132484_-,
CGCGAATCACGACC chr16:89639677-89639877_+,chr16:89639677-89639877_-,
CGCGAGATAGTGGA chr17:21713526-21713726_+,chr17:21713526-21713726_-,
CGCGATCTGCGGTA chr17:64896595-64896795_+,chr17:64896595-64896795_-,
CGCGAACCCACCAC chr17:82027827-82028027_+,chr17:82027827-82028027_-,
CGCGATTCGCGCGC chr18:37021811-37022011_+,chr18:37021811-37022011_-,
CGCGAGACAGATCT chr18:48915819-48916019_+,chr18:48915819-48916019_-,
CGCGATGACGTCGA chr19:13424141-13424341_+,chr19:13424141-13424341_-,
CGCGATCGTCTTCC chr19:15348342-15348542_+,chr19:15348356-15348556_+,chr19:15348342-15348542_-,chr19:15348356-15348556_-,
CGCGAATTGTGACG chr19:18706824-18707024_+,chr19:18706824-18707024_-,
CGCGAACGTCAACA chr19:23206512-23206712_+,chr19:23206512-23206712_-,
CGCGAACGTCAACA chr19:23206512-23206712_+,chr19:23206512-23206712_-,
CGCGATAACGGGAT chr19:4107307-4107507_+,chr19:4107307-4107507_-,
CGCGATAACGGGAT chr19:4107307-4107507_+,chr19:4107307-4107507_-,
CGCG

TTCCGCCGAGGCAA chr20:50452635-50452835_+,chr20:50452662-50452862_+,chr20:50452635-50452835_-,chr20:50452662-50452862_-,
TTCCGGGCGACGCA chr20:59128839-59129039_+,chr20:59128839-59129039_-,
TTCCGGTCGCCGCG chr22:46734924-46735124_+,chr22:46734924-46735124_-,
TTCCGCGACGGATT chr3:44777309-44777509_+,chr3:44777309-44777509_-,
TTCCGCGACGCTTA chr8:8810316-8810516_+,chr8:8810316-8810516_-,
ATCCGCTCGGTTAC chr1:120428181-120428381_+,chr1:120428181-120428381_-,
ATCCGGGAGACGCA chr1:178442746-178442946_+,chr1:178442746-178442946_-,
ATCCGCCTAATCGC chr1:229556798-229556998_+,chr1:229556798-229556998_-,
ATCCGTCCGGGAAC chr11:121955008-121955208_+,chr11:121955008-121955208_-,
ATCCGATCCATACG chr12:121221106-121221306_+,chr12:121221106-121221306_-,
ATCCGTGCACGCGT chr13:112135871-112136071_+,chr13:112135871-112136071_-,
ATCCGCGCCCAACG chr14:52446773-52446973_+,chr14:52446785-52446985_+,chr14:52446773-52446973_-,chr14:52446785-52446985_-,
ATCCGTACAGGTCG chr16:28499820-28500020_+,chr16:28499820-28500020_-,
AT

CGCGTAACGGACGC chr11:116787580-116787780_+,chr11:116787580-116787780_-,
CGCGTAGCGCCACT chr11:118630296-118630496_+,chr11:118630296-118630496_-,
CGCGTTGGTGGTTA chr11:12786282-12786482_+,chr11:12786282-12786482_-,
CGCGTCTTTACGTA chr11:43467245-43467446_+,chr11:43467245-43467446_-,
CGCGTCTCGTCTCG chr11:59085164-59085364_+,chr11:59085164-59085364_-,
CGCGTCAGAAGTGG chr12:112328126-112328326_+,chr12:112328126-112328326_-,
CGCGTACACTCATT chr12:115596584-115596784_+,chr12:115596584-115596784_-,
CGCGTAACACCAAA chr12:132917318-132917518_+,chr12:132917318-132917518_-,
CGCGTTCGGCGGGA chr12:1601580-1601780_+,chr12:1601580-1601780_-,
CGCGTCACGGCGAC chr12:1687439-1687639_+,chr12:1687439-1687639_-,
CGCGTACCATCGGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGCGTACCATCGGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGCGTGGTACGTAA chr12:62792077-62792277_+,chr12:62792077-62792277_-,
CGCGTCGGAGCACG chr13:112135871-112136071_+,chr13:112135871-112136071_-,
CGCGTTGGCGATGG chr13:76203827-76

CGCGTCGGCGATCC chr8:57525460-57525660_+,chr8:57525460-57525660_-,
CGCGTCTCCTTCCG chr9:112524413-112524613_+,chr9:112524413-112524613_-,
CGCGTCTTGACCGG chr9:14438572-14438772_+,chr9:14438585-14438785_+,chr9:14438572-14438772_-,chr9:14438585-14438785_-,
CGCGTAGCGACGCC chr9:29226355-29226555_+,chr9:29226355-29226555_-,
CGCGTAGCGACGCC chr9:29226355-29226555_+,chr9:29226355-29226555_-,
CGCGTAGCGCGCTG chr9:6686147-6686347_+,chr9:6686147-6686347_-,
CGCGTAGCGCGCTG chr9:6686147-6686347_+,chr9:6686147-6686347_-,
CGCGTTACATTTCG chr9:108589943-108590143_+,chr9:108589943-108590143_-,
CGCGTGTCGACGCC chrX:152607650-152607850_+,chrX:152607650-152607850_-,
CGCGTGTCGACGCC chrX:152607650-152607850_+,chrX:152607650-152607850_-,
CGCGTCGAATTCTG chrX:53333728-53333928_+,chrX:53333728-53333928_-,
CGCGTAGGCTAACC chrY:13812940-13813140_+,chrY:13812940-13813140_-,
GTCCGACTACCCGC chr1:155244869-155245069_+,chr1:155244869-155245069_-,
GTCCGTATCGGAGA chr1:244921061-244921261_+,chr1:244921061-244921261_-,
GTCCGACGAT

TCGACCAGCGCGCG chr19:53696937-53697137_+,chr19:53696937-53697137_-,
TCGACAGACTCGAC chr2:158591524-158591724_+,chr2:158591542-158591742_+,chr2:158591524-158591724_-,chr2:158591542-158591742_-,
TCGACGCCCCGGTC chr2:171999434-171999634_+,chr2:171999434-171999634_-,
TCGACGAGTTCTAT chr2:70975972-70976172_+,chr2:70975972-70976172_-,
TCGACGATTTCCGG chr20:59128839-59129039_+,chr20:59128839-59129039_-,
TCGACGTCTCGCGG chr22:30230190-30230390_+,chr22:30230190-30230390_-,
TCGACGTCTCGCGG chr22:30230190-30230390_+,chr22:30230190-30230390_-,
TCGACGTCTCGCGG chr22:30230190-30230390_+,chr22:30230190-30230390_-,
TCGACTACGTTATG chr22:36870268-36870468_+,chr22:36870268-36870468_-,
TCGACGTTGGCGGA chr22:43200566-43200766_+,chr22:43200566-43200766_-,
TCGACGCGCCCGGA chr3:141070276-141070476_+,chr3:141070276-141070476_-,
TCGACGCCTCCTTA chr3:44701266-44701466_+,chr3:44701266-44701466_-,
TCGACGGCTCGCGC chr4:130925807-130926007_+,chr4:130925807-130926007_-,
TCGACTCACGCGTT chr4:191507040-191507240_+,chr4:191507040-1

CGTACGACAGTTCG chr11:62563371-62563571_+,chr11:62563371-62563571_-,
CGTACGACAGTTCG chr11:62563371-62563571_+,chr11:62563371-62563571_-,
CGTACCATCGGCGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGTACCATCGGCGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGTACCATCGGCGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGTACCATCGGCGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGTACCATCGGCGC chr12:49866795-49866995_+,chr12:49866795-49866995_-,
CGTACGCGTACTTG chr12:51784946-51785146_+,chr12:51784946-51785146_-,
CGTACCATAACGCA chr13:101822693-101822893_+,chr13:101822693-101822893_-,
CGTACTTCCCGCCG chr13:109336974-109337174_+,chr13:109336974-109337174_-,
CGTACACTCGGGGA chr14:53404854-53405054_+,chr14:53404854-53405054_-,
CGTACAAAATGGCG chr14:63404477-63404677_+,chr14:63404477-63404677_-,
CGTACTCGTGCGCG chr14:88308471-88308671_+,chr14:88308471-88308671_-,
CGTACAAACCTACG chr15:24356112-24356312_+,chr15:24356112-24356312_-,
CGTACGCAGCACCG chr15:38318994-38319194_+

TAGCGAAGGGCGGA chr16:3391946-3392146_+,chr16:3391946-3392146_-,
TAGCGTCGTCCGCC chr17:36355607-36355807_+,chr17:36355607-36355807_-,
TAGCGAACACGACA chr17:68351370-68351570_+,chr17:68351394-68351594_+,chr17:68351370-68351570_-,chr17:68351394-68351594_-,
TAGCGGAGCTACGA chr17:84087340-84087540_+,chr17:84087340-84087540_-,
TAGCGACGGCCGTA chr19:17646176-17646376_+,chr19:17646176-17646376_-,
TAGCGCGCGTCGGA chr2:232146844-232147044_+,chr2:232146844-232147044_-,
TAGCGTTCGGGGTA chr2:237966007-237966207_+,chr2:237966007-237966207_-,
TAGCGCTCGGTTAT chr2:65445903-65446103_+,chr2:65445903-65446103_-,
TAGCGGCCCGCGAT chr20:2237644-2237844_+,chr20:2237644-2237844_-,
TAGCGGCCCGCGAT chr20:2237644-2237844_+,chr20:2237644-2237844_-,
TAGCGTGACGCGAC chr22:24164493-24164693_+,chr22:24164495-24164695_+,chr22:24164493-24164693_-,chr22:24164495-24164695_-,
TAGCGCGGGAAGCG chr22:30819861-30820061_+,chr22:30819861-30820061_-,
TAGCGCGGCGATGC chr3:167978566-167978766_+,chr3:167978566-167978766_-,
TAGCGTGGCGTTAG chr6:

GTCGTACGATCATC chr7:48573221-48573421_+,chr7:48573221-48573421_-,
GTCGTATGACTACG chr9:149532238-149532438_+,chr9:149532238-149532438_-,
GTCGTGCGATCGCG chr9:29226355-29226555_+,chr9:29226355-29226555_-,
GTCGTGCGATCGCG chr9:29226355-29226555_+,chr9:29226355-29226555_-,
GTCGTGCGATCGCG chr9:29226355-29226555_+,chr9:29226355-29226555_-,
GTCGTTCTACACGC chrX:149421155-149421355_+,chrX:149421155-149421355_-,
TCGCCTTCGATCGA chr1:145044200-145044400_+,chr1:145044200-145044400_-,
TCGCCGAGGTTCGG chr1:54767375-54767575_+,chr1:54767375-54767575_-,
TCGCCCATCAACGG chr10:11483661-11483861_+,chr10:11483661-11483861_-,
TCGCCCGACGCACA chr10:133147605-133147805_+,chr10:133147605-133147805_-,
TCGCCACGATCGCC chr10:22364425-22364625_+,chr10:22364425-22364625_-,
TCGCCCGCACGACT chr10:317671-317871_+,chr10:317671-317871_-,
TCGCCTACGGACGA chr10:53732984-53733184_+,chr10:53732984-53733184_-,
TCGCCTACGGACGA chr10:53732984-53733184_+,chr10:53732984-53733184_-,
TCGCCTACGGACGA chr10:53732984-53733184_+,chr10:53732984-

CGTTAAGCGCGGGA chr14:48934353-48934553_+,chr14:48934353-48934553_-,
CGTTAGTAAGTCGC chr14:49011353-49011553_+,chr14:49011353-49011553_-,
CGTTACTGCGGTCT chr15:87172399-87172599_+,chr15:87172412-87172612_+,chr15:87172399-87172599_-,chr15:87172412-87172612_-,
CGTTAGGGGTAAAG chr16:764721-764921_+,chr16:764721-764921_-,
CGTTAAGCCGGACG chr16:92565821-92566021_+,chr16:92565821-92566021_-,
CGTTAACGGAGCGC chr17:46446785-46446985_+,chr17:46446785-46446985_-,
CGTTAATCGGCCAA chr17:50942137-50942337_+,chr17:50942137-50942337_-,
CGTTACACGAAACG chr18:45861596-45861796_+,chr18:45861596-45861796_-,
CGTTACGCTACCGT chr18:45966153-45966353_+,chr18:45966153-45966353_-,
CGTTACGCTACCGT chr18:45966153-45966353_+,chr18:45966153-45966353_-,
CGTTAATTGTCTAG chr18:58064045-58064245_+,chr18:58064045-58064245_-,
CGTTACGCAGCGCG chr19:12323091-12323291_+,chr19:12323091-12323291_-,
CGTTACGCAGCGCG chr19:12323091-12323291_+,chr19:12323091-12323291_-,
CGTTACCCGCTAGA chr19:20097012-20097212_+,chr19:20097012-20097212_-,
CGTT

GCGAAGACGTACGA chr15:60994263-60994463_+,chr15:60994263-60994463_-,
GCGAATCGGTCCAA chr17:3620840-3621040_+,chr17:3620840-3621040_-,
GCGAAAGCGGTCCG chr2:143152537-143152737_+,chr2:143152537-143152737_-,
GCGAACCGAGCCGA chr3:120717369-120717569_+,chr3:120717369-120717569_-,
GCGAAACTAGCCGA chr3:13453279-13453479_+,chr3:13453279-13453479_-,
GCGAACGACAGGTA chr3:141070276-141070476_+,chr3:141070276-141070476_-,
GCGAACCTCACACG chr3:176181287-176181487_+,chr3:176181287-176181487_-,
GCGAATTAGACTGT chr3:195140461-195140661_+,chr3:195140465-195140665_+,chr3:195140461-195140661_-,chr3:195140465-195140665_-,
GCGAAATACGTCCG chr3:58218239-58218439_+,chr3:58218239-58218439_-,
GCGAAATACGTCCG chr3:58218239-58218439_+,chr3:58218239-58218439_-,
GCGAATGATCAAAG chr4:158671670-158671870_+,chr4:158671670-158671870_-,
GCGAATCGCGCCAA chr7:480116-480316_+,chr7:480116-480316_-,
GCGAACCTCACGGG chr7:6442480-6442680_+,chr7:6442480-6442680_-,
GCGAATAACCGCGC chrX:45259785-45259985_+,chrX:45259785-45259985_-,
CGAACGCCAC

TACGACCAGACGGA chr15:37876026-37876226_+,chr15:37876029-37876229_+,chr15:37876026-37876226_-,chr15:37876029-37876229_-,
TACGACATACGCTG chr16:2684463-2684663_+,chr16:2684463-2684663_-,
TACGACCGAGGCCA chr17:16978616-16978816_+,chr17:16978616-16978816_-,
TACGATTACGCGGG chr17:29660225-29660425_+,chr17:29660225-29660425_-,
TACGATTACGCGGG chr17:29660225-29660425_+,chr17:29660225-29660425_-,
TACGATTACGCGGG chr17:29660225-29660425_+,chr17:29660225-29660425_-,
TACGATTACGCGGG chr17:29660225-29660425_+,chr17:29660225-29660425_-,
TACGATTACGCGGG chr17:29660225-29660425_+,chr17:29660225-29660425_-,
TACGACGTCGCTTT chr17:39716768-39716968_+,chr17:39716768-39716968_-,
TACGAGCCATGTGC chr17:47805138-47805338_+,chr17:47805138-47805338_-,
TACGAATGCCGCGG chr18:2320886-2321086_+,chr18:2320886-2321086_-,
TACGAGTGCCGCGT chr19:32055451-32055651_+,chr19:32055451-32055651_-,
TACGATGCGGAATG chr2:227468099-227468299_+,chr2:227468099-227468299_-,
TACGACGTATCAGG chr2:55279942-55280142_+,chr2:55279942-55280142_-,
TACG

TACGCGTCGCGTAT chr7:141793480-141793680_+,chr7:141793480-141793680_-,
TACGCGTCGCGTAT chr7:141793480-141793680_+,chr7:141793480-141793680_-,
TACGCGTCGCGTAT chr7:141793480-141793680_+,chr7:141793480-141793680_-,
TACGCGCAACTGCC chr7:41854911-41855111_+,chr7:41854911-41855111_-,
TACGCGCGCTGTAC chr7:5091691-5091891_+,chr7:5091691-5091891_-,
TACGCTTGCGCGAG chr7:5091691-5091891_+,chr7:5091691-5091891_-,
TACGCTTGCGCGAG chr7:5091691-5091891_+,chr7:5091691-5091891_-,
TACGCCCTCGTGTG chr8:24690231-24690431_+,chr8:24690231-24690431_-,
TACGCTCGTTCAGG chr8:61409124-61409324_+,chr8:61409124-61409324_-,
TACGCGAACCAGCG chr9:106128300-106128500_+,chr9:106128300-106128500_-,
TACGCGCCGCAAAT chrX:112990172-112990372_+,chrX:112990172-112990372_-,
TACGCTAGCGCTGG chrX:39569120-39569320_+,chrX:39569120-39569320_-,
TACGGCCGCGGCGA chr1:159221239-159221439_+,chr1:159221239-159221439_-,
TACGGCCGCGGCGA chr1:159221239-159221439_+,chr1:159221239-159221439_-,
TACGGTGGTCGTGC chr1:38974845-38975045_+,chr1:38974845-389750

In [64]:
tsv.head()

Unnamed: 0,kmer,nKmer,gcKmer,null,nNull,gcNull,pretty,coor
0,CTTGGCGTAGTCCG,2,0.64,CGTAGCGTAGTCCG,1,0.64,.G.A..........,"chr15:87114925-87115125_+,chr15:87114925-87115..."
1,CTTGGCGAATATAG,2,0.43,CGTCGCGAATATAG,1,0.5,.G.C..........,"chr4:97936775-97936975_+,chr4:97936775-9793697..."
2,AAATTGCGCGTAAC,4,0.43,GAATCGCGCGTAAC,1,0.57,G...C.........,"chr3:100743096-100743296_+,chr3:100743099-1007..."
3,TTGGGCGCCGCAAT,2,0.64,TTGCGCGCCGTAAT,1,0.57,...C......T...,"chr11:2239158-2239358_+,chr11:2239158-2239358_-,"
4,TTGGGTTCGGCGAC,2,0.64,ATGCGTTCGGCGAC,1,0.64,A..C..........,"chr19:11489403-11489603_+,chr19:11489403-11489..."


## format kmer coordinates.  

In [77]:
explode_cols = ["coor"]
for col in explode_cols:
    tsv[col]=tsv[col].apply(lambda x: x.split(","))
    
# explode columns
tsv = tsv.explode(explode_cols)
# drop empty columns
tsv = tsv.loc[tsv.coor!= ""]

# drop strand annotation. Not useful here. 
tsv[col] = tsv[col].apply(lambda x: x.split("_")[0])

tsv = tsv.drop_duplicates()

In [78]:
tsv.head()

Unnamed: 0,kmer,nKmer,gcKmer,null,nNull,gcNull,pretty,coor
0,CTTGGCGTAGTCCG,2,0.64,CGTAGCGTAGTCCG,1,0.64,.G.A..........,chr15:87114925-87115125
1,CTTGGCGAATATAG,2,0.43,CGTCGCGAATATAG,1,0.5,.G.C..........,chr4:97936775-97936975
2,AAATTGCGCGTAAC,4,0.43,GAATCGCGCGTAAC,1,0.57,G...C.........,chr3:100743096-100743296
2,AAATTGCGCGTAAC,4,0.43,GAATCGCGCGTAAC,1,0.57,G...C.........,chr3:100743099-100743299
3,TTGGGCGCCGCAAT,2,0.64,TTGCGCGCCGTAAT,1,0.57,...C......T...,chr11:2239158-2239358


In [79]:
tsv.to_csv(TSV_MUT, sep='\t', index=False)