# Generate and visualize filter strengths

In [1]:
%load_ext autoreload
%autoreload 2

import sys
sys.path.append("../")
import os
os.chdir("..")
import pandas as pd
import matplotlib.pyplot as plt
from src.vis_data import get_vis_data

  from .autonotebook import tqdm as notebook_tqdm


## 1. Generate and save filter strengths

In [2]:
def sum_strength(d):
    if "strength" in d.keys():
        return d["strength"]
    return sum([sum_strength(child) for child in d["children"]])

In [2]:
json_data = get_vis_data(exon="GCGGCACCTACTACAATGTCCCCCGCTGCATACACTCGGAGCCAATAGGGCGCCTATAGAGTGTAGTCCT", json_file="data/teaser.json", threshold=0.001)
json_data = get_vis_data(exon="GAGTCCCGCTTACCATTGCATTTAAGAAAGCGGCCATACGCCGCTAAGACCCTACTCTTCAGAATACCAG", json_file="data/exon_s1.json", threshold=0.001)
json_data = get_vis_data(exon="CCTTCCACGCCTCTCCCACTCGTTACACTCAGTTGCAGTATGGTTAACACTCCACTAGGCCCCAGGAATC", json_file="data/exon_s1_comp1.json", threshold=0.001)
json_data = get_vis_data(exon="GTCTGACAGTACTACGCTAATACTACGTAAACCAAAGCCATAATCCAATTGACCTCCTTTTCAGGAATTC", json_file="data/exon_s1_comp2.json", threshold=0.001)
json_data = get_vis_data(exon="GAGTCCCGCTTACCATTGCATTTAAGAAAGAGGCCATACGCCGCTAAGACCCTACTCTTCAGAATACCAG", json_file="data/exon_s1_34c>a.json", threshold=0.001)
json_data = get_vis_data(exon="GAGTCCCGCTTACCATTGCATTTAAGAAAGAGGCCATACGCCTCTAAGACCCTACTCTTCAGAATACCAG", json_file="data/exon_s1_34c>a_46g>u.json", threshold=0.001)
json_data = get_vis_data(exon="GACTATGAGCCCCAACGAACAAGCTCCTATCTGGGAACTCTTTTCTGCAGACTTTAACCCTACCCCCAGA", json_file="data/exon_d1.json", threshold=0.001)



In [3]:
json_data = get_vis_data(exon="GCGGCACCTACTACAATGTCCCCCGCTGCATACACTCGGAGCCAATAGGGCGCCTATAGAGTGTAGTCCT", json_file="data/exon.json", threshold=0.001)



In [5]:
json_data["delta_force"]

-16.2321506754854

In [6]:
sum_strength(json_data["nucleotide_activations"]["children"][0]) - sum_strength(json_data["nucleotide_activations"]["children"][1]) + json_data["incl_bias"]

-16.2142274712114

In [7]:
sum_strength(json_data["feature_activations"]["children"][0]) - sum_strength(json_data["feature_activations"]["children"][1])

-16.214227471211387

## 2. New groupings

In [11]:
json_data = get_vis_data(exon="GCGGCACCTACTACAATGTCCCCCGCTGCATACACTCGGAGCCAATAGGGCGCCTATAGAGTGTAGTCCT", json_file="data/correct_teaser.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="GAGTCCCGCTTACCATTGCATTTAAGAAAGCGGCCATACGCCGCTAAGACCCTACTCTTCAGAATACCAG", json_file="data/correct_exon_s1.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="CCTTCCACGCCTCTCCCACTCGTTACACTCAGTTGCAGTATGGTTAACACTCCACTAGGCCCCAGGAATC", json_file="data/correct_exon_s1_comp1.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="GTCTGACAGTACTACGCTAATACTACGTAAACCAAAGCCATAATCCAATTGACCTCCTTTTCAGGAATTC", json_file="data/correct_exon_s1_comp2.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="GAGTCCCGCTTACCATTGCATTTAAGAAAGAGGCCATACGCCGCTAAGACCCTACTCTTCAGAATACCAG", json_file="data/correct_exon_s1_34c>a.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="GAGTCCCGCTTACCATTGCATTTAAGAAAGAGGCCATACGCCTCTAAGACCCTACTCTTCAGAATACCAG", json_file="data/correct_exon_s1_34c>a_46g>u.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="GACTATGAGCCCCAACGAACAAGCTCCTATCTGGGAACTCTTTTCTGCAGACTTTAACCCTACCCCCAGA", json_file="data/correct_exon_d1.json", threshold=0.001, use_new_grouping=True)

In [2]:
json_data = get_vis_data(exon="GCGGCACCUACUACAAUGUCCCCCGCUGCAUACACUCGGAGCCAAUAGGGCGCCUAUAGAGUGUAGUCCU", json_file="data/teaser_18.json", threshold=0.001, use_new_grouping=True)



In [2]:
json_data = get_vis_data(exon="CCGCGACCGGAUUAAGAUGAAGGAACGAAGCAAUUGUCGAAUCUACUCUAAUCUGCUCGAAGAUCAGAAC", json_file="data/max_incl_class.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="AGAUGUCGAUCCCCAUUAAUCAACCCCUCUCCUUAUAUUAUCCCCAUAUUCACAAAACUGUUUGCUAAAA", json_file="data/max_skip_class.json", threshold=0.001, use_new_grouping=True)

In [3]:
json_data = get_vis_data(exon="CCGCGACCGGAUUAAGAUGAAGGAACGAAGCAAUUGUCGAAUCUACUCUAAUCUGCUCGAAGAUCAGAAC", json_file="data/max_incl_feature.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="CCACUCACCGCCGCCGGUGUCCUGGCAUACUCAUUAUCGCAACCCCGACGCGGCCCACUUGGGUCGCGGC", json_file="data/max_skip_feature.json", threshold=0.001, use_new_grouping=True)



In [4]:
json_data = get_vis_data(exon="AGUCUCUUGGAAUCGCGCCCGACAUCUUACCAGUAAAAUCGGUGCUCCAGGGCCACGAUCUUCGACACCA", json_file="data/max_incl_feature_pos.json", threshold=0.001, use_new_grouping=True)
json_data = get_vis_data(exon="GCUCGCAACCAGCCGCCUACCUAUUAAUUGUCUGUGCUCCAAGAAUUACAGCUAGCAAUUUAGGUACCAA", json_file="data/max_skip_feature_pos.json", threshold=0.001, use_new_grouping=True)

In [2]:
json_data = get_vis_data(exon="GACTATGAGCCCCAACGAACAAGCTCCTATCTGGGAACTCTTTTCTGCAGACTTTAACCCTACCCCCAGA", json_file="data/exon_d1_18.json", threshold=0.001, use_new_grouping=True)

# 3. Different length

In [5]:
json_data = get_vis_data(exon="ATATTGTTGACGGTCAATTATATGGGCTCATATGATAGCACCTGTCGAGATGTTTAAGGCATAAGGAGCTGACGTTGGCCTCAGTATTATAGTGCAGCAACGGATTGTGCATAATCGTGTATGAATCCGAGGATTTGGCG", json_file="data/exon_length_140.json", threshold=0.001, use_new_grouping=True, dataset="ES7")
json_data = get_vis_data(exon="TCAAACAGGCGTAACATATTCATTAAAGCCGTTGCACATGGAGCTGAGATATACACAGGAACGAACCGTTTACGTTAATGGGA", json_file="data/exon_length_83.json", threshold=0.001, use_new_grouping=True, dataset="ES7")
json_data = get_vis_data(exon="ATGAAATCCATTCCACAGCA", json_file="data/exon_length_20.json", threshold=0.001, use_new_grouping=True, dataset="ES7")

