#Imports and functions

In [1]:
"""
from google.colab import drive
drive.mount('/content/drive')
"""

Mounted at /content/drive


In [2]:
!pip install captum
!pip install transformers
!pip install pybedtools

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting captum
  Downloading captum-0.6.0-py3-none-any.whl (1.3 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m1.3/1.3 MB[0m [31m19.5 MB/s[0m eta [36m0:00:00[0m
Installing collected packages: captum
Successfully installed captum-0.6.0
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting transformers
  Downloading transformers-4.30.1-py3-none-any.whl (7.2 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m7.2/7.2 MB[0m [31m56.0 MB/s[0m eta [36m0:00:00[0m
Collecting huggingface-hub<1.0,>=0.14.1 (from transformers)
  Downloading huggingface_hub-0.15.1-py3-none-any.whl (236 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m236.8/236.8 kB[0m [31m22.0 MB/s[0m eta [36m0:00:00[0m
Collecting tokenizers!=0.11.3,<0.14,>=0.11.1 (from transformers)
  Downloading tokenizers-0

In [3]:
import numpy as np
import pandas as pd
import pybedtools
from transformers import BertTokenizer, BertForSequenceClassification, BertConfig
from captum.attr import visualization as viz
from captum.attr import IntegratedGradients, LayerConductance, LayerIntegratedGradients
from captum.attr import configure_interpretable_embedding_layer, remove_interpretable_embedding_layer
import torch
import matplotlib.pyplot as plt

In [4]:
from transformers import AutoTokenizer, BigBirdForSequenceClassification, AutoModelForSequenceClassification, AutoModel

tokenizer = AutoTokenizer.from_pretrained('/content/drive/MyDrive/SE_annotation_project/bulk/results_bert/bigbird_base')
model = AutoModelForSequenceClassification.from_pretrained('/content/drive/MyDrive/SE_annotation_project/bulk/results_bert/bigbird_base')

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
model.to(device)
model.eval()
model.zero_grad()

In [5]:
def predict(inputs):
    return model(inputs)[0]

def construct_input_ref_pair(text, ref_token_id, sep_token_id, cls_token_id):

    text_ids = tokenizer.encode(text, add_special_tokens=False)
    # construct input token ids
    input_ids = [cls_token_id] + text_ids + [sep_token_id]
    # construct reference token ids
    ref_input_ids = [cls_token_id] + [ref_token_id] * len(text_ids) + [sep_token_id]

    return torch.tensor([input_ids], device=device), torch.tensor([ref_input_ids], device=device), len(text_ids)

def construct_input_ref_token_type_pair(input_ids, sep_ind=0):
    seq_len = input_ids.size(1)
    token_type_ids = torch.tensor([[0 if i <= sep_ind else 1 for i in range(seq_len)]], device=device)
    ref_token_type_ids = torch.zeros_like(token_type_ids, device=device)# * -1
    return token_type_ids, ref_token_type_ids

def construct_input_ref_pos_id_pair(input_ids):
    seq_length = input_ids.size(1)
    position_ids = torch.arange(seq_length, dtype=torch.long, device=device)
    # we could potentially also use random permutation with `torch.randperm(seq_length, device=device)`
    ref_position_ids = torch.zeros(seq_length, dtype=torch.long, device=device)

    position_ids = position_ids.unsqueeze(0).expand_as(input_ids)
    ref_position_ids = ref_position_ids.unsqueeze(0).expand_as(input_ids)
    return position_ids, ref_position_ids

def construct_attention_mask(input_ids):
    return torch.ones_like(input_ids)

def custom_forward(inputs):
    preds = predict(inputs)
    return torch.softmax(preds, dim = 1)[0][1].unsqueeze(-1)

def summarize_attributions(attributions):
    attributions = attributions.sum(dim=-1).squeeze(0)
    attributions = attributions / torch.norm(attributions)
    return attributions

In [6]:
def dataframe_creation(attributions_sum, all_tokens, start, chrom):
  short_a_s = attributions_sum[0:len(all_tokens)]
  df = {'tokens':all_tokens, 'score':short_a_s}
  df = pd.DataFrame.from_dict(df)
  df = df[1:len(df)-1]
  starts = [start]
  ends = []
  l=list(df.tokens)
  for i in range(len(l))[1:]:
    starts.append(starts[i-1]+len(l[i-1]))
    ends.append(starts[i])
  ends.append(starts[-1]+len(l[-1]))
  df['chromStart'] = starts
  df['chromEnd']= ends
  df['chrom'] = [chrom]*len(df)
  return df

def bed_file_creation(df, filename):
  df_pos = df[df['score']>=0]
  df_neg = df[df['score']<0]
  mult = 1000/max(max(df_pos['score']), abs(min(df_neg['score'])))
  df_neg['score']= df_neg['score']*mult*(-1)
  df_pos['score']= df_pos['score']*mult
  pos_data = pd.DataFrame()
  pos_data['chrom'] = df_pos['chrom']
  pos_data['chromStart'] = df_pos['chromStart']
  pos_data['chromEnd'] = df_pos['chromEnd']
  pos_data['name'] = df_pos['tokens']
  pos_data['score']  = df_pos['score'].astype(int)
  pos = pybedtools.BedTool.from_dataframe(pos_data)
  pos.saveas(filename+'_pos.bed')
  neg_data = pd.DataFrame()
  neg_data['chrom'] = df_neg['chrom']
  neg_data['chromStart'] = df_neg['chromStart']
  neg_data['chromEnd'] = df_neg['chromEnd']
  neg_data['name'] = df_neg['tokens']
  neg_data['score']  = df_neg['score'].astype(int)
  neg = pybedtools.BedTool.from_dataframe(neg_data)
  neg.saveas(filename + '_neg.bed')

#SE_67479

The text is SE_67479 from SEdb v2.0, 11.06.2023 18:00

In [None]:
text = 'AAAGGTTTGGAGAGGGAGGTCCTAGTGAGGCTGAACAGAGGTAAAATAAACAGAAAGTTCCAGGCTCTCCTTGCTTCTACTTAAGAAAAATCAGAGCAGTAAATCCCAAACCAGTTCTGCCCACAACTCAAATGCAGATGAGCATCCCTTGCTCCATCTATGCAGGAAAGCCATAGTGTGGGGCTGTAGGACTATGGAGTCAGCCTCTGCAAGCAACAAGGCTCAGAGGCTGAGGGGCTTCAGGCCCCAGCAAAACCCAGTGATCCTGTTGTCAAATCTGAATGTCATCATCTGCCTCCAGGGCGACCAGCTCTGGATGGGGGTGTCAGGGTCAGGATCCTGTTCCATGTGGCAAGAGCTTGGGGAAGCTGCTGCAGGCCTACTGATGACCTTCTTTCCTGGCCCAGACACTCTTAAAAACTTCCTGGCGAGGGAGGCAACACACCTTATTGTGCAGCCCTCATCGAACGCATCAGCTGCACTAAGTGCTGAAGAAAAGTTCCCATAATAACCATGTGTGATAATAAAAAGATAAAGAGGCAAATAGGTATGTAGGTCAGCTCAAAAATAGCCACCCACCCGCCTGGCCTGGGTAGCCCTTTGTGCCAAGTGGGTAGAAAGGTTTTCCTTGCTTCCCTTCCCAAGCTGATGCCCCCTGCACTTTTCAAGGTTGCCTTAAATACAACTCCTTCCTGCACTAGCTGGGGTAGCCAGGGCAGTAGGGACTGCAGCCCTACAGGGGCAGCCCTGCGCTCCCTCCACCAAATCAATCCTGGGGTCAGAGGGCACAAAGGCTTGGCCTCTCTGACGTGAGTTCTCGGGGCTAAGTCAGGGTTTAGGGTAGTGAGTCACAGACATTCTTTCCCCCATCCCTTAGGGTTTGCGCACACCCAGGAAGCCTTCCCCTCCCCAACAGAGACCGCTTTGTTAGCACGACCCACCCGGTTGGAGAAGAGTTACAGCCTCAGGGGTGTGAGGGCCTCCTCGGCCTCTCCCTCCCTCCCCCTCTCTCCTCTCTAGGGCTCTCACCAGAAAGGCGCCAACCCTGCGCCCTGCCCCCACCCAGCCGCCGGGGCCCCAAATGCTGAGCTCAGCATCTCTGTGGCCTGGCTGCCCTCCTCCCGGGCAGTGGGAGGAGCCTCCTTCCTCCCGAGGGTGGGCGGGGCCAGGGCCAGCCCCGCCCTCCTCCCCGTTCCCCCTCTCCCTCCATCCCCCTCCCGTTCCTCAGTCGCACGTTCTCCAAGTCACGTCCCCCGCTTCCCCTAGTAGGGGGTCGACGGAGATTGGACCCTTCCCCCAGTCAGCTGCTCTGCATCTGTCACCTCGGCGGCAGCGCTCCCTTGAGGTCGCACCTCCGCTGTGGAGGGAGGCGAGAGCGAGCTGAGTGGGGGGTCTTCCCTTCCCCCATCCCGCTGGCCCCAGACAAGCCACCGCAGACCGCGGCGAAATCAGTTAAGCTCTTGCGTGCACCAGTTCCCGGAGCAGAGTCTGAAAGTTTTTGTGTTTCTGTGCGGCTACTTTTAAGTATAAAAAATTCAGCAGTGGCTCCTGGGTGCCTATGTCAGCGTCTGGCCCTTTGTGGATTACGTACGGGACAACTGGGGTGGGGAAGGGCCCCTCTTCACAGGCAGCAATTCCCAGAGTGGCCTTCCTATGGGACCCCAGAGCTCCCAGGGGGAGGATCCCAGAGGGGGATATGGTAACAGAATCACTGTCACTTCTGGGATTGAGGGTGGCAGCTAAAGGGAAACCCCTCGAGTGTCAGTCGGACTTGCCATTTGAGTCAGCACTGCTAGGTGCTGCTGAATTCTGCAGGGGGAGGAAGAACCTGATCAGATAAAACAAGGGCTGACCTAGAGAAAGTCTCTTGGGTCAACATATTCTTAGCGATAACAGAAGATCACTCCAACTGTTCTACACCCCACCCTACAACATTGACCCCCCGCTTTCCAGCATTTACAGTCCCTTTTAGTTTACAACTAAGAGTATGGGTTGCCTGGGATCAGGAAATGAGCCTAGATGTAGAGTCCTGGCTCCAGCCTTGCTGACACTATGTGACTCACTGCACCTATCTGAATCTCAGTTTTCTCACCTGTGCAGTGACATTGATGAGGTCTGTCCTGCCTACAAACTCTACACACATATATTAGTTGTTGTTTTTTAATTTTTAGTAGAGATGGGGTTCTCACAACTTGCCCCAGGCTGGTTTGAACTCCTGGATTCAAGCAATCCTCCCATCTCCACCTCCCAAATGCTGGGATTACAGGTGTGAGCCAGTGTACCAGGCCAGTATTATGCTGGGATTACAGGTGTGAGCCACCATACCAGGCCTTTATTTTTGTTTTGTTGGTTTGTTTCGTTTTTGTTTGAGATAGCGTCTCACTCTATCACCCAGGCTGGAGTGCAGTGGAACGATCTTGGCTCACCGCAACCTCCGCTTCCCGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCAGGTAGCTGGGATTACAGGTGCATGCCACCAAACCTGGGTAAATTTTGTATTTTTAGTAGAGACAGGGTTTCACTATGTTGGCCATGCTGGTCTCAAACTCCTGGCCTCAAGTGATCCACTCGCCTCAGCTTCCCAAATCATGTGCTGGAATTACAGGTGTGAGCCACTGCCCAGCCTAAGTCTTTTTTTTTTTTTTTTTTTTTTTTGAGACAGAGTCTTGCTTTTTGACCCAGGCTGGAGTGCAGTGGCACAATCTCAGCTCACTGTAACCTCAGCCCCCTGGGCTCAAGTGATTTTCCCACCTCAGCCTCCCAAGAAGCTGGGAATACAGATACACTCTACCATGTCCAGCTAACTTTTTGTCTCTTTAGTAGAGATGGGATTTCACCATGTTGGCCAGGCTGGTCTTGACCTCCTTGACTCAAGTGATCTGCCCACCTTGGCCTCCCAAAGTGCTGAGATTACAGGCATGAGCCACCATGCCCAGCCTCCAGTTGTTATTTTTATTAACAAAGTTATGAAAATCCTTTAGAACATGTGGAAAAAGACAAAAAGTTATAAGGCTGGGTGCAGTGCCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGAGGTGAGCAGATCGCCTGAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGTGAAACCCTGTCTTTACTAAAAATACAAATATTAGCCAGGCATGGTGGCGGGCACCTGTAATCCCAGCTACTTAGGAGGCGGAGGCAGGAGAATCGCTTAAATCCAGGAGACAGGTTGCAGTGAGCCACGATCGTGTCCAGCCTGGGCAACACAAGACTCCATCTCAAAATTAAAAAAAAAAAAAGTTATGAAAGCCCTAAAAAATATGGAAGTGTGTTTTTTTGTTTGTTTTGGTTTTTTTGAGACGGAATTTCACACTGTTGCCCAGGCTGGAGTCTAGTGGCGCGATCTAGGCTCACTGCAACCTCTACCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACCGGCGCCCGCCAGCACGCACGGCTAACTTTTTCTATTTTTAGTAGAGATGGGGTTTTACTATTTTGGCCAGGCTGGTCTCAAACTCCTGACCTCATGATCCGCCTGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTGCCAGGCCTGTGCAAGTGTTTTTAGAATCCTGAAGCGCTCCATAAGGGTCAATGATCTTTGTGAGGAGGCTGGTGCGGTGGTTCACGCCTGTAATCCCAGCACTTTGGGAGGCTGAAGGGGGCAGATCACCTGAGGTCAAGAGTTTGAGACCAGCCTGGCCAACGTAGTGAAACCCTGTCTCTGTTGAAAATACAAAAATAAACCGGGCGTGGTAGTGCATTCCTGTAATCTCAGCTACTCGGGAGGCTGAGGCAGGTGAATCCCTTGAAGCCGGGAGGCAGAGGTTGCAGTAAGCTGAGATTGCACCACTTGTACTCCAGCCTGGGTGACAGAGTGAGACTCCACCTCAAAAAAAAAAAAAGATCTTTGTGAAGAGATGGCAAATTGCCAGGTGGGCTGGCAGCTTCCATTTCCTGCCAGCCCAGGTGTTCCAGAGAAAGGCTCAGCATGCAGACCTGGGCAGCTGCCTTTTGCCTAGACTTGAGTTTCCCAAGCCTTTGACTATTAAGGCCACTGGAGATAAAATGCACTTCTGAGTGAGGTTAGAGGCATCGCAGAAGGGTGATGAAGGAGACCAAAGCCAGGGAGAAGAAAGTTCCAGAGGATTGAGTGGGGCCTAACTGCCAGGAGAGAGGGAGATCCTGGAACCTCCTAAGGCTCCCTGCCCTGTCAGTTCCTTGTCCATAAAGTGGGGGAGGTTGGGGGCTGGAAGGAGTACTCTCTTAGGACCTGCTTATCTTAACATTAAAAGATTTTAGCCGGGCATGGTAGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCTGAGGCGGGCAGATCACCTGAGGTTGGGAGTTTGAGACCAGGCTGACCAACATGGAGAAACCCCATCTCTACTAAAAATACAAAAAAGTTAGCCAGGTGTGGTGGCACATGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCGCTTGAACCTGGGAGGCGGAGGTTGCGGTGAGCCAAGATTGCGCCATTGCACTCCAGCCTGGGCGACAAGAGCGAAACTCCATCTCAAAAGAAAAGAAAAAAAGAAAGATTTTAAGGTTCATTCTACTGACAGAAGAATCCTGACAGTGAGAAGGCTGACCCTTCTCTCTGCTGATCTAGCTCTACTCACCCCAGCCCTTTGGGAAACGCAGAGGCTAGACAGGTCCTCCTGGTCTCCTTTCTTCTCTAGAAGGAAAAACAACAACAATAGAGTGAGCTCATTTTGCTGTCCAGACAAATGATGAGCCTGGGTTTGGGCTTTCCCAACTGTGGCAGGTCCTGATCATCTCTGTCATCCCCTGTCATATACTCCCTAGGCTGGTGGAAAAACCCCCATCCCTGCTTCCCCCTTTGTTATATGGATATCAACAATATTTCCATATTGTAAACCAATTGGAAGCCCTCAAAAGGCAAAAGCACTGAAATGGCTGAAATGCCTATTTCTACCTTCTCTGGCAGGCCTCCTGCAGAGAGTCCTATGGGCTAGGACTGGGGTTTGGGGGAAAGCAGCTCCATGGAATGTATTATATCTTTCTCCTTTGCTATGATCCTTGTAGAGGTTGAAGAGGTCTTTGAGATTCTCTAGTTCCGTGTTTTCAAAACTGAGGTATGAAGGCCGGGCTTGGTTACTCACGCTTGTAATCCCAGCACTTTGGGAGGCCGAGGCAGGCAGATTACTTGAGGCTAGGAGATAGAGACCAGCCTGGCCAACATGGCAAAACCCCGTCTCTACTAAAAATAAAAAAATTAGCCAGGCGTGGTGGCGCATGCCTGTAATCCCAGCTACCCGTGAGGCTGCGGCAGGAGAATCTCTTGAACCTGGGAGGCAGAGGTTGCAGTGAGCTGAGATATCGGCACTGCACTCCAGCCAGGAGGACAGAGCGAGACTCTGTCTCAAAAAAGAAAAAAAAAGTTTTTTTCTTTTTTTGGAGGGAGAAATTAAGTAATTTAACTAGTAAGTAATCTAAACATTTGCTACTGAAATTAACACAGATAAAATATATAATAAAATGCAAAATTGTGTTATTTGTAATAAAAATTCTGGGCTTCAAAGACATGGTATGCTTCCTGGGGGCTGCTTCTGGGCCACAGCCCAGACTCCGATCCATCCTTAGTGGCCAAACAGCCTGCAACTAAGGTCTGCTGACTCCTATCCTCTCACTCCACAGGGCCTGAGCTAGCCGAGGTTTAAGAGACTCACTAGAGAGAGGGGGTTGCCTAGCCCTCCCTGCACTTCATTGCTTTCTCTCCTCATAAGGATTCAGAACCTAGGATTGGAGAGGGATCTTAGTAATGGCTGGCAGAAACCTGGCCTCTAAGTGGATGGGATTCCTTACTGACAGTCAGTGGGACAGGTGAGGAGAAAAGAGACAGTGCCGGAGTCAGAAGGACGAGGTTCCAGGCCTGGCTGGGTCCCTAGGACAACTCATTTGACCACGCGGGCTGGAGACGGGTGGGCTGCATGAAGTCTGGTAGGCTGTCTGTGCCTTTGCTACTGCTGGGATACAGAGGTCTGCCAGAATCCTCAGGCTACTCTCTCAGCTCTCAAAACCCTTATCCCTTGGCATGGGTGGTTTATCAACCTAGCCCTTTGTGGGGTTCCCACTGCCCTGCCCTCTCCCCAGAGGAAATGACTTCTTGGGAAACCTAGGACCCCAGGCAGAACCAGGCAGAACTGGTTGTCTGTGAGCTCACCTTTGTCACGTGTGAGCCCTGTCTACACAGCTGCAAGCTCTCACCCACCCCTAACCCAACCAGGCCTATCTTTCTTTCCTAGAGGTCAATAAGCACCCCAACTAAAGATAAGCATCAGAATCGCCTGGAGAATTTTGCTCCTAAGGACCCCACCCAGACCTACCCAATCAGAATGGGGGTTGAGGAGATGAGAATCTCGGTTTTACAAGCTCCTCAGCTGATTCTAATTTTTTTTTTTTTGAGATGGAGTCACACTCTGTTGCCCAGGCTGGAGTGCAATGGCGTGATCTCAGCTCACTGCAATATCTGCTTCCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCTGAATAGCTGGGGCTACAGGGGTGTCCCACCACACCCAGCTAATTTTTGTATTTTTAGTAGAGATCAGGTTTCACCATGTTGGCCAGGCTGGTCTTGAACTCCTGACCTCGTGATCCGACCGCCTTGGCCTCCCAAAGTGCTGGGATTATAGGCATGAGCCACCACACCCAGCCTGATTCTAATTATTAATCAGACTTGAAATGAAAGCCACTGGTTCACGGAGGGATTACGGGACTCTCACTTTGAGCCTCAATGTCCACATCTGTAGAATGGCACTATATTTGTTCCTTGGGGCATACTTGGACAACAGATTTTTTTTTTTTTTTTTTGAGATGGAGTTTCACTCTTGTTGCCCAGGCTCGAGTGCAATGGCACAATCTCGGCTCACCACAACCTCTGCCTCCCAGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCTAGTAGCTGGGATTACAGGCATGTGCCACCACGCCCGGCTAATTTTCTATTTTTAGTAGAGATGGGGGTTTCTCCATGTTGGTCAGGCTGGTCTCGAACTCCCGACCTCAGGTGATCTGCCCGCCTCAGCCTCCCAAAGTGCTGGGATTACAGGCATGAGCCACCGCGCCCGGTCTGGACAACAGATTTTTAAAAGCTACTTTGAAAGACTGCTCAATACCGTCCAGGCCCGGTGGCCCATGCCTGTAATCCTAGCACTTTGGGAGGCTGAGGCAGGCGGATCACTTGATGTTAGGAGTTCAAGACCAGCCTGGCCAACATGGTGAAACCCCGTCTCTACTAAAAATACAAAAATTAGCCAGGCGTGGTGGCACGTGCCTGCAGTGCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCACTTGAACCTGGGAGGCAGAGGTTGCAGTGAGCAGAGATCGTGCCACTGCATTCTAATCTGGGTGACAGAGTGAGACTCCATCTCAAAAAAAAAAAAAAAAAGACTGCTCAATACATTGTATTGTTAGTATTTCCATTTCAAAAAGCAGCCTTATTTGCAAAGACTCCTCACTGAGTTTTTAACTCTCCCTCCAGTAGGATAGACAAAATCCTCCTTGAGGCCCTCACTTCAGCTTTTCACAAGCCTCCTAAACCAGGTGCATTTATAATCGTGCTATTTTGACCAAGCTGTTTGTTGTTTTTCAAGAAAGCCACAGAATCCTGGGAACGCTTCTGCTGGCTTCTCATCTCCACCTCCTCCCAATGCTCCACCTTCTCCTTCATGCCTCGACCCACGGGCTCCTCCACCAGCTACTTCCACCAGCCGCAATGAGAAATTTCCAAAGGGCTGCAGAGGCGCCCCAAGCAGAGGCATGCGAGCGAGCTGGCTGGCCTTCAGGGGTTTCCATCCTGAATTCTGGGGTTCTTGGAATCATACCCCCACCCCAAGATCTGGTTCAACTTCCCAAACCCGACCAGGGTGACTTGCCAGACCGAGGCCCTGGGAACCGGTGCTCCAGACGGAACCGCCTGAACGGGGAGGGGCAGGTGGCCGGGAGTGAGTGCTCATTGACTTTAAATTGCAGGTTGCGGCATTGCGCTCTATTCTGATGGAGTGCAGTCCTGGAAGAGGCAGGGTTTATGCACGGTCAGGGCCCTGGCCACAGACACTGGGACATGGGGCCTGATCACCAACTCCAGAGGCCTGAGTCACCTGGGACATGACACCAGCCCACTCCTGCTCAGAGGTCGGCCAGTCTCCCCACCAGGGTTGTCTTGCGGCTGCCGTGTTGCACATTGTGTCTATGTGATGAGTGCTCCCTGGAGCACTACTCTCCAGAAGACACATGTTCATGCAGACTCTAATGGTAGCAGCATCCTCTGGAGTTGTGCAAAGAGGCAGCCCTGCTTCTTCTTCTTTTTTTTTTAATTAAAAAAAAATAGGCCAGGTGTGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCAAGGCGGGTGGATCATGAGGTCAGGAGATCGAGACCATCCTGGCCAAAATGGTGAAACCCCATCTCTACTAAAATATGAAAAAATTATCTGGGCATGGTGGTGTGCACCTGTAGTCCCAGCTACTTGGAAGGCGGAGGTTGCAGTGAGCTGAGATCACTCCAGCTTGGCAACAGAACAAGACTCCGTCTCAAAAAAAAAAAATAGAGATGGGGGTCTCACTATGTTGGCCAGGTTGGTCTTGAACTCTTGGCTTCAGTCAGTCCTCCCACATTGTCCTCCCAAAGTGCTAGGATTACAGGCATGAGCCACCACACCCAGCCCTACTTCTACCAACAAGGGAACACTTCAAAGCATTTTGAGGGGAGTGACTGCTTCATGGGTAAAGGACCTCCATGGGAGTTAGGAAAGGTGTTTTGGAACCAGATAGAGGTAGTGGTTGCACAACATTGTGAGTGTACTAAATGCCACTGAACTAACTGTTCACTTTGAAATGGTTAATTTCTCTCCCTCCCTTCCTTCCTTCCTTCCTTCCTTCCTTCCTTCCTTCCCTCCTTCCTTCCTTCTTTCCTTCCTTCCCTCCTTCCTTCCCTCCTTCCTTCCTGTAATCCCAGCTACTCAGGAGGCTGAGACCTGGGCAACAAGAGTGAAACTCTGTTTCCAAAAAAAAAAAAAAAAGGCCAGGTGCGGTGGCTCACGCCTATAATCCCAACACTTTGGGAGGCCTAGGCGGGTGGATCACCTGAGGTTGGGAGTTCAAGACCAGCCTGACCAACATGGAGAAACCCTGTCTCTACTCAAAATACAAAATAAGCTGGGCATGGTGGCGCATGTCTGTAATCCCAGCTACTGAGGAGGCTGAGGCAGGAGAATCACTTGAACCCAGGAAGCAGAGGTTGCAGTGAGCCGAGATCGTGCCATTGCACTCCAGCCTGGGCAACAAGAGCGAAACAGCGAAACTCCGTCTCAAAAAAAAAAAAAAAAAAAAATTCCCTACAACAGATCAGCCCTCTGCAAGATTTCACGTCTCTCCCCAGTTTCCTGGGCTAGGTCGCTGACTATATTCCAGAGGAAGAACTGGATTGGCTTAGAAGCCCCATTCCCAGACCCCAGCTGAGGAGGAAGGGAAATGGTCAGATCTGTCCAAGGCTCTTGGCAGCACTTGCCATAAAGAGGATGGAAAGGTAGCATCAGGGTCCTCTTGAAGGCACCCCATAGGCCCCACTAGATCCTGGGAATCTAGATGCGGGTGTCTGCAATTCTGGAAAAAGCCATGTGCTTTTTGTTTTTGTCTCACTATGTCACCCAAGCTGTAGTGCAGTGGTACCATCATAGCTCACTGTCCCTGGCCAGGCTCCAGCGATTCTCCTACCTCAGCTTCCTGAGTACCTGGGACTAAAGATGTGTGCTACCATGCCCAGTTAATTTTTATTATTTATTTATTTATTTATTTATTTATTTGAGACAGAGTCTCGCTCTGTCACCCAGGCTCGAGTGCAGTGGCAAGATCACGGCTCACTGCAACCTCCGCCTCCCGGGTTCAAGCAATTCTCCTGCCTCAGCCTCCCAACTAGCTGGGACTACAGGCACGCGACACCACGCCCAGCTAATTTTTGTACTTTTAGTAGAGATGGGGTTTCACCATGTTGGCCAGGATCGTCTGGATCTCTTGACCTCGTGATCCACCTGCCTCAGCCTCCCAAAACGCTGGCGTGAACCACTGCATCTGGCCAATTTTCTGTATTTTAGTAGAGACGGGGTTTCACCATGTTGCCCAGGGTGGTCTCAAACTCCTGAGCTCAGGTGATCTGCCCACCTCAGCCTCCCAAAGTGCTGGGGTTACAGGCATCAGCCACCATGCCTGGCTAATTTTTAAATTTTTTGTAGACACGGGGTCTCACTATGTTGCCTAGGCTGGTCCTAAACTCCTGGCTTCAAGTAATCCTCTCACCTCCAAAGTGTGTGGGTTAAAAGTGTGAGCTGCCACAGCCAGAGAAGCCACGTTCTTGCCTCATCTAGCCATTCATTCATCCATCCATTCATTCATGTATTTATCCAAGGAACATTTGCTGAGCCTTTTCTATGTACTGGGCACAGTGCTGGCTACTTGAAGTTAGGATGTGTAGAACGCCATCCTCAAGTAGCTTACTGTCTAGTGGGAAGACCAAAGTGGAAAGAATTATTAACAACAAAGATATGCACTGGCTGGAAAGATGCCCTGAGGAAGGCACCTAAGGGATGGAGTGTCGGGATGAGGGTGCTAGGGGAGGCTTCCTGGAGGAAGGGATGCCAGAGTTGGGTGGCCAAGGCTGCTGGTGGAAGCATGTCTAGGCAAGCCCACCTTGGCCTGAGGGGAGGAGGAGCGGGTGGGTGGACACCAAATGCAGGGTTTCTAGGTTTTGTGAGAGCTCCAATGAGGTCTGGTTCAGAGGCCAGGAGATGGAGCGTCCTCCTGACCAGAAGGGCCCCATTTGCAGAGCTGTGGAGTGAGGGGGTGTTCGGTGTAGGGAGGGTGGTTACAAAGTCTTTCCAGCTCCAGCCAGATGGAAGGGAATCTACCCTCCACCTCAGGACAGGATGGACCAAGGCCCTGCACTCTGGCTCCTGGGAGAGGCTAGCAGTTAAGAACCCCCACTTTACCCTCCTCCCGACCTTTGAGATTCTCCTGGCATACAGGCCTTTTCTCTATCAGGGGTTTTAGCAGTTGTCACAGGGGAAGACACTGACCACTCCCAACTCCCCCAGGCCTCTGCCAGGCCTCCTTGCAGGAGACTTTACCCTGGAACCCACTCCCTCCTACTTTAGGAAACACTTCCAACAATAGGACTGCCTTCTTTTTTTTTTTTAATCGCTTTTTAGAAACACAATGAGACAATAACACTAATAGATTTCTTTTGAAAAGAAACAAAATTACTCAGTGCGCATTAACCAGCCCTTCCCATTTGAGACAAGTTGTTTTATTAACAGAAGGAGACAGTGAATGAAAAAAAGGTGCTTGGAACACTGTTGGGCAGTCTTGATGGTGTTTGTTGAATGAATAAATGATTCCTAATAACTGACCTTTCCAAACCGGACCCGGATTCTTTTCCTTATGAATATCTACTTAAAAGGAAAAAAAAAAAAAGCCTGTGCTTTCTTTAGGTCAGTGTTCCACATTTTCCTGAATTTTTTTTCTGTCCAAAAAAAAAAAAAAAAAGGCCAGGCGTGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCCCAGGCTGGTGGATCACCTGAGTTCAGGAATTTGAGACCAGCTTGGCCAACATGGTGAAACCGTCTCTCTACTAAAAATACAAAAATTAGGCCGGGCGCGGTGGCTCACGCCTGTAATCCTAGCACTTTGGGAGGCCGAGGCAGGCGGATCACGAGGTCAGGAGATCGAGACCATCCTGGCTAACACGGTGAAACCCTCTCTCTATTAAAAATACAAAAGATTAGCCGGACGTGGTGGTGGGCACCTGCAGTTCCAGCTTCTCGGGAGGCTGAGGTAGGAGAATGGTGTGAACCCGGGAGGCGGAGCTTGCAGTGAGCCAAGATCGCACCACTGCACTCCAGCCTGGGTGAAAGAGTGAGACCCCATCTCAAAAAAAAAAAAAAAAAGAAGAAGAAGAAGAAAAAACATCGTAACTCTTGTTTCCTTAGGGTGTTTAGGTGTCCCGCCCAAATCAGCCTGGAGGAAATGTGAATGTTCCTGATGGATTAATTCAGATCTTCTCTCTGGCCAGCAGGAAGACACACCCATGCAGGTCACCTCTGTAAGAGTGATTTCAAGAGTATGTCATCTACTCCAGCCCTCCAAGAACAACTAGCCGCCTTGATCCAGTGTCTTTTATTATTTTTAATTTTTATATCCCCATTGTTAAGCAATCTGGTGTCTTTAAGGCTCCAACAAGCGACAGAGCTTGAAGAATGGGAAGAGAAGGCCTTGAAAGTCCCAGTGGCTCACAAACTATTCCATTCTGCAGCTGTCTTTAAGATGTCTCCTGGATCCCCTGATTTCTTTTTTTAATCCATAAATTTGTCTCCATAAGTGGGTCTCCCACCTGTCAAATGAGAGTAGGGTGCAGAGCTTGGATTCTGGTTCTTTCAGGTTCTAAGTCTTGGCCCAAGTGTCAGCTTTTTCTTTTTTCTAAGTTGGGGTGGGGATGGGGGTTGCGGAGGGCAGTGGCCTGACATCTCCTGCAAGTGTCATTTGTCACGCGAAAGCAAGCCTGACCCGAGGCAAGGCCCGCCTATCTGGTTAGGTTCCTTGCCCGCCCCCGGGGCCCTGGGCATCTGATGTAAGTTTGGCTCCCTCTTCCATCAGGGTCCTCCTGTCCCAGACTGATAAACCTTTAGAGCAATAAAGGTCGAGTCCGTCTCAACCTCCACCCACCCTCAGCAACCACTGTTAGCCTCTGAGCACTGCTGCCAGGCCAGATTTCCTGTGGCCCCGCCTGAATGATGAAACACGGGATGGCCATTGCACTCCCTGGCTTTTCCAGAGATCTCGGTCCTCGGTCCTGATGCAACCGTCTGGATCTTTTACACAAAGCGCTAGGCGAGCGCTGGGTGCTAGGACCCGGGGGGCGCCCGGGCAGGGAGGTCCGGCTGCGCTGCCTGCAGTCCGCGGGGAGGGCGGATGGGTCTGTGAGTCCGACTGCTGTGAATCCTCGCTTCCATCCCTGCACTGGGCGCTATGAACCCGGGCCCATCCACACTCCTCTAACCACTCTCCTCAAGCCCTCTCCTTGGGAGCAGTTGGAAGTGGAAGCAGATAGGGTTTGGGAGGAGGCAGGGATCCCCATTAACCTATGTCCTGGGCTGTAGAGTAACAGCCAGGATGGGCAGGTGGGGCCTTGGGGAAGGGGCAGCATGGTGCCCGGAGCTTCCCAGTCTGTGGACCCCACCCCCATATCCCGAGCCTTTGCAAAGCAGGGATAGAGGGGGTAAGGGCGCGAGGGCAGGCCGGGCTAACGTCTGCTCCTGCGCCGCCGTCCCACGGGCATCCCCCCCGTGTGTGCCCAGTTGTTCCCGAAGCTTTAGGATCCAAGACGCTGGGGGCAACCATTTTCCTTGCCCGCCGCCCCCTCACGCTTCCCTGCCTCTCCTCCTAGCCTGGTCACGGGCTGTCCCCTCCTCCAGCAATGCAACCCTATAATAAACAAGTCTTTCCTTGATCCTCCCCTGCCGCGAGCGCCCTCGGGGACCTTGGCAGCTGCAGCCGCCGCGGATCCTTTCCAGAAAGGGGGCGTGGCGGTGGGTCGGGGTTCGACTGCGAGCTTTCTGGGGCTCAATGGAGGCGGGGCCCGGCCGCTGTCACCGGGCAGGAGAGAACGTTGCTTACGTGCGCCCGGAGTCCATTGGCCAAGGCGGGCCACACTCCCGGGTCTGGATTGGGTCGTGGCGCAGAGAAGGCGTGGCCTCGCCGCGCTAGTCCTTATAGGCTGCTCCGCGCTGGTGCTAGGGCGCAGCAGGCCAAGGGGGAGGTGCGAGCGTGGACCTGGGACGGGTCTGGGCGGCTCTCGGTGGTTGGCACGGGTTCGCACACCCATTCAAGCGGCAGGACGCACTTGTCTTAGCGTTCTCGCTGACCGCGCTAGCTGGTGAGTGTCCCTTCTGTGTGTGGGTCCTAGAGCTCGCGGTCTGGTCTGGTCTGGTCCCCAGACTGACGCCTGGTCGGTCCCCCTCTTGTCTTACAGCGGCTTCTACGCTCCGGCACTCTGAGTTCATCAGCAAACGCCCTGGCGTCTGTCCTCACCATGCCTAGCCTTTGGGACCGCTTCTCGTCGTCGTCCACCTCCTCTTCGCCCTCGTCCTTGCCCCGAACTCCCACCCCAGATCGGCCGCCGCGCTCAGCCTGGGGGTCGGCGACCCGGGAGGAGGGGTTTGACCGCTCCACGAGCCTGGAGAGCTCGGACTGCGAGTCCCTGGACAGCAGCAACAGTGGCTTCGGGCCGGAGGAAGGTGAGCGGTGGGCGGGTGCCGACGCGACTCGAGGGGCCGGGAAGGTGGGGAAGCCCCGGTGCTGGAAGGGGTCAGAGCCGCCTTGGCTTCCTATCCCATCGGGACCCAGATTGCTTGGGGGCAGGGGGAATTGGAGTATAAGGTGAGTGAGGCGGAAACTGAGGCACGGAGTGGGAAGGAGCGTTGGTTTCTTAAGGAAACAGCACCTCCCCCGCCTGTGCGTTTCGTTTTGAAGCCGCTCTAATACCCCTTCCTGTGTGCTCTCCTTTCCAGACACGGCTTACCTGGATGGGGTGTCGTTGCCCGACTTCGAGCTGCTCAGTGACCCTGAGGATGAACACTTGTGTGCCAACCTGATGCAGCTGCTGCAGGAGAGCCTGGCCCAGGCGCGGCTGGGCTCTCGACGCCCTGCGCGCCTGCTGATGCCTAGCCAGTTGGTAAGCCAGGTGGGCAAAGAACTACTGCGCCTGGCCTACAGCGAGCCGTGCGGCCTGCGGGGGGCGCTGCTGGACGTCTGCGTGGAGCAGGGCAAGAGCTGCCACAGCGTGGGCCAGCTGGCACTCGACCCCAGCCTGGTGCCCACCTTCCAGCTGACCCTCGTGCTGCGCCTGGACTCACGACTCTGGCCCAAGATCCAGGGGCTGTTTAGCTCCGCCAACTCTCCCTTCCTCCCTGGCTTCAGCCAGTCCCTGACGCTGAGCACTGGCTTCCGAGTCATCAAGAAGAAGCTGTACAGCTCGGAACAGCTGCTCATTGAGGAGTGTTGAACTTCAACCTGAGGGGGCCGACAGTGCCCTCCAAGACAGAGACGACTGAACTTTTGGGGTGGAGACTAGAGGCAGGAGCTGAGGGACTGATTCCTGTGGTTGGAAAACTGAGGCAGCCACCTAAGGTGGAGGTGGGGGAATAGTGTTTCCCAGGAAGCTCATTGAGTTGTGTGCGGGTGGCTGTGCATTGGGGACACATACCCCTCAGTACTGTAGCATGAAACAAAGGCTTAGGGGCCAACAAGGCTTCCAGCTGGATGTGTGTGTAGCATGTACCTTATTATTTTTGTTACTGACAGTTAACAGTGGTGTGACATCCAGAGAGCAGCTGGGCTGCTCCCGCCCCAGCCCGGCCCAGGGTGAAGGAAGAGGCACGTGCTCCTCAGAGCAGCCGGAGGGAGGGGGGAGGTCGGAGGTCGTGGAGGTGGTTTGTGTATCTTACTGGTCTGAAGGGACCAAGTGTGTTTGTTGTTTGTTTTGTATCTTGTTTTTCTGATCGGAGCATCACTACTGACCTGTTGTAGGCAGCTATCTTACAGACGCATGAATGTAAGAGTAGGAAGGGGTGGGTGTCAGGGATCACTTGGGATCTTTGACACTTGAAAAATTACACCTGGCAGCTGCGTTTAAGCCTTCCCCCATCGTGTACTGCAGAGTTGAGCTGGCAGGGGAGGGGCTGAGAGGGTGGGGGCTGGAACCCCTCCCCGGGAGGAGTGCCATCTGGGTCTTCCATCTAGAACTGTTTACATGAAGATAAGATACTCACTGTTCATGAATACACTTGATGTTCAAGTATTAAGACCTATGCAATATTTTTTACTTTTCTAATAAACATGTTTGTTAAAACAGTTGGTTGAGTCTCTCATCAGTACCATGAAGTGAAAAGGAGGGAGATGGGTGCTAGTGAAAGGCAGGTCTCATCAGGCCCTGGGGTCCACCTGTGTGTTCCTCCATCCCTTTCCGGGACTGCCTGCCAGCCTGGTGACAGAGGTATGTGTACCGTGTGCCATCTGTGCCAAGAACCCTTGGCCCTGTGCTGGCTGAAGCTACTAGGAGAACACACTGGAAACCCCTGAAGGTAGGGGGTGAGTCAGACCTCCCACCGAGCCAGAGTCTCCAGAGGGAGAGCTCACCTGGCTGCCCCGGTTAGAAGGCCCAGACAGGAGGGCCCACTGAGCCCAAGGTCTTTAATAAACAGTGAAAGAACTAGAAAATACCTTTTTTCTTTCTGGGAGAAAAAAATCAGTTGTTCTACCATCATGAAAATTACAAATCTTATCTCTGGATTTAAAAAGACTAAGAGGGGGAGTTTGAAAAATGCTACTTAGCTCATGCCTCTCACTGGACAAGGAACCAAGAGGGGCATGAGCTGCCACTGGAAGGAAGTCTGGACCAGGCAGGTGCAGAACTCCTTGCACACACACAGGTGAGGGAAGGAGTGCTAAGGGCTTAGAGAGCAAGGAAATAGCAGGCCTACCTTAACGATACCTTGGGTCACCCAGACGTCCTCTGTGACCTGTTGTCCCAGCCACTTGGGATGCTGAAGCCAGAGGATTGCTTGAGTCCAGGAGTTCAAGGCTGCAGCCTGGGTGACAGCAAGACCCTGTCTCTAAAAACAAAAGATGCATTGTGCATTCTGGGCCCTAAGTTCCTTGTCAGAAAAATTGGCAAATTGGAGTTGGGCCAGATGAAGCCCAGGGCCTTTCCCCCTTCTTCCCTGGAATTACATCCACCCACACCAACTGGCATTTGGAGAGTTTTTATCTCCCTTGTTTCTCTTCCTGGTCCCAGACAGGCCTTGTTTGCTCAAGACTAAAACAGTGGCTCTTGCACTTGAGCGTGTGTAATCAGATCACATGGGCCCTCCTGGAGATTCTCAGTGCATCCGGGCCAGGGCCCCAGGAATCTGCATTTACATCAGGGATTCCAATAGAGGGTCCTAAACTTTACGATGACTTGGAAGACCCATCTCTCTTTGGTAGAACTGAGTGATTTGTTCCCCAAAATGGATAAACTTGGATTAGAAGTGCATTTGGAAATGGATAGTGAGAACAGTGAAGAAGGTGCCCAGACCAGTGTGAGGAAAGCCCTCACACCCATTTTCTTAGCACATCCTCCTAATAGCCACCCTGTGAGGGGTGGGTGGCGGCAGGGGTTTTTAATGTTTTACAGATTAGTAAATGGAGGCCCAAGCCCTGGAATGGTCATCTTCTTGGATAAGGGCTGACTTTGTCCACTCCCAGCCTATTGAGATTCAGGGCTGGGAGTAAAGCAAGCTTGACACCTGGGCTGAGTCTGAAGGGCACTTTCCCGGGAACTGAGATCTGTGCCAATGCTCACGACCCTGCCTCCCCAGTCTCAAAAGAGAAGCAAGGAAACAATTGTCTTCAGAGTACAGAGTCTTGTTGGTATTTGGGGGCCTGAGCTGGATGGATTGGTCAGCATTAGCCCTTCTCCAAGCCAAGGAGGCAGCTGAGCCCAGCACCGTACCTTTTCTTAGATAGTCAGACTGAGGCCAAATCAAAGCTTGGGTTCCCAAGCTAGCTCAGCTGAGATGCCCTCTCCCAGAGCCAAACTGGCTTCCCTCATTCTCACAGGGCCTGAAAATCCTCCTGCAGCAGGACAGAAGGGTCCGCAAGTGGGAGCCCTGAGCTTGAGTCTCACAGTAAAGGGAAGAGGGTTGCTGAGGCCCAAGACAGTTCTGGGTCCTGAGGTCTGCTAAGACATGGCAGGGAGCTTTGCCCCAGGTACCGGACTTGCTAAGAAAAAATGGGGCAGGCTTCTTTGTTGCTAAGCAGGAAAGCTAAGAAAGCTTATAAAGACCTACACATAAAATCAACTTTGGTAAATGCTTTCAGAAATTGTCCTATTTAGTGAGACCCTATCTGATAAAGAAAGGAAGGAAAGAAAAAAAAGAAAGGAAAGGAAAGGGGAAAGGAAAAAGGAAAGGAAAGGAAAAAGATTGCCCTATTTGGCCTGGAAAATATGTACTGATTACCTCCCTTCCTACAGGATTCCCTCTCTTATTCCTATTTCCCACCTCATCGGGTCAATGCTCTAGAACCTGCAATGGTTCCCTATTGCCAGATTCCACTGCTGGTCTTTTAGGACATTTGGTGTTGGGCCCTATACTCCCTACTGAGGCTTACCTCCCACCATTCCCCTTAACTGGGGGCAAGTCAATCTGGACTGCCCTTTTCTCTAGCCGCAGACTCCGCTCATTCTAGTGCCTTCCACCAAGGATATCTTCCTGAGTTTTGCTGGCAAGCCCTGTCCTTCCTTTAAGGCCTAGAGCAAGTTCCAGCCTTTTTATGGCTCTTTTCTGCTTTCCCTCCCCCCATCTTTCACAATTGCAGTGTGAAAACATGGCATACAATGATCTCATTGTATGCACTTGTTTTATATCCCCCTAGCTCTATAGAACACCCCTAGGTTCTCCTGAGGCCTGGCACATAGTGGTTAACTAAGCATTGGCTGTCCGAGCCTTGGGTCATGCCCTCTCTCTAAGCTCAGAGAACATAAGATTCCCTCACTAGCCTCAGACTCTCAGGCTACGAGGAGAGGAGGGCAGGGTTAGAAAGAGTTGTTGTTGTTTTTTTGTTTGTTTGTTTTTTGTTTTTTTCATTAGCCTACCACCTAGTTTAGAGGAATATTAAAGGCTAAGGTCCTGGAAGGGAGGTAGTGTCATTAGTGGCTAAAGCCACCTGCATTAGTGAAATCTGGATTCAGATCCCAGCTCAGCCATTTCCTAGCCAATGACCTGGGGCCAGTAACTTTACCTTCCTAAGCTTCAGTTTCCTCATCCGTAA'

In [None]:
text = text[0:7000]

In [None]:
ref_token_id = tokenizer.pad_token_id # A token used for generating token reference
sep_token_id = tokenizer.sep_token_id # A token used as a separator between question and text and it is also added to the end of the text.
cls_token_id = tokenizer.cls_token_id # A token used for prepending to the concatenated question-text word sequence

In [None]:
lig = LayerIntegratedGradients(custom_forward, model.bert.embeddings)

input_ids, ref_input_ids, sep_id = construct_input_ref_pair(text, ref_token_id, sep_token_id, cls_token_id)
token_type_ids, ref_token_type_ids = construct_input_ref_token_type_pair(input_ids, sep_id)
position_ids, ref_position_ids = construct_input_ref_pos_id_pair(input_ids)
attention_mask = construct_attention_mask(input_ids)

indices = input_ids[0].detach().tolist()
all_tokens = tokenizer.convert_ids_to_tokens(indices)

In [None]:
# Check predict output
predict(input_ids)

tensor([[-0.6619,  0.5897]], grad_fn=<AddmmBackward0>)

In [None]:
# Check output of custom_forward
custom_forward(input_ids)

tensor([0.7776], grad_fn=<UnsqueezeBackward0>)

In [None]:
torch.cuda.empty_cache()

In [None]:
attributions, delta = lig.attribute(inputs=input_ids,
                                    baselines=ref_input_ids,
                                    n_steps=700,
                                    internal_batch_size=1,
                                    return_convergence_delta=True)

In [None]:
score = predict(input_ids)

print('Sentence: ', text)
print('Sentiment: ' + str(torch.argmax(score[0]).cpu().numpy()) + \
      ', Probability positive: ' + str(torch.softmax(score, dim = 1)[0][1].cpu().detach().numpy()))

Sentence:  AAAGGTTTGGAGAGGGAGGTCCTAGTGAGGCTGAACAGAGGTAAAATAAACAGAAAGTTCCAGGCTCTCCTTGCTTCTACTTAAGAAAAATCAGAGCAGTAAATCCCAAACCAGTTCTGCCCACAACTCAAATGCAGATGAGCATCCCTTGCTCCATCTATGCAGGAAAGCCATAGTGTGGGGCTGTAGGACTATGGAGTCAGCCTCTGCAAGCAACAAGGCTCAGAGGCTGAGGGGCTTCAGGCCCCAGCAAAACCCAGTGATCCTGTTGTCAAATCTGAATGTCATCATCTGCCTCCAGGGCGACCAGCTCTGGATGGGGGTGTCAGGGTCAGGATCCTGTTCCATGTGGCAAGAGCTTGGGGAAGCTGCTGCAGGCCTACTGATGACCTTCTTTCCTGGCCCAGACACTCTTAAAAACTTCCTGGCGAGGGAGGCAACACACCTTATTGTGCAGCCCTCATCGAACGCATCAGCTGCACTAAGTGCTGAAGAAAAGTTCCCATAATAACCATGTGTGATAATAAAAAGATAAAGAGGCAAATAGGTATGTAGGTCAGCTCAAAAATAGCCACCCACCCGCCTGGCCTGGGTAGCCCTTTGTGCCAAGTGGGTAGAAAGGTTTTCCTTGCTTCCCTTCCCAAGCTGATGCCCCCTGCACTTTTCAAGGTTGCCTTAAATACAACTCCTTCCTGCACTAGCTGGGGTAGCCAGGGCAGTAGGGACTGCAGCCCTACAGGGGCAGCCCTGCGCTCCCTCCACCAAATCAATCCTGGGGTCAGAGGGCACAAAGGCTTGGCCTCTCTGACGTGAGTTCTCGGGGCTAAGTCAGGGTTTAGGGTAGTGAGTCACAGACATTCTTTCCCCCATCCCTTAGGGTTTGCGCACACCCAGGAAGCCTTCCCCTCCCCAACAGAGACCGCTTTGTTAGCACGACCCACCCGGTTGGAGAAGAGTTACAGCCTCAGGGGTGTGAGGGCCTCCTCGGC

In [None]:
attributions_sum = summarize_attributions(attributions)

In [None]:
# storing couple samples in an array for visualization purposes
score_vis = viz.VisualizationDataRecord(attributions_sum,
                                        torch.softmax(score, dim = 1)[0][1],
                                        torch.argmax(torch.softmax(score, dim = 0)[0]),
                                        1,
                                        text,
                                        attributions_sum.sum(),
                                        all_tokens,
                                        delta)

In [None]:
print('\033[1m', 'Visualization For Score', '\033[0m')
viz.visualize_text([score_vis])

[1m Visualization For Score [0m


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
1.0,0 (0.78),AAAGGTTTGGAGAGGGAGGTCCTAGTGAGGCTGAACAGAGGTAAAATAAACAGAAAGTTCCAGGCTCTCCTTGCTTCTACTTAAGAAAAATCAGAGCAGTAAATCCCAAACCAGTTCTGCCCACAACTCAAATGCAGATGAGCATCCCTTGCTCCATCTATGCAGGAAAGCCATAGTGTGGGGCTGTAGGACTATGGAGTCAGCCTCTGCAAGCAACAAGGCTCAGAGGCTGAGGGGCTTCAGGCCCCAGCAAAACCCAGTGATCCTGTTGTCAAATCTGAATGTCATCATCTGCCTCCAGGGCGACCAGCTCTGGATGGGGGTGTCAGGGTCAGGATCCTGTTCCATGTGGCAAGAGCTTGGGGAAGCTGCTGCAGGCCTACTGATGACCTTCTTTCCTGGCCCAGACACTCTTAAAAACTTCCTGGCGAGGGAGGCAACACACCTTATTGTGCAGCCCTCATCGAACGCATCAGCTGCACTAAGTGCTGAAGAAAAGTTCCCATAATAACCATGTGTGATAATAAAAAGATAAAGAGGCAAATAGGTATGTAGGTCAGCTCAAAAATAGCCACCCACCCGCCTGGCCTGGGTAGCCCTTTGTGCCAAGTGGGTAGAAAGGTTTTCCTTGCTTCCCTTCCCAAGCTGATGCCCCCTGCACTTTTCAAGGTTGCCTTAAATACAACTCCTTCCTGCACTAGCTGGGGTAGCCAGGGCAGTAGGGACTGCAGCCCTACAGGGGCAGCCCTGCGCTCCCTCCACCAAATCAATCCTGGGGTCAGAGGGCACAAAGGCTTGGCCTCTCTGACGTGAGTTCTCGGGGCTAAGTCAGGGTTTAGGGTAGTGAGTCACAGACATTCTTTCCCCCATCCCTTAGGGTTTGCGCACACCCAGGAAGCCTTCCCCTCCCCAACAGAGACCGCTTTGTTAGCACGACCCACCCGGTTGGAGAAGAGTTACAGCCTCAGGGGTGTGAGGGCCTCCTCGGCCTCTCCCTCCCTCCCCCTCTCTCCTCTCTAGGGCTCTCACCAGAAAGGCGCCAACCCTGCGCCCTGCCCCCACCCAGCCGCCGGGGCCCCAAATGCTGAGCTCAGCATCTCTGTGGCCTGGCTGCCCTCCTCCCGGGCAGTGGGAGGAGCCTCCTTCCTCCCGAGGGTGGGCGGGGCCAGGGCCAGCCCCGCCCTCCTCCCCGTTCCCCCTCTCCCTCCATCCCCCTCCCGTTCCTCAGTCGCACGTTCTCCAAGTCACGTCCCCCGCTTCCCCTAGTAGGGGGTCGACGGAGATTGGACCCTTCCCCCAGTCAGCTGCTCTGCATCTGTCACCTCGGCGGCAGCGCTCCCTTGAGGTCGCACCTCCGCTGTGGAGGGAGGCGAGAGCGAGCTGAGTGGGGGGTCTTCCCTTCCCCCATCCCGCTGGCCCCAGACAAGCCACCGCAGACCGCGGCGAAATCAGTTAAGCTCTTGCGTGCACCAGTTCCCGGAGCAGAGTCTGAAAGTTTTTGTGTTTCTGTGCGGCTACTTTTAAGTATAAAAAATTCAGCAGTGGCTCCTGGGTGCCTATGTCAGCGTCTGGCCCTTTGTGGATTACGTACGGGACAACTGGGGTGGGGAAGGGCCCCTCTTCACAGGCAGCAATTCCCAGAGTGGCCTTCCTATGGGACCCCAGAGCTCCCAGGGGGAGGATCCCAGAGGGGGATATGGTAACAGAATCACTGTCACTTCTGGGATTGAGGGTGGCAGCTAAAGGGAAACCCCTCGAGTGTCAGTCGGACTTGCCATTTGAGTCAGCACTGCTAGGTGCTGCTGAATTCTGCAGGGGGAGGAAGAACCTGATCAGATAAAACAAGGGCTGACCTAGAGAAAGTCTCTTGGGTCAACATATTCTTAGCGATAACAGAAGATCACTCCAACTGTTCTACACCCCACCCTACAACATTGACCCCCCGCTTTCCAGCATTTACAGTCCCTTTTAGTTTACAACTAAGAGTATGGGTTGCCTGGGATCAGGAAATGAGCCTAGATGTAGAGTCCTGGCTCCAGCCTTGCTGACACTATGTGACTCACTGCACCTATCTGAATCTCAGTTTTCTCACCTGTGCAGTGACATTGATGAGGTCTGTCCTGCCTACAAACTCTACACACATATATTAGTTGTTGTTTTTTAATTTTTAGTAGAGATGGGGTTCTCACAACTTGCCCCAGGCTGGTTTGAACTCCTGGATTCAAGCAATCCTCCCATCTCCACCTCCCAAATGCTGGGATTACAGGTGTGAGCCAGTGTACCAGGCCAGTATTATGCTGGGATTACAGGTGTGAGCCACCATACCAGGCCTTTATTTTTGTTTTGTTGGTTTGTTTCGTTTTTGTTTGAGATAGCGTCTCACTCTATCACCCAGGCTGGAGTGCAGTGGAACGATCTTGGCTCACCGCAACCTCCGCTTCCCGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCAGGTAGCTGGGATTACAGGTGCATGCCACCAAACCTGGGTAAATTTTGTATTTTTAGTAGAGACAGGGTTTCACTATGTTGGCCATGCTGGTCTCAAACTCCTGGCCTCAAGTGATCCACTCGCCTCAGCTTCCCAAATCATGTGCTGGAATTACAGGTGTGAGCCACTGCCCAGCCTAAGTCTTTTTTTTTTTTTTTTTTTTTTTTGAGACAGAGTCTTGCTTTTTGACCCAGGCTGGAGTGCAGTGGCACAATCTCAGCTCACTGTAACCTCAGCCCCCTGGGCTCAAGTGATTTTCCCACCTCAGCCTCCCAAGAAGCTGGGAATACAGATACACTCTACCATGTCCAGCTAACTTTTTGTCTCTTTAGTAGAGATGGGATTTCACCATGTTGGCCAGGCTGGTCTTGACCTCCTTGACTCAAGTGATCTGCCCACCTTGGCCTCCCAAAGTGCTGAGATTACAGGCATGAGCCACCATGCCCAGCCTCCAGTTGTTATTTTTATTAACAAAGTTATGAAAATCCTTTAGAACATGTGGAAAAAGACAAAAAGTTATAAGGCTGGGTGCAGTGCCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGAGGTGAGCAGATCGCCTGAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGTGAAACCCTGTCTTTACTAAAAATACAAATATTAGCCAGGCATGGTGGCGGGCACCTGTAATCCCAGCTACTTAGGAGGCGGAGGCAGGAGAATCGCTTAAATCCAGGAGACAGGTTGCAGTGAGCCACGATCGTGTCCAGCCTGGGCAACACAAGACTCCATCTCAAAATTAAAAAAAAAAAAAGTTATGAAAGCCCTAAAAAATATGGAAGTGTGTTTTTTTGTTTGTTTTGGTTTTTTTGAGACGGAATTTCACACTGTTGCCCAGGCTGGAGTCTAGTGGCGCGATCTAGGCTCACTGCAACCTCTACCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACCGGCGCCCGCCAGCACGCACGGCTAACTTTTTCTATTTTTAGTAGAGATGGGGTTTTACTATTTTGGCCAGGCTGGTCTCAAACTCCTGACCTCATGATCCGCCTGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTGCCAGGCCTGTGCAAGTGTTTTTAGAATCCTGAAGCGCTCCATAAGGGTCAATGATCTTTGTGAGGAGGCTGGTGCGGTGGTTCACGCCTGTAATCCCAGCACTTTGGGAGGCTGAAGGGGGCAGATCACCTGAGGTCAAGAGTTTGAGACCAGCCTGGCCAACGTAGTGAAACCCTGTCTCTGTTGAAAATACAAAAATAAACCGGGCGTGGTAGTGCATTCCTGTAATCTCAGCTACTCGGGAGGCTGAGGCAGGTGAATCCCTTGAAGCCGGGAGGCAGAGGTTGCAGTAAGCTGAGATTGCACCACTTGTACTCCAGCCTGGGTGACAGAGTGAGACTCCACCTCAAAAAAAAAAAAAGATCTTTGTGAAGAGATGGCAAATTGCCAGGTGGGCTGGCAGCTTCCATTTCCTGCCAGCCCAGGTGTTCCAGAGAAAGGCTCAGCATGCAGACCTGGGCAGCTGCCTTTTGCCTAGACTTGAGTTTCCCAAGCCTTTGACTATTAAGGCCACTGGAGATAAAATGCACTTCTGAGTGAGGTTAGAGGCATCGCAGAAGGGTGATGAAGGAGACCAAAGCCAGGGAGAAGAAAGTTCCAGAGGATTGAGTGGGGCCTAACTGCCAGGAGAGAGGGAGATCCTGGAACCTCCTAAGGCTCCCTGCCCTGTCAGTTCCTTGTCCATAAAGTGGGGGAGGTTGGGGGCTGGAAGGAGTACTCTCTTAGGACCTGCTTATCTTAACATTAAAAGATTTTAGCCGGGCATGGTAGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCTGAGGCGGGCAGATCACCTGAGGTTGGGAGTTTGAGACCAGGCTGACCAACATGGAGAAACCCCATCTCTACTAAAAATACAAAAAAGTTAGCCAGGTGTGGTGGCACATGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCGCTTGAACCTGGGAGGCGGAGGTTGCGGTGAGCCAAGATTGCGCCATTGCACTCCAGCCTGGGCGACAAGAGCGAAACTCCATCTCAAAAGAAAAGAAAAAAAGAAAGATTTTAAGGTTCATTCTACTGACAGAAGAATCCTGACAGTGAGAAGGCTGACCCTTCTCTCTGCTGATCTAGCTCTACTCACCCCAGCCCTTTGGGAAACGCAGAGGCTAGACAGGTCCTCCTGGTCTCCTTTCTTCTCTAGAAGGAAAAACAACAACAATAGAGTGAGCTCATTTTGCTGTCCAGACAAATGATGAGCCTGGGTTTGGGCTTTCCCAACTGTGGCAGGTCCTGATCATCTCTGTCATCCCCTGTCATATACTCCCTAGGCTGGTGGAAAAACCCCCATCCCTGCTTCCCCCTTTGTTATATGGATATCAACAATATTTCCATATTGTAAACCAATTGGAAGCCCTCAAAAGGCAAAAGCACTGAAATGGCTGAAATGCCTATTTCTACCTTCTCTGGCAGGCCTCCTGCAGAGAGTCCTATGGGCTAGGACTGGGGTTTGGGGGAAAGCAGCTCCATGGAATGTATTATATCTTTCTCCTTTGCTATGATCCTTGTAGAGGTTGAAGAGGTCTTTGAGATTCTCTAGTTCCGTGTTTTCAAAACTGAGGTATGAAGGCCGGGCTTGGTTACTCACGCTTGTAATCCCAGCACTTTGGGAGGCCGAGGCAGGCAGATTACTTGAGGCTAGGAGATAGAGACCAGCCTGGCCAACATGGCAAAACCCCGTCTCTACTAAAAATAAAAAAATTAGCCAGGCGTGGTGGCGCATGCCTGTAATCCCAGCTACCCGTGAGGCTGCGGCAGGAGAATCTCTTGAACCTGGGAGGCAGAGGTTGCAGTGAGCTGAGATATCGGCACTGCACTCCAGCCAGGAGGACAGAGCGAGACTCTGTCTCAAAAAAGAAAAAAAAAGTTTTTTTCTTTTTTTGGAGGGAGAAATTAAGTAATTTAACTAGTAAGTAATCTAAACATTTGCTACTGAAATTAACACAGATAAAATATATAATAAAATGCAAAATTGTGTTATTTGTAATAAAAATTCTGGGCTTCAAAGACATGGTATGCTTCCTGGGGGCTGCTTCTGGGCCACAGCCCAGACTCCGATCCATCCTTAGTGGCCAAACAGCCTGCAACTAAGGTCTGCTGACTCCTATCCTCTCACTCCACAGGGCCTGAGCTAGCCGAGGTTTAAGAGACTCACTAGAGAGAGGGGGTTGCCTAGCCCTCCCTGCACTTCATTGCTTTCTCTCCTCATAAGGATTCAGAACCTAGGATTGGAGAGGGATCTTAGTAATGGCTGGCAGAAACCTGGCCTCTAAGTGGATGGGATTCCTTACTGACAGTCAGTGGGACAGGTGAGGAGAAAAGAGACAGTGCCGGAGTCAGAAGGACGAGGTTCCAGGCCTGGCTGGGTCCCTAGGACAACTCATTTGACCACGCGGGCTGGAGACGGGTGGGCTGCATGAAGTCTGGTAGGCTGTCTGTGCCTTTGCTACTGCTGGGATACAGAGGTCTGCCAGAATCCTCAGGCTACTCTCTCAGCTCTCAAAACCCTTATCCCTTGGCATGGGTGGTTTATCAACCTAGCCCTTTGTGGGGTTCCCACTGCCCTGCCCTCTCCCCAGAGGAAATGACTTCTTGGGAAACCTAGGACCCCAGGCAGAACCAGGCAGAACTGGTTGTCTGTGAGCTCACCTTTGTCACGTGTGAGCCCTGTCTACACAGCTGCAAGCTCTCACCCACCCCTAACCCAACCAGGCCTATCTTTCTTTCCTAGAGGTCAATAAGCACCCCAACTAAAGATAAGCATCAGAATCGCCTGGAGAATTTTGCTCCTAAGGACCCCACCCAGACCTACCCAATCAGAATGGGGGTTGAGGAGATGAGAATCTCGGTTTTACAAGCTCCTCAGCTGATTCTAATTTTTTTTTTTTTGAGATGGAGTCACACTCTGTTGCCCAGGCTGGAGTGCAATGGCGTGATCTCAGCTCACTGCAATATCTGCTTCCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCTGAATAGCTGGGGCTACAGGGGTGTCCCACCACACCCAGCTAATTTTTGTATTTTTAGTAGAGATCAGGTTTCACCATGTTGGCCAGGCTGGTCTTGAACTCCTGACCTCGTGATCCGACCGCCTTGGCCTCCCAAAGTGCTGGGATTATAGGCATGAGCCACCACACCCAGCCTGATTCTAATTATTAATCAGACTTGAAATGAAAGCCACTGGTTCACGGAGGGATTACGGGACTCTCACTTTGAGCCTCAATGTCCACATCTGTAGAATGGCACTATATTTGTTCC,3.23,[CLS] AAAGG TTTGG AGAGGG AGGTCC TAG TGAGGC TGAAC AGAGG TAAAA TAAACAGAA AGTTCC AGGCTCTCC TTGC TTCTAC TTAAG AAAAATC AGAGC AGTAA ATCCC AAACC AGTTCTG CCC ACAAC TCAAATGC AGATG AGCATCCC TTGC TCCATC TATGC AGGAAAGCC ATAGTG TGGGGC TGTAGG ACTATGG AGTCAGCC TCTGC AAGCAAC AAGGC TCAGAGGC TGAGGGGC TTCAGG CCCC AGCAAAA CCC AGTGATCC TGTTG TCAA ATCTGAA TGTC ATCATC TGCCTCC AGGGCG ACCAGC TCTGG ATGGGGG TGTCAGGG TCAGG ATCC TGTTCC ATGTGGC AAGAGC TTGGGG AAGC TGCTGC AGGCC TACTGATG ACCTTC TTTCC TGGCCC AGACAC TCTTAAAA ACTTCC TGGCG AGGG AGGCAAC ACACC TTATTG TGCAGCCC TCATCG AACGC ATCAGC TGCAC TAAGTGC TGAAG AAAAG TTCCC ATAATAACC ATGTGTG ATAATAA AAAGATAA AGAGGC AAATAGG TATGTAGG TCAGC TCAAAA ATAGCC ACCC ACCCGCC TGGCCTGGG TAGCCC TTTGTGCC AAG TGGGTAG AAAGG TTTTCC TTGC TTCCCTTCCC AAGC TGATGCC CCC TGCAC TTTTCAAGG TTGCC TTAAATAC AACTCC TTCC TGCAC TAGC TGGGG TAGCC AGGGC AGTAGGG ACTGC AGCCCTAC AGGGGC AGCCC TGCGC TCCC TCCACC AAATC AATCC TGGGG TCAGAGGGC ACAAAGGC TTGGCCTCTC TGACG TGAGTTCTC GGGGC TAAG TCAGGG TTTAGGG TAG TGAGTCAC AGACATTC TTTCCCCC ATCCC TTAGGG TTTGCGC ACACCC AGGAAGCC TTCCCCTCCCC AACAGAG ACCGC TTTG TTAGC ACGACCC ACCCGG TTGGAGAAG AGTTAC AGCC TCAGGGG TGTG AGGGCC TCCTCGGCC TCTCCC TCCCTCCCCC TCTCTCC TCTC TAGGGC TCTC ACCAGAA AGGCGCC AACCC TGCGCCC TGCCCCC ACCCAGCC GCC GGGGCCCC AAATGC TGAGC TCAGC ATCTCTG TGGCC TGGCTGCCC TCCTCCC GGGC AGTGGG AGGAGCC TCCTTCC TCCCG AGGGTGGGC GGGGCC AGGGCC AGCCCC GCCC TCC TCCCCG TTCCCCC TCTCCC TCCATCC CCC TCCCG TTCC TCAGTC GCACG TTCTCCAAG TCACG TCCCCCGC TTCCCC TAGTAG GGGG TCG ACGG AGATTGG ACCC TTCCCCC AGTC AGCTGC TCTGC ATCTGTC ACCTC GGCGGC AGCGC TCCC TTGAGG TCGC ACCTCCGC TGTGGAGGG AGGCG AGAGCG AGCTGAG TGGGGGG TCTTCCC TTCCCCC ATCCCGC TGGCCCC AGACAAGCC ACCGC AGACCGC GGCG AAATC AGTTAAGC TCTTGC GTGCACC AGTTCCC GG AGCAGAG TCTG AAAGTTTT TGTGTTTC TGTGC GGC TACTTTT AAG TATAAAA AATTC AGCAGTGGC TCCTGGG TGCCTATG TCAGCG TCTGGCCC TTTG TGGATT ACGTAC GGG ACAAC TGGGG TGGGGAAGG GCCCC TCTTC ACAGGC AGC AATTCCC AGAG TGGCCTTCC TATGGG ACCCC AGAGCTCCC AGGGGG AGGATCCC AGAGGGGG ATATGG TAAC AGAATCAC TGTCAC TTCTGGG ATTG AGGGTGGC AGCTAA AGGG AAACCCC TCGAGTG TCAGTCGG ACTTGCC ATTTGAGTC AGCAC TGCTAGG TGCTGC TGAA TTCTGC AGGGGG AGGAAG AACC TGATC AGATAAAAC AAGGGC TGACC TAGAGAA AGTCTC TTGGG TCAAC ATATTC TTAGCG ATAAC AGAAG ATCAC TCCAAC TGTTCTAC ACCCCACCC TACAAC ATTG ACCCCCC GC TTTCC AGCATTTAC AGTCCC TTTT AGTTTAC AACTAAG AGTATGGG TTGCCTGGG ATCAGG AAATG AGCCTAG ATGTAG AGTCCTGGC TCCAGCC TTGC TGACAC TATGTGAC TCACTGC ACCTATC TGAATCTC AGTTTTC TCACC TGTGC AGTG ACATTG ATGAGG TCTG TCCTGCC TACAAAC TCTAC ACAC ATATATT AGTTG TTGTTTT TTAATTTT TAGTAG AGATGGGG TTCTCAC AACTTG CCCC AGGCTGG TTTG AACTCC TGGATTC AAGCAATCC TCCC ATCTCC ACCTCCC AAATGC TGGGATTACAGGTGTGAGCC AGTGTACC AGGCC AGTATT ATGC TGGGATTAC AGGTGTGAGCCACC ATACC AGGCC TTTATT TTTGTTTTG TTGGTTTG TTTCG TTTTTGTTTG AGATAGC GTCTC ACTCTATC ACCC AGGCTGGAGTGCAGTGG AACG ATCTTGGC TCACCGCAACC TCCGC TTCCCGGG TTCAAGTGATTCTCCTGCCTCAGCC TCCCAGG TAGCTGGGATTAC AGGTGCATGCC ACCAAACC TGGGTAA ATTTTGTATT TTTAGTAGAGACAGGGTTTC ACTATGTTGGCC ATGC TGGTCTCAAACTCC TGGCCTCAAGTGATCC ACTCGCC TCAGCTTCCC AAATC ATGTGC TGGAATTAC AGGTGTGAGCC ACTGCCC AGCCTAAG TC TTTTTTTTTTTTTTTTTTTTTTTTG AGACAGAGTCTTGC TTTT TGACCC AGGCTGGAGTGCAGTGGC ACAATCTC AGCTCAC TGTAACC TCAGCCCCC TGGGCTCAAG TGATT TTCCC ACCTCAGCCTCCC AAGAAGC TGGGAATAC AGATACAC TCTACC ATGTCC AGCTAAC TTTT TGTCTC TTTAGTAG AGATGGGATTTC ACCATGTTGGCCAGGCTGG TCTTG ACCTCC TTG ACTCAAG TGATCTGCCC ACC TTGGCCTCCCAAAGTGC TGAGATTACAGGCATGAGCC ACCATGCCC AGCCTCC AGTTG TTATTTTTATT AACAAAG TTATG AAAATCC TTTAGAAC ATGTGG AAAA AGACAAAA AGTT ATAAGGC TGGGTGC AGTGCC TCACACC TGTAATCCCAGCACTTTGGGAGGCCG AGGTGAGC AGATC GCC TGAGGTCAGGAGTTCAAGACCAGCC TGGCCAACATGGTGAAACCC TGTCTTTAC TAAAAATAC AAATATT AGCCAGGCATGGTGGC GGGCACC TGTAATCCCAGCTAC TTAGG AGGCGG AGGCAGGAGAA TCGC TTAAATCC AGGAGAC AGG TTGCAGTGAGCC ACG ATCGTG TCCAGCCTGGGCAAC ACAAG ACTCCATCTC AAAA TTAAAAAAAAAAAA AGTTATG AAAGCCC TAAAAAA TATGGAAG TGTGTTTT TTTGTTTG TTTTGG TTTTTTTG AGACGG AATTTC ACAC TGTTGCCC AGGCTGG AGTCTAG TGGC GCG ATCTAGGC TCACTGCAACCTCTACC TCCCGGGTTCAAGCG ATTCTCCTGCCTCAGCCTCCCGAGTAGC TGGG ATTACC GGC GCCCGCC AGCACGC ACGGC TAAC TTTTTCTATT TTTAGTAGAGATGGGG TTTT ACTATT TTGGCCAGGCTGG TCTCAAACTCCTGACCTC ATGATCC GCCTGCC TTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCC ACCGTGCC AGGCC TGTGC AAGTGTTTT TAGAATCC TGAAGC GCTCC ATAAGGG TCAATG ATCTTTGTG AGG AGGCTGG TGCGG TGG TTCACGCC TGTAATCCCAGCACTTTGGG AGGC TGAAGG GGGC AGATCACCTGAGG TCAAG AGTTTGAGACCAGCC TGGCC AACGTAG TGAAACCCTGTCTC TGTTGAAAA TACAAAA ATAAACC GGGCGTGG TAGTGC ATTCC TGTAATCTCAGCTAC TCGGGAGGCTGAGGC AGGTGAA TCCCTTG AAGCC GGGAGGCAGAGG TTGC AGTAAGC TGAGATTGC ACCAC TTGTAC TCCAGCC TGGGTGACAGAGTGAGAC TCCACCTC AAAAAAAAAAAA AGATC TTTGTG AAG AGATGGC AAATTGCC AGGTGGGC TGGC AGCTTCC ATTTCC TGCCAGCCC AGGTGTTCC AGAGAA AGGCTCAGC ATGC AGACC TGGGC AGCTGCC TTTTGCC TAGACTTG AGTTTCCC AAGCC TTTG ACTATT AAGGCC ACTGG AGATAAAA TGCAC TTCTG AGTGAGG TTAGAGGC ATCGC AGAAGGG TGATGAAGG AGACC AAAGCC AGGGAGAAG AAAGTTCC AGAGG ATTG AGTGGGGCC TAACTGCC AGGAGAG AGGG AGATCC TGG AACCTCC TAAGGC TCCCTGCCC TGTC AGTTCC TTGTCC ATAA AGTGGGGG AGGTTGG GGGC TGGAAGG AGTAC TCTC TTAGG ACCTGC TTATC TTAAC ATTAAAAG ATTTT AGCCGGGC ATGGTAGC TCATGCCTGTAATCCCAGCACTTTGGG AGGCTGAGGCGGGC AGATCACCTGAGG TTGGG AGTTTGAGACC AGGC TGACCAACATGGAGAAACCCC ATCTC TACTAAAAATAC AAAAAAG TTAGCC AGGTGTGGTGGC ACATGCC TGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAA TCGCTTGAACCTGGG AGGCGGAGGTTGC GG TGAGCC AAGATTGC GCC ATTGCACTCCAGCC TGGGCGACAAG AGCG AAACTCCATCTC AAAAGAAAAGAAAA AAAGAA AGATT TTAAGG TTCATTC TACTGAC AGAAG AATCC TGACAGTG AGAAGGC TGACCC TTCTCTC TGCTGATC TAGC TCTAC TCACCCC AGCCC TTTGGG AAACGC AGAGGC TAGACAGG TCCTCC TGGTCTCC TTTC TTCTCTAG AAGGAAAA ACAACAAC AATAG AGTGAGC TCATTTTGC TGTCC AGACAAATG ATGAGCC TGGG TTTGGGC TTTCCC AAC TGTGGC AGGTCC TGATC ATCTCTG TCATCCCC TGTC ATAT ACTCCC TAGGC TGGTGG AAAA ACCCCC ATCCCTGC TTCCCCC TTTG TTATATGG ATATCAAC AATATTTCC ATATTG TAAACC AATTGG AAGCCC TCAAAAGGC AAAAGC ACTGAA ATGGC TGAAATGCC TATT TCTACC TTCTCTGGC AGGCC TCCTGC AGAGAGTCC TATGGGC TAGG ACTGGGG TTTGGGGG AAAGC AGCTCC ATGG AATGTATT ATATC TTTCTCC TTTGC TATGATCC TTGTAG AGGTTGAAG AGGTCTTTG AGATTC TCTAG TTCCGTG TTTTCAAAAC TGAGG TATG AAGGCC GGGC TTGGTTAC TCACGC TTGTAATCCCAGCACTTTGGG AGGCCGAGGCAGGC AGATTAC TTGAGGC TAGG AGATAGAG ACCAGCC TGGCCAACATGGCAAAACCCC GTCTCTACTAAAA ATAAAAAAATT AGCCAGGCGTGGTGGC GCATGCC TGTAATCCC AGCTACCC GTG AGGCTGC GGC AGGAGAA TCTC TTGAACCTGGGAGGCAGAGG TTGCAGTGAGCTGAG ATATC GGC ACTGCACTCCAGCC AGGAGG ACAGAGCGAGAC TCTGTCTC AAAAAAGAAAAAAAA AGTTTT TTTCTTTT TTTGGAGGG AGAAATT AAGTAA TTTAAC TAG TAAGTAA TCTAA ACATT TGCTAC TGAA ATTAAC ACAGATAAAA TATATAA TAAAA TGCAAAA TTG TGTTATT TGTAA TAAAAATTC TGGGC TTCAAAG ACATGG TATGCTTCC TGGGGGC TGCTTC TGGGCC ACAGCCC AGACTCCG ATCCATCC TTAG TGGCC AAACAGCC TGCAAC TAAGG TCTGC TGACTCC TATCC TCTCACTCC ACAGGGCC TGAGC TAGCC GAGG TTTAAG AGAC TCACTAG AGAG AGGGGG TTGCC TAGCCC TCCCTGC ACTTC ATTGC TTTCTCTCC TCATAAGG ATTC AGAACC TAGG ATTGG AGAGGG ATC TTAGTAA TGGCTGGC AGAAACC TGGCC TCTAAG TGGATGGG ATTCC TTACTGAC AGTC AGTGGG ACAGG TGAGGAG AAAAGAGAC AGTGCC GGAGTC AGAAGG ACG AGGTTCC AGGCC TGGCTGGG TCCCTAGG ACAAC TCATTTG ACCACGC GGGC TGGAGAC GGG TGGGCTGC ATGAAG TCTGG TAGGC TGTC TGTGCC TTTGC TACTGC TGGGATAC AGAGG TCTGCC AGAA TCCTC AGGCTAC TCTCTCAGC TCTC AAAACCC TTATCCC TTGGC ATGGGTGG TTTATC AACC TAGCCC TTTGTGGGG TTCCC ACTGCCC TGCCC TCTCCCC AGAGG AAATG ACTTC TTGGG AAACC TAGG ACCCCAGGC AGAACC AGGC AGAACTGG TTGTC TGTGAGC TCACC TTTG TCACG TGTG AGCCC TGTCTAC ACAGC TGCAAGC TCTCACCC ACCCC TAACCC AACC AGGCC TATC TTTCTTTCC TAG AGGTC AATAAGC ACCCC AACTAA AGATAAGC ATCAGAA TCGCC TGGAGAA TTTTGC TCCTAAGG ACCCCACCC AGACC TACCC AATCAGAA TGGGGG TTG AGGAG ATGAGAA TCTCGG TTTT ACAAGC TCCTCAGC TGATTC TAA TTTTTTTTTTTT TGAGATGG AGTCACAC TCTG TTGCCCAGGCTGGAGTGCAATGGC GTG ATCTCAGCTCACTGC AATATC TGCTTCC TGGG TTCAAGCGATTCTCCTGCCTCAGCC TCCTGAA TAGC TGGGGC TACAGGGG TGTCCC ACCACACCCAGC TAATTTTTGTATTTTTAGTAG AGATC AGG TTTCACCATGTTGGCCAGGCTGGTCTTGAACTCC TGACCTCGTGATCC G ACCGCC TTGGCCTCCCAAAGTGC TGGGATTATAGGCATGAGCC ACCACACCCAGCC TGATTC TAATTATT AATC AGACTTG AAATG AAAGCC ACTGG TTCACGG AGGG ATTAC GGG ACTCTC ACTTTG AGCC TCAATG TCCACATC TGTAG AATGGC ACTAT ATTTGTTCC [SEP]
,,,,


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
1.0,0 (0.78),AAAGGTTTGGAGAGGGAGGTCCTAGTGAGGCTGAACAGAGGTAAAATAAACAGAAAGTTCCAGGCTCTCCTTGCTTCTACTTAAGAAAAATCAGAGCAGTAAATCCCAAACCAGTTCTGCCCACAACTCAAATGCAGATGAGCATCCCTTGCTCCATCTATGCAGGAAAGCCATAGTGTGGGGCTGTAGGACTATGGAGTCAGCCTCTGCAAGCAACAAGGCTCAGAGGCTGAGGGGCTTCAGGCCCCAGCAAAACCCAGTGATCCTGTTGTCAAATCTGAATGTCATCATCTGCCTCCAGGGCGACCAGCTCTGGATGGGGGTGTCAGGGTCAGGATCCTGTTCCATGTGGCAAGAGCTTGGGGAAGCTGCTGCAGGCCTACTGATGACCTTCTTTCCTGGCCCAGACACTCTTAAAAACTTCCTGGCGAGGGAGGCAACACACCTTATTGTGCAGCCCTCATCGAACGCATCAGCTGCACTAAGTGCTGAAGAAAAGTTCCCATAATAACCATGTGTGATAATAAAAAGATAAAGAGGCAAATAGGTATGTAGGTCAGCTCAAAAATAGCCACCCACCCGCCTGGCCTGGGTAGCCCTTTGTGCCAAGTGGGTAGAAAGGTTTTCCTTGCTTCCCTTCCCAAGCTGATGCCCCCTGCACTTTTCAAGGTTGCCTTAAATACAACTCCTTCCTGCACTAGCTGGGGTAGCCAGGGCAGTAGGGACTGCAGCCCTACAGGGGCAGCCCTGCGCTCCCTCCACCAAATCAATCCTGGGGTCAGAGGGCACAAAGGCTTGGCCTCTCTGACGTGAGTTCTCGGGGCTAAGTCAGGGTTTAGGGTAGTGAGTCACAGACATTCTTTCCCCCATCCCTTAGGGTTTGCGCACACCCAGGAAGCCTTCCCCTCCCCAACAGAGACCGCTTTGTTAGCACGACCCACCCGGTTGGAGAAGAGTTACAGCCTCAGGGGTGTGAGGGCCTCCTCGGCCTCTCCCTCCCTCCCCCTCTCTCCTCTCTAGGGCTCTCACCAGAAAGGCGCCAACCCTGCGCCCTGCCCCCACCCAGCCGCCGGGGCCCCAAATGCTGAGCTCAGCATCTCTGTGGCCTGGCTGCCCTCCTCCCGGGCAGTGGGAGGAGCCTCCTTCCTCCCGAGGGTGGGCGGGGCCAGGGCCAGCCCCGCCCTCCTCCCCGTTCCCCCTCTCCCTCCATCCCCCTCCCGTTCCTCAGTCGCACGTTCTCCAAGTCACGTCCCCCGCTTCCCCTAGTAGGGGGTCGACGGAGATTGGACCCTTCCCCCAGTCAGCTGCTCTGCATCTGTCACCTCGGCGGCAGCGCTCCCTTGAGGTCGCACCTCCGCTGTGGAGGGAGGCGAGAGCGAGCTGAGTGGGGGGTCTTCCCTTCCCCCATCCCGCTGGCCCCAGACAAGCCACCGCAGACCGCGGCGAAATCAGTTAAGCTCTTGCGTGCACCAGTTCCCGGAGCAGAGTCTGAAAGTTTTTGTGTTTCTGTGCGGCTACTTTTAAGTATAAAAAATTCAGCAGTGGCTCCTGGGTGCCTATGTCAGCGTCTGGCCCTTTGTGGATTACGTACGGGACAACTGGGGTGGGGAAGGGCCCCTCTTCACAGGCAGCAATTCCCAGAGTGGCCTTCCTATGGGACCCCAGAGCTCCCAGGGGGAGGATCCCAGAGGGGGATATGGTAACAGAATCACTGTCACTTCTGGGATTGAGGGTGGCAGCTAAAGGGAAACCCCTCGAGTGTCAGTCGGACTTGCCATTTGAGTCAGCACTGCTAGGTGCTGCTGAATTCTGCAGGGGGAGGAAGAACCTGATCAGATAAAACAAGGGCTGACCTAGAGAAAGTCTCTTGGGTCAACATATTCTTAGCGATAACAGAAGATCACTCCAACTGTTCTACACCCCACCCTACAACATTGACCCCCCGCTTTCCAGCATTTACAGTCCCTTTTAGTTTACAACTAAGAGTATGGGTTGCCTGGGATCAGGAAATGAGCCTAGATGTAGAGTCCTGGCTCCAGCCTTGCTGACACTATGTGACTCACTGCACCTATCTGAATCTCAGTTTTCTCACCTGTGCAGTGACATTGATGAGGTCTGTCCTGCCTACAAACTCTACACACATATATTAGTTGTTGTTTTTTAATTTTTAGTAGAGATGGGGTTCTCACAACTTGCCCCAGGCTGGTTTGAACTCCTGGATTCAAGCAATCCTCCCATCTCCACCTCCCAAATGCTGGGATTACAGGTGTGAGCCAGTGTACCAGGCCAGTATTATGCTGGGATTACAGGTGTGAGCCACCATACCAGGCCTTTATTTTTGTTTTGTTGGTTTGTTTCGTTTTTGTTTGAGATAGCGTCTCACTCTATCACCCAGGCTGGAGTGCAGTGGAACGATCTTGGCTCACCGCAACCTCCGCTTCCCGGGTTCAAGTGATTCTCCTGCCTCAGCCTCCCAGGTAGCTGGGATTACAGGTGCATGCCACCAAACCTGGGTAAATTTTGTATTTTTAGTAGAGACAGGGTTTCACTATGTTGGCCATGCTGGTCTCAAACTCCTGGCCTCAAGTGATCCACTCGCCTCAGCTTCCCAAATCATGTGCTGGAATTACAGGTGTGAGCCACTGCCCAGCCTAAGTCTTTTTTTTTTTTTTTTTTTTTTTTGAGACAGAGTCTTGCTTTTTGACCCAGGCTGGAGTGCAGTGGCACAATCTCAGCTCACTGTAACCTCAGCCCCCTGGGCTCAAGTGATTTTCCCACCTCAGCCTCCCAAGAAGCTGGGAATACAGATACACTCTACCATGTCCAGCTAACTTTTTGTCTCTTTAGTAGAGATGGGATTTCACCATGTTGGCCAGGCTGGTCTTGACCTCCTTGACTCAAGTGATCTGCCCACCTTGGCCTCCCAAAGTGCTGAGATTACAGGCATGAGCCACCATGCCCAGCCTCCAGTTGTTATTTTTATTAACAAAGTTATGAAAATCCTTTAGAACATGTGGAAAAAGACAAAAAGTTATAAGGCTGGGTGCAGTGCCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGAGGTGAGCAGATCGCCTGAGGTCAGGAGTTCAAGACCAGCCTGGCCAACATGGTGAAACCCTGTCTTTACTAAAAATACAAATATTAGCCAGGCATGGTGGCGGGCACCTGTAATCCCAGCTACTTAGGAGGCGGAGGCAGGAGAATCGCTTAAATCCAGGAGACAGGTTGCAGTGAGCCACGATCGTGTCCAGCCTGGGCAACACAAGACTCCATCTCAAAATTAAAAAAAAAAAAAGTTATGAAAGCCCTAAAAAATATGGAAGTGTGTTTTTTTGTTTGTTTTGGTTTTTTTGAGACGGAATTTCACACTGTTGCCCAGGCTGGAGTCTAGTGGCGCGATCTAGGCTCACTGCAACCTCTACCTCCCGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCCGAGTAGCTGGGATTACCGGCGCCCGCCAGCACGCACGGCTAACTTTTTCTATTTTTAGTAGAGATGGGGTTTTACTATTTTGGCCAGGCTGGTCTCAAACTCCTGACCTCATGATCCGCCTGCCTTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCCACCGTGCCAGGCCTGTGCAAGTGTTTTTAGAATCCTGAAGCGCTCCATAAGGGTCAATGATCTTTGTGAGGAGGCTGGTGCGGTGGTTCACGCCTGTAATCCCAGCACTTTGGGAGGCTGAAGGGGGCAGATCACCTGAGGTCAAGAGTTTGAGACCAGCCTGGCCAACGTAGTGAAACCCTGTCTCTGTTGAAAATACAAAAATAAACCGGGCGTGGTAGTGCATTCCTGTAATCTCAGCTACTCGGGAGGCTGAGGCAGGTGAATCCCTTGAAGCCGGGAGGCAGAGGTTGCAGTAAGCTGAGATTGCACCACTTGTACTCCAGCCTGGGTGACAGAGTGAGACTCCACCTCAAAAAAAAAAAAAGATCTTTGTGAAGAGATGGCAAATTGCCAGGTGGGCTGGCAGCTTCCATTTCCTGCCAGCCCAGGTGTTCCAGAGAAAGGCTCAGCATGCAGACCTGGGCAGCTGCCTTTTGCCTAGACTTGAGTTTCCCAAGCCTTTGACTATTAAGGCCACTGGAGATAAAATGCACTTCTGAGTGAGGTTAGAGGCATCGCAGAAGGGTGATGAAGGAGACCAAAGCCAGGGAGAAGAAAGTTCCAGAGGATTGAGTGGGGCCTAACTGCCAGGAGAGAGGGAGATCCTGGAACCTCCTAAGGCTCCCTGCCCTGTCAGTTCCTTGTCCATAAAGTGGGGGAGGTTGGGGGCTGGAAGGAGTACTCTCTTAGGACCTGCTTATCTTAACATTAAAAGATTTTAGCCGGGCATGGTAGCTCATGCCTGTAATCCCAGCACTTTGGGAGGCTGAGGCGGGCAGATCACCTGAGGTTGGGAGTTTGAGACCAGGCTGACCAACATGGAGAAACCCCATCTCTACTAAAAATACAAAAAAGTTAGCCAGGTGTGGTGGCACATGCCTGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAATCGCTTGAACCTGGGAGGCGGAGGTTGCGGTGAGCCAAGATTGCGCCATTGCACTCCAGCCTGGGCGACAAGAGCGAAACTCCATCTCAAAAGAAAAGAAAAAAAGAAAGATTTTAAGGTTCATTCTACTGACAGAAGAATCCTGACAGTGAGAAGGCTGACCCTTCTCTCTGCTGATCTAGCTCTACTCACCCCAGCCCTTTGGGAAACGCAGAGGCTAGACAGGTCCTCCTGGTCTCCTTTCTTCTCTAGAAGGAAAAACAACAACAATAGAGTGAGCTCATTTTGCTGTCCAGACAAATGATGAGCCTGGGTTTGGGCTTTCCCAACTGTGGCAGGTCCTGATCATCTCTGTCATCCCCTGTCATATACTCCCTAGGCTGGTGGAAAAACCCCCATCCCTGCTTCCCCCTTTGTTATATGGATATCAACAATATTTCCATATTGTAAACCAATTGGAAGCCCTCAAAAGGCAAAAGCACTGAAATGGCTGAAATGCCTATTTCTACCTTCTCTGGCAGGCCTCCTGCAGAGAGTCCTATGGGCTAGGACTGGGGTTTGGGGGAAAGCAGCTCCATGGAATGTATTATATCTTTCTCCTTTGCTATGATCCTTGTAGAGGTTGAAGAGGTCTTTGAGATTCTCTAGTTCCGTGTTTTCAAAACTGAGGTATGAAGGCCGGGCTTGGTTACTCACGCTTGTAATCCCAGCACTTTGGGAGGCCGAGGCAGGCAGATTACTTGAGGCTAGGAGATAGAGACCAGCCTGGCCAACATGGCAAAACCCCGTCTCTACTAAAAATAAAAAAATTAGCCAGGCGTGGTGGCGCATGCCTGTAATCCCAGCTACCCGTGAGGCTGCGGCAGGAGAATCTCTTGAACCTGGGAGGCAGAGGTTGCAGTGAGCTGAGATATCGGCACTGCACTCCAGCCAGGAGGACAGAGCGAGACTCTGTCTCAAAAAAGAAAAAAAAAGTTTTTTTCTTTTTTTGGAGGGAGAAATTAAGTAATTTAACTAGTAAGTAATCTAAACATTTGCTACTGAAATTAACACAGATAAAATATATAATAAAATGCAAAATTGTGTTATTTGTAATAAAAATTCTGGGCTTCAAAGACATGGTATGCTTCCTGGGGGCTGCTTCTGGGCCACAGCCCAGACTCCGATCCATCCTTAGTGGCCAAACAGCCTGCAACTAAGGTCTGCTGACTCCTATCCTCTCACTCCACAGGGCCTGAGCTAGCCGAGGTTTAAGAGACTCACTAGAGAGAGGGGGTTGCCTAGCCCTCCCTGCACTTCATTGCTTTCTCTCCTCATAAGGATTCAGAACCTAGGATTGGAGAGGGATCTTAGTAATGGCTGGCAGAAACCTGGCCTCTAAGTGGATGGGATTCCTTACTGACAGTCAGTGGGACAGGTGAGGAGAAAAGAGACAGTGCCGGAGTCAGAAGGACGAGGTTCCAGGCCTGGCTGGGTCCCTAGGACAACTCATTTGACCACGCGGGCTGGAGACGGGTGGGCTGCATGAAGTCTGGTAGGCTGTCTGTGCCTTTGCTACTGCTGGGATACAGAGGTCTGCCAGAATCCTCAGGCTACTCTCTCAGCTCTCAAAACCCTTATCCCTTGGCATGGGTGGTTTATCAACCTAGCCCTTTGTGGGGTTCCCACTGCCCTGCCCTCTCCCCAGAGGAAATGACTTCTTGGGAAACCTAGGACCCCAGGCAGAACCAGGCAGAACTGGTTGTCTGTGAGCTCACCTTTGTCACGTGTGAGCCCTGTCTACACAGCTGCAAGCTCTCACCCACCCCTAACCCAACCAGGCCTATCTTTCTTTCCTAGAGGTCAATAAGCACCCCAACTAAAGATAAGCATCAGAATCGCCTGGAGAATTTTGCTCCTAAGGACCCCACCCAGACCTACCCAATCAGAATGGGGGTTGAGGAGATGAGAATCTCGGTTTTACAAGCTCCTCAGCTGATTCTAATTTTTTTTTTTTTGAGATGGAGTCACACTCTGTTGCCCAGGCTGGAGTGCAATGGCGTGATCTCAGCTCACTGCAATATCTGCTTCCTGGGTTCAAGCGATTCTCCTGCCTCAGCCTCCTGAATAGCTGGGGCTACAGGGGTGTCCCACCACACCCAGCTAATTTTTGTATTTTTAGTAGAGATCAGGTTTCACCATGTTGGCCAGGCTGGTCTTGAACTCCTGACCTCGTGATCCGACCGCCTTGGCCTCCCAAAGTGCTGGGATTATAGGCATGAGCCACCACACCCAGCCTGATTCTAATTATTAATCAGACTTGAAATGAAAGCCACTGGTTCACGGAGGGATTACGGGACTCTCACTTTGAGCCTCAATGTCCACATCTGTAGAATGGCACTATATTTGTTCC,3.23,[CLS] AAAGG TTTGG AGAGGG AGGTCC TAG TGAGGC TGAAC AGAGG TAAAA TAAACAGAA AGTTCC AGGCTCTCC TTGC TTCTAC TTAAG AAAAATC AGAGC AGTAA ATCCC AAACC AGTTCTG CCC ACAAC TCAAATGC AGATG AGCATCCC TTGC TCCATC TATGC AGGAAAGCC ATAGTG TGGGGC TGTAGG ACTATGG AGTCAGCC TCTGC AAGCAAC AAGGC TCAGAGGC TGAGGGGC TTCAGG CCCC AGCAAAA CCC AGTGATCC TGTTG TCAA ATCTGAA TGTC ATCATC TGCCTCC AGGGCG ACCAGC TCTGG ATGGGGG TGTCAGGG TCAGG ATCC TGTTCC ATGTGGC AAGAGC TTGGGG AAGC TGCTGC AGGCC TACTGATG ACCTTC TTTCC TGGCCC AGACAC TCTTAAAA ACTTCC TGGCG AGGG AGGCAAC ACACC TTATTG TGCAGCCC TCATCG AACGC ATCAGC TGCAC TAAGTGC TGAAG AAAAG TTCCC ATAATAACC ATGTGTG ATAATAA AAAGATAA AGAGGC AAATAGG TATGTAGG TCAGC TCAAAA ATAGCC ACCC ACCCGCC TGGCCTGGG TAGCCC TTTGTGCC AAG TGGGTAG AAAGG TTTTCC TTGC TTCCCTTCCC AAGC TGATGCC CCC TGCAC TTTTCAAGG TTGCC TTAAATAC AACTCC TTCC TGCAC TAGC TGGGG TAGCC AGGGC AGTAGGG ACTGC AGCCCTAC AGGGGC AGCCC TGCGC TCCC TCCACC AAATC AATCC TGGGG TCAGAGGGC ACAAAGGC TTGGCCTCTC TGACG TGAGTTCTC GGGGC TAAG TCAGGG TTTAGGG TAG TGAGTCAC AGACATTC TTTCCCCC ATCCC TTAGGG TTTGCGC ACACCC AGGAAGCC TTCCCCTCCCC AACAGAG ACCGC TTTG TTAGC ACGACCC ACCCGG TTGGAGAAG AGTTAC AGCC TCAGGGG TGTG AGGGCC TCCTCGGCC TCTCCC TCCCTCCCCC TCTCTCC TCTC TAGGGC TCTC ACCAGAA AGGCGCC AACCC TGCGCCC TGCCCCC ACCCAGCC GCC GGGGCCCC AAATGC TGAGC TCAGC ATCTCTG TGGCC TGGCTGCCC TCCTCCC GGGC AGTGGG AGGAGCC TCCTTCC TCCCG AGGGTGGGC GGGGCC AGGGCC AGCCCC GCCC TCC TCCCCG TTCCCCC TCTCCC TCCATCC CCC TCCCG TTCC TCAGTC GCACG TTCTCCAAG TCACG TCCCCCGC TTCCCC TAGTAG GGGG TCG ACGG AGATTGG ACCC TTCCCCC AGTC AGCTGC TCTGC ATCTGTC ACCTC GGCGGC AGCGC TCCC TTGAGG TCGC ACCTCCGC TGTGGAGGG AGGCG AGAGCG AGCTGAG TGGGGGG TCTTCCC TTCCCCC ATCCCGC TGGCCCC AGACAAGCC ACCGC AGACCGC GGCG AAATC AGTTAAGC TCTTGC GTGCACC AGTTCCC GG AGCAGAG TCTG AAAGTTTT TGTGTTTC TGTGC GGC TACTTTT AAG TATAAAA AATTC AGCAGTGGC TCCTGGG TGCCTATG TCAGCG TCTGGCCC TTTG TGGATT ACGTAC GGG ACAAC TGGGG TGGGGAAGG GCCCC TCTTC ACAGGC AGC AATTCCC AGAG TGGCCTTCC TATGGG ACCCC AGAGCTCCC AGGGGG AGGATCCC AGAGGGGG ATATGG TAAC AGAATCAC TGTCAC TTCTGGG ATTG AGGGTGGC AGCTAA AGGG AAACCCC TCGAGTG TCAGTCGG ACTTGCC ATTTGAGTC AGCAC TGCTAGG TGCTGC TGAA TTCTGC AGGGGG AGGAAG AACC TGATC AGATAAAAC AAGGGC TGACC TAGAGAA AGTCTC TTGGG TCAAC ATATTC TTAGCG ATAAC AGAAG ATCAC TCCAAC TGTTCTAC ACCCCACCC TACAAC ATTG ACCCCCC GC TTTCC AGCATTTAC AGTCCC TTTT AGTTTAC AACTAAG AGTATGGG TTGCCTGGG ATCAGG AAATG AGCCTAG ATGTAG AGTCCTGGC TCCAGCC TTGC TGACAC TATGTGAC TCACTGC ACCTATC TGAATCTC AGTTTTC TCACC TGTGC AGTG ACATTG ATGAGG TCTG TCCTGCC TACAAAC TCTAC ACAC ATATATT AGTTG TTGTTTT TTAATTTT TAGTAG AGATGGGG TTCTCAC AACTTG CCCC AGGCTGG TTTG AACTCC TGGATTC AAGCAATCC TCCC ATCTCC ACCTCCC AAATGC TGGGATTACAGGTGTGAGCC AGTGTACC AGGCC AGTATT ATGC TGGGATTAC AGGTGTGAGCCACC ATACC AGGCC TTTATT TTTGTTTTG TTGGTTTG TTTCG TTTTTGTTTG AGATAGC GTCTC ACTCTATC ACCC AGGCTGGAGTGCAGTGG AACG ATCTTGGC TCACCGCAACC TCCGC TTCCCGGG TTCAAGTGATTCTCCTGCCTCAGCC TCCCAGG TAGCTGGGATTAC AGGTGCATGCC ACCAAACC TGGGTAA ATTTTGTATT TTTAGTAGAGACAGGGTTTC ACTATGTTGGCC ATGC TGGTCTCAAACTCC TGGCCTCAAGTGATCC ACTCGCC TCAGCTTCCC AAATC ATGTGC TGGAATTAC AGGTGTGAGCC ACTGCCC AGCCTAAG TC TTTTTTTTTTTTTTTTTTTTTTTTG AGACAGAGTCTTGC TTTT TGACCC AGGCTGGAGTGCAGTGGC ACAATCTC AGCTCAC TGTAACC TCAGCCCCC TGGGCTCAAG TGATT TTCCC ACCTCAGCCTCCC AAGAAGC TGGGAATAC AGATACAC TCTACC ATGTCC AGCTAAC TTTT TGTCTC TTTAGTAG AGATGGGATTTC ACCATGTTGGCCAGGCTGG TCTTG ACCTCC TTG ACTCAAG TGATCTGCCC ACC TTGGCCTCCCAAAGTGC TGAGATTACAGGCATGAGCC ACCATGCCC AGCCTCC AGTTG TTATTTTTATT AACAAAG TTATG AAAATCC TTTAGAAC ATGTGG AAAA AGACAAAA AGTT ATAAGGC TGGGTGC AGTGCC TCACACC TGTAATCCCAGCACTTTGGGAGGCCG AGGTGAGC AGATC GCC TGAGGTCAGGAGTTCAAGACCAGCC TGGCCAACATGGTGAAACCC TGTCTTTAC TAAAAATAC AAATATT AGCCAGGCATGGTGGC GGGCACC TGTAATCCCAGCTAC TTAGG AGGCGG AGGCAGGAGAA TCGC TTAAATCC AGGAGAC AGG TTGCAGTGAGCC ACG ATCGTG TCCAGCCTGGGCAAC ACAAG ACTCCATCTC AAAA TTAAAAAAAAAAAA AGTTATG AAAGCCC TAAAAAA TATGGAAG TGTGTTTT TTTGTTTG TTTTGG TTTTTTTG AGACGG AATTTC ACAC TGTTGCCC AGGCTGG AGTCTAG TGGC GCG ATCTAGGC TCACTGCAACCTCTACC TCCCGGGTTCAAGCG ATTCTCCTGCCTCAGCCTCCCGAGTAGC TGGG ATTACC GGC GCCCGCC AGCACGC ACGGC TAAC TTTTTCTATT TTTAGTAGAGATGGGG TTTT ACTATT TTGGCCAGGCTGG TCTCAAACTCCTGACCTC ATGATCC GCCTGCC TTGGCCTCCCAAAGTGCTGGGATTACAGGCGTGAGCC ACCGTGCC AGGCC TGTGC AAGTGTTTT TAGAATCC TGAAGC GCTCC ATAAGGG TCAATG ATCTTTGTG AGG AGGCTGG TGCGG TGG TTCACGCC TGTAATCCCAGCACTTTGGG AGGC TGAAGG GGGC AGATCACCTGAGG TCAAG AGTTTGAGACCAGCC TGGCC AACGTAG TGAAACCCTGTCTC TGTTGAAAA TACAAAA ATAAACC GGGCGTGG TAGTGC ATTCC TGTAATCTCAGCTAC TCGGGAGGCTGAGGC AGGTGAA TCCCTTG AAGCC GGGAGGCAGAGG TTGC AGTAAGC TGAGATTGC ACCAC TTGTAC TCCAGCC TGGGTGACAGAGTGAGAC TCCACCTC AAAAAAAAAAAA AGATC TTTGTG AAG AGATGGC AAATTGCC AGGTGGGC TGGC AGCTTCC ATTTCC TGCCAGCCC AGGTGTTCC AGAGAA AGGCTCAGC ATGC AGACC TGGGC AGCTGCC TTTTGCC TAGACTTG AGTTTCCC AAGCC TTTG ACTATT AAGGCC ACTGG AGATAAAA TGCAC TTCTG AGTGAGG TTAGAGGC ATCGC AGAAGGG TGATGAAGG AGACC AAAGCC AGGGAGAAG AAAGTTCC AGAGG ATTG AGTGGGGCC TAACTGCC AGGAGAG AGGG AGATCC TGG AACCTCC TAAGGC TCCCTGCCC TGTC AGTTCC TTGTCC ATAA AGTGGGGG AGGTTGG GGGC TGGAAGG AGTAC TCTC TTAGG ACCTGC TTATC TTAAC ATTAAAAG ATTTT AGCCGGGC ATGGTAGC TCATGCCTGTAATCCCAGCACTTTGGG AGGCTGAGGCGGGC AGATCACCTGAGG TTGGG AGTTTGAGACC AGGC TGACCAACATGGAGAAACCCC ATCTC TACTAAAAATAC AAAAAAG TTAGCC AGGTGTGGTGGC ACATGCC TGTAATCCCAGCTACTCAGGAGGCTGAGGCAGGAGAA TCGCTTGAACCTGGG AGGCGGAGGTTGC GG TGAGCC AAGATTGC GCC ATTGCACTCCAGCC TGGGCGACAAG AGCG AAACTCCATCTC AAAAGAAAAGAAAA AAAGAA AGATT TTAAGG TTCATTC TACTGAC AGAAG AATCC TGACAGTG AGAAGGC TGACCC TTCTCTC TGCTGATC TAGC TCTAC TCACCCC AGCCC TTTGGG AAACGC AGAGGC TAGACAGG TCCTCC TGGTCTCC TTTC TTCTCTAG AAGGAAAA ACAACAAC AATAG AGTGAGC TCATTTTGC TGTCC AGACAAATG ATGAGCC TGGG TTTGGGC TTTCCC AAC TGTGGC AGGTCC TGATC ATCTCTG TCATCCCC TGTC ATAT ACTCCC TAGGC TGGTGG AAAA ACCCCC ATCCCTGC TTCCCCC TTTG TTATATGG ATATCAAC AATATTTCC ATATTG TAAACC AATTGG AAGCCC TCAAAAGGC AAAAGC ACTGAA ATGGC TGAAATGCC TATT TCTACC TTCTCTGGC AGGCC TCCTGC AGAGAGTCC TATGGGC TAGG ACTGGGG TTTGGGGG AAAGC AGCTCC ATGG AATGTATT ATATC TTTCTCC TTTGC TATGATCC TTGTAG AGGTTGAAG AGGTCTTTG AGATTC TCTAG TTCCGTG TTTTCAAAAC TGAGG TATG AAGGCC GGGC TTGGTTAC TCACGC TTGTAATCCCAGCACTTTGGG AGGCCGAGGCAGGC AGATTAC TTGAGGC TAGG AGATAGAG ACCAGCC TGGCCAACATGGCAAAACCCC GTCTCTACTAAAA ATAAAAAAATT AGCCAGGCGTGGTGGC GCATGCC TGTAATCCC AGCTACCC GTG AGGCTGC GGC AGGAGAA TCTC TTGAACCTGGGAGGCAGAGG TTGCAGTGAGCTGAG ATATC GGC ACTGCACTCCAGCC AGGAGG ACAGAGCGAGAC TCTGTCTC AAAAAAGAAAAAAAA AGTTTT TTTCTTTT TTTGGAGGG AGAAATT AAGTAA TTTAAC TAG TAAGTAA TCTAA ACATT TGCTAC TGAA ATTAAC ACAGATAAAA TATATAA TAAAA TGCAAAA TTG TGTTATT TGTAA TAAAAATTC TGGGC TTCAAAG ACATGG TATGCTTCC TGGGGGC TGCTTC TGGGCC ACAGCCC AGACTCCG ATCCATCC TTAG TGGCC AAACAGCC TGCAAC TAAGG TCTGC TGACTCC TATCC TCTCACTCC ACAGGGCC TGAGC TAGCC GAGG TTTAAG AGAC TCACTAG AGAG AGGGGG TTGCC TAGCCC TCCCTGC ACTTC ATTGC TTTCTCTCC TCATAAGG ATTC AGAACC TAGG ATTGG AGAGGG ATC TTAGTAA TGGCTGGC AGAAACC TGGCC TCTAAG TGGATGGG ATTCC TTACTGAC AGTC AGTGGG ACAGG TGAGGAG AAAAGAGAC AGTGCC GGAGTC AGAAGG ACG AGGTTCC AGGCC TGGCTGGG TCCCTAGG ACAAC TCATTTG ACCACGC GGGC TGGAGAC GGG TGGGCTGC ATGAAG TCTGG TAGGC TGTC TGTGCC TTTGC TACTGC TGGGATAC AGAGG TCTGCC AGAA TCCTC AGGCTAC TCTCTCAGC TCTC AAAACCC TTATCCC TTGGC ATGGGTGG TTTATC AACC TAGCCC TTTGTGGGG TTCCC ACTGCCC TGCCC TCTCCCC AGAGG AAATG ACTTC TTGGG AAACC TAGG ACCCCAGGC AGAACC AGGC AGAACTGG TTGTC TGTGAGC TCACC TTTG TCACG TGTG AGCCC TGTCTAC ACAGC TGCAAGC TCTCACCC ACCCC TAACCC AACC AGGCC TATC TTTCTTTCC TAG AGGTC AATAAGC ACCCC AACTAA AGATAAGC ATCAGAA TCGCC TGGAGAA TTTTGC TCCTAAGG ACCCCACCC AGACC TACCC AATCAGAA TGGGGG TTG AGGAG ATGAGAA TCTCGG TTTT ACAAGC TCCTCAGC TGATTC TAA TTTTTTTTTTTT TGAGATGG AGTCACAC TCTG TTGCCCAGGCTGGAGTGCAATGGC GTG ATCTCAGCTCACTGC AATATC TGCTTCC TGGG TTCAAGCGATTCTCCTGCCTCAGCC TCCTGAA TAGC TGGGGC TACAGGGG TGTCCC ACCACACCCAGC TAATTTTTGTATTTTTAGTAG AGATC AGG TTTCACCATGTTGGCCAGGCTGGTCTTGAACTCC TGACCTCGTGATCC G ACCGCC TTGGCCTCCCAAAGTGC TGGGATTATAGGCATGAGCC ACCACACCCAGCC TGATTC TAATTATT AATC AGACTTG AAATG AAAGCC ACTGG TTCACGG AGGG ATTAC GGG ACTCTC ACTTTG AGCC TCAATG TCCACATC TGTAG AATGGC ACTAT ATTTGTTCC [SEP]
,,,,


In [None]:
df = dataframe_creation(attributions_sum, all_tokens, 74019545, 10)

In [None]:
bed_file_creation(df, './67479')

Enter filename/content/drive/MyDrive/SE_annotation_project/bulk/67479


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_neg['score']= df_neg['score']*mult*(-1)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_pos['score']= df_pos['score']*mult


# SE_67637

In [None]:
text = 'ACAGGACAGGAGTGAGGACAGGAGGTGGCCTGAGGGGGAGAAAGAGAAAGATTTTTGGCTTTATTGAGAATGGTTTGTGGAAGAATAAGAGGAAGCCAAGAAGAAGGAAAGCGAAACGCCCCCTCCCCCCATTGCAAGACAGGTTTCGGCTGTTTGAGACGGAGCATCACAGGCAGGAAGGAGGAGGCAGGGAGGGGGCCTGGGCTCCTTGCCCCCTGCTCGGCCCCCACCAAGAGGATTCCTGTTCTTAGCACTTTGGCCTTAGGGAGACTTGAGTTTCTTAGTCCGTGGGGAGGTTCCGTTCTCTGCCTTCACCACTCCATTTTCATGGTAACCTGGGAAGTGGAGAGAGACAAGCATACATGGTGTTTCTGCTGGAGCTAAGGCAGAAGAGGGGAGGGTGGGGCCAGGCCAAGGAAGGGGCCCGGGCAGCCCAGCTGCTATACATGGATGCACCAAAGGGGCGCCAGGCTGCAGCCTTGCACAGCAAATGCAAGCCAGCAGACGGCTCCCAGGAGGGTCCTGTCTTCCCCAGGGCCCTGGACTAGTGGCCCTGTTTGAGAGGCTTGGTCTCTGACTGCACTTTAGCAGGAGGGGCCTGGGATGACACACAGTAACTCAGCAACAACAGAGGCCAGCCTGCCCAAGCCTGAGGCTGGGGCTAGATACTCGCCGAAATCACTTAGATGCTGTCACTGCTCACTGTCCTCAGTTCTTCTCAGGCCCCTGCAAGGCATCAGCCCACTTCCAGTTCAGCAAGAACTCCCAGGAGCAGTGGCCACAGAAGGGAGGGGGACAAGAGGCTGTAGGAACAAGGCCTCAAGCAGGATGCCTGACACTCCTCTGGCAGAAAAATTGTGCTCTATTGTTCAAAATACCTCCGTGCGCTTGCTCAAATTCAGAGGTACTGGCTGCAGTCTTATGCCCCATACCTCCCCCGCCAGCCAGGCCTGACTCTGTGACACACCCAGCTGCGCGCGTGTCTGGTTCAAACACACATAAGCCTTTGCCAAGCAGGTGGCCACCTAGAGAAAAGCAGGTGAGTCAGAAAGCAGCGCCCAGTGCAGACAGGCCCCCAGGCTGGGCAGAACGTGCAGGGCTGGCAGGGCCTGAGGACCTGCTGAAGGTGGGTGATGACTGGAGTGCGTGCACGGGCCAAAGGATAAGTGTCCCACCCCTACCCCCCACCTAGCACTATGTCACTGTGAGTCATTCTTGGAGACAGAGGAGGAGCCAGCAAGCTGGGAGGCAGGGGCAGGCTAAGATGTGGAGCAAAAGGGCAGGTGAGGACAGAGGCCGCCGTCCGGCACTGAGAATGGGCGGCGGCGGCAGTAGCAGCACTTGGCTGGGGTCCAGAAGCCACCCTGAGGACACGCTTCCTGCCAGAGTTCCCCACCCAGCCACTGCCCTGCCCCGTGGTGGCCAGGGCTCCCAGCCTAGTTAGGGCCAGCCCCACCCACAGCCTGTCCCTGGCCCACACCCAGCCACGTGCCAATCAGGGAGCTAGGAGCCCCAGCCCTGAGGTAAGAGTCAGGAAGGAGAAGCTGGCAGGATTGGTCTGGGCAGCGCCCAAGAAGCCAGGTGCCTTGGCTCCTCCCACCCATCCCAGACAGACTTCCCTGGCTCCACTCTCTGCCAAGGGCCCTGGCACTCACCAGATTCCCTCTTGATGAGCCTGGCTGGTAGTCTGGGTGTGGCTGGGACTCTCCGCTTTGCACTCTGCTCATTCCAGTATTCCCGCCAGTGCCGCAGCTGGGAGTGGATGAAGCGCCACATGAGCCAGGCCTGGGCGGCACACACCAGCAGCAGCACGCAGAGCCTGCAGAGCAGGGGGTTAGGGGCTTAGGCTGGGGCTTGGGCTCACAGCCTTGGGCTGGGTTGTGCAGGGGAGAACAAGGGCCAGGGGCCCTGCAGTTCCCATGGCTTATCACGTCCGCCTTCACCACTGGCCCTCTTCGATACCACCACTATCACCAGGAAGAATGTGTGCTTCAGTCAGTCTCTGCTCCAGCATACATCACATGTGCCAGGGAGACGGGAAGGAAGTGGCGACAGACGTACGGCCAGCTCTACAATCACGCTACTCCTATGACGAGGGAGGGGTCCATGGCTGTGTCTGTTTTGCGCCCATTGCACAGAACAAGACTAATGTAAGCTCCACAAATATTGGTAGCATTCAAATGAACTGAATTTCTGGAAGAGTGGCTTCTCATTTAACATGTCACTTAAAAGTGGAGCAACCCTGGACAAATCACTCTCCTGGGCCTAGGGGCTCCGGAAAATAGTGGCTTCCTCACTGCCACAGGAGGCCACTGGCCAAGCCATTAAGCACATGGTTTTAAAGCACCCACACACAAGAAGAGGAGAATGATATCAACTGAGAGACTGGGTGTGATGCCTCTGTGCACCACAAAGTGCCAGACAAATGTAAGGGATTCCTATTTGGACTACAGTCTGAGCAAACCAGGACTAGGGGATGAAGATGGTTTGGATGGAACCAGAGGCTGCTATCTCTTCTCCCCTCAGGCCTGATATCCAGAGATTTCCAAAAAATAACAATATGTGGGAGACTAAAGGGTCTGCTGCCTCCAGACCTTCTGCAAGGGCTGTGCCAAGTTCAGGAGGCTCCCTGGCTTATCACCTTGGACTTCTGCTCGACTCACCTGCAAAACAAAGTGTTGAAGTTCCCTTTCTCGGGATCAAATGCCTGGTTTTCCATGCGAGCCAGTCCAAAGCCAATGGCCAGCACGGCAAGGGTGAGGATGAAGAGGCGGGTAACCCCAAAAACAGCAGCCCAGGCACTGAACCTGCTCACAGAGGCAGAAGAGGGATGTCAGTCTTTAGCGCCCTTGAAGGAATCTTCACCCACTTCTCCAGAAGAGACCCCGAGTGGGAAGAGGATTCAAGGGTGGCTGGGGAAAGTGCTTGAGGGACGAGATATCTAAAATCAGATGTTCCAGAAAAAAATAACGGGAGGGCACCACCTGCAGGTAAGCGGGCAGTGTGCAACCAGGGAGGGACCCTCCAACCATCCGGGCCTCGGGGGAACCCCTGCCCAGGCCTCTAAGCGGGCCAGCCTGCAGCAGACCCACTTACAGTTTCTCGTTGTTTTCATCTGCAAAGTAGAAGAGTCTAGCCGTGTGGAAGAGGAACTCAGTTGAGTACTGCAGCAGCAGCAAGATCAGGCCCAGGCGGCTCAGGCTGGGGGTGGGGAAGACTAGACTTACATTCCCTCCAAGATGCTGCGTGGAGCAGAAGCCATTGCATCTTGGCTCAGGCTGTCCCCTGTGCCTGGCTGGGCTCTGCTTTCCACTCCCACTTTCCCTGGCTGGCTCTGCTCCATCCTTTGGATTCAGTTTAGCTCTCACACCTTTAAGACATTTTTCCTAATACCGACCCGCTGGCCGTTCAGCTGTCCTGTCTCAGTCAGATGCCCTTGCCTGCTCCCACAGCAAACCTCGCATAGGCCCTTCACAGTACTTAGCACCTTGCACTCATCACCTAGGCTGGAACCAAGTACATAAAAGGTACTCAGAACACATTTGCTGAGCTCTGAGTATAGGAATATGAAATGTTCCTGTTGTCTGACTTTCCATTATCCAAGTCTTCACAGCTCCGAGGTACATGCAGAAGCAGCAAGTGCTCCTTCTGTGTGGCCCTGCTTATACGTTCTTCCCCGGTCCTCGCCACTGCTACGGTGACAGTGCAGACTGGCTTCTTAGACCCGTTATGCATGTGACACATGACCATCCAACACAAGGGCAGAGCTGGCATCACCCCACAGCCTTCAGCCCTCAAAGACCCATCCGGGAACTGACGCTGCTACAGGCCACCAGAGACAGGAGACAGAGTTTGAGAGCTCCTTCCCTGCCTCAGTCTTACTAATCCAAGTCAGTCATTCACACAGGATGCCTGCTGCAAGGACCTAGTCCAACGCACCTCGGGATTTCCAGGCACCTCGGCAGAAAGTTACACACAGTGAGCTCTGTAAGTGCCAGCCTAGAGAAAGTGTGGGGTGCTTTTACTGCATGGATAACACTCAGCAAAAGCCCAAATTATCAATGACACAGCTTATTAACATCAAAAGGATTCTTTTCATAAAAGAGGCTCTTCGAGAACTAATATTATAGCAATTCTTTCTGCCTCTAGAACAACCAAGAGAGACCTACTCTCCATGTCATTATAAACCAAAGGGAAGGGAATTCCAGGGCTACGAGCTCTAGCAGTGTTTGCATTGGACACTGTGAGGTAAGAGCCCAGCTTTGGGAGGCCTTCAAGCTGCAAAGCCATGGTTCAAAGGCCGACATCCACTGGAAGTCTTCCTGGCTGTCTCTGTTGAGGGTCTTCTTCTGGGTTGCAGAGCAGATGATACATACTGTGTTATGGTGTTCATCACTCTCAACTGTCCTTACTTATGTCTATAACTGTCTCTTCAGAATGAGAATGAACCACTGAAGATAAAGAATCTTCCATTACCATCTTTGTATTGCCAAGTCTTAGCATAGTGCTAGGCACACAGAGGATGTCAACAAATGCCTGATAATTATATGAGTGTGTGGACAGATGCATGGACATAAAAGGGCAAGGAAATCTGGCTGGCTCCATGGTCTCACTCACTTTAAGAGGTATGCTCCAGCTATATGCACCAGGTACAGGCAAATATACTGGAGCTGGCGGGGAATTTCCTCCTGGAAACAAGAGAAGCAGATGGTAAATTTGCTAATTCCCTAACTGAAGATTCAGGGAAGGGGGAAAAGTGCAGGGGGATGAGAGAGGGCCAGGCTCCTCTGGGCTGCTTTAACACACAGTCCCATGTCCCACGAGTCCCACAGTCCCACTGCACCAGGCTGCTGAAATTCAAGGGCATTCAGGTCCATTCCCAAATTCCAGCAGCCTTGGGTCTAGTGTCAGAGGGTGAGGTTTGGATTGAGAAATAAGAGACAGGGACTGGAGAAGAGGGCTCTTGGAAATAATTCAGAAGGAAACTATAAAAAGTAAAAATAAAAAAAGACTATGGAAATGGCAAAGACCTCTCCTTTGACATCTATAAGATGAGAGTTAGGTTTCCTCCAAAGCCACAGGTCTGGTGGAAGAGGCAGGCAAGAGACTGACACTGGTGGTCAACTACATGACACTTCTCCAAGAGATGACTCAGCATGTTGCTCAATCCCCAACATATTCCTATCACCACCCAACACTCCATGCTTCTGGAGAAAAGGAAGGGAGGTACCCCTGGGAATAGCAGGAGGGGAGTGGTCAATGAATGGCCTCCAAGAAGGGAGAGAAGTGAGCACTCACCTTCCGTACCTTCTGGAAGTATAGCTCAGGAAGTGCGTGCAGCCAGTAGGCCAGCTGGCATAGGTAGAAAAACTTCACCTGGAAGCTGGAGACAAGGGGGCAAGTCACACGGGCAGGATAGAGAAAAGTGTCCCTGCAGGTGCTGGCCAAGCACAGGAGGGAAAAGCATGGGCTGAGACTCTGCCTGTGAGGAGCTGGTCCAGGAGCAAGGGAGTTAGGCCAGTGACCGCCGCACCCTGAGCCTGGGACCCTGGCTTCTCCATTGGCCTGTGCCCTTGTTCCACATACAAAACCACTTAAAGGACACGGAAAGTCCACAGAAAGAAACAAACATGATTAAAATAGTGCAGAGGAGGAGGAATCCTTCAGCCTTGAGGAGGGAGCTGATTACAGAGCACTGTTGGAGATAGGGACCAACAGATACACTGAGACAACAAACAGCTCTAAGTAGCAAGGGAAGGTTCTAACTCAGCCCTACATCCTTTGCTATTATTGCTCTTAAAGATCTCGGGAAAGGCAGCCAGGCGTGGTGGCTCACGCCTGTAACCCCAGCACTTTGGGAGGCTGAGGCAGGTGGATCACCTGAAGTCAGGAGTTTGAGACCAGCCTGGCCAACATGGTGAAATCCCATCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGCACATGTCTGTAATCCAAGCTACTTGGGAGGCTGAGGCAGGAGAATCGCTTAAACCCAGGAGGTGGAGGTTGCAGTGAGCTGAAATCATGCCATTGCACTCCACCCTGGGCAACAAGAGCAAATCTCCATCTCAGAAAAAAGACAAAAAACAAAGATCTCGGGAAAGGCAAAGGGTGGCCTCCTGAGGGAGATGGCCCCAGGTATTGCCCTTGGGGTACACTGCCCTCTTGGCAGCACTATATGAGGCAGAGGACACTGGCTCTGACAGACCACCAGCCATGGCAGGCCAGAAGGGAAGACACTCTGTGGATGTCAGGGGGTCGCCAAGAAGGTAGAAACCCAGAGGGCATTATGGAGAGAGATGTTCTGCTTCTGAATCTGTCTCATGCAGTTGAGGGACCTCTGTGATGGGAGCCAGCACAGATGGAATTTCATCTGGGGATTCTCTGGTCAAGCATGCTGAGAAGAAGTGGCTTCCAGACAAGTCTACCATCCACAATAGGCTCAGGGCATGATCTGCTCGTCAGGCCAGCTGGGCCTGTGGTGTTCTGGCCACACTCCGCTGGGACAGGAAGGCAGTGGGCCCGGTCGCTCCTCCCTGGGGCTGAGTCAACAGAATACTCACGGGAGGTGCACATGCGGGTAGTCTTCCCAGAGGCTTCTTGGGTTTGTTAAGTATCCTTCCTGCAGTGGGCAAGAAGAGAGACCATTTAGAGATGTGGACGTGAGACCTGCTGGGGCCCTGGGACCGGTCCAGGGGTCAGGGATGCATCCAGTCCCCACCTGACAGAAAGAGGAAGGAACAGGAAATGTGAAAACAGAGAACTTCTCTGTGTGGGACCCCTGGCGCTTGGCTGGTTTCTTTACTGTGGAAGAGTCATGCTGGAGTAGGAAGGGCCACGCTCTGAGGTCCAACGACCCATATCTGAAGATGAGTCTGACAAGCGAATTAGTCTTGCTCCTCTGAGCAAGCTAATTAGTTTCCCTAAGCCACAGCTGGCTCATCTGCAAAACAAAATAAAAATACCCACCCTCACAGAGTTATTGTTGGAAATGAATGGGATAGTTTATGTGCCAGTGTCTAGTCCTGTGCCTGGCATGCAGGCGCTCAGGAAATGCCTCCATAATGAATAAGCAAATGAACTCTAGAATCACCACTCGCTGGAAAAATGAAAAGCCTACTTTGGCTTTTCACAGCCTGCTGAATAAAAAACATGGCAGGACCCCATAGGCCTCACCATGCAGCTGGACTCTGACACCTACCACACTGTGTCATTACTGTCAGTTGTTTCCATTACTCTTGCAAGTCCCTTCACACTAGGGCCTTTTCTTGCCTATCTTTAGAATTCTAACATGTAGTCCAGCACCTTATATGGGGTGGGGATGGCAACATGAAAATCCTTCCATCACAAAACATCTAGAAATGCTGGGTGAAATCTAATGAATATTCTTTTAAATGCAAAGAGCTGAGCTCACAGTAAGAAAGGGAAACCCCCTGGGACCCAAAGGGAGAGGGAGGCTAAAAGGCAGAGCAGTAAAGTGACACTGTAGCAGCCCAAAAGGCACTAGTTATGGGCCAGGGTTTTTGTGCCCATGTGAGAACAGAAGATGGTGCCTTGGGAGGTGGAACCCAAGACCTTGTATAAGACCAGGACCTCTGAAAGGCCACAATCTCAGAGAAAGGAAAAGACTAGAAAGTGTTTGCTGACCAACACAGGGAAATGAAGATGTCTGCTCAGCCCATACCCAAGGTGAAAACAAAATCATTTATTCTAAAAATCTGCAACCTCAGGTTCACTCTGAGTTTGGAGGTGAAATATACTACCTGTGTGATCCAAAAGCCGCCAAGGTAAGAAATTAGAATTAATAGTGTGGTGGGCCAGTGATACCCTGGGGACATACCCTCATCCAAGGATGCTCCACAGATAAAACCTTGCTAAAGATGAATTTATAATCCAAGAGTACAAAGCATGGGAAGAAATAATCTACCACAAGCAAGAGTCAGCTGAAACTACAGGAGTGCAATACACACCAGTTGGTTGAATGAATGAATGATGAATGCTTTGGGCAATTTCTCTCTTCTGAAGAAAGGGCTCTTATTTGTCACTCAGAGAAGGCAGAGCAGATTAGATTAGGATGACTTCATTTTAGAAATGGGAAAATGAAAAAACAGATAGGAAGGATCTCCTGAAATAAGATAGTTTTGTTTTGTTTTTTTGATATGGAGTTTTGCTCTTGTTGCCCAGGCTGGAGTGCAATGGCACGATCTCAGCTCACTGCAACCTCTGCCTTGCAGGTTCAAGCGATTCTCCCGCCTCAGTCCTCCTGAGTAGCTGGGATTACAAGCACGCAACACCACACCCGGCTATTTTTTGTACTTTTAGCAGAGACGGGGTTTCACTATGTTGACCAGGCTGGTCTCAAACTCCTGACCTCACTTGCCTCGACCTCCCAAAGTGCTGTGATTACAGGCGTGCACCATTGCGCCCAGCCAAGATAGTTTTTCAGTAGCACAGCTGAAATCCGAGTTGGGCCACAAGCCTTCTGGTCCAATAACTTCAGGCTAGGTTGCTTCAGTAAATCAGAAAATCAGCTGAGCTGGTGGCTTTGATGAGAAGGCTGAGAACCTCAGATGTTCACACTGGGATTAAAGGCAGAGGTTTTACAGTGCTCAGAATGAGGCCAACAGGGTTTAGTAAGAAGCATTCTAGGTTATTGTCTATTAGGATCTTTAGTTGTATTTCCAAGTGAGGGCTGATCCACCCACCTTTGAGTCACTAAACGCCCTGTGACCTATCAGCATGCCTTTCGGGTATAGTCCACGGCCCTAATCCCACAAACTTGGGCCTCCATGAGCACAATAACCTGACTGATAAGTCCTTTTATCGGATACATCTATACCACTGTAGTCACAGTCACCTGGATTAGAAGGAAATGATCTCACTTCGAACTTACATGGCCTCATTTCTAATCTCTTCTCACTACCACTCTCTCCTCCCTGGGTCACGTGCCGATTGAGGAATAAAAGTGGATGAGGCTCTCGGGTGGTGGCGTGTGTGGTGGCGGTGACAGTTGTGAGCTCTCTCAAATACACTGCTTCTATCACCTCTACCCACCCACTCTGTCGGGCATACGCCTGCCTTCATCAGCTCTCCTGCCCCAGGCTACCTCATTCCAGGGACATCAGAAAGGTGAGAATGTCTCTTCCTAGAGGAAGCAGGAATGTACTTAGCAGGAAAAATGGTACTTCTGAAACTGAGGTGGGAGAGAAAGTTTTGCCCAAACAAGACTCGCCAAGAAAAGCAGCACTGAGAGCAATGTAAAGCCCAGAAAATCTCGTGATTTTAAACAGGAACGCTCCTTGGCTTGGCCTCTTACTTAGAGACAAAGAGGTCAGAACTTTGAAGCCAAAAAGCAAAGAAACTCCCCAGAAAAATGTTGCCTGCTTGTGAATGTCCAGTCCACGGGGACTGGAGGAGGAAAAGGGTGGAGGGAGGAGAGCAGGGGGAGCCAGAGGAAAAATGACTCACTGCTCTGAGAACAGCCTTTTCCAGACCTCTGTCCAGGCAGCTGTCTGAAGGAGGACTGAGGCTGGGGCACCCTCTGAGCTCAGGCACGCAAAGCACCTGAGTCCACAGGGGGCTGAGTGTGACCCAGCAAGCACCTGAAACCCACCCCAAATCCCATCCACTGACAGGCCCCAGCAGATGGTTTGGAGAGGCTTTTGAAATCCTTTGTTCTCTCGATTCTACAAATCCACCCATGAGCTAAGCAAGGCCTCAACAAGGTGGAGAGATCCCTCCTGTTTCCCCAGCAGCCTTCCTTTTGGTGTGTGAACAAACACAACCACGAAGAACAGCATAATTCAGATATAGCACAGGCAAGTGCTACATAAATTCAGACATACCTTATATTATTTGACCATCAGAACAACCATGCACTAAAAATCTGCCCTAAAGCAACTAGTCTGTTAGTAGAAACCGGTCCTGGTACAAGCACCAGCATTAAGGACATTCCCTCTACTTGGTTCTAAAATCTACGGTGGATTTTAGGTTCTAAAAGATGAAGCCAAATATAGCAAGGAAGTCAGACAGGGAAGACCAAACGCCCACCCATCCTGCTTTCTCCAGTGGAGTGTTTTTTTTCTTTTTCCCTCAACAATGAGTAGTCGATCAAAGGTAGATTAAAAGTTGGAGGCTGACATTCCTATAAAATTATTGGCGGTCCAGCCACACTCCCACTGCTCTGCCTCTATATATGCAGAGAGAAATGTTTCAATCAAACACCAGAATAATACTGGTATTTCTGGTGGGAGGAATTTGCTTTTTTGAACTTCTCTATATTGTTCACTTTTTAAAAAATGATCATTTATGATATTTATTAAAACAACCAATTCATTACTTTAAAAATGTTGAAGGCTGGAGAGAGAAGATGCATTTGCAGTTTATTCACTCATTCTCATAGCCAACATTTAGTGGGCACTTAGTATGTGCCAGGCACCATACCAGGGATACAGCAGTGAGCACCGTGCCTGCTAGCAGGCAGCTCAGAATCTAGTGGGAGAAACAGAGAATACAGAATACACAATCAAGAGAAGCACCAGCAACAGGCACAGTGCAGAAAATGCAAATTGGTGGGGGGTTCTCTGAGGAGATGGTATTTAGGCAGAGACTTGGATGGCAAGAAGGAGTTGGCCATGGGATGGCAGGGGATGGAGCCCTTGAGCAGAGAAATCACCAGTACAAAGCCCAGGATGCAGAACAGCCAGGCCAAAAGTGGGGGTGTGGCCAGTGAGATGAGACCAGCAAGATTAGCAGGGCCCAGATCACATGAATGGGGAGGAAAAAACGATTTCACTGCAAGTGTGATGGGACTTTTAAGCACGGGAATGTATGGTTTTATTTCTGTTTTAAAAGATCCATCTGGCTGAGCAGAAAATGGATTGGGGTGGGAGGGTACAAGAGTGGAAACAGTCTCCTTCTAGAAAAAAGATATTTAGTGTCTAGGCAAGAGATGATGGTGGCTTGGACTATACAGATCGAGGTTTCTCAATCTTGGCACTATGGCCAGATAGTTCTTTGTTGTGGAGGCTGTCCTGTGCATTAAACGCCATATCGTAGCATCCCTGGCCTCCACCCACTAGATACCAGTAGCATATTGCCAAATGTCCCCTACAGGCCCAAATCTCCCCTGGTCAAAGGTCACTAGACTAGGGTTGGTGGTGCAGGCAGAAAGCAGCAGACAGTCTCAATGTGTTTGGGAGGCAGAGCTGGCAGGACCTGCCGATGAAATGACTGTGGAGAGTGAGAGAAAGAAGAGTCATGAAAAAATTTGCATCATAACAGAAAAATATTATTTTTTTAAAAAAACAAGCTGTTTTTATGCCTTTTACAGAACTACATCTCTTCTTCTTCAATCACTTTCCTTCCAGGAAGCACAGTTCCAACGGAGGAGGGCAAGGAGTCAAATGTTGTTAGGAAGAGTGGCGGGGGTCGGGGGTCACTGGAGCTTTCCGTGGTCCCCTGGTCTCTGTGCCTATTGAATATGTTGAGTGGGGAACTGGCTCTTCCCAGAATAAAAAACTGTTATGTGCCTCCCCAAGAAAAGCCTATGTGCTCTCAAACTAATTAGCATCATGTTCAAATCCTTGAAGAACTGAGAGAGGCAAAGACAGAGCTGTTGAGCATTTCACACCCTGGAAGGCGTGTTAAGCAACTTGGCTCTAGCCTCCAAATCTGGTCGCCACGTGTCACAGCTGGGGTGGAATGTTTGGGGGTGAAGTTGAAAGGGTAAAAGTGATTCAGAGATGAGGCAATCCTCCTGAACGGCGTCTTTGGTATCTTGAGGCTGTTCTGCTTCAAAGCAGCTTAGGCCTCCGGGGGTGGGCATGAACTGAACGTCAAGGGACTGGGTGTGGTCTGAAACCTGGAAGTCTAGGGACTTGTGTGCATGGCACAACAGCAGGGATGCACTGTTCACACAGTGTCAATCTGCCCCTGGGACTGTGACAGCCTTGCCTGAGAGGACAGAAGTCTTGGGCCCCCCATTTAAAATTCCTAGTATTCTGCTTAGGAAAGCTGCTCTATGATGAAATGATAATAGGAATAAAAACAATGTACAAAAGGACACGTTGACTCTGGCTTTGAGAATAGGAATTCAACATTCAACTCTGGAGACAGAGTTCCTTGTGATGGGAGCGCCCATCACTGTCACTGAAAGAAGAGGAAGAAAGTGAGGGATCTGTGGAAGGCCGGGAAGGAAATCTTAAAGAGGTCACAGGGTTGCTGAATTTTCCAAGACCCAGGCATGGATTTCTCAGGGGGCCAGGTTACAGGAAGGTAGAGCTCCAGGTGGTGGTGGGTACTAACTCAATACTTCCTAGCAGGACAGGCAAGGTCTTGTTACAGGAAACTCCAAAGGACCATCCACATTCCTTTCTATGAGGGAATTTTGCTGTATCAAAGGCTGCTTGAAATAAGAGTCTGTTTACATAGAAAGGAGGGGAAAATTGTCTGGTCCTGCAGGCATTTGTTGAAACGGCATTGACTCTCACAGGATTTGATGAGCTGACAGAGTGAGGCTGGCCTCGTTTATAGAAGGCCAAGGTAGTAAAACAGAGAGTAAGCTGGGCTTGGAACTCTATCTCCAAGTCCAAACTATCCTTTGCTGTTTCAAAACCACAGAACCACAGGCATACTGCAAAATTTGAGCTTGGAACTCTTCAATCTGTAACATGGGTATCAGAATGAACATCAAATGTATCTTATGGGACAGTGTTTGTAGAAGAGCCTTGTAAAACAATACAGTATTATGTAGATACATGGTATCATTACTGCAGTATTGCATAATGATTATAACAAGTGGTGACTGTTGGCCAAGATGACTCTCTCCAGCTATAAAATGGCATCTCTCTGTAATACCATGAGGATGCAAACATAGCTTCAGTTCTAAGAAGCTAAGAAGGTTCTAAGAAACTTGTTCCCCTTAACAGAAAAAGAAAAAGAGCAAGGGGTCCTTTGCAGTCATTTGATTAGCAATCCCAGAGCTGGAATTGCCCCTTGGTTTGAGCTCTCCCGCTTCAGCAGTCCTGAGAATGGCTCACCGTCACCACCACGTAGAAGCACCAAATCACCGAGGTGAAATGAAAGACGACCAGCTGTCCAGATTCATTGAACTTGCTGTGTTTGACTTTGGAGAGATGAAGCCGTTTGCTGATTTTCTAAAGAATAAAGAAAACCCCTCATATTAATATACAAATGTATCCATATTGGGCAGGTTTCAAACTCTTGTATTCTCCCCACAGAAGGGTTGAACATCGTTAGAAGTTTGCAGCTGGCCATAATCCAAGTCATTTGGTGTAAGCCTACTGCGTGCATACAGTGCTTGGTCTAAGGCAAGCATTTTGAGAAAGTGGCAAGATGAATGTCTCTAGCCTATGTGTAAAGAAAATAACCCCAATTACTCAATGTGCCCCAGACCCATAAGGACACCATCTCCAGACAGCTTTCTCTCTGTGTAATAAATACTGCTGTCCCATGTGCTGATTAAAGGAGGCTGTGAACAGAAACCAAAGTGTGGTGAAGGAAGCCCAGGCAATAGACCCAACCAGTGCAAGCAAGTTGGAGGATGAATGGGTGCAGAGCTGCAGTTTCCTCCAAGGCCAGGTCCTCCACCCCAAGGCACCTCCCCAGCTTCTGATCTCAGAATCCAGACATGTCACTTACATCTAAAATGTACTCCTGAACCACAGCATGCAAGATGATGGTGATGAAGATGTAGAACAAGATTGTGACCAGGTCCTTAGGGCCATAGTGGTAGTGCACGGTCTCACTGTCTGTGGAGGTAATAAAAGTCCCATCAGCATCCCTGGGGGAAGGAAATACTCTGGGACCCAAAACTGAAATGAGATGGGAGGCGAAATGCGCCATCAAATGCTACCCGTTTGCTATAGCCTCAGACTCAGAAGAAGGTTTCTGCCCCAGAATCCTGCCCACCCTCTGGTCTTAGCACTTGGAAGCACCAATGGAGATGGCTAAGGAGAACCAAGTGCATGGCTGTATTGTCATAACAGTATCTCCTGAGTCTGTGCAGCAGAGCACAGTGGTTATAACAGAGCCAGGGTTAGAGACCACCAATCCCCATCACTGGCTCTATCACTCCCTAACTGTGTGACTGTGGATAAAGGACTAACCTCTTTGAGCCTCAGTTTCCTCCCCTGTAAAATGGGACTATAGTTATGCTTTCTCAAGAAAGCACCGCGTAAGGGCTAAATGTGGACTCAGAAGCTGGACTCTTCAGTTTGTATTGCAGCTCTGTCCTATGTGACCCAGGGGTATCTCCATGTGTGACTTTTCTGTACCTCAGTTTTCTCATCTGAAAAATGAGGACAACATTTCCTGCATAGTAAGTTTATTATGAGAATTAAATGAATAAATGCGAAGTGCTTAGAACAGTGTCTGGCACATAGTTAAGTGCTATATATGCACTTGCTATTATTTTTGTTGTTGGGCTAGTGCAAGGATCAAATGAGATAATTTGCTTACAACAGTACCAACAATTTACAGTAAGTCTGCAATAAATGGTGGCTTATTAAAATACAATTAAATAGTAATAAATTAGACAACATCCCAGGTATAGAAATCTTGTGAAACTCCGCCATTGCAGCCTGTGGACAGAGGAGAATCTGCATCCTTGCTCCAGTCAGTGGGCAGCAGGCTGCGGGGCTGTGAGCCTGGTGGCCGTGTGCCTGGGTCTGGGCTGCTCTCTGCAACCCCCACCTCCACCAGGCAAATGGCTGCTCTCCAGCTGTGCTGCATTCGCTCTGAGTCACACACACATGAGTCATCTCACTGCTGGGATGCATTTACCAGAAGGTAGCCAGGCTCAGTTTGTTTCAGGGTGGCCAGGGAACAAAGTCAAGCTGATTGGGTCACTCTGGGAGTCCACCCTAATCTCAGCCACCCTAGACTGGGAGAATGTAACGGTGGGCAGTGGTGAGGGGGTGGGAGGAGGTGGCGAGGACAGAGAGAACATGATCTTGGAAATCAGACAAACTTTCCTTTTTCCTCTCCCTCTTCCTTTCCACAAAGACCTATTCTGTGAGAGGCACTGGGCTAACTGTTGAAACATGGAGATAAAAGACACCACCCCCGGTTGGAAAACATACAGTGCAGCAGGGAGACTAACAGACAGATGTACGATTACACTACAGACGGGCAGCGCTCCTGAGAAGCACATACAGTGAGCCACAGCAGGCGAGGGCCCCACTCTGGCTAGGGTGGAGGTTGTGGGTAAACTGTTCACTGGTCAGGGTGAACAGAACGGCATTGGAACTCGGGGACCAGCAGGAGAGGCCGGTATTGGGGACATCCTAGCCAGAGAAAGCAGCATCCACAAAGAATGAAGGGACTGAGGCTGGACTGCTGGGGGCGGAGGGGAGGTCACCGTGGTGAGCGGCGGGCTGCTGTGCGTGGCCTTGTGTGCCATGTAAAAGGGTGTGGACTTTATCCTGAAGGCAACGTGGAAATATTGAAGAATTCAAATTAAACAGGAAAATGATGACATTTGCGTTTTGGAACATTTACTCTGGCAGCAGTGAACATGCCCAGAGGTAAGGACACCGGTTAGAAAGCTGTTCCTGTGATCCAGGTAAGAAGCCACAGGGCCTGAATCAAGGCAGGAGAAGAGAGAGGAAGGGAGAAGGAGGGCTGTCAGTGAGAGAGAGCTGATGAGCCTTGGCCACTGAGGACCGAAGGGCTGGGATCCAGGATGGGGAGTCAGGCACTGAACACCCGAGGAGAAGACACGAAGATGAGGGAGAGGAGACTCATGGCCCAGCCTCTCCACTCTACCACATGTGACGCCAGGATTACATTTTCCTTGCCTTCTTCATAAAGAGACCAATTAGGTGGCCGCATATTTTGAAATTATAAAATAACTAAACATAGTTTCATCATCAAGATCATCCTTACTAGGCATAATGGGATTTATACTCAACCAAACAAGCACAGTCCAAAAATCAGTGAAACAGTACCTGACAAGACCTTAGATTATCCATTTTAAAGCCCTTTACGAGGGTCACCTGCCATTCTTGATACCAAATACTAGGGTTCCAAAGAAATATGACTATAATCTGAAATCCTTCTTGAAACTAGAATGAATGTAGAAATAAACACAGACTCGTGTTCCTCTGCTGTTGAGACCTGCGCACATGCATCCTCATTGGCTGACGAACCACGCACAGGGCTCCATGCTGGGCACTGGGAGACGGCAGTGAGCAAGGTGGGCACAGCCCCTGCCCTCTTGGAGCTTAGCGGGTACACACCACATCCTTGTACACTTAAACACCAGCAGCCAAAGAACTGTAACTCAACAACAAAAACCAAACAACCTGATTCTAAAAGGGACAAAGTTCTTGAAGAGACATTTCTCCAAAGAAGAAATACAAATGGCCAATAAAGACATGAAAGATACTCAACACCACTCATCATTAGGGCACTACAAATCAAAACCACAACAAGGTTATCTCCTCACACCCATAAGGACGGTTACAATGAGGAAAAAACAAACAAGCAAAAAACAGAAAAACAACAAGTATTGGTGAGGATGTGGAGAAACTGGGAACTTTGTACATTGTTGGTGGGAATGTAAAATGGTACAGCCACTGCAGAAAACAGTATAGTGATTCTTCAGAAAGTTAACAATACAATTACCACATATTTCAGTAATTCCACTTCTGAGTGTTGGGGTAATTGAAGGCCAGATTTCAATAAAATATTTGTACATCCATGTCCATAGCAGCACTATTCACAACAGCCAAAAAGATGGAAGCGACGCAGGTGTCCATGGATTGATGAATGAATAAACAACATGTGCTGTATACATACAGTGGAAGATGATTCAGCCTTAAAAAAAAAAAAAGGAAATTCTGACACATGCTACAACATGGGTGGACCTCGAGGACATTAGACTAAGTTGAATAAGTCAGTCACAAAAGGACAAATACTGTATGATTCGATTTATATATGAGTTACCTAGACTAGTCAAATTCAGAGACAGAAAGCAAAATGGTGGTTACCAAGGGCTGGGAGTGAGAGGAATGGGAAGGTGCTATTTAATGGGTACGGGGTTTGTTTTGCAAGATGAAAAGTGTTCTGAAAATTGGTTGTATAATAACGTGAATGTACTTAACAATACTGAACTGTACATTTAGAAATGGTTAAGATGGTAAGTTTTATGTTATGTGTATTTTACAATTTAAAAAACAACAACAGCCAGCTGTGTCAATGCTCTGAAGTGGACTGAAGGCTGGGGGTGTGGAGCAGAAGGTTGGGGACCTGCAGAGGTGGGAGATCAGGAAGCACCCCTTAGAGGTCAGGGCAAGACATGCGGACTGTACCCTAAAGGAATGAGAGCTACTGGAGGATTTTCGTCACATGTTCATAGAGACCTCTCTTCCTGCCACAGGGAGAATGGGTTAGAGTGGCAAGGCTGGAAGCCAGGAGAGCAGTCAGAAGGTGCCCGTGGGAATTCCAGGCAGAGCAATCGGAGAAGAGATGGGCGTCGGATAGAGTCAGTGACGGAATCAAAAGAACCAGCTAACAGCTGGCTACGCGGATGGATTCTCAAGTTCCTTCTGGAACAGTACCTATATTCTATAGCCTCTTTCATGGTTTTAAAATTCTGCAACATGCATTATCTCGTCTGATCATCCTAACTATCTCATGAGATAAGCAAGGAAAGTGAATGAGGAAAGAGTTCACAGAGTTAAGGGACACAGTCCGTTTCTTGGGTTTCCTCACTCCTAGAACCCAGCCACCAAATGCCACCTCAAGGTCAACACAGCCCCCCATCCCACCCCATCACAGCTCCATTTCTGGTAATATACCATTCCTCTGACCTCTTACTCCTACAATCATAAGGAACAGCTTCATACACAAATAATCAAAAGCTATATTCTGATTCGCACAAATTATCTCCATGGTTTCCCTCCTTACCTGCTATCCTCCTACTTTTTGTTTTGTTTTGTTTTTTGAGACAGAGTCACCCAGGCTGGAGTGTAATGGCGCAGTCTTGGCTCACCACAACCTCCCGGGTTCAAGCAATTCTCTTGCCTCAGCCTCCCAAGTAGCTGGGATTACAGGCGCGGGCCACCAGTTCCGGCAAATTTTTTTTTTTTGTATTTTTAGTAGAGATGTGTTTTTGCCATGTTGGCCAGGCTGGTCTTGAACTCTTGACCTAAGATGATCCACCTGCCTTGGCTTCCCAAAGTGCTGGGATTACAGGTGTGAGCCACTGCACCCAGCCCTATCTTCCTACTTTTGATCAGAGGAGGAAAGTAGTAGGTTGGTGCAAACGTAGTAATAAATTGGTTTGGCCCTGTTTTCATAGAACTATAGAGGTTGGACCTTTGTCCCCTTCCAGATGCCTACAAACAAACTGATGTTTTTGATTTTTTTTTCTTTTTAAATTTTGGTTGCCACTAATTCTTATAAAAATCCTCACACAAGGCTGGGCGCGGTGGCTCACACCTGTAATCCCAGCACTTTGGGAGGCCGAGGCAGGCGGATCAAGAGATCAGGAGCTCGAGACCATCCTGGCTAACATGGTGAAACCCCCGTCTCCACTAAAAATACAAAAAAAAATTAGCCGGGCGTGGTGGCGGGCACCTGTAGTCCCAGCTACTCGGGAGGCTGAGGCAGGAGAATGGCGTGAACCCGGGAGGGGAAGCTTGCAGTGAGCCGAGATTGCGCCACTGCACTCTAGCCTGGGAGACAGAGCGAGAGACTCCATCTCAAAAAAATAAAATAAAATAAAATAAAATAAAACAAAACAAAATAAAATAAAATAAAATAAAAATAAATAAATAAAAATCCTCACACGACCCAGGTTAGAGCTCCCACTTCTCATAGACTGCCCCTGTCGTGCATGAGCTCTCAAAAAGAACAGCAATCGTTTGGCAATAATCTATTCTATTTTTTTAGAAGAATAAGTCCAGCACATCTCTGGCCTATGAGGCCAGAGAGGTGACTCTGATTTTGGATCAAAACAAAACGCCTACAGGGACCGGGGGGAGCACAAATGAGCCAGGTGGTCCAGGTGTCTTAAGATAGCTGCTTTCAATACAGAGGCCCACTGCATTAAGCAGGTCATATTCTTCACTTCCACAGAGAAATATGCTTTCCACTGCTTTTCTTTAAACATATCACCCTCTGGTCTATCTTTCACATCTCCACTTTGAGAGAAACAAGTTTAAGAGATATCCACTGACCTTTTAACCTTACTAAAATAAATACACGTTAAAACTGAGATAAACAGTAGTAACTGGCAGCCTCGATGTCAGGAACACACTAGAGAGGAGGGGCACACCCCACACTGTGTCCCACAGGGGTGAGGGAGGCAGTGGCGTAGCTGCATCTCAGCCACTGTGGCTGCAGGAGAGGCGCAACCCAGTGGCTGGAGTCCCAATGTTTCAAAAGCAAAGAAAAATCTTTACGTGAAATCATCTGATTTTAAAATGCTGGTGACTAATTCGAAATTTTTAAAAACACTGCATGGGCCAACACCAGACTGGCCAAAGAAAACACATCTGTAGGCCAACTCTGACTACAGGCCACAGATTTGTAACCTCCAACCTTCATGACCCCTGATACCTTTCCAACACCAATACTCTATGAGCCTTCTTCCTATATAACCCTATGGAGTACGCCAATATGCTCTAGTGTAGGAATTAATCTAGCTTTGGGAAAAAGCACCTTCAATAATGACCTTCCTACTGTAGTGGGTTATCCCACCTCCCATCAAAAATGACACTTACTTTGCTTATCTTTGATTACAGTTTAAAGAGAGACCTGAAATAATCAGAATCTTGGCTGTTTTGACAACCTCTGTGAGCAGCTGTCCCTTTTGGGGAGTCACATTCTGCTTGACCTCCTGCTCCGTTTCCTATGACTAATAGATATTTTCCTGTTTCCTTCTGAGGTCACCTGCAAGCGGCTTCTCCTGCCTGCCTTTACATTTCCCAGTCCTGTCTGGATCCCACTGTGCGGTCTCTGACCTCCTCTGCACAACCTGAGCTGGTGTCCACTTCTTACTGACATCCCATCTGCTTCTGAGAACTCATGTGAGCCAGGGCAGGCATCTGCCCTAGAAGCTTCTTCTTTTGTCTGAAAGCTAGTTGTTTAAAGAGCATCACTGTACTCCTAGTTTCTTTCCGAATCCCTGCAAATCTGGATTTGTAAAATTTTCTTCTATTGGTTGCTGTGCCAAGAGCCAACTCTGTTTTCGTATTATTTTGAATTTTTTACACTATATATAAATCCAGAATTAGATATGGAAACACCACCACAAACAAAATCTGGAGGCAAATGATCACCTGGGGAAAATATTTACAATTCAGATCAGAGACAAAGGGCTAATCTT'

In [None]:
text = text[0:10000]

In [None]:
ref_token_id = tokenizer.pad_token_id # A token used for generating token reference
sep_token_id = tokenizer.sep_token_id # A token used as a separator between question and text and it is also added to the end of the text.
cls_token_id = tokenizer.cls_token_id # A token used for prepending to the concatenated question-text word sequence

lig = LayerIntegratedGradients(custom_forward, model.bert.embeddings)

input_ids, ref_input_ids, sep_id = construct_input_ref_pair(text, ref_token_id, sep_token_id, cls_token_id)
token_type_ids, ref_token_type_ids = construct_input_ref_token_type_pair(input_ids, sep_id)
position_ids, ref_position_ids = construct_input_ref_pos_id_pair(input_ids)
attention_mask = construct_attention_mask(input_ids)

indices = input_ids[0].detach().tolist()
all_tokens = tokenizer.convert_ids_to_tokens(indices)

In [None]:
predict(input_ids)

tensor([[-0.4575,  0.3728]], grad_fn=<AddmmBackward0>)

In [None]:
torch.cuda.empty_cache()

In [None]:
# Check output of custom_forward
custom_forward(input_ids)

tensor([0.6964], grad_fn=<UnsqueezeBackward0>)

In [None]:
attributions, delta = lig.attribute(inputs=input_ids,
                                    baselines=ref_input_ids,
                                    n_steps=700,
                                    internal_batch_size=1,
                                    return_convergence_delta=True)

In [None]:
score = predict(input_ids)

print('Sentence: ', text)
print('Sentiment: ' + str(torch.argmax(score[0]).cpu().numpy()) + \
      ', Probability positive: ' + str(torch.softmax(score, dim = 1)[0][1].cpu().detach().numpy()))

Sentence:  ACAGGACAGGAGTGAGGACAGGAGGTGGCCTGAGGGGGAGAAAGAGAAAGATTTTTGGCTTTATTGAGAATGGTTTGTGGAAGAATAAGAGGAAGCCAAGAAGAAGGAAAGCGAAACGCCCCCTCCCCCCATTGCAAGACAGGTTTCGGCTGTTTGAGACGGAGCATCACAGGCAGGAAGGAGGAGGCAGGGAGGGGGCCTGGGCTCCTTGCCCCCTGCTCGGCCCCCACCAAGAGGATTCCTGTTCTTAGCACTTTGGCCTTAGGGAGACTTGAGTTTCTTAGTCCGTGGGGAGGTTCCGTTCTCTGCCTTCACCACTCCATTTTCATGGTAACCTGGGAAGTGGAGAGAGACAAGCATACATGGTGTTTCTGCTGGAGCTAAGGCAGAAGAGGGGAGGGTGGGGCCAGGCCAAGGAAGGGGCCCGGGCAGCCCAGCTGCTATACATGGATGCACCAAAGGGGCGCCAGGCTGCAGCCTTGCACAGCAAATGCAAGCCAGCAGACGGCTCCCAGGAGGGTCCTGTCTTCCCCAGGGCCCTGGACTAGTGGCCCTGTTTGAGAGGCTTGGTCTCTGACTGCACTTTAGCAGGAGGGGCCTGGGATGACACACAGTAACTCAGCAACAACAGAGGCCAGCCTGCCCAAGCCTGAGGCTGGGGCTAGATACTCGCCGAAATCACTTAGATGCTGTCACTGCTCACTGTCCTCAGTTCTTCTCAGGCCCCTGCAAGGCATCAGCCCACTTCCAGTTCAGCAAGAACTCCCAGGAGCAGTGGCCACAGAAGGGAGGGGGACAAGAGGCTGTAGGAACAAGGCCTCAAGCAGGATGCCTGACACTCCTCTGGCAGAAAAATTGTGCTCTATTGTTCAAAATACCTCCGTGCGCTTGCTCAAATTCAGAGGTACTGGCTGCAGTCTTATGCCCCATACCTCCCCCGCCAGCCAGGCCTGACTCTGTGACACACCCAGCTGCGCGCGTGTCTGGTT

In [None]:
attributions_sum = summarize_attributions(attributions)

In [None]:
# storing couple samples in an array for visualization purposes
score_vis = viz.VisualizationDataRecord(attributions_sum,
                                        torch.softmax(score, dim = 1)[0][1],
                                        torch.argmax(torch.softmax(score, dim = 0)[0]),
                                        1,
                                        text,
                                        attributions_sum.sum(),
                                        all_tokens,
                                        delta)

In [None]:
print('\033[1m', 'Visualization For Score', '\033[0m')
viz.visualize_text([score_vis])

[1m Visualization For Score [0m


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
1.0,0 (0.70),ACAGGACAGGAGTGAGGACAGGAGGTGGCCTGAGGGGGAGAAAGAGAAAGATTTTTGGCTTTATTGAGAATGGTTTGTGGAAGAATAAGAGGAAGCCAAGAAGAAGGAAAGCGAAACGCCCCCTCCCCCCATTGCAAGACAGGTTTCGGCTGTTTGAGACGGAGCATCACAGGCAGGAAGGAGGAGGCAGGGAGGGGGCCTGGGCTCCTTGCCCCCTGCTCGGCCCCCACCAAGAGGATTCCTGTTCTTAGCACTTTGGCCTTAGGGAGACTTGAGTTTCTTAGTCCGTGGGGAGGTTCCGTTCTCTGCCTTCACCACTCCATTTTCATGGTAACCTGGGAAGTGGAGAGAGACAAGCATACATGGTGTTTCTGCTGGAGCTAAGGCAGAAGAGGGGAGGGTGGGGCCAGGCCAAGGAAGGGGCCCGGGCAGCCCAGCTGCTATACATGGATGCACCAAAGGGGCGCCAGGCTGCAGCCTTGCACAGCAAATGCAAGCCAGCAGACGGCTCCCAGGAGGGTCCTGTCTTCCCCAGGGCCCTGGACTAGTGGCCCTGTTTGAGAGGCTTGGTCTCTGACTGCACTTTAGCAGGAGGGGCCTGGGATGACACACAGTAACTCAGCAACAACAGAGGCCAGCCTGCCCAAGCCTGAGGCTGGGGCTAGATACTCGCCGAAATCACTTAGATGCTGTCACTGCTCACTGTCCTCAGTTCTTCTCAGGCCCCTGCAAGGCATCAGCCCACTTCCAGTTCAGCAAGAACTCCCAGGAGCAGTGGCCACAGAAGGGAGGGGGACAAGAGGCTGTAGGAACAAGGCCTCAAGCAGGATGCCTGACACTCCTCTGGCAGAAAAATTGTGCTCTATTGTTCAAAATACCTCCGTGCGCTTGCTCAAATTCAGAGGTACTGGCTGCAGTCTTATGCCCCATACCTCCCCCGCCAGCCAGGCCTGACTCTGTGACACACCCAGCTGCGCGCGTGTCTGGTTCAAACACACATAAGCCTTTGCCAAGCAGGTGGCCACCTAGAGAAAAGCAGGTGAGTCAGAAAGCAGCGCCCAGTGCAGACAGGCCCCCAGGCTGGGCAGAACGTGCAGGGCTGGCAGGGCCTGAGGACCTGCTGAAGGTGGGTGATGACTGGAGTGCGTGCACGGGCCAAAGGATAAGTGTCCCACCCCTACCCCCCACCTAGCACTATGTCACTGTGAGTCATTCTTGGAGACAGAGGAGGAGCCAGCAAGCTGGGAGGCAGGGGCAGGCTAAGATGTGGAGCAAAAGGGCAGGTGAGGACAGAGGCCGCCGTCCGGCACTGAGAATGGGCGGCGGCGGCAGTAGCAGCACTTGGCTGGGGTCCAGAAGCCACCCTGAGGACACGCTTCCTGCCAGAGTTCCCCACCCAGCCACTGCCCTGCCCCGTGGTGGCCAGGGCTCCCAGCCTAGTTAGGGCCAGCCCCACCCACAGCCTGTCCCTGGCCCACACCCAGCCACGTGCCAATCAGGGAGCTAGGAGCCCCAGCCCTGAGGTAAGAGTCAGGAAGGAGAAGCTGGCAGGATTGGTCTGGGCAGCGCCCAAGAAGCCAGGTGCCTTGGCTCCTCCCACCCATCCCAGACAGACTTCCCTGGCTCCACTCTCTGCCAAGGGCCCTGGCACTCACCAGATTCCCTCTTGATGAGCCTGGCTGGTAGTCTGGGTGTGGCTGGGACTCTCCGCTTTGCACTCTGCTCATTCCAGTATTCCCGCCAGTGCCGCAGCTGGGAGTGGATGAAGCGCCACATGAGCCAGGCCTGGGCGGCACACACCAGCAGCAGCACGCAGAGCCTGCAGAGCAGGGGGTTAGGGGCTTAGGCTGGGGCTTGGGCTCACAGCCTTGGGCTGGGTTGTGCAGGGGAGAACAAGGGCCAGGGGCCCTGCAGTTCCCATGGCTTATCACGTCCGCCTTCACCACTGGCCCTCTTCGATACCACCACTATCACCAGGAAGAATGTGTGCTTCAGTCAGTCTCTGCTCCAGCATACATCACATGTGCCAGGGAGACGGGAAGGAAGTGGCGACAGACGTACGGCCAGCTCTACAATCACGCTACTCCTATGACGAGGGAGGGGTCCATGGCTGTGTCTGTTTTGCGCCCATTGCACAGAACAAGACTAATGTAAGCTCCACAAATATTGGTAGCATTCAAATGAACTGAATTTCTGGAAGAGTGGCTTCTCATTTAACATGTCACTTAAAAGTGGAGCAACCCTGGACAAATCACTCTCCTGGGCCTAGGGGCTCCGGAAAATAGTGGCTTCCTCACTGCCACAGGAGGCCACTGGCCAAGCCATTAAGCACATGGTTTTAAAGCACCCACACACAAGAAGAGGAGAATGATATCAACTGAGAGACTGGGTGTGATGCCTCTGTGCACCACAAAGTGCCAGACAAATGTAAGGGATTCCTATTTGGACTACAGTCTGAGCAAACCAGGACTAGGGGATGAAGATGGTTTGGATGGAACCAGAGGCTGCTATCTCTTCTCCCCTCAGGCCTGATATCCAGAGATTTCCAAAAAATAACAATATGTGGGAGACTAAAGGGTCTGCTGCCTCCAGACCTTCTGCAAGGGCTGTGCCAAGTTCAGGAGGCTCCCTGGCTTATCACCTTGGACTTCTGCTCGACTCACCTGCAAAACAAAGTGTTGAAGTTCCCTTTCTCGGGATCAAATGCCTGGTTTTCCATGCGAGCCAGTCCAAAGCCAATGGCCAGCACGGCAAGGGTGAGGATGAAGAGGCGGGTAACCCCAAAAACAGCAGCCCAGGCACTGAACCTGCTCACAGAGGCAGAAGAGGGATGTCAGTCTTTAGCGCCCTTGAAGGAATCTTCACCCACTTCTCCAGAAGAGACCCCGAGTGGGAAGAGGATTCAAGGGTGGCTGGGGAAAGTGCTTGAGGGACGAGATATCTAAAATCAGATGTTCCAGAAAAAAATAACGGGAGGGCACCACCTGCAGGTAAGCGGGCAGTGTGCAACCAGGGAGGGACCCTCCAACCATCCGGGCCTCGGGGGAACCCCTGCCCAGGCCTCTAAGCGGGCCAGCCTGCAGCAGACCCACTTACAGTTTCTCGTTGTTTTCATCTGCAAAGTAGAAGAGTCTAGCCGTGTGGAAGAGGAACTCAGTTGAGTACTGCAGCAGCAGCAAGATCAGGCCCAGGCGGCTCAGGCTGGGGGTGGGGAAGACTAGACTTACATTCCCTCCAAGATGCTGCGTGGAGCAGAAGCCATTGCATCTTGGCTCAGGCTGTCCCCTGTGCCTGGCTGGGCTCTGCTTTCCACTCCCACTTTCCCTGGCTGGCTCTGCTCCATCCTTTGGATTCAGTTTAGCTCTCACACCTTTAAGACATTTTTCCTAATACCGACCCGCTGGCCGTTCAGCTGTCCTGTCTCAGTCAGATGCCCTTGCCTGCTCCCACAGCAAACCTCGCATAGGCCCTTCACAGTACTTAGCACCTTGCACTCATCACCTAGGCTGGAACCAAGTACATAAAAGGTACTCAGAACACATTTGCTGAGCTCTGAGTATAGGAATATGAAATGTTCCTGTTGTCTGACTTTCCATTATCCAAGTCTTCACAGCTCCGAGGTACATGCAGAAGCAGCAAGTGCTCCTTCTGTGTGGCCCTGCTTATACGTTCTTCCCCGGTCCTCGCCACTGCTACGGTGACAGTGCAGACTGGCTTCTTAGACCCGTTATGCATGTGACACATGACCATCCAACACAAGGGCAGAGCTGGCATCACCCCACAGCCTTCAGCCCTCAAAGACCCATCCGGGAACTGACGCTGCTACAGGCCACCAGAGACAGGAGACAGAGTTTGAGAGCTCCTTCCCTGCCTCAGTCTTACTAATCCAAGTCAGTCATTCACACAGGATGCCTGCTGCAAGGACCTAGTCCAACGCACCTCGGGATTTCCAGGCACCTCGGCAGAAAGTTACACACAGTGAGCTCTGTAAGTGCCAGCCTAGAGAAAGTGTGGGGTGCTTTTACTGCATGGATAACACTCAGCAAAAGCCCAAATTATCAATGACACAGCTTATTAACATCAAAAGGATTCTTTTCATAAAAGAGGCTCTTCGAGAACTAATATTATAGCAATTCTTTCTGCCTCTAGAACAACCAAGAGAGACCTACTCTCCATGTCATTATAAACCAAAGGGAAGGGAATTCCAGGGCTACGAGCTCTAGCAGTGTTTGCATTGGACACTGTGAGGTAAGAGCCCAGCTTTGGGAGGCCTTCAAGCTGCAAAGCCATGGTTCAAAGGCCGACATCCACTGGAAGTCTTCCTGGCTGTCTCTGTTGAGGGTCTTCTTCTGGGTTGCAGAGCAGATGATACATACTGTGTTATGGTGTTCATCACTCTCAACTGTCCTTACTTATGTCTATAACTGTCTCTTCAGAATGAGAATGAACCACTGAAGATAAAGAATCTTCCATTACCATCTTTGTATTGCCAAGTCTTAGCATAGTGCTAGGCACACAGAGGATGTCAACAAATGCCTGATAATTATATGAGTGTGTGGACAGATGCATGGACATAAAAGGGCAAGGAAATCTGGCTGGCTCCATGGTCTCACTCACTTTAAGAGGTATGCTCCAGCTATATGCACCAGGTACAGGCAAATATACTGGAGCTGGCGGGGAATTTCCTCCTGGAAACAAGAGAAGCAGATGGTAAATTTGCTAATTCCCTAACTGAAGATTCAGGGAAGGGGGAAAAGTGCAGGGGGATGAGAGAGGGCCAGGCTCCTCTGGGCTGCTTTAACACACAGTCCCATGTCCCACGAGTCCCACAGTCCCACTGCACCAGGCTGCTGAAATTCAAGGGCATTCAGGTCCATTCCCAAATTCCAGCAGCCTTGGGTCTAGTGTCAGAGGGTGAGGTTTGGATTGAGAAATAAGAGACAGGGACTGGAGAAGAGGGCTCTTGGAAATAATTCAGAAGGAAACTATAAAAAGTAAAAATAAAAAAAGACTATGGAAATGGCAAAGACCTCTCCTTTGACATCTATAAGATGAGAGTTAGGTTTCCTCCAAAGCCACAGGTCTGGTGGAAGAGGCAGGCAAGAGACTGACACTGGTGGTCAACTACATGACACTTCTCCAAGAGATGACTCAGCATGTTGCTCAATCCCCAACATATTCCTATCACCACCCAACACTCCATGCTTCTGGAGAAAAGGAAGGGAGGTACCCCTGGGAATAGCAGGAGGGGAGTGGTCAATGAATGGCCTCCAAGAAGGGAGAGAAGTGAGCACTCACCTTCCGTACCTTCTGGAAGTATAGCTCAGGAAGTGCGTGCAGCCAGTAGGCCAGCTGGCATAGGTAGAAAAACTTCACCTGGAAGCTGGAGACAAGGGGGCAAGTCACACGGGCAGGATAGAGAAAAGTGTCCCTGCAGGTGCTGGCCAAGCACAGGAGGGAAAAGCATGGGCTGAGACTCTGCCTGTGAGGAGCTGGTCCAGGAGCAAGGGAGTTAGGCCAGTGACCGCCGCACCCTGAGCCTGGGACCCTGGCTTCTCCATTGGCCTGTGCCCTTGTTCCACATACAAAACCACTTAAAGGACACGGAAAGTCCACAGAAAGAAACAAACATGATTAAAATAGTGCAGAGGAGGAGGAATCCTTCAGCCTTGAGGAGGGAGCTGATTACAGAGCACTGTTGGAGATAGGGACCAACAGATACACTGAGACAACAAACAGCTCTAAGTAGCAAGGGAAGGTTCTAACTCAGCCCTACATCCTTTGCTATTATTGCTCTTAAAGATCTCGGGAAAGGCAGCCAGGCGTGGTGGCTCACGCCTGTAACCCCAGCACTTTGGGAGGCTGAGGCAGGTGGATCACCTGAAGTCAGGAGTTTGAGACCAGCCTGGCCAACATGGTGAAATCCCATCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGCACATGTCTGTAATCCAAGCTACTTGGGAGGCTGAGGCAGGAGAATCGCTTAAACCCAGGAGGTGGAGGTTGCAGTGAGCTGAAATCATGCCATTGCACTCCACCCTGGGCAACAAGAGCAAATCTCCATCTCAGAAAAAAGACAAAAAACAAAGATCTCGGGAAAGGCAAAGGGTGGCCTCCTGAGGGAGATGGCCCCAGGTATTGCCCTTGGGGTACACTGCCCTCTTGGCAGCACTATATGAGGCAGAGGACACTGGCTCTGACAGACCACCAGCCATGGCAGGCCAGAAGGGAAGACACTCTGTGGATGTCAGGGGGTCGCCAAGAAGGTAGAAACCCAGAGGGCATTATGGAGAGAGATGTTCTGCTTCTGAATCTGTCTCATGCAGTTGAGGGACCTCTGTGATGGGAGCCAGCACAGATGGAATTTCATCTGGGGATTCTCTGGTCAAGCATGCTGAGAAGAAGTGGCTTCCAGACAAGTCTACCATCCACAATAGGCTCAGGGCATGATCTGCTCGTCAGGCCAGCTGGGCCTGTGGTGTTCTGGCCACACTCCGCTGGGACAGGAAGGCAGTGGGCCCGGTCGCTCCTCCCTGGGGCTGAGTCAACAGAATACTCACGGGAGGTGCACATGCGGGTAGTCTTCCCAGAGGCTTCTTGGGTTTGTTAAGTATCCTTCCTGCAGTGGGCAAGAAGAGAGACCATTTAGAGATGTGGACGTGAGACCTGCTGGGGCCCTGGGACCGGTCCAGGGGTCAGGGATGCATCCAGTCCCCACCTGACAGAAAGAGGAAGGAACAGGAAATGTGAAAACAGAGAACTTCTCTGTGTGGGACCCCTGGCGCTTGGCTGGTTTCTTTACTGTGGAAGAGTCATGCTGGAGTAGGAAGGGCCACGCTCTGAGGTCCAACGACCCATATCTGAAGATGAGTCTGACAAGCGAATTAGTCTTGCTCCTCTGAGCAAGCTAATTAGTTTCCCTAAGCCACAGCTGGCTCATCTGCAAAACAAAATAAAAATACCCACCCTCACAGAGTTATTGTTGGAAATGAATGGGATAGTTTATGTGCCAGTGTCTAGTCCTGTGCCTGGCATGCAGGCGCTCAGGAAATGCCTCCATAATGAATAAGCAAATGAACTCTAGAATCACCACTCGCTGGAAAAATGAAAAGCCTACTTTGGCTTTTCACAGCCTGCTGAATAAAAAACATGGCAGGACCCCATAGGCCTCACCATGCAGCTGGACTCTGACACCTACCACACTGTGTCATTACTGTCAGTTGTTTCCATTACTCTTGCAAGTCCCTTCACACTAGGGCCTTTTCTTGCCTATCTTTAGAATTCTAACATGTAGTCCAGCACCTTATATGGGGTGGGGATGGCAACATGAAAATCCTTCCATCACAAAACATCTAGAAATGCTGGGTGAAATCTAATGAATATTCTTTTAAATGCAAAGAGCTGAGCTCACAGTAAGAAAGGGAAACCCCCTGGGACCCAAAGGGAGAGGGAGGCTAAAAGGCAGAGCAGTAAAGTGACACTGTAGCAGCCCAAAAGGCACTAGTTATGGGCCAGGGTTTTTGTGCCCATGTGAGAACAGAAGATGGTGCCTTGGGAGGTGGAACCCAAGACCTTGTATAAGACCAGGACCTCTGAAAGGCCACAATCTCAGAGAAAGGAAAAGACTAGAAAGTGTTTGCTGACCAACACAGGGAAATGAAGATGTCTGCTCAGCCCATACCCAAGGTGAAAACAAAATCATTTATTCTAAAAATCTGCAACCTCAGGTTCACTCTGAGTTTGGAGGTGAAATATACTACCTGTGTGATCCAAAAGCCGCCAAGGTAAGAAATTAGAATTAATAGTGTGGTGGGCCAGTGATACCCTGGGGACATACCCTCATCCAAGGATGCTCCACAGATAAAACCTTGCTAAAGATGAATTTATAATCCAAGAGTACAAAGCATGGGAAGAAATAATCTACCACAAGCAAGAGTCAGCTGAAACTACAGGAGTGCAATACACACCAGTTGGTTGAATGAATGAATGATGAATGCTTTGGGCAATTTCTCTCTTCTGAAGAAAGGGCTCTTATTTGTCACTCAGAGAAGGCAGAGCAGATTAGATTAGGATGACTTCATTTTAGAAATGGGAAAATGAAAAAACAGATAGGAAGGATCTCCTGAAATAAGATAGTTTTGTTTTGTTTTTTTGATATGGAGTTTTGCTCTTGTTGCCCAGGCTGGAGTGCAATGGCACGATCTCAGCTCACTGCAACCTCTGCCTTGCAGGTTCAAGCGATTCTCCCGCCTCAGTCCTCCTGAGTAGCTGGGATTACAAGCACGCAACACCACACCCGGCTATTTTTTGTACTTTTAGCAGAGACGGGGTTTCACTATGTTGACCAGGCTGGTCTCAAACTCCTGACCTCACTTGCCTCGACCTCCCAAAGTGCTGTGATTACAGGCGTGCACCATTGCGCCCAGCCAAGATAGTTTTTCAGTAGCACAGCTGAAATCCGAGTTGGGCCACAAGCCTTCTGGTCCAATAACTTCAGGCTAGGTTGCTTCAGTAAATCAGAAAATCAGCTGAGCTGGTGGCTTTGATGAGAAGGCTGAGAACCTCAGATGTTCACACTGGGATTAAAGGCAGAGGTTTTACAGTGCTCAGAATGAGGCCAACAGGGTTTAGTAAGAAGCATTCTAGGTTATTGTCTATTAGGATCTTTAGTTGTATTTCCAAGTGAGGGCTGATCCACCCACCTTTGAGTCACTAAACGCCCTGTGACCTATCAGCATGCCTTTCGGGTATAGTCCACGGCCCTAATCCCACAAACTTGGGCCTCCATGAGCACAATAACCTGACTGATAAGTCCTTTTATCGGATACATCTATACCACTGTAGTCACAGTCACCTGGATTAGAAGGAAATGATCTCACTTCGAACTTACATGGCCTCATTTCTAATCTCTTCTCACTACCACTCTCTCCTCCCTGGGTCACGTGCCGATTGAGGAATAAAAGTGGATGAGGCTCTCGGGTGGTGGCGTGTGTGGTGGCGGTGACAGTTGTGAGCTCTCTCAAATACACTGCTTCTATCACCTCTACCCACCCACTCTGTCGGGCATACGCCTGCCTTCATCAGCTCTCCTGCCCCAGGCTACCTCATTCCAGGGACATCAGAAAGGTGAGAATGTCTCTTCCTAGAGGAAGCAGGAATGTACTTAGCAGGAAAAATGGTACTTCTGAAACTGAGGTGGGAGAGAAAGTTTTGCCCAAACAAGACTCGCCAAGAAAAGCAGCACTGAGAGCAATGTAAAGCCCAGAAAATCTCGTGATTTTAAACAGGAACGCTCCTTGGCTTGGCCTCTTACTTAGAGACAAAGAGGTCAGAACTTTGAAGCCAAAAAGCAAAGAAACTCCCCAGAAAAATGTTGCCTGCTTGTGAATGTCCAGTCCACGGGGACTGGAGGAGGAAAAGGGTGGAGGGAGGAGAGCAGGGGGAGCCAGAGGAAAAATGACTCACTGCTCTGAGAACAGCCTTTTCCAGACCTCTGTCCAGGCAGCTGTCTGAAGGAGGACTGAGGCTGGGGCACCCTCTGAGCTCAGGCACGCAAAGCACCTGAGTCCACAGGGGGCTGAGTGTGACCCAGCAAGCACCTGAAACCCACCCCAAATCCCATCCACTGACAGGCCCCAGCAGATGGTTTGGAGAGGCTTTTGAAATCCTTTGTTCTCTCGATTCTACAAATCCACCCATGAGCTAAGCAAGGCCTCAACAAGGTGGAGAGATCCCTCCTGTTTCCCCAGCAGCCTTCCTTTTGGTGTGTGAACAAACACAACCACGAAGAACAGCATAATTCAGATATAGCACAGGCAAGTGCTACATAAATTCAGACATACCTTATATTATTTGACCATCAGAACAACCATGCACTAAAAATCTGCCCTAAAGCAACTAGTCTGTTAGTAGAAACCGGTCCTGGTACAAGCACCAGCATTAAGGACATTCCCTCTACTTGGTTCTAA,2.48,[CLS] ACAGG ACAGG AGTGAGG ACAGG AGGTGGCC TGAGGGGG AGAAAGAGAA AGATT TTTGGC TTTATTG AGAATGG TTTGTGG AAGAATAAG AGGAAGCC AAGAAGAAGG AAAGCG AAAC GCCCCC TCCCCCC ATTGC AAGACAGG TTTCGGC TGTTTG AGACGG AGCATCAC AGGC AGGAAGG AGGAGGC AGGGAGGG GGCC TGGGCTCC TTGCCCCC TGCTC GGCCCCC ACCAAG AGGATTCC TGTTC TTAGCAC TTTGGCC TTAGGG AGACTTG AGTTTC TTAG TCCG TGGGG AGG TTCCG TTCTC TGCCTTC ACCACTCC ATTTTC ATGG TAACC TGGG AAGTGG AGAGAGAC AAGC ATACATGG TGTTTC TGCTGG AGCTAAGGC AGAAG AGGGGAGGG TGGGGCC AGGCCAAGG AAGGGGCCC GGGC AGCCC AGCTGC TATACATGG ATGCACC AAAGGGGC GCC AGGCTGC AGCCTTGC ACAGC AAATGC AAGCC AGCAGAC GGCTCCC AGGAGGG TCCTGTC TTCCCC AGGGCCC TGGACTAG TGGCCC TGTTTG AGAGGC TTGGTCTC TGACTGC ACTTTAGC AGGAGGG GCCTGGG ATGACAC ACAGTAAC TCAGC AACAAC AGAGGCC AGCCTGCCC AAGCC TGAGGC TGGGGC TAGATAC TCGCCG AAATC ACTTAG ATGC TGTCACTGC TCACTGTCC TCAGTTC TTCTC AGGCCCC TGCAAGGC ATCAGCCC ACTTCC AGTTC AGCAAGAAC TCCC AGGAGC AGTGGCC ACAGAAGGG AGGGGG ACAAG AGGC TGTAGG AAC AAGGCC TCAAGC AGGATGCC TGACAC TCCTCTGGC AGAAAA ATTG TGCTC TATTG TTCAAAA TACC TCCG TGCGC TTGC TCAAATTC AGAGGTAC TGGCTGC AGTC TTATG CCCC ATACC TCCCCC GCCAGCC AGGCC TGAC TCTGTG ACACACCC AGCTGC GCGCG TGTC TGGTTC AAACAC ACATAAGCC TTTGCC AAGCAGG TGGCC ACCTAG AGAAAAGC AGG TGAGTC AGAAAGC AGCGCCC AGTGC AGACAGGCC CCCAGGC TGGGC AGAACGTGC AGGGCTGGC AGGGCC TGAGG ACCTGC TGAAGG TGGGTGATG ACTGG AGTGCG TGCAC GGGCC AAAGG ATAAG TGTCCC ACCCC TACCCCCC ACCTAGC ACTATG TCACTGTG AGTCATTC TTGGAGAC AGAGG AGGAGCC AGCAAGC TGGGAGGC AGGGGC AGGCTAAG ATGTGG AGCAAAA GGGC AGGTGAGG ACAGAGGCC GCCG TCCGGC ACTGAGAA TGGGC GGCGGC GGC AGTAGC AGCAC TTGGC TGGGGTCC AGAAGCC ACCCTGAGG ACACGC TTCCTGCC AGAG TTCCCC ACCCAGCC ACTGCCC TGCCCC GTGG TGGCCAGGGC TCCCAGCC TAG TTAGGGCC AGCCCC ACCC ACAGCC TGTCCC TGGCCC ACACCC AGCC ACGTGCC AATC AGGGAGC TAGG AGCCCC AGCCC TGAGG TAAGAGTC AGGAAGG AGAAGC TGGCAGG ATTGG TCTGGGC AGCG CCCAAG AAGCC AGGTGCC TTGGC TCCTCCC ACCCATCCC AGACAGAC TTCCCTGGC TCCAC TCTCTGCC AAGGGCCC TGGC ACTCACC AGATTCCC TCTTG ATGAGCC TGGC TGGTAG TCTGGG TGTGGC TGGGACTC TCCGC TTTGC ACTC TGCTC ATTCC AGTATT CCCGCC AGTGCC GC AGCTGGG AGTGG ATGAAGC GCC ACATG AGCCAGGCC TGGGCGGC ACACACC AGCAGC AGCACGC AGAGCC TGCAGAGC AGGGGG TTAGGGGC TTAGGC TGGGGC TTGGGC TCACAGCC TTGGGC TGGG TTGTGC AGGGG AGAAC AAGGGCC AGGGG CCCTGC AGTTCCC ATGGC TTATC ACG TCCGCC TTCACCAC TGGCCC TCTTCG ATACC ACCAC TATCACC AGGAAG AATGTG TGCTTC AGTC AGTCTC TGCTCC AGCATAC ATCAC ATGTGCC AGGGAGAC GGG AAGGAAG TGGCG ACAGAC GTAC GGCC AGCTCTAC AATCAC GC TACTCC TATGACG AGGGAGGGG TCCATGGC TGTG TCTGTTTT GCGCCC ATTGC ACAG AACAAG ACTAA TGTAA GCTCC ACAA ATATTGG TAGCATTC AAATGAAC TGAATTTC TGGAAG AGTGGC TTCTC ATTTAAC ATGTCAC TTAAAAG TGGAGC AACCCTGG ACAAATC ACTCTCC TGGGCC TAGGGGC TCCGG AAAATAG TGGCTTCC TCACTGCC ACAGG AGGCC ACTGGCC AAGCC ATTAAGC ACATGG TTTTAAAGC ACCCACAC ACAAGAAG AGGAGAA TGATATC AAC TGAGAG ACTGGG TGTGATGCC TCTGTGC ACCAC AAAGTGCC AGACAAATG TAAGGG ATTCC TATTTGG ACTAC AGTCTG AGCAAACC AGGACTAG GGG ATGAAG ATGGTTTGG ATGGAACC AGAGGC TGCTATC TCTTC TCCCC TCAGGCC TGATATCC AGAG ATTTCC AAAA AATAAC AATATG TGGGAGAC TAAAGGG TCTGC TGCCTCC AGACC TTCTGC AAGGGC TGTGCC AAGTTC AGGAGGC TCCCTGGC TTATC ACCTTGG ACTTC TGCTCG ACTC ACCTGC AAAACAAAG TGTTG AAGTTCCC TTTC TCGGG ATC AAATGCC TGGTTTTCC ATGCG AGCC AGTCC AAAGCC AATGGCC AGCACGGC AAGGGTG AGGATGAAG AGGCGGG TAACCCC AAAAACAGC AGCCCAGGC ACTGAACC TGCTCAC AGAGGC AGAAGAGGG ATGTC AGTC TTTAGC GCCC TTGAAGG AATC TTCACCC ACTTC TCCAGAAG AGACCCCG AGTGGG AAGAGG ATTC AAGGG TGGCTGGGG AAAGTGC TTGAGGG ACG AGATATC TAAAATC AGATGTTCC AGAAAA AAATAAC GGG AGGGC ACCACC TGCAGG TAAGC GGGC AGTGTGC AACC AGGGAGGG ACCCTCC AACCATCC GGGCC TCGGGGG AACCCC TGCCC AGGCC TCTAAGC GGGCC AGCCTGC AGCAGACCC ACTTAC AGTTTC TCG TTGTTTTC ATCTGC AAAG TAGAAG AGTC TAGCC GTG TGGAAG AGGAAC TCAGTTG AGTACTGC AGCAGC AGCAAG ATC AGGCCC AGGCGGC TCAGGC TGGGGGTGGGG AAGAC TAGAC TTAC ATTCCC TCCAAG ATGC TGCG TGGAGC AGAAGCC ATTGC ATCTTGGC TCAGGC TGTCCCC TGTGCC TGGCTGGGC TCTGC TTTCC ACTCCC ACTTTCCC TGGCTGGC TCTGC TCCATCC TTTGGATTC AGTTTAGC TCTC ACACC TTTAAG ACATT TTTCCTAA TACCG ACCCGC TGGCCG TTCAGC TGTCC TGTCTC AGTC AGATGCCC TTGCC TGCTCCC ACAGC AAACCTC GC ATAGGCCC TTCACAG TACTTAGC ACCTTGC ACTC ATCACC TAGGC TGGAACC AAGTAC ATAAAAGG TAC TCAGAAC ACATTTGC TGAGC TCTG AGTAT AGGAA TATGAAATG TTCCTGTTG TCTG ACTTTCC ATTATCC AAGTCTTC ACAGC TCCG AGGTAC ATGC AGAAGC AGCAAG TGCTCC TTCTGTG TGGCCC TGC TTATAC GTTC TTCCCC GG TCCTC GCCACTGC TACGG TGACAGTGC AGAC TGGCTTC TTAG ACCCG TTATGC ATGTGACAC ATGACC ATCC AACAC AAGGGC AGAGC TGGCATC ACCCC ACAGCC TTCAGCCC TCAAAG ACCCATCC GGGAAC TGACGC TGCTAC AGGCC ACCAGAG ACAGG AGACAGAG TTTGAGAGC TCCTTCCC TGCC TCAGTC TTAC TAATCC AAGTC AGTCATTC ACACAGG ATGCC TGCTGC AAGG ACCTAG TCCAAC GC ACCTCGGG ATTTCC AGGC ACCTCGGC AGAA AGTTACAC ACAGTG AGCTCTG TAAG TGCCAGCC TAGAGAA AGTGTGGGG TGCTTTT ACTGCATGG ATAAC ACTCAGC AAAAGCCC AAATT ATCAATG ACACAGC TTATT AACATC AAAAGG ATTCTTTTC ATAAAAG AGGC TCTTCG AGAAC TAATATT ATAGC AATTC TTTCTGCC TCTAG AACAACC AAGAGAG ACCTAC TCTCC ATGTCATT ATAAACC AAAGGG AAGGG AATTCC AGGGC TACG AGCTC TAGCAGTG TTTGC ATTGG ACACTGTG AGGTAAG AGCCC AGCTTTGGG AGGCC TTCAAGC TGCAAAGCC ATGGTTC AAAGGCCG ACATCC ACTGG AAGTC TTCCTGGC TGTCTC TGTTG AGGG TCTTC TTCTGGG TTGCAGAGC AGATG ATACATAC TGTG TTATGG TGTTC ATCAC TCTCAAC TGTCC TTACTTATG TCTATAAC TGTCTC TTCAGAA TGAGAA TGAACC ACTG AAGATAA AGAA TCTTCC ATT ACCATC TTTGTATT GCC AAGTC TTAGC ATAGTGC TAGGC ACACAGAGG ATGTCAAC AAATGCC TGATAA TTATATG AGTGTG TGG ACAGATGC ATGG ACATAAAA GGGC AAGGAAATC TGGC TGGCTCC ATGGTCTC ACTCAC TTTAAG AGGTATGC TCCAGC TATATGC ACC AGGTAC AGGC AAATAT ACTGG AGCTGGC GGGG AATTTCC TCCTGG AAACAAG AGAAGC AGATGG TAAATTTGC TAATTCCC TAACTGAAG ATTCAGGG AAGGGGG AAAAGTGC AGGGGG ATGAGAG AGGGCC AGGC TCCTC TGGGCTGC TTTAAC ACAC AGTCCC ATGTCCC ACG AGTCCC ACAGTCCC ACTGCACC AGGCTGC TGAAATTC AAGGGC ATTC AGGTCC ATTCCC AAATTCC AGCAGCC TTGGG TCTAG TGTC AGAGGG TGAGG TTTGG ATTGAGAA ATAAG AGACAGGG ACTGG AGAAG AGGGC TCTTGG AAATAA TTCAGAAGG AAAC TATAAAA AGTAAAA ATAAAA AAAG ACTATGG AAATGGC AAAG ACCTC TCCTTTG ACATC TATAAGATG AGAG TTAGG TTTCCTCC AAAGCC ACAGG TCTGG TGGAAG AGGCAGGC AAGAGAC TGACAC TGGTGG TCAAC TACATG ACAC TTCTCC AAGAGATG ACTC AGCATG TTGC TCAA TCCCCAAC ATATTCC TATC ACCACCC AACACTCC ATGC TTCTGG AGAAAAGG AAGGG AGG TACCCC TGGG AATAGC AGGAGGGG AGTGG TCAATGAA TGGCC TCCAAG AAGGG AGAGAAG TGAGC ACTCACC TTCCG TACCTTC TGGAAG TATAGC TCAGGAAG TGCG TGCAGCC AGTAGGCC AGCTGGC ATAGG TAGAAAA ACTTC ACCTGG AAGC TGGAGAC AAGGGGGC AAGTCACAC GGGC AGGATAGAG AAAAG TGTCCC TGC AGGTGC TGGCC AAGCACAGG AGGG AAAAGC ATGGGC TGAGAC TCTGCC TGTG AGGAGC TGGTCC AGGAGC AAGGG AGTT AGGCC AGTGACC GCCGC ACCC TGAGCC TGGGACCC TGGC TTCTCC ATTGGCC TGTGCCC TTGTTCC ACATAC AAAACC ACTTAA AGGACAC GGAAAG TCCAC AGAAAGAA ACAAAC ATG ATTAAAA TAGTGC AGAGG AGGAGG AATCC TTCAGCC TTGAGG AGGGAGC TGATT ACAGAGC ACTGTTGG AGATAGGG ACCAAC AGATACAC TGAGAC AACAAAC AGCTC TAAGTAGC AAGGGAAGG TTCTAAC TCAGCCC TACATCC TTTGCTATT ATTGC TCTTAAAG ATCTC GGG AAAGGC AGCCAGGCGTGG TGGCTCACGCC TGTAACCCC AGCACTTTGGG AGGCTGAGGCAGGTGG ATCACCTGAAG TCAGGAGTTTGAGACCAGCC TGGCCAACATGG TGAAATCCC ATCTC TACTAAAAATACAAAAATTAGCTGGGCGTGGTGGC ACATG TCTG TAATCC AAGCTAC TTGGGAGGCTGAGGCAGGAGAA TCGC TTAAACCC AGGAGGTGGAGG TTGCAGTG AGC TGAAATC ATGCC ATTGCACTCC ACCC TGGGCAACAAG AGCAAATC TCCATC TCAG AAAAAAG ACAAAA AACAAAG ATCTC GGG AAAGGC AAAGGG TGGCCTCC TGAGGG AGATGG CCCC AGG TATTGCCC TTGGGG TAC ACTGCCC TCTTGGC AGCAC TATATG AGGCAGAGG ACAC TGGCTCTG ACAG ACCACC AGCCATGGC AGGCC AGAAGGG AAGACAC TCTGTGG ATGTC AGGGGG TCGCC AAGAAGG TAG AAACCC AGAGGGC ATTATGG AGAGAGATG TTCTGC TTCTGAA TCTGTCTC ATGCAGTTG AGGG ACCTCTGTG ATGGG AGCC AGCACAG ATGG AATTTC ATCTGGGG ATTCTCTGG TCAAGC ATGCTGAG AAGAAG TGGCTTCC AGAC AAGTC TACCATCC ACAATAGGC TCAGGGC ATG ATCTGC TCG TCAGGCC AGCTGGGCC TGTGG TGTTC TGGCCACAC TCCGC TGGGACAGG AAGGC AGTGGG CCCGG TCGC TCCTCCC TGGGGC TGAGTC AACAGAA TACTCAC GGGAGG TGCACATGC GGGTAG TCTTCCC AGAGGC TTCTTGGG TTTGTTAAG TATCC TTCCTGC AGTGGGC AAGAAG AGAGACC ATTTAG AGATG TGGACG TGAG ACCTGC TGGGGCCC TGGG ACCGG TCCAGGGG TCAGGG ATGCATCC AGTCCCC ACCTGAC AGAA AGAGGAAGG AACAGG AAATG TGAAAAC AGAGAAC TTCTC TGTGTGGG ACCCC TGGCGC TTGGC TGGTTTC TTTAC TGTGG AAGAGTC ATGCTGG AGTAGG AAGGGCC ACGC TCTG AGGTCC AACG ACCC ATATC TGAAGATG AGTCTG ACAAGCG AATT AGTCTTGC TCCTCTG AGCAAGC TAATTAG TTTCCC TAAGCC ACAGCTGGC TCATCTGC AAAACAAAA TAAAA ATACCC ACCC TCACAGAG TTATTG TTGGAAATG AATGGG ATAG TTTATG TGCCAGTG TCTAGTCC TGTGCC TGGCATGC AGGCGC TCAGG AAATGCC TCCATAA TGAATAAGC AAATGAAC TCTAG AATCACC ACTCGC TGGAAAA ATGAAAA GCCTAC TTTGGC TTTTC ACAGCC TGC TGAATAA AAAAC ATGGC AGGACCCC ATAGGCC TCACC ATGCAGC TGGAC TCTGACACC TACC ACACTGTG TCATTAC TGTCAGTTG TTTCC ATTACTC TTGC AAGTCCC TTCACAC TAGGGCC TTTTC TTGCC TATCTTTAG AATTCTAAC ATGTAG TCC AGCACC TTATATG GGGTGGGG ATGGCAAC ATGAAAA TCCTTCC ATCAC AAAAC ATCTAG AAATGC TGGGTGAA ATCTAA TGAA TATTCTTTT AAATGC AAAGAGC TGAGC TCAC AGTAAG AAAGGG AAACCCCC TGGGACCC AAAGGG AGAGGG AGGCTAA AAGGC AGAGC AGTAA AGTGACAC TGTAGC AGCCC AAAAGGC ACTAG TTATGGGCC AGGGTTTT TGTGCCC ATG TGAGAAC AGAAG ATGGTGCC TTGGG AGGTGG AACCCAAG ACCTTG TATAAG ACCAGG ACCTC TGAAAGGCC ACAATCTC AGAGAA AGGAAAAG ACTAG AAAG TGTTTGC TGACC AACAC AGGGAAATG AAGATG TCTGC TCAGCCC ATACCC AAGG TGAAAAC AAAATCATT TATTC TAAAA ATCTGC AACCTCAGG TTCACTCTG AGTTTGG AGGTGAA ATAT ACTACC TGTG TGATCC AAAAGCC GCC AAGGTAAG AAATTAGAA TTAATAG TGTGG TGGGCC AGTG ATACCC TGGGG ACATACCC TCATCC AAGG ATGCTCC ACAG ATAAAACC TTGCTAA AGATG AATTTAT AATCC AAGAGTAC AAAGC ATGGGAAG AAATAA TCTACC ACAAGC AAG AGTCAGC TGAAAC TAC AGGAGTGC AATAC ACACC AGTTGG TTG AATGAATGAA TGATG AATGC TTTGGGC AATTTC TCTC TTCTG AAGAA AGGGC TCTTATT TGTCAC TCAG AGAAGGC AGAGC AGATT AGATT AGGATG ACTTC ATTTTAGAA ATGGG AAAATGAAAA AAC AGATAGG AAGG ATCTCC TGAAATAAG ATAGTTTTG TTTTGTTTTTTTG ATATGG AGTTTTGCTCTTG TTGCCCAGGCTGGAGTGCAATGGC ACG ATCTCAGCTCACTGCAACCTCTGCC TTGC AGGTTCAAGCG ATTC TCCCGCC TCAG TCCTCC TGAGTAGC TGGGATTAC AAGC ACGC AAC ACCACACCCGGC TATTTTTTG TACTTTT AGCAGAG ACGGGG TTTC ACTATG TTGACC AGGCTGGTCTCAAACTCC TGACC TCACTTGCC TCGACC TCCCAAAGTGC TGTG ATTACAGGC GTGC ACCATTGC GCCC AGCCAAG ATAGTTTT TCAGTAGC ACAGC TGAA ATCCG AGTTGGGCC ACAAGCC TTCTGG TCC AATAAC TTCAGGC TAGG TTGCTTC AGTAA ATCAGAAAA TCAGC TGAGC TGGTGGC TTTGATG AGAAGGC TGAGAACC TCAG ATGTTC ACAC TGGGATTAAAGGC AGAGG TTTTACAG TGCTCAGAA TGAGGCC AACAGGG TTTAGTAAG AAGCATTC TAGG TTATTG TCTATT AGGATC TTTAG TTGTATT TCCAAG TGAGGGC TGATCC ACCCACC TTTG AGTCAC TAA ACGCCC TGTGACC TATCAGC ATGCC TTTCGGG TATAGTCC ACGGCCC TAATCCC ACAAAC TTGGGCC TCCATG AGCACAA TAACC TGAC TGATAAG TCCTTTT ATCGG ATACATC TATACC ACTGTAG TCACAGTC ACCTGG ATTAGAAGG AAATG ATCTCAC TTCG AACTTAC ATGGCC TCATTTC TAATCTC TTCTCAC TACC ACTCTC TCCTCCC TGGG TCACG TGCCG ATTG AGGAATAA AAGTGG ATGAGGC TCTC GGGTGG TGGCG TGTG TGGTGGC GGTGAC AGTTG TGAGCTCTC TCAA ATACAC TGCTTC TATC ACCTC TACCCACCC ACTCTG TCGGGC ATAC GCCTGCC TTCATC AGCTCTCC TGCCCC AGGCTACC TCATTCC AGGG ACATC AGAAAGG TGAGAA TGTCTC TTCCTAG AGGAAGC AGGAATG TACTTAGC AGGAAAA ATGGTAC TTCTGAAAC TGAGGTGGG AGAGAA AGTTTTG CCC AAACAAG ACTC GCCAAG AAAAGC AGCAC TGAGAGC AATGTAA AGCCC AGAAAA TCTC GTG ATTTTAAAC AGGAAC GCTCC TTGGC TTGGCC TCTTAC TTAGAG ACAAAG AGG TCAGAAC TTTGAAGCC AAAAAGC AAAGAA ACTCCCC AGAAAA ATGTTGCC TGCTTG TGAATGTCC AGTCC ACGGGG ACTGG AGGAGG AAAAGGG TGGAGGG AGGAGAGC AGGGGG AGCC AGAGGAAAA ATGAC TCACTGC TCTGAGAAC AGCC TTTTCC AGACC TCTG TCCAGGC AGCTGTCTG AAGGAGG ACTGAGGC TGGGGC ACCCTCTG AGCTCAGGC ACGC AAAGC ACCTGAG TCCAC AGGGGGC TGAGTGTG ACCCAGC AAGCACC TGAAACCC ACCCC AAATCCC ATCC ACTGAC AGGCCCC AGCAGATGG TTTGG AGAGGC TTTTG AAATCC TTTGTTC TCTCG ATTCTAC AAATCC ACCC ATGAGC TAAGC AAGGCC TCAAC AAGG TGGAGAG ATCCCTCC TGTTTCCCC AGCAGCC TTCC TTTTGG TGTGTGAAC AAACAC AACCACG AAGAAC AGCATAA TTC AGATAT AGCACAGGC AAGTGC TACATAA ATTCAGAC ATACC TTATATT ATTTG ACCATC AGAAC AACCATGC ACTAAAA ATCTGCCC TAA AGCAAC TAGTCTG TTAGTAG AAACCGG TCCTGG TACAAGC ACC AGCATT AAGG ACATTCCC TCTAC TTGG TTCTAA [SEP]
,,,,


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
1.0,0 (0.70),ACAGGACAGGAGTGAGGACAGGAGGTGGCCTGAGGGGGAGAAAGAGAAAGATTTTTGGCTTTATTGAGAATGGTTTGTGGAAGAATAAGAGGAAGCCAAGAAGAAGGAAAGCGAAACGCCCCCTCCCCCCATTGCAAGACAGGTTTCGGCTGTTTGAGACGGAGCATCACAGGCAGGAAGGAGGAGGCAGGGAGGGGGCCTGGGCTCCTTGCCCCCTGCTCGGCCCCCACCAAGAGGATTCCTGTTCTTAGCACTTTGGCCTTAGGGAGACTTGAGTTTCTTAGTCCGTGGGGAGGTTCCGTTCTCTGCCTTCACCACTCCATTTTCATGGTAACCTGGGAAGTGGAGAGAGACAAGCATACATGGTGTTTCTGCTGGAGCTAAGGCAGAAGAGGGGAGGGTGGGGCCAGGCCAAGGAAGGGGCCCGGGCAGCCCAGCTGCTATACATGGATGCACCAAAGGGGCGCCAGGCTGCAGCCTTGCACAGCAAATGCAAGCCAGCAGACGGCTCCCAGGAGGGTCCTGTCTTCCCCAGGGCCCTGGACTAGTGGCCCTGTTTGAGAGGCTTGGTCTCTGACTGCACTTTAGCAGGAGGGGCCTGGGATGACACACAGTAACTCAGCAACAACAGAGGCCAGCCTGCCCAAGCCTGAGGCTGGGGCTAGATACTCGCCGAAATCACTTAGATGCTGTCACTGCTCACTGTCCTCAGTTCTTCTCAGGCCCCTGCAAGGCATCAGCCCACTTCCAGTTCAGCAAGAACTCCCAGGAGCAGTGGCCACAGAAGGGAGGGGGACAAGAGGCTGTAGGAACAAGGCCTCAAGCAGGATGCCTGACACTCCTCTGGCAGAAAAATTGTGCTCTATTGTTCAAAATACCTCCGTGCGCTTGCTCAAATTCAGAGGTACTGGCTGCAGTCTTATGCCCCATACCTCCCCCGCCAGCCAGGCCTGACTCTGTGACACACCCAGCTGCGCGCGTGTCTGGTTCAAACACACATAAGCCTTTGCCAAGCAGGTGGCCACCTAGAGAAAAGCAGGTGAGTCAGAAAGCAGCGCCCAGTGCAGACAGGCCCCCAGGCTGGGCAGAACGTGCAGGGCTGGCAGGGCCTGAGGACCTGCTGAAGGTGGGTGATGACTGGAGTGCGTGCACGGGCCAAAGGATAAGTGTCCCACCCCTACCCCCCACCTAGCACTATGTCACTGTGAGTCATTCTTGGAGACAGAGGAGGAGCCAGCAAGCTGGGAGGCAGGGGCAGGCTAAGATGTGGAGCAAAAGGGCAGGTGAGGACAGAGGCCGCCGTCCGGCACTGAGAATGGGCGGCGGCGGCAGTAGCAGCACTTGGCTGGGGTCCAGAAGCCACCCTGAGGACACGCTTCCTGCCAGAGTTCCCCACCCAGCCACTGCCCTGCCCCGTGGTGGCCAGGGCTCCCAGCCTAGTTAGGGCCAGCCCCACCCACAGCCTGTCCCTGGCCCACACCCAGCCACGTGCCAATCAGGGAGCTAGGAGCCCCAGCCCTGAGGTAAGAGTCAGGAAGGAGAAGCTGGCAGGATTGGTCTGGGCAGCGCCCAAGAAGCCAGGTGCCTTGGCTCCTCCCACCCATCCCAGACAGACTTCCCTGGCTCCACTCTCTGCCAAGGGCCCTGGCACTCACCAGATTCCCTCTTGATGAGCCTGGCTGGTAGTCTGGGTGTGGCTGGGACTCTCCGCTTTGCACTCTGCTCATTCCAGTATTCCCGCCAGTGCCGCAGCTGGGAGTGGATGAAGCGCCACATGAGCCAGGCCTGGGCGGCACACACCAGCAGCAGCACGCAGAGCCTGCAGAGCAGGGGGTTAGGGGCTTAGGCTGGGGCTTGGGCTCACAGCCTTGGGCTGGGTTGTGCAGGGGAGAACAAGGGCCAGGGGCCCTGCAGTTCCCATGGCTTATCACGTCCGCCTTCACCACTGGCCCTCTTCGATACCACCACTATCACCAGGAAGAATGTGTGCTTCAGTCAGTCTCTGCTCCAGCATACATCACATGTGCCAGGGAGACGGGAAGGAAGTGGCGACAGACGTACGGCCAGCTCTACAATCACGCTACTCCTATGACGAGGGAGGGGTCCATGGCTGTGTCTGTTTTGCGCCCATTGCACAGAACAAGACTAATGTAAGCTCCACAAATATTGGTAGCATTCAAATGAACTGAATTTCTGGAAGAGTGGCTTCTCATTTAACATGTCACTTAAAAGTGGAGCAACCCTGGACAAATCACTCTCCTGGGCCTAGGGGCTCCGGAAAATAGTGGCTTCCTCACTGCCACAGGAGGCCACTGGCCAAGCCATTAAGCACATGGTTTTAAAGCACCCACACACAAGAAGAGGAGAATGATATCAACTGAGAGACTGGGTGTGATGCCTCTGTGCACCACAAAGTGCCAGACAAATGTAAGGGATTCCTATTTGGACTACAGTCTGAGCAAACCAGGACTAGGGGATGAAGATGGTTTGGATGGAACCAGAGGCTGCTATCTCTTCTCCCCTCAGGCCTGATATCCAGAGATTTCCAAAAAATAACAATATGTGGGAGACTAAAGGGTCTGCTGCCTCCAGACCTTCTGCAAGGGCTGTGCCAAGTTCAGGAGGCTCCCTGGCTTATCACCTTGGACTTCTGCTCGACTCACCTGCAAAACAAAGTGTTGAAGTTCCCTTTCTCGGGATCAAATGCCTGGTTTTCCATGCGAGCCAGTCCAAAGCCAATGGCCAGCACGGCAAGGGTGAGGATGAAGAGGCGGGTAACCCCAAAAACAGCAGCCCAGGCACTGAACCTGCTCACAGAGGCAGAAGAGGGATGTCAGTCTTTAGCGCCCTTGAAGGAATCTTCACCCACTTCTCCAGAAGAGACCCCGAGTGGGAAGAGGATTCAAGGGTGGCTGGGGAAAGTGCTTGAGGGACGAGATATCTAAAATCAGATGTTCCAGAAAAAAATAACGGGAGGGCACCACCTGCAGGTAAGCGGGCAGTGTGCAACCAGGGAGGGACCCTCCAACCATCCGGGCCTCGGGGGAACCCCTGCCCAGGCCTCTAAGCGGGCCAGCCTGCAGCAGACCCACTTACAGTTTCTCGTTGTTTTCATCTGCAAAGTAGAAGAGTCTAGCCGTGTGGAAGAGGAACTCAGTTGAGTACTGCAGCAGCAGCAAGATCAGGCCCAGGCGGCTCAGGCTGGGGGTGGGGAAGACTAGACTTACATTCCCTCCAAGATGCTGCGTGGAGCAGAAGCCATTGCATCTTGGCTCAGGCTGTCCCCTGTGCCTGGCTGGGCTCTGCTTTCCACTCCCACTTTCCCTGGCTGGCTCTGCTCCATCCTTTGGATTCAGTTTAGCTCTCACACCTTTAAGACATTTTTCCTAATACCGACCCGCTGGCCGTTCAGCTGTCCTGTCTCAGTCAGATGCCCTTGCCTGCTCCCACAGCAAACCTCGCATAGGCCCTTCACAGTACTTAGCACCTTGCACTCATCACCTAGGCTGGAACCAAGTACATAAAAGGTACTCAGAACACATTTGCTGAGCTCTGAGTATAGGAATATGAAATGTTCCTGTTGTCTGACTTTCCATTATCCAAGTCTTCACAGCTCCGAGGTACATGCAGAAGCAGCAAGTGCTCCTTCTGTGTGGCCCTGCTTATACGTTCTTCCCCGGTCCTCGCCACTGCTACGGTGACAGTGCAGACTGGCTTCTTAGACCCGTTATGCATGTGACACATGACCATCCAACACAAGGGCAGAGCTGGCATCACCCCACAGCCTTCAGCCCTCAAAGACCCATCCGGGAACTGACGCTGCTACAGGCCACCAGAGACAGGAGACAGAGTTTGAGAGCTCCTTCCCTGCCTCAGTCTTACTAATCCAAGTCAGTCATTCACACAGGATGCCTGCTGCAAGGACCTAGTCCAACGCACCTCGGGATTTCCAGGCACCTCGGCAGAAAGTTACACACAGTGAGCTCTGTAAGTGCCAGCCTAGAGAAAGTGTGGGGTGCTTTTACTGCATGGATAACACTCAGCAAAAGCCCAAATTATCAATGACACAGCTTATTAACATCAAAAGGATTCTTTTCATAAAAGAGGCTCTTCGAGAACTAATATTATAGCAATTCTTTCTGCCTCTAGAACAACCAAGAGAGACCTACTCTCCATGTCATTATAAACCAAAGGGAAGGGAATTCCAGGGCTACGAGCTCTAGCAGTGTTTGCATTGGACACTGTGAGGTAAGAGCCCAGCTTTGGGAGGCCTTCAAGCTGCAAAGCCATGGTTCAAAGGCCGACATCCACTGGAAGTCTTCCTGGCTGTCTCTGTTGAGGGTCTTCTTCTGGGTTGCAGAGCAGATGATACATACTGTGTTATGGTGTTCATCACTCTCAACTGTCCTTACTTATGTCTATAACTGTCTCTTCAGAATGAGAATGAACCACTGAAGATAAAGAATCTTCCATTACCATCTTTGTATTGCCAAGTCTTAGCATAGTGCTAGGCACACAGAGGATGTCAACAAATGCCTGATAATTATATGAGTGTGTGGACAGATGCATGGACATAAAAGGGCAAGGAAATCTGGCTGGCTCCATGGTCTCACTCACTTTAAGAGGTATGCTCCAGCTATATGCACCAGGTACAGGCAAATATACTGGAGCTGGCGGGGAATTTCCTCCTGGAAACAAGAGAAGCAGATGGTAAATTTGCTAATTCCCTAACTGAAGATTCAGGGAAGGGGGAAAAGTGCAGGGGGATGAGAGAGGGCCAGGCTCCTCTGGGCTGCTTTAACACACAGTCCCATGTCCCACGAGTCCCACAGTCCCACTGCACCAGGCTGCTGAAATTCAAGGGCATTCAGGTCCATTCCCAAATTCCAGCAGCCTTGGGTCTAGTGTCAGAGGGTGAGGTTTGGATTGAGAAATAAGAGACAGGGACTGGAGAAGAGGGCTCTTGGAAATAATTCAGAAGGAAACTATAAAAAGTAAAAATAAAAAAAGACTATGGAAATGGCAAAGACCTCTCCTTTGACATCTATAAGATGAGAGTTAGGTTTCCTCCAAAGCCACAGGTCTGGTGGAAGAGGCAGGCAAGAGACTGACACTGGTGGTCAACTACATGACACTTCTCCAAGAGATGACTCAGCATGTTGCTCAATCCCCAACATATTCCTATCACCACCCAACACTCCATGCTTCTGGAGAAAAGGAAGGGAGGTACCCCTGGGAATAGCAGGAGGGGAGTGGTCAATGAATGGCCTCCAAGAAGGGAGAGAAGTGAGCACTCACCTTCCGTACCTTCTGGAAGTATAGCTCAGGAAGTGCGTGCAGCCAGTAGGCCAGCTGGCATAGGTAGAAAAACTTCACCTGGAAGCTGGAGACAAGGGGGCAAGTCACACGGGCAGGATAGAGAAAAGTGTCCCTGCAGGTGCTGGCCAAGCACAGGAGGGAAAAGCATGGGCTGAGACTCTGCCTGTGAGGAGCTGGTCCAGGAGCAAGGGAGTTAGGCCAGTGACCGCCGCACCCTGAGCCTGGGACCCTGGCTTCTCCATTGGCCTGTGCCCTTGTTCCACATACAAAACCACTTAAAGGACACGGAAAGTCCACAGAAAGAAACAAACATGATTAAAATAGTGCAGAGGAGGAGGAATCCTTCAGCCTTGAGGAGGGAGCTGATTACAGAGCACTGTTGGAGATAGGGACCAACAGATACACTGAGACAACAAACAGCTCTAAGTAGCAAGGGAAGGTTCTAACTCAGCCCTACATCCTTTGCTATTATTGCTCTTAAAGATCTCGGGAAAGGCAGCCAGGCGTGGTGGCTCACGCCTGTAACCCCAGCACTTTGGGAGGCTGAGGCAGGTGGATCACCTGAAGTCAGGAGTTTGAGACCAGCCTGGCCAACATGGTGAAATCCCATCTCTACTAAAAATACAAAAATTAGCTGGGCGTGGTGGCACATGTCTGTAATCCAAGCTACTTGGGAGGCTGAGGCAGGAGAATCGCTTAAACCCAGGAGGTGGAGGTTGCAGTGAGCTGAAATCATGCCATTGCACTCCACCCTGGGCAACAAGAGCAAATCTCCATCTCAGAAAAAAGACAAAAAACAAAGATCTCGGGAAAGGCAAAGGGTGGCCTCCTGAGGGAGATGGCCCCAGGTATTGCCCTTGGGGTACACTGCCCTCTTGGCAGCACTATATGAGGCAGAGGACACTGGCTCTGACAGACCACCAGCCATGGCAGGCCAGAAGGGAAGACACTCTGTGGATGTCAGGGGGTCGCCAAGAAGGTAGAAACCCAGAGGGCATTATGGAGAGAGATGTTCTGCTTCTGAATCTGTCTCATGCAGTTGAGGGACCTCTGTGATGGGAGCCAGCACAGATGGAATTTCATCTGGGGATTCTCTGGTCAAGCATGCTGAGAAGAAGTGGCTTCCAGACAAGTCTACCATCCACAATAGGCTCAGGGCATGATCTGCTCGTCAGGCCAGCTGGGCCTGTGGTGTTCTGGCCACACTCCGCTGGGACAGGAAGGCAGTGGGCCCGGTCGCTCCTCCCTGGGGCTGAGTCAACAGAATACTCACGGGAGGTGCACATGCGGGTAGTCTTCCCAGAGGCTTCTTGGGTTTGTTAAGTATCCTTCCTGCAGTGGGCAAGAAGAGAGACCATTTAGAGATGTGGACGTGAGACCTGCTGGGGCCCTGGGACCGGTCCAGGGGTCAGGGATGCATCCAGTCCCCACCTGACAGAAAGAGGAAGGAACAGGAAATGTGAAAACAGAGAACTTCTCTGTGTGGGACCCCTGGCGCTTGGCTGGTTTCTTTACTGTGGAAGAGTCATGCTGGAGTAGGAAGGGCCACGCTCTGAGGTCCAACGACCCATATCTGAAGATGAGTCTGACAAGCGAATTAGTCTTGCTCCTCTGAGCAAGCTAATTAGTTTCCCTAAGCCACAGCTGGCTCATCTGCAAAACAAAATAAAAATACCCACCCTCACAGAGTTATTGTTGGAAATGAATGGGATAGTTTATGTGCCAGTGTCTAGTCCTGTGCCTGGCATGCAGGCGCTCAGGAAATGCCTCCATAATGAATAAGCAAATGAACTCTAGAATCACCACTCGCTGGAAAAATGAAAAGCCTACTTTGGCTTTTCACAGCCTGCTGAATAAAAAACATGGCAGGACCCCATAGGCCTCACCATGCAGCTGGACTCTGACACCTACCACACTGTGTCATTACTGTCAGTTGTTTCCATTACTCTTGCAAGTCCCTTCACACTAGGGCCTTTTCTTGCCTATCTTTAGAATTCTAACATGTAGTCCAGCACCTTATATGGGGTGGGGATGGCAACATGAAAATCCTTCCATCACAAAACATCTAGAAATGCTGGGTGAAATCTAATGAATATTCTTTTAAATGCAAAGAGCTGAGCTCACAGTAAGAAAGGGAAACCCCCTGGGACCCAAAGGGAGAGGGAGGCTAAAAGGCAGAGCAGTAAAGTGACACTGTAGCAGCCCAAAAGGCACTAGTTATGGGCCAGGGTTTTTGTGCCCATGTGAGAACAGAAGATGGTGCCTTGGGAGGTGGAACCCAAGACCTTGTATAAGACCAGGACCTCTGAAAGGCCACAATCTCAGAGAAAGGAAAAGACTAGAAAGTGTTTGCTGACCAACACAGGGAAATGAAGATGTCTGCTCAGCCCATACCCAAGGTGAAAACAAAATCATTTATTCTAAAAATCTGCAACCTCAGGTTCACTCTGAGTTTGGAGGTGAAATATACTACCTGTGTGATCCAAAAGCCGCCAAGGTAAGAAATTAGAATTAATAGTGTGGTGGGCCAGTGATACCCTGGGGACATACCCTCATCCAAGGATGCTCCACAGATAAAACCTTGCTAAAGATGAATTTATAATCCAAGAGTACAAAGCATGGGAAGAAATAATCTACCACAAGCAAGAGTCAGCTGAAACTACAGGAGTGCAATACACACCAGTTGGTTGAATGAATGAATGATGAATGCTTTGGGCAATTTCTCTCTTCTGAAGAAAGGGCTCTTATTTGTCACTCAGAGAAGGCAGAGCAGATTAGATTAGGATGACTTCATTTTAGAAATGGGAAAATGAAAAAACAGATAGGAAGGATCTCCTGAAATAAGATAGTTTTGTTTTGTTTTTTTGATATGGAGTTTTGCTCTTGTTGCCCAGGCTGGAGTGCAATGGCACGATCTCAGCTCACTGCAACCTCTGCCTTGCAGGTTCAAGCGATTCTCCCGCCTCAGTCCTCCTGAGTAGCTGGGATTACAAGCACGCAACACCACACCCGGCTATTTTTTGTACTTTTAGCAGAGACGGGGTTTCACTATGTTGACCAGGCTGGTCTCAAACTCCTGACCTCACTTGCCTCGACCTCCCAAAGTGCTGTGATTACAGGCGTGCACCATTGCGCCCAGCCAAGATAGTTTTTCAGTAGCACAGCTGAAATCCGAGTTGGGCCACAAGCCTTCTGGTCCAATAACTTCAGGCTAGGTTGCTTCAGTAAATCAGAAAATCAGCTGAGCTGGTGGCTTTGATGAGAAGGCTGAGAACCTCAGATGTTCACACTGGGATTAAAGGCAGAGGTTTTACAGTGCTCAGAATGAGGCCAACAGGGTTTAGTAAGAAGCATTCTAGGTTATTGTCTATTAGGATCTTTAGTTGTATTTCCAAGTGAGGGCTGATCCACCCACCTTTGAGTCACTAAACGCCCTGTGACCTATCAGCATGCCTTTCGGGTATAGTCCACGGCCCTAATCCCACAAACTTGGGCCTCCATGAGCACAATAACCTGACTGATAAGTCCTTTTATCGGATACATCTATACCACTGTAGTCACAGTCACCTGGATTAGAAGGAAATGATCTCACTTCGAACTTACATGGCCTCATTTCTAATCTCTTCTCACTACCACTCTCTCCTCCCTGGGTCACGTGCCGATTGAGGAATAAAAGTGGATGAGGCTCTCGGGTGGTGGCGTGTGTGGTGGCGGTGACAGTTGTGAGCTCTCTCAAATACACTGCTTCTATCACCTCTACCCACCCACTCTGTCGGGCATACGCCTGCCTTCATCAGCTCTCCTGCCCCAGGCTACCTCATTCCAGGGACATCAGAAAGGTGAGAATGTCTCTTCCTAGAGGAAGCAGGAATGTACTTAGCAGGAAAAATGGTACTTCTGAAACTGAGGTGGGAGAGAAAGTTTTGCCCAAACAAGACTCGCCAAGAAAAGCAGCACTGAGAGCAATGTAAAGCCCAGAAAATCTCGTGATTTTAAACAGGAACGCTCCTTGGCTTGGCCTCTTACTTAGAGACAAAGAGGTCAGAACTTTGAAGCCAAAAAGCAAAGAAACTCCCCAGAAAAATGTTGCCTGCTTGTGAATGTCCAGTCCACGGGGACTGGAGGAGGAAAAGGGTGGAGGGAGGAGAGCAGGGGGAGCCAGAGGAAAAATGACTCACTGCTCTGAGAACAGCCTTTTCCAGACCTCTGTCCAGGCAGCTGTCTGAAGGAGGACTGAGGCTGGGGCACCCTCTGAGCTCAGGCACGCAAAGCACCTGAGTCCACAGGGGGCTGAGTGTGACCCAGCAAGCACCTGAAACCCACCCCAAATCCCATCCACTGACAGGCCCCAGCAGATGGTTTGGAGAGGCTTTTGAAATCCTTTGTTCTCTCGATTCTACAAATCCACCCATGAGCTAAGCAAGGCCTCAACAAGGTGGAGAGATCCCTCCTGTTTCCCCAGCAGCCTTCCTTTTGGTGTGTGAACAAACACAACCACGAAGAACAGCATAATTCAGATATAGCACAGGCAAGTGCTACATAAATTCAGACATACCTTATATTATTTGACCATCAGAACAACCATGCACTAAAAATCTGCCCTAAAGCAACTAGTCTGTTAGTAGAAACCGGTCCTGGTACAAGCACCAGCATTAAGGACATTCCCTCTACTTGGTTCTAA,2.48,[CLS] ACAGG ACAGG AGTGAGG ACAGG AGGTGGCC TGAGGGGG AGAAAGAGAA AGATT TTTGGC TTTATTG AGAATGG TTTGTGG AAGAATAAG AGGAAGCC AAGAAGAAGG AAAGCG AAAC GCCCCC TCCCCCC ATTGC AAGACAGG TTTCGGC TGTTTG AGACGG AGCATCAC AGGC AGGAAGG AGGAGGC AGGGAGGG GGCC TGGGCTCC TTGCCCCC TGCTC GGCCCCC ACCAAG AGGATTCC TGTTC TTAGCAC TTTGGCC TTAGGG AGACTTG AGTTTC TTAG TCCG TGGGG AGG TTCCG TTCTC TGCCTTC ACCACTCC ATTTTC ATGG TAACC TGGG AAGTGG AGAGAGAC AAGC ATACATGG TGTTTC TGCTGG AGCTAAGGC AGAAG AGGGGAGGG TGGGGCC AGGCCAAGG AAGGGGCCC GGGC AGCCC AGCTGC TATACATGG ATGCACC AAAGGGGC GCC AGGCTGC AGCCTTGC ACAGC AAATGC AAGCC AGCAGAC GGCTCCC AGGAGGG TCCTGTC TTCCCC AGGGCCC TGGACTAG TGGCCC TGTTTG AGAGGC TTGGTCTC TGACTGC ACTTTAGC AGGAGGG GCCTGGG ATGACAC ACAGTAAC TCAGC AACAAC AGAGGCC AGCCTGCCC AAGCC TGAGGC TGGGGC TAGATAC TCGCCG AAATC ACTTAG ATGC TGTCACTGC TCACTGTCC TCAGTTC TTCTC AGGCCCC TGCAAGGC ATCAGCCC ACTTCC AGTTC AGCAAGAAC TCCC AGGAGC AGTGGCC ACAGAAGGG AGGGGG ACAAG AGGC TGTAGG AAC AAGGCC TCAAGC AGGATGCC TGACAC TCCTCTGGC AGAAAA ATTG TGCTC TATTG TTCAAAA TACC TCCG TGCGC TTGC TCAAATTC AGAGGTAC TGGCTGC AGTC TTATG CCCC ATACC TCCCCC GCCAGCC AGGCC TGAC TCTGTG ACACACCC AGCTGC GCGCG TGTC TGGTTC AAACAC ACATAAGCC TTTGCC AAGCAGG TGGCC ACCTAG AGAAAAGC AGG TGAGTC AGAAAGC AGCGCCC AGTGC AGACAGGCC CCCAGGC TGGGC AGAACGTGC AGGGCTGGC AGGGCC TGAGG ACCTGC TGAAGG TGGGTGATG ACTGG AGTGCG TGCAC GGGCC AAAGG ATAAG TGTCCC ACCCC TACCCCCC ACCTAGC ACTATG TCACTGTG AGTCATTC TTGGAGAC AGAGG AGGAGCC AGCAAGC TGGGAGGC AGGGGC AGGCTAAG ATGTGG AGCAAAA GGGC AGGTGAGG ACAGAGGCC GCCG TCCGGC ACTGAGAA TGGGC GGCGGC GGC AGTAGC AGCAC TTGGC TGGGGTCC AGAAGCC ACCCTGAGG ACACGC TTCCTGCC AGAG TTCCCC ACCCAGCC ACTGCCC TGCCCC GTGG TGGCCAGGGC TCCCAGCC TAG TTAGGGCC AGCCCC ACCC ACAGCC TGTCCC TGGCCC ACACCC AGCC ACGTGCC AATC AGGGAGC TAGG AGCCCC AGCCC TGAGG TAAGAGTC AGGAAGG AGAAGC TGGCAGG ATTGG TCTGGGC AGCG CCCAAG AAGCC AGGTGCC TTGGC TCCTCCC ACCCATCCC AGACAGAC TTCCCTGGC TCCAC TCTCTGCC AAGGGCCC TGGC ACTCACC AGATTCCC TCTTG ATGAGCC TGGC TGGTAG TCTGGG TGTGGC TGGGACTC TCCGC TTTGC ACTC TGCTC ATTCC AGTATT CCCGCC AGTGCC GC AGCTGGG AGTGG ATGAAGC GCC ACATG AGCCAGGCC TGGGCGGC ACACACC AGCAGC AGCACGC AGAGCC TGCAGAGC AGGGGG TTAGGGGC TTAGGC TGGGGC TTGGGC TCACAGCC TTGGGC TGGG TTGTGC AGGGG AGAAC AAGGGCC AGGGG CCCTGC AGTTCCC ATGGC TTATC ACG TCCGCC TTCACCAC TGGCCC TCTTCG ATACC ACCAC TATCACC AGGAAG AATGTG TGCTTC AGTC AGTCTC TGCTCC AGCATAC ATCAC ATGTGCC AGGGAGAC GGG AAGGAAG TGGCG ACAGAC GTAC GGCC AGCTCTAC AATCAC GC TACTCC TATGACG AGGGAGGGG TCCATGGC TGTG TCTGTTTT GCGCCC ATTGC ACAG AACAAG ACTAA TGTAA GCTCC ACAA ATATTGG TAGCATTC AAATGAAC TGAATTTC TGGAAG AGTGGC TTCTC ATTTAAC ATGTCAC TTAAAAG TGGAGC AACCCTGG ACAAATC ACTCTCC TGGGCC TAGGGGC TCCGG AAAATAG TGGCTTCC TCACTGCC ACAGG AGGCC ACTGGCC AAGCC ATTAAGC ACATGG TTTTAAAGC ACCCACAC ACAAGAAG AGGAGAA TGATATC AAC TGAGAG ACTGGG TGTGATGCC TCTGTGC ACCAC AAAGTGCC AGACAAATG TAAGGG ATTCC TATTTGG ACTAC AGTCTG AGCAAACC AGGACTAG GGG ATGAAG ATGGTTTGG ATGGAACC AGAGGC TGCTATC TCTTC TCCCC TCAGGCC TGATATCC AGAG ATTTCC AAAA AATAAC AATATG TGGGAGAC TAAAGGG TCTGC TGCCTCC AGACC TTCTGC AAGGGC TGTGCC AAGTTC AGGAGGC TCCCTGGC TTATC ACCTTGG ACTTC TGCTCG ACTC ACCTGC AAAACAAAG TGTTG AAGTTCCC TTTC TCGGG ATC AAATGCC TGGTTTTCC ATGCG AGCC AGTCC AAAGCC AATGGCC AGCACGGC AAGGGTG AGGATGAAG AGGCGGG TAACCCC AAAAACAGC AGCCCAGGC ACTGAACC TGCTCAC AGAGGC AGAAGAGGG ATGTC AGTC TTTAGC GCCC TTGAAGG AATC TTCACCC ACTTC TCCAGAAG AGACCCCG AGTGGG AAGAGG ATTC AAGGG TGGCTGGGG AAAGTGC TTGAGGG ACG AGATATC TAAAATC AGATGTTCC AGAAAA AAATAAC GGG AGGGC ACCACC TGCAGG TAAGC GGGC AGTGTGC AACC AGGGAGGG ACCCTCC AACCATCC GGGCC TCGGGGG AACCCC TGCCC AGGCC TCTAAGC GGGCC AGCCTGC AGCAGACCC ACTTAC AGTTTC TCG TTGTTTTC ATCTGC AAAG TAGAAG AGTC TAGCC GTG TGGAAG AGGAAC TCAGTTG AGTACTGC AGCAGC AGCAAG ATC AGGCCC AGGCGGC TCAGGC TGGGGGTGGGG AAGAC TAGAC TTAC ATTCCC TCCAAG ATGC TGCG TGGAGC AGAAGCC ATTGC ATCTTGGC TCAGGC TGTCCCC TGTGCC TGGCTGGGC TCTGC TTTCC ACTCCC ACTTTCCC TGGCTGGC TCTGC TCCATCC TTTGGATTC AGTTTAGC TCTC ACACC TTTAAG ACATT TTTCCTAA TACCG ACCCGC TGGCCG TTCAGC TGTCC TGTCTC AGTC AGATGCCC TTGCC TGCTCCC ACAGC AAACCTC GC ATAGGCCC TTCACAG TACTTAGC ACCTTGC ACTC ATCACC TAGGC TGGAACC AAGTAC ATAAAAGG TAC TCAGAAC ACATTTGC TGAGC TCTG AGTAT AGGAA TATGAAATG TTCCTGTTG TCTG ACTTTCC ATTATCC AAGTCTTC ACAGC TCCG AGGTAC ATGC AGAAGC AGCAAG TGCTCC TTCTGTG TGGCCC TGC TTATAC GTTC TTCCCC GG TCCTC GCCACTGC TACGG TGACAGTGC AGAC TGGCTTC TTAG ACCCG TTATGC ATGTGACAC ATGACC ATCC AACAC AAGGGC AGAGC TGGCATC ACCCC ACAGCC TTCAGCCC TCAAAG ACCCATCC GGGAAC TGACGC TGCTAC AGGCC ACCAGAG ACAGG AGACAGAG TTTGAGAGC TCCTTCCC TGCC TCAGTC TTAC TAATCC AAGTC AGTCATTC ACACAGG ATGCC TGCTGC AAGG ACCTAG TCCAAC GC ACCTCGGG ATTTCC AGGC ACCTCGGC AGAA AGTTACAC ACAGTG AGCTCTG TAAG TGCCAGCC TAGAGAA AGTGTGGGG TGCTTTT ACTGCATGG ATAAC ACTCAGC AAAAGCCC AAATT ATCAATG ACACAGC TTATT AACATC AAAAGG ATTCTTTTC ATAAAAG AGGC TCTTCG AGAAC TAATATT ATAGC AATTC TTTCTGCC TCTAG AACAACC AAGAGAG ACCTAC TCTCC ATGTCATT ATAAACC AAAGGG AAGGG AATTCC AGGGC TACG AGCTC TAGCAGTG TTTGC ATTGG ACACTGTG AGGTAAG AGCCC AGCTTTGGG AGGCC TTCAAGC TGCAAAGCC ATGGTTC AAAGGCCG ACATCC ACTGG AAGTC TTCCTGGC TGTCTC TGTTG AGGG TCTTC TTCTGGG TTGCAGAGC AGATG ATACATAC TGTG TTATGG TGTTC ATCAC TCTCAAC TGTCC TTACTTATG TCTATAAC TGTCTC TTCAGAA TGAGAA TGAACC ACTG AAGATAA AGAA TCTTCC ATT ACCATC TTTGTATT GCC AAGTC TTAGC ATAGTGC TAGGC ACACAGAGG ATGTCAAC AAATGCC TGATAA TTATATG AGTGTG TGG ACAGATGC ATGG ACATAAAA GGGC AAGGAAATC TGGC TGGCTCC ATGGTCTC ACTCAC TTTAAG AGGTATGC TCCAGC TATATGC ACC AGGTAC AGGC AAATAT ACTGG AGCTGGC GGGG AATTTCC TCCTGG AAACAAG AGAAGC AGATGG TAAATTTGC TAATTCCC TAACTGAAG ATTCAGGG AAGGGGG AAAAGTGC AGGGGG ATGAGAG AGGGCC AGGC TCCTC TGGGCTGC TTTAAC ACAC AGTCCC ATGTCCC ACG AGTCCC ACAGTCCC ACTGCACC AGGCTGC TGAAATTC AAGGGC ATTC AGGTCC ATTCCC AAATTCC AGCAGCC TTGGG TCTAG TGTC AGAGGG TGAGG TTTGG ATTGAGAA ATAAG AGACAGGG ACTGG AGAAG AGGGC TCTTGG AAATAA TTCAGAAGG AAAC TATAAAA AGTAAAA ATAAAA AAAG ACTATGG AAATGGC AAAG ACCTC TCCTTTG ACATC TATAAGATG AGAG TTAGG TTTCCTCC AAAGCC ACAGG TCTGG TGGAAG AGGCAGGC AAGAGAC TGACAC TGGTGG TCAAC TACATG ACAC TTCTCC AAGAGATG ACTC AGCATG TTGC TCAA TCCCCAAC ATATTCC TATC ACCACCC AACACTCC ATGC TTCTGG AGAAAAGG AAGGG AGG TACCCC TGGG AATAGC AGGAGGGG AGTGG TCAATGAA TGGCC TCCAAG AAGGG AGAGAAG TGAGC ACTCACC TTCCG TACCTTC TGGAAG TATAGC TCAGGAAG TGCG TGCAGCC AGTAGGCC AGCTGGC ATAGG TAGAAAA ACTTC ACCTGG AAGC TGGAGAC AAGGGGGC AAGTCACAC GGGC AGGATAGAG AAAAG TGTCCC TGC AGGTGC TGGCC AAGCACAGG AGGG AAAAGC ATGGGC TGAGAC TCTGCC TGTG AGGAGC TGGTCC AGGAGC AAGGG AGTT AGGCC AGTGACC GCCGC ACCC TGAGCC TGGGACCC TGGC TTCTCC ATTGGCC TGTGCCC TTGTTCC ACATAC AAAACC ACTTAA AGGACAC GGAAAG TCCAC AGAAAGAA ACAAAC ATG ATTAAAA TAGTGC AGAGG AGGAGG AATCC TTCAGCC TTGAGG AGGGAGC TGATT ACAGAGC ACTGTTGG AGATAGGG ACCAAC AGATACAC TGAGAC AACAAAC AGCTC TAAGTAGC AAGGGAAGG TTCTAAC TCAGCCC TACATCC TTTGCTATT ATTGC TCTTAAAG ATCTC GGG AAAGGC AGCCAGGCGTGG TGGCTCACGCC TGTAACCCC AGCACTTTGGG AGGCTGAGGCAGGTGG ATCACCTGAAG TCAGGAGTTTGAGACCAGCC TGGCCAACATGG TGAAATCCC ATCTC TACTAAAAATACAAAAATTAGCTGGGCGTGGTGGC ACATG TCTG TAATCC AAGCTAC TTGGGAGGCTGAGGCAGGAGAA TCGC TTAAACCC AGGAGGTGGAGG TTGCAGTG AGC TGAAATC ATGCC ATTGCACTCC ACCC TGGGCAACAAG AGCAAATC TCCATC TCAG AAAAAAG ACAAAA AACAAAG ATCTC GGG AAAGGC AAAGGG TGGCCTCC TGAGGG AGATGG CCCC AGG TATTGCCC TTGGGG TAC ACTGCCC TCTTGGC AGCAC TATATG AGGCAGAGG ACAC TGGCTCTG ACAG ACCACC AGCCATGGC AGGCC AGAAGGG AAGACAC TCTGTGG ATGTC AGGGGG TCGCC AAGAAGG TAG AAACCC AGAGGGC ATTATGG AGAGAGATG TTCTGC TTCTGAA TCTGTCTC ATGCAGTTG AGGG ACCTCTGTG ATGGG AGCC AGCACAG ATGG AATTTC ATCTGGGG ATTCTCTGG TCAAGC ATGCTGAG AAGAAG TGGCTTCC AGAC AAGTC TACCATCC ACAATAGGC TCAGGGC ATG ATCTGC TCG TCAGGCC AGCTGGGCC TGTGG TGTTC TGGCCACAC TCCGC TGGGACAGG AAGGC AGTGGG CCCGG TCGC TCCTCCC TGGGGC TGAGTC AACAGAA TACTCAC GGGAGG TGCACATGC GGGTAG TCTTCCC AGAGGC TTCTTGGG TTTGTTAAG TATCC TTCCTGC AGTGGGC AAGAAG AGAGACC ATTTAG AGATG TGGACG TGAG ACCTGC TGGGGCCC TGGG ACCGG TCCAGGGG TCAGGG ATGCATCC AGTCCCC ACCTGAC AGAA AGAGGAAGG AACAGG AAATG TGAAAAC AGAGAAC TTCTC TGTGTGGG ACCCC TGGCGC TTGGC TGGTTTC TTTAC TGTGG AAGAGTC ATGCTGG AGTAGG AAGGGCC ACGC TCTG AGGTCC AACG ACCC ATATC TGAAGATG AGTCTG ACAAGCG AATT AGTCTTGC TCCTCTG AGCAAGC TAATTAG TTTCCC TAAGCC ACAGCTGGC TCATCTGC AAAACAAAA TAAAA ATACCC ACCC TCACAGAG TTATTG TTGGAAATG AATGGG ATAG TTTATG TGCCAGTG TCTAGTCC TGTGCC TGGCATGC AGGCGC TCAGG AAATGCC TCCATAA TGAATAAGC AAATGAAC TCTAG AATCACC ACTCGC TGGAAAA ATGAAAA GCCTAC TTTGGC TTTTC ACAGCC TGC TGAATAA AAAAC ATGGC AGGACCCC ATAGGCC TCACC ATGCAGC TGGAC TCTGACACC TACC ACACTGTG TCATTAC TGTCAGTTG TTTCC ATTACTC TTGC AAGTCCC TTCACAC TAGGGCC TTTTC TTGCC TATCTTTAG AATTCTAAC ATGTAG TCC AGCACC TTATATG GGGTGGGG ATGGCAAC ATGAAAA TCCTTCC ATCAC AAAAC ATCTAG AAATGC TGGGTGAA ATCTAA TGAA TATTCTTTT AAATGC AAAGAGC TGAGC TCAC AGTAAG AAAGGG AAACCCCC TGGGACCC AAAGGG AGAGGG AGGCTAA AAGGC AGAGC AGTAA AGTGACAC TGTAGC AGCCC AAAAGGC ACTAG TTATGGGCC AGGGTTTT TGTGCCC ATG TGAGAAC AGAAG ATGGTGCC TTGGG AGGTGG AACCCAAG ACCTTG TATAAG ACCAGG ACCTC TGAAAGGCC ACAATCTC AGAGAA AGGAAAAG ACTAG AAAG TGTTTGC TGACC AACAC AGGGAAATG AAGATG TCTGC TCAGCCC ATACCC AAGG TGAAAAC AAAATCATT TATTC TAAAA ATCTGC AACCTCAGG TTCACTCTG AGTTTGG AGGTGAA ATAT ACTACC TGTG TGATCC AAAAGCC GCC AAGGTAAG AAATTAGAA TTAATAG TGTGG TGGGCC AGTG ATACCC TGGGG ACATACCC TCATCC AAGG ATGCTCC ACAG ATAAAACC TTGCTAA AGATG AATTTAT AATCC AAGAGTAC AAAGC ATGGGAAG AAATAA TCTACC ACAAGC AAG AGTCAGC TGAAAC TAC AGGAGTGC AATAC ACACC AGTTGG TTG AATGAATGAA TGATG AATGC TTTGGGC AATTTC TCTC TTCTG AAGAA AGGGC TCTTATT TGTCAC TCAG AGAAGGC AGAGC AGATT AGATT AGGATG ACTTC ATTTTAGAA ATGGG AAAATGAAAA AAC AGATAGG AAGG ATCTCC TGAAATAAG ATAGTTTTG TTTTGTTTTTTTG ATATGG AGTTTTGCTCTTG TTGCCCAGGCTGGAGTGCAATGGC ACG ATCTCAGCTCACTGCAACCTCTGCC TTGC AGGTTCAAGCG ATTC TCCCGCC TCAG TCCTCC TGAGTAGC TGGGATTAC AAGC ACGC AAC ACCACACCCGGC TATTTTTTG TACTTTT AGCAGAG ACGGGG TTTC ACTATG TTGACC AGGCTGGTCTCAAACTCC TGACC TCACTTGCC TCGACC TCCCAAAGTGC TGTG ATTACAGGC GTGC ACCATTGC GCCC AGCCAAG ATAGTTTT TCAGTAGC ACAGC TGAA ATCCG AGTTGGGCC ACAAGCC TTCTGG TCC AATAAC TTCAGGC TAGG TTGCTTC AGTAA ATCAGAAAA TCAGC TGAGC TGGTGGC TTTGATG AGAAGGC TGAGAACC TCAG ATGTTC ACAC TGGGATTAAAGGC AGAGG TTTTACAG TGCTCAGAA TGAGGCC AACAGGG TTTAGTAAG AAGCATTC TAGG TTATTG TCTATT AGGATC TTTAG TTGTATT TCCAAG TGAGGGC TGATCC ACCCACC TTTG AGTCAC TAA ACGCCC TGTGACC TATCAGC ATGCC TTTCGGG TATAGTCC ACGGCCC TAATCCC ACAAAC TTGGGCC TCCATG AGCACAA TAACC TGAC TGATAAG TCCTTTT ATCGG ATACATC TATACC ACTGTAG TCACAGTC ACCTGG ATTAGAAGG AAATG ATCTCAC TTCG AACTTAC ATGGCC TCATTTC TAATCTC TTCTCAC TACC ACTCTC TCCTCCC TGGG TCACG TGCCG ATTG AGGAATAA AAGTGG ATGAGGC TCTC GGGTGG TGGCG TGTG TGGTGGC GGTGAC AGTTG TGAGCTCTC TCAA ATACAC TGCTTC TATC ACCTC TACCCACCC ACTCTG TCGGGC ATAC GCCTGCC TTCATC AGCTCTCC TGCCCC AGGCTACC TCATTCC AGGG ACATC AGAAAGG TGAGAA TGTCTC TTCCTAG AGGAAGC AGGAATG TACTTAGC AGGAAAA ATGGTAC TTCTGAAAC TGAGGTGGG AGAGAA AGTTTTG CCC AAACAAG ACTC GCCAAG AAAAGC AGCAC TGAGAGC AATGTAA AGCCC AGAAAA TCTC GTG ATTTTAAAC AGGAAC GCTCC TTGGC TTGGCC TCTTAC TTAGAG ACAAAG AGG TCAGAAC TTTGAAGCC AAAAAGC AAAGAA ACTCCCC AGAAAA ATGTTGCC TGCTTG TGAATGTCC AGTCC ACGGGG ACTGG AGGAGG AAAAGGG TGGAGGG AGGAGAGC AGGGGG AGCC AGAGGAAAA ATGAC TCACTGC TCTGAGAAC AGCC TTTTCC AGACC TCTG TCCAGGC AGCTGTCTG AAGGAGG ACTGAGGC TGGGGC ACCCTCTG AGCTCAGGC ACGC AAAGC ACCTGAG TCCAC AGGGGGC TGAGTGTG ACCCAGC AAGCACC TGAAACCC ACCCC AAATCCC ATCC ACTGAC AGGCCCC AGCAGATGG TTTGG AGAGGC TTTTG AAATCC TTTGTTC TCTCG ATTCTAC AAATCC ACCC ATGAGC TAAGC AAGGCC TCAAC AAGG TGGAGAG ATCCCTCC TGTTTCCCC AGCAGCC TTCC TTTTGG TGTGTGAAC AAACAC AACCACG AAGAAC AGCATAA TTC AGATAT AGCACAGGC AAGTGC TACATAA ATTCAGAC ATACC TTATATT ATTTG ACCATC AGAAC AACCATGC ACTAAAA ATCTGCCC TAA AGCAAC TAGTCTG TTAGTAG AAACCGG TCCTGG TACAAGC ACC AGCATT AAGG ACATTCCC TCTAC TTGG TTCTAA [SEP]
,,,,


In [None]:
df = dataframe_creation(attributions_sum, all_tokens, 52367734, 6)

In [None]:
bed_file_creation(df, './67637')

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_neg['score']= df_neg['score']*mult*(-1)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_pos['score']= df_pos['score']*mult


# SE_67718

In [7]:
text = 'AGCTACTTGGGAGGTTGAGGCAGGAGAATCACTTGAACCAGAAGGCAGAGGTTGCAGTGGGCCGAGATCACGTCATTGCACCCCAGCCTGGGCAACAAGAGGGAAACTCTGTCTCAAAAGAAAAAAAAAATTAACACAGGTAAAAAGCTTAGATCAGTGCTGAGCACAATATAAACCCATTAGTGGCTAAACCATCAACAAGTGTTGGGAGCTGCTGCTATTTTTACTTTCCCTAGAATTCTATCTCTTACCTTTCACTCTTCTCACTGCCCTTATTTGCCCAGAAATCCCTTTATGTCCTGAAAAACTCAACTCTCATATTTTACTTTTAGGAAATTATCAGTTACTGCTCTAACACAGTTCTTGATGTATGCTCTTCACTCCCTGACCTTTTGCTTTGTTGATACTTTATTATTGTACTTACGACTCCATACTTAAAAAATATAATTGGTAAAAAAAAATGTAACTAGTAATAGGCAGAAAAACTGGAATTGATTCCCAGTGCCTGTTACATGACAGGGGCTCATTATATACTTGCTGAGTGAATGATGGAAGGTCAAGTGAACAAATTAGAGAAATCAGGCAGAAAATATTTCCAGGTATCTTGGGGAGTTGAGAATTAGAGAAGAAAAGAATGAAGGAGGTTGGGATTTGATGAAGAACATATTTGTGACAGTGAAACTCAGTCGTGGGATTTGCTGTTTATATTGTTTTCTTTCCTTCTCAAATCAACATGAGTTGTACAGACCATAATAAAAGCTTCATCTTGAGCCTGTTATTGCATCACCATTTGGCTGATGTTTCACTGCTCCATCACTGTGGGAGGTTAACACTCACTGAGGGGTGGCAGTACCCTCTGCATTTCTCTGGGAAACTCCAATGATTCATCCAAAAGTGTGAGAAGCCAAGCAGCTTTTATCACCCAGGAGACAGCTGTAACCTGACCTCAATTCATGCCAAAGAAGCCTGAGGAAAGTGCCCTGGAAGTGAACAGCCTGCTCATGACTCAAGGAACTCAAAAGTCAGAGTTCTGACCAGTATTGTTGGGGTGGGTAAAAGAACTTCACTCCCTCAGATCTGAAAGTGTCCTTGCCAGAGGAGAGGGAGACCTTATTTCAAGTGTGTTTGAATAAACATGACATACATAAACTTGATTTTCCAGGTTTTGGAGAAAGCATACATTTGTCCTCTGCATCATGAAATAATGTCCTTGGTGGCTCCTTTCAGGGCCTGTGCTGCACTCTCCTTAGTGACTATTAGCATTGGAGTTGGACAATTTAAGGGCAGGAGTGGAGACCTGCTACTTATAAAGGATGACTACACTTATTTAGGGATACTGCTCACGCTGACTCTCAGAGCAATTCTTTTGTTCCAACAGCTGTTCCCAGGGTAGGGTAATATTGGAACAGAGGCTTATGCTGCAGTATCCATTGAGTGGGACTGAGGCCCCTTCAGTAGCTGAAAATCCCCACTTCAGTGCTACTGCTTCAGCTACTGCAGCTCTTACTGTCTTCAAAAACAATGGTAAGGATTCCTTTAACCTCAGAGGAGGAATTAGCTTTTTGCAGAGACTACAAAGAATCCATAGGATACAAACATTTCTATAGTCCAGGAAGGAGTCCCACATATAAAAACAAAACTGTAATATATTTTATAAGTGATTTGCCTAAATATGTGAGGCTGTATTCACTCAGTTTCTCAAGAAGCATTTCTTGAGAAGCTACTGTGTGCCAGAGCCTCCTTAGGGGGCAGGAACTGCTTATTTATCTTCATATCAACATCCCTAGGTAAGTGCCTAGCCCATCGTATGGGCTACAGACTATGCAATGCTATTTCCCTTAGCCCCACCAGAGTTCAGGGTCAGACTGATGGGCAGGACTATGAACAGATCTTCTTTCTCTCCTTGAAGGTAACTAACCTTCCATGGGACTTGAAGCTTCAGATTTTGGCCTTAACCAAGTCAACTAGCTCAAGTCAGAGGGGCAGTGATTATTTGAATTGCCAAGGTATTACCTAATGAGAATCTTTGTGACTAAGCTCTTAAAGTTGAAACTTAAGTAACATTAGCTGAAAAACTTGTTGGATAAACATTGCTACTCCCTTGAAAATTCCGGGAGTTCCAGTTTGGTTGCTGACCATTTTTTACCATTTATCTATTTGTTTAGCACTAACGTTTCTTAAGCTTCCAATGTATATAGAATGCTATGCTGGGTTGTGGGAAATACAATGAGCTATGCTCCCTGTCTGCAAGTCGGTCACATTTTAAGTGGGGGTGCAATAAATGACAGATTCAAACCACTGAACAATTATTAACAGAGAAAAGCAACTTTTATGGGCAAAGGCTTTCGGCAACTCCAGGCACAGTCTCACCCAAGGCCTTGATTGTGGCACTGCTTCTGTCACAGAGAATAAGAGTGAAATGTTAGAAGACTGTTGAAACACTGCGGAGTTAATGTTATGTTCCTTTTCATCTTTGGGTCTTTGTACATGCTGGTTCCTTGTCTTCCCACCACTACCCCTATATCATTTATCTAATTAAAACTCATAAACATGAATGAGAAGCCCTTTTTGACCACCAGCCTACAAACAGACACACAGACACACACACACACACACACACACACACACACACACACACTGCGTTGTCCTTCCATTGAGGTACCAACAGCACACTATAATTTCTCCATTATGATAGCATTTATTACAAGGTATTATGATTTCTGTTTAACTTCTCTGTATCCCTCCTGCCTGCTACATTGTAACTTCTGTGACTGCAGGGATATATCTGTTTTGTTCACCATTATATTGGCTAGCATGTAGCAGCCATTCAATAAATACTTGCTGAATGCATGAATGAACGGCTGAATGGCAGAACCAACATTTGAGTAAAATTTTCGTGTATTGTTTACTTTGTGCTATAACTTCCTAGGTATTTTATGGATCTTCTTTCTGTGGGGTTATATATAGTATAAATTTGTTGCAATATTATATTCTTTTTAAATGCCTCAGTCACTTGTTAAATTTAGTGCTTGTTGCAGAAGGGTATAATGTTACTGATAGGAAAGCCATAGTCTTGATCCCTATATCGAGGCCAAATGGCTTCTTATCTGGAAATCTCTGCCTTAAATTGAGCAGTATCTAGATTAGATGTTTTGAAACTATGTATCACTCACTATGGTGGGCAAATAGTTCAGACAGACTAGGAGACGGGATATGAGAAACTTAGAATAAGCTACAAGAAGAATTCTAAAGACACATGACCCATTAAATTCCTTTTTCATTGAAAATCAGACCAAAATCTGTGGCAAAAACAGAAAACGTATTCCGGAAATATGGCTGTAGAACTGAAGACTAAATAGCAAGCAGTGTTTAATCTGAAGTAATGAATGTTATTTCAAGGAGCAAAGAAGCTAACACTTGCAATAAATCTTTGTTTTGAAGTATCTTTCTCAAAGGTCATCAAAATAAGTTTTAATTTAGATTCCTAAATCCAGTTTCTGCTCTGTTAGTTATTGGGGATTTTTTGAATAAATAATCTACGCAGAACTGTGGACTCTGCTCTGCTTTTTCAACCCCATGGTGTGGTCATCCAGAAAGGATTTCTTCTCCGCTCTAGGCTTAGAAATGGGGTACCTCCTGCCTGATGTATCCTATGCTTTCCAGAACCTGAAAGATTAAGATGAATCATTACAAGTGAAATGACCCTAGACAGAGAACAAAGAGGGCTGGCACATGTTTGCTGTAACATTCCGGGAGAGCTCTTCATCCCGTTTACATGTTCTTGAGAGGGTGCCTTCCGTGCTGTGATGAATGAGCCACCCAGACCTCCCGCTACCACACAGCAATTGTTTAGTCAGAGATCCTGTGCATCTGGGTCTTTTTTTTAATCAGCAGGTTCTAAATAAAAAACAAAAAACAATAACAAGCCCACCCTCTCTGAATATGACTCTCTGACTCTCTTGTGTTTCTTGTTTACATTTTATTGTGCGAATGTGATTCTGCTTCTTAGCCTAGTGCATTTGGATTTGTTGTTCACACTGAGCATAAATTGCCAAACACTCAACTTTAATCTAATTGTACATACTATAAACAGAAAATGTTGACGTTAAAAGCATTTCCATAATCACAGATTGGGTGTATGGATGAGCAAGTGGATGAGTTAGGCCTTTTGTCATCTCAGTCCATAGCTTGATCCTTCAGGTATTCAAAAGGAAACGGGGACTGTCTTCCACTGATGACCTCACTGATGATGAGGTTCATCTGCCACCATCTATAGTGAGTGAAACTTTATGGTGTAGTTGTTAAGTCTCAAATTCAGAGAGACTTAGGATCAAATCTCACTCTGCTACTTTCTAGCTATGTGACCTTGGGAAAGCCACATGGTGCCTTGAAGACTCAGTCTCCTTAACTATATTATAAGAATAATAATATTCCCTATGCCAAAGGGATCCTGTGAGATAATAACATCTTAATTGAGTTAAATTATTTAAGAGTTAAATGAGATAATGGATAAAAATCATGGCACATTTTGAGCACTTCATAAATATTAATGATAACGATCCTTATTTAAACGTGCCCTGCATTCTAAAAATGAGAAGTAACTTTCTGGCTGAAACCAACCCCTGAATGGCAACAGAGAAAGCTGTTTCAACAGGGTTGAGAAAAAAGCTGGGGGATAAAGTAATGTTTCTAATCTTAGAGTTTAAGAGAAAATACATTTTTTAATTCACTTGGTAAATTAGAGATCTTTTAGGGACACCAGAAGAAGGCACTTTCTGAAAGAGTTAAAATGATTTCCTTAGAGTAAACAAATCTCTCTCATAGAATTTTTGCTTAGACTAAGTTGATGGGACATTCATTAAGAAATAAACTTTTCATCCTCGCTTGGGTAATGCAACCAGGGAACGAGTAAATATCCCGGGAAAGCCAACTTGCTATATGCAGGTACTATTTCTTAAAAATGTTATTTTTATCTATCAAAATAATATTACTGTTATTAAGTATCATTGAGGTTCAATCCTGCGACAGAAACTGTACTTAGCTATAGGGAATCAAATATGATTGTGACATAGTTCTACCCTCAGGGGTTTTAAGTGGGAAGATAGAATATGCCATTAAAAAAAAAGTAATCCTTGGCATGGAAGGTTAAATGCCTTATAACTAACTGATGATTGATAGCAGAAGAGTGACTAATTCTCATCTAGAAAGAGAAGGCCTGGGCTCTAGTTTTGGTTCCACCACTTGTCAAGTTTGTAACCTAGGGAAATTCACTTCAATCCTTTGAACTTTCAGTTTTTCAAAGGAAATGGAGATGACGATATTTGCCCTACCATTCCCATAAGGTTGCTGTGAGGTTCAAATGAGCTAAGGTTTACGAAAACACATAATAAATTACAGCACTTCGGTGCTATTCCTTGGTGTGATCATTTTCCTTCCTCTGCCTCCTCATAGACTGAGACTCTCATAAACTGTTTTATTTTCTGTCTCAGCTTATGAAATATCTGCAAGTTATATCATTATGTGTGTGTGTGTATTGTGTGCACATTATCAAGTCTAATCAAGCCAAAGCAGCAGAACTAAACACAGATATCTGGACTCCTAAAAATCCACCACTTAATCGTGAAGACAACATTGTTAGAGAAGAAAAGATATTCTCTAAGGTTGGACCTATTTCAGAAATGAGTAGCATCACCCTTGCTTTACAATGGAGAAAACTGAGTATTGATTTATTGAACACTTATTTAATAAAGGTTTATGAAGAACCCATCCTGCACCAGGGGCCCAGGTACCAACTTAAAGAATGTGAGTGAGAAAAACAGGGAACTCAGTCCTGGCATTGACCTTTGCTGTAACTTCTGCTCATTGTAGGAATCAGCCAACTTCCTGTCCTTTAGTTTCCTCTTCTGCAAACTGAAGATTAGTTAGTTGTAGAGCATACAGTCAGTGTTATGTCTGAAAATATTGAAATACAGAGACAAAGTGAAAAAGAAGGGTATGAAACCCCTTTCCATTAGACTGTAAGAGGGATGATGATTGTTACTTTTGGGAGTTATGAGCGTGGGCAGTGGAGAGAGTGGTTTGTTTGAGGATGCCACGCTGAGCATTGGGTGGATGTGGAATTTGTGTGGGCAGGGAAGTAGAGAAGAGAGTTGGGGCAAGCTAAGACTGCCAGCTTCCAGACTGGAAGCTTCTGCGGTAGTTACGGGGAATGAGTCAGGAAATAGTTCTGTGTAAATAGTTATGAAATTTTAAAGCTAATTTTGTCATGGGCCAAAGGCATTTTTTGGGGATGATGAGAGATATCAAATTTTGTGGATGCGCCTACAAGTAGGTGATGGTTCTACACTGAAAGATTTGCCACTTTTCTTCACCCTAGAATGTTCATATTGTGCGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTATGGTTTCTTAGTGGACTGTGAGATATATTAAACATAGATAAAAGGAATATTTAACTAAAAGAGAAGCAACAGAAAGTTAATCAAATAGTATCCAAGACAGGACGGAAATGGGCTTTAGGGGAGTCCTGAGAGAAAGAGAACTCACATTCATTGAGTTCGTGTGAATTGTTTCTGGGCCCCGGGCACTGTCATATCCATGAAATAACCTTATTCTTGTCTTGAAAAGCTGTTCTCATACAGATCTGAAAACTAAGGCCCAGAGACAGTAAGCAGCTTCTGGGAATGACTATGTTGTTGAGCTCAGGTTTGAGCTATGGAGGGTATGAAGTTATTTCCTCTTAGCAACTCCATCACAGACTCAACATGCTGGGCAAACTCACTTTATCTTTAAAGAACAGTCTCTATTTGCAAAGGAGAGAACCTGCTTCCATACACTTGGGACTGTTAGAGTTGTCAGACGATGTTACCAAAGCAAAGGCACTTGAACTTAGGCCAAGGTATATGTTTCTGTAGTCACCCTGTGGTAACTACTGGGGTCAGCATTTCACAAAACCTACTTACCCTGTTTAGTTAGGAAAACCCTAGAGGTGGGGGAGTGGGAGTGAGGGTCCCCAGTCCCACTGTCATTTGGAAAAATGTCCAGATGAGAGTAGGCTGTCCACTTCCTAGAGGCAAATCTTTCTGAATCTACATAGTTTCACAGACTCACAGAACTTCAGAGCTGAAGAGACCTTCAGATAGATATTTTTCAGATAGACCTTCAGATAGACATTTTGCCGCACTGCTCAGTCTAGGTTAACGGGAAGCTAGGGCAAGAATTCACTTATGGCCCTCCCTTCTTCCTGTATTCAGTATTTTCCTGTCTGTAACATTGGGTCCATGATTAAGCTATTTAACCAGTTTCTGAATTTGTAATTTATGAAGCCAGGAAAAGGGCATTTATCACTTGAATCATCCCAGCAGCCTGTGTCAGAGTTAAGGAGGGAATTATTTTTTTTTCTAAAAATTCTGTTCTAGGCTATTTAAGGTCACTCTACTTGCCTCTTCTGGAGAGACTCGTACATGCGTTGCTGATCCCTGGGCTGAGTTCTCCCAGCCCTAGTGAACTCGGAAGTACAGGTCCAGAAGGTTCTGCTTGATGGTTCCCATCAGGGTAAAACTGAAAATAGGAAGCCGTTGGTTGCTGATTGTAAGATAAATTTGTTTAAGTAGTGTGCCAAAAGCAGTGGGTCATATGAAAAGCCACATGACCAACCAGAAATAATTGGAGCTTAAAAGATGCTAGGGTCTATGAGTAAGATTTCTTTCACCATGGGATTTAGGTAAGGCAAACTCACCCACTCACTAGTTCTTAATTCCCATTTTCTTTTTGTCCTGGAACATTTCACCTGCCCTGATGCGGCAAATTAAGTGATTGAATTAATACAGAAATGTCAGCCTTTATTGATGACAATTAGGTGTTCATATTATTTCTGTTTTATTAATAATTTATTTACCTATTCAACAAATCTTTAAAGCCTACTGTGTGCTAGATGTGGAGGAAGAAACAAGTAACACTTCCTCCGTGACAGTTTTTCTAATCCCTCTAGTGTAAATTCTCTCTCCCTTTCCTGAAACTTAGTAGTTCTTTGTTTATAGTTCTCCAATAGATTTATGCCATGTTGCCTTGTATTGTAGCAGCTTGAGAACATGTCTTACTATTTAGAACTAAGACAATTGCTTTACAAGTATTTGTCTGTACCATGATATTTAAAGTAGTGCTGGCACAGAGTATGTTGTCAGTGTTGTGGAATAAATGACTAAATGAATATTTGTTGAATTAGGTAAGAAGTTGCTTCAGCTTTGGCTGTTATGCTGCTGTAACAAACAGCTCCCAAATTTCAATAGCTCAGAACACAATGATTTATTTCTCATCTATGTTAATGCCCATAGTGAGTTAGGTGCAGCTCTGCTCCCCATCTTCTGGATTTGGGGATCTGGGTAGAAATAGCCATTAGTTGGGATTTTCTTGTGTTGGGGAACAAGAGAGATGGCAGAAACACATGATAGATCAGAAGTGGCATTCATTGGCTGGGCACGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCATAGGCAGGTGGATCACCTGAGCTCAGGAGCCCAAGATCAGCCTGGCCAACAATGGTGAAACCCCATCTCTACTAAAAATACAAAAATTAGCCAAGCACGGTGGCAGGCACCTGTATCTCAGCTACTTGGAAGGCTGAGGCAAGAGAATTGCTTGAACCCGGGAGGTGGAGGTTGCAGTGAGCTAAGATTGCGCTACCACCCTCCACCTGAGCAGCAGAGCGAGACTCTGTCAAAAAACAAACAAACAAACAAACAACATCACTTCTGCTCAAATTTCGTTGGCCCAAACTAGTCATGTAGCCACGCCTGCCGTGGAGGGCAGACAAGGATAATTCTCCCATGAGAAAGGCCATGAATCTTTGGGAATAATAATATAATTTACCAGAGAAGTCATCCTTATTTTTTAAAGAACTTAAAATTTAGTTGAGGAAGTAAGCTATACACAAAGAAATACAATAAAAAAAAGGTGCAAGCAACATGTTATAGAGGTGAGGGAGGAGAGATTTCTTTGGACTAAGATTAGTCACAGAAGGATTAATAAAAGATGTGTTCTTTAAATTGGACATGAAAAGTAAGATTTTGCCAAGTGGAACTGGACAAGAGGTGAATAGAAGAGTATTTAAAAAGATATGAAGGTACTCAAACAAAAAATGTACTAAAAAAAAGAGTGAAAAGTCCACTTTTGGTGGATAATTAGGTCCACATTTCAAAGTTGGGAATTTAGAGTCTATTAAGCAGGAAATTATAAACCACTAGAGATTTGGAAAGCTAACTAAAGGATGCAATGGAGAGAAGCTGAAAATATTTTTGAGGCTATGCAAAGAGTTCAGGAAACAGGGACTAAAGACAGAATCAGAATAGTGAAAAGTATGAACAGGACAGAACATACAGAGGCAAGATGCAAAGGAAATGTACAAAGGTTGAAAACCGATTGGTTTGGAAAGCAAAGGAGAGAGGCAGTGAAAGAAGTTGCAGATGATTATTCCATTAATGGTGGTGCCATTAATGGAATTCAAAAAATAAGAAGAGGACTGACTCATAGGAAGAGAAAATAAGTTTTGTTTGAGGTATTCTGATTTCGAGGAATTTCAGAGAGAAATGTTTAGTAGGCGTATGGAACTCTGGGAATAGAGTTTGTGGGATTGTGGTTGTGATTGAAGATGTAGTCCTGAGGGACCCCTGAAGAGGTGACAGTTGAAGCCATGAGTGCAGATGAGAATCCCAAAGGAAACTAGTGGCCAAAAGGCAGAGTCTTGGAGGGCTGCCAACATGTAGGATGTGGGAAGATGAAGACAAACCAGGGAGGGAAGCTGAAGAACCTTGACAAGGCAGAGAGGAGAACACTATAGTGTGGGATCAAGTGAGCTGAGGCAGGAGAGAGGCTGAGGAGCAGGGAGAGGTCAGCGGTGTCAAATGCTTTAGAAAGTGCTAAGAAGATGAGAATGTAGGAAGTGGTATTGAGGTTAGAGTAGGAGATCATTGGCGATGAGTAAGGAAACAACTTCAGTGAGGACTGGAGATGTTCTTGTGAGATATCTGATAACAAAAATTACAGAGATTGCATAATGGAGGATTAGTTGGAACTGGTGGAACTGAGAGTACGCTTAGTGCGATAACCTTTGAAAAGAAGAGGAACCTATTCCATTTGGGGAAGGCAGGAGAAAACTATGCACTAAGAGAGAACTTGTCCATGAGAAGGAGTGATTTTTAAGGTGCTTCTTAACAAAGTAGAGTTTAGGGAATGTATTCACTCTTTGAAATTAAAAAGCAATTGCTTATTATTGAAAACCCAGGTTAGCTATTAAAAAAAAAAAAAGAGAAAAATAAGACAAAAAAAGAAAAAAAAACCATGCATGTGTAACAAGTCAGGGGAAGCTGAGGAGACCTTCCAAACTGTACTGTATTCACTTGCATATATTCCACATCTGGCACTGGGCAGTCAAATATTCACAGGTAATAAATAGATATTAAAGAATGTATTATTGGGCATTAGGACTCATAATTTTAGAAAAATGTTTTTTGTGGCTGGGCGTGGTGGCTCACTCCTGTAATCCCAGCACTTTGGGAGGCCAAGGAGAGTGGATCAGAAGGTCAGGAGATCGACAGCATCCTGGCCAACATGGTGAAACCCCGT'

In [8]:
ref_token_id = tokenizer.pad_token_id # A token used for generating token reference
sep_token_id = tokenizer.sep_token_id # A token used as a separator between question and text and it is also added to the end of the text.
cls_token_id = tokenizer.cls_token_id # A token used for prepending to the concatenated question-text word sequence

lig = LayerIntegratedGradients(custom_forward, model.bert.embeddings)

input_ids, ref_input_ids, sep_id = construct_input_ref_pair(text, ref_token_id, sep_token_id, cls_token_id)
token_type_ids, ref_token_type_ids = construct_input_ref_token_type_pair(input_ids, sep_id)
position_ids, ref_position_ids = construct_input_ref_pos_id_pair(input_ids)
attention_mask = construct_attention_mask(input_ids)

indices = input_ids[0].detach().tolist()
all_tokens = tokenizer.convert_ids_to_tokens(indices)

In [9]:
predict(input_ids)

tensor([[-0.1817,  0.0391]], grad_fn=<AddmmBackward0>)

In [10]:
torch.cuda.empty_cache()
custom_forward(input_ids)

tensor([0.5550], grad_fn=<UnsqueezeBackward0>)

In [11]:
attributions, delta = lig.attribute(inputs=input_ids,
                                    baselines=ref_input_ids,
                                    n_steps=700,
                                    internal_batch_size=1,
                                    return_convergence_delta=True)

score = predict(input_ids)

print('Sentence: ', text)
print('Sentiment: ' + str(torch.argmax(score[0]).cpu().numpy()) + \
      ', Probability positive: ' + str(torch.softmax(score, dim = 1)[0][1].cpu().detach().numpy()))

attributions_sum = summarize_attributions(attributions)

# storing couple samples in an array for visualization purposes
score_vis = viz.VisualizationDataRecord(attributions_sum,
                                        torch.softmax(score, dim = 1)[0][1],
                                        torch.argmax(torch.softmax(score, dim = 0)[0]),
                                        1,
                                        text,
                                        attributions_sum.sum(),
                                        all_tokens,
                                        delta)

Sentence:  AGCTACTTGGGAGGTTGAGGCAGGAGAATCACTTGAACCAGAAGGCAGAGGTTGCAGTGGGCCGAGATCACGTCATTGCACCCCAGCCTGGGCAACAAGAGGGAAACTCTGTCTCAAAAGAAAAAAAAAATTAACACAGGTAAAAAGCTTAGATCAGTGCTGAGCACAATATAAACCCATTAGTGGCTAAACCATCAACAAGTGTTGGGAGCTGCTGCTATTTTTACTTTCCCTAGAATTCTATCTCTTACCTTTCACTCTTCTCACTGCCCTTATTTGCCCAGAAATCCCTTTATGTCCTGAAAAACTCAACTCTCATATTTTACTTTTAGGAAATTATCAGTTACTGCTCTAACACAGTTCTTGATGTATGCTCTTCACTCCCTGACCTTTTGCTTTGTTGATACTTTATTATTGTACTTACGACTCCATACTTAAAAAATATAATTGGTAAAAAAAAATGTAACTAGTAATAGGCAGAAAAACTGGAATTGATTCCCAGTGCCTGTTACATGACAGGGGCTCATTATATACTTGCTGAGTGAATGATGGAAGGTCAAGTGAACAAATTAGAGAAATCAGGCAGAAAATATTTCCAGGTATCTTGGGGAGTTGAGAATTAGAGAAGAAAAGAATGAAGGAGGTTGGGATTTGATGAAGAACATATTTGTGACAGTGAAACTCAGTCGTGGGATTTGCTGTTTATATTGTTTTCTTTCCTTCTCAAATCAACATGAGTTGTACAGACCATAATAAAAGCTTCATCTTGAGCCTGTTATTGCATCACCATTTGGCTGATGTTTCACTGCTCCATCACTGTGGGAGGTTAACACTCACTGAGGGGTGGCAGTACCCTCTGCATTTCTCTGGGAAACTCCAATGATTCATCCAAAAGTGTGAGAAGCCAAGCAGCTTTTATCACCCAGGAGACAGCTGTAACCTGACCTCAATTCATGCCAAAGAAGCCTGAGGAAAGTGCCCTGGAAGTG

In [12]:
print('\033[1m', 'Visualization For Score', '\033[0m')
viz.visualize_text([score_vis])

[1m Visualization For Score [0m


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
1.0,0 (0.55),AGCTACTTGGGAGGTTGAGGCAGGAGAATCACTTGAACCAGAAGGCAGAGGTTGCAGTGGGCCGAGATCACGTCATTGCACCCCAGCCTGGGCAACAAGAGGGAAACTCTGTCTCAAAAGAAAAAAAAAATTAACACAGGTAAAAAGCTTAGATCAGTGCTGAGCACAATATAAACCCATTAGTGGCTAAACCATCAACAAGTGTTGGGAGCTGCTGCTATTTTTACTTTCCCTAGAATTCTATCTCTTACCTTTCACTCTTCTCACTGCCCTTATTTGCCCAGAAATCCCTTTATGTCCTGAAAAACTCAACTCTCATATTTTACTTTTAGGAAATTATCAGTTACTGCTCTAACACAGTTCTTGATGTATGCTCTTCACTCCCTGACCTTTTGCTTTGTTGATACTTTATTATTGTACTTACGACTCCATACTTAAAAAATATAATTGGTAAAAAAAAATGTAACTAGTAATAGGCAGAAAAACTGGAATTGATTCCCAGTGCCTGTTACATGACAGGGGCTCATTATATACTTGCTGAGTGAATGATGGAAGGTCAAGTGAACAAATTAGAGAAATCAGGCAGAAAATATTTCCAGGTATCTTGGGGAGTTGAGAATTAGAGAAGAAAAGAATGAAGGAGGTTGGGATTTGATGAAGAACATATTTGTGACAGTGAAACTCAGTCGTGGGATTTGCTGTTTATATTGTTTTCTTTCCTTCTCAAATCAACATGAGTTGTACAGACCATAATAAAAGCTTCATCTTGAGCCTGTTATTGCATCACCATTTGGCTGATGTTTCACTGCTCCATCACTGTGGGAGGTTAACACTCACTGAGGGGTGGCAGTACCCTCTGCATTTCTCTGGGAAACTCCAATGATTCATCCAAAAGTGTGAGAAGCCAAGCAGCTTTTATCACCCAGGAGACAGCTGTAACCTGACCTCAATTCATGCCAAAGAAGCCTGAGGAAAGTGCCCTGGAAGTGAACAGCCTGCTCATGACTCAAGGAACTCAAAAGTCAGAGTTCTGACCAGTATTGTTGGGGTGGGTAAAAGAACTTCACTCCCTCAGATCTGAAAGTGTCCTTGCCAGAGGAGAGGGAGACCTTATTTCAAGTGTGTTTGAATAAACATGACATACATAAACTTGATTTTCCAGGTTTTGGAGAAAGCATACATTTGTCCTCTGCATCATGAAATAATGTCCTTGGTGGCTCCTTTCAGGGCCTGTGCTGCACTCTCCTTAGTGACTATTAGCATTGGAGTTGGACAATTTAAGGGCAGGAGTGGAGACCTGCTACTTATAAAGGATGACTACACTTATTTAGGGATACTGCTCACGCTGACTCTCAGAGCAATTCTTTTGTTCCAACAGCTGTTCCCAGGGTAGGGTAATATTGGAACAGAGGCTTATGCTGCAGTATCCATTGAGTGGGACTGAGGCCCCTTCAGTAGCTGAAAATCCCCACTTCAGTGCTACTGCTTCAGCTACTGCAGCTCTTACTGTCTTCAAAAACAATGGTAAGGATTCCTTTAACCTCAGAGGAGGAATTAGCTTTTTGCAGAGACTACAAAGAATCCATAGGATACAAACATTTCTATAGTCCAGGAAGGAGTCCCACATATAAAAACAAAACTGTAATATATTTTATAAGTGATTTGCCTAAATATGTGAGGCTGTATTCACTCAGTTTCTCAAGAAGCATTTCTTGAGAAGCTACTGTGTGCCAGAGCCTCCTTAGGGGGCAGGAACTGCTTATTTATCTTCATATCAACATCCCTAGGTAAGTGCCTAGCCCATCGTATGGGCTACAGACTATGCAATGCTATTTCCCTTAGCCCCACCAGAGTTCAGGGTCAGACTGATGGGCAGGACTATGAACAGATCTTCTTTCTCTCCTTGAAGGTAACTAACCTTCCATGGGACTTGAAGCTTCAGATTTTGGCCTTAACCAAGTCAACTAGCTCAAGTCAGAGGGGCAGTGATTATTTGAATTGCCAAGGTATTACCTAATGAGAATCTTTGTGACTAAGCTCTTAAAGTTGAAACTTAAGTAACATTAGCTGAAAAACTTGTTGGATAAACATTGCTACTCCCTTGAAAATTCCGGGAGTTCCAGTTTGGTTGCTGACCATTTTTTACCATTTATCTATTTGTTTAGCACTAACGTTTCTTAAGCTTCCAATGTATATAGAATGCTATGCTGGGTTGTGGGAAATACAATGAGCTATGCTCCCTGTCTGCAAGTCGGTCACATTTTAAGTGGGGGTGCAATAAATGACAGATTCAAACCACTGAACAATTATTAACAGAGAAAAGCAACTTTTATGGGCAAAGGCTTTCGGCAACTCCAGGCACAGTCTCACCCAAGGCCTTGATTGTGGCACTGCTTCTGTCACAGAGAATAAGAGTGAAATGTTAGAAGACTGTTGAAACACTGCGGAGTTAATGTTATGTTCCTTTTCATCTTTGGGTCTTTGTACATGCTGGTTCCTTGTCTTCCCACCACTACCCCTATATCATTTATCTAATTAAAACTCATAAACATGAATGAGAAGCCCTTTTTGACCACCAGCCTACAAACAGACACACAGACACACACACACACACACACACACACACACACACACACACTGCGTTGTCCTTCCATTGAGGTACCAACAGCACACTATAATTTCTCCATTATGATAGCATTTATTACAAGGTATTATGATTTCTGTTTAACTTCTCTGTATCCCTCCTGCCTGCTACATTGTAACTTCTGTGACTGCAGGGATATATCTGTTTTGTTCACCATTATATTGGCTAGCATGTAGCAGCCATTCAATAAATACTTGCTGAATGCATGAATGAACGGCTGAATGGCAGAACCAACATTTGAGTAAAATTTTCGTGTATTGTTTACTTTGTGCTATAACTTCCTAGGTATTTTATGGATCTTCTTTCTGTGGGGTTATATATAGTATAAATTTGTTGCAATATTATATTCTTTTTAAATGCCTCAGTCACTTGTTAAATTTAGTGCTTGTTGCAGAAGGGTATAATGTTACTGATAGGAAAGCCATAGTCTTGATCCCTATATCGAGGCCAAATGGCTTCTTATCTGGAAATCTCTGCCTTAAATTGAGCAGTATCTAGATTAGATGTTTTGAAACTATGTATCACTCACTATGGTGGGCAAATAGTTCAGACAGACTAGGAGACGGGATATGAGAAACTTAGAATAAGCTACAAGAAGAATTCTAAAGACACATGACCCATTAAATTCCTTTTTCATTGAAAATCAGACCAAAATCTGTGGCAAAAACAGAAAACGTATTCCGGAAATATGGCTGTAGAACTGAAGACTAAATAGCAAGCAGTGTTTAATCTGAAGTAATGAATGTTATTTCAAGGAGCAAAGAAGCTAACACTTGCAATAAATCTTTGTTTTGAAGTATCTTTCTCAAAGGTCATCAAAATAAGTTTTAATTTAGATTCCTAAATCCAGTTTCTGCTCTGTTAGTTATTGGGGATTTTTTGAATAAATAATCTACGCAGAACTGTGGACTCTGCTCTGCTTTTTCAACCCCATGGTGTGGTCATCCAGAAAGGATTTCTTCTCCGCTCTAGGCTTAGAAATGGGGTACCTCCTGCCTGATGTATCCTATGCTTTCCAGAACCTGAAAGATTAAGATGAATCATTACAAGTGAAATGACCCTAGACAGAGAACAAAGAGGGCTGGCACATGTTTGCTGTAACATTCCGGGAGAGCTCTTCATCCCGTTTACATGTTCTTGAGAGGGTGCCTTCCGTGCTGTGATGAATGAGCCACCCAGACCTCCCGCTACCACACAGCAATTGTTTAGTCAGAGATCCTGTGCATCTGGGTCTTTTTTTTAATCAGCAGGTTCTAAATAAAAAACAAAAAACAATAACAAGCCCACCCTCTCTGAATATGACTCTCTGACTCTCTTGTGTTTCTTGTTTACATTTTATTGTGCGAATGTGATTCTGCTTCTTAGCCTAGTGCATTTGGATTTGTTGTTCACACTGAGCATAAATTGCCAAACACTCAACTTTAATCTAATTGTACATACTATAAACAGAAAATGTTGACGTTAAAAGCATTTCCATAATCACAGATTGGGTGTATGGATGAGCAAGTGGATGAGTTAGGCCTTTTGTCATCTCAGTCCATAGCTTGATCCTTCAGGTATTCAAAAGGAAACGGGGACTGTCTTCCACTGATGACCTCACTGATGATGAGGTTCATCTGCCACCATCTATAGTGAGTGAAACTTTATGGTGTAGTTGTTAAGTCTCAAATTCAGAGAGACTTAGGATCAAATCTCACTCTGCTACTTTCTAGCTATGTGACCTTGGGAAAGCCACATGGTGCCTTGAAGACTCAGTCTCCTTAACTATATTATAAGAATAATAATATTCCCTATGCCAAAGGGATCCTGTGAGATAATAACATCTTAATTGAGTTAAATTATTTAAGAGTTAAATGAGATAATGGATAAAAATCATGGCACATTTTGAGCACTTCATAAATATTAATGATAACGATCCTTATTTAAACGTGCCCTGCATTCTAAAAATGAGAAGTAACTTTCTGGCTGAAACCAACCCCTGAATGGCAACAGAGAAAGCTGTTTCAACAGGGTTGAGAAAAAAGCTGGGGGATAAAGTAATGTTTCTAATCTTAGAGTTTAAGAGAAAATACATTTTTTAATTCACTTGGTAAATTAGAGATCTTTTAGGGACACCAGAAGAAGGCACTTTCTGAAAGAGTTAAAATGATTTCCTTAGAGTAAACAAATCTCTCTCATAGAATTTTTGCTTAGACTAAGTTGATGGGACATTCATTAAGAAATAAACTTTTCATCCTCGCTTGGGTAATGCAACCAGGGAACGAGTAAATATCCCGGGAAAGCCAACTTGCTATATGCAGGTACTATTTCTTAAAAATGTTATTTTTATCTATCAAAATAATATTACTGTTATTAAGTATCATTGAGGTTCAATCCTGCGACAGAAACTGTACTTAGCTATAGGGAATCAAATATGATTGTGACATAGTTCTACCCTCAGGGGTTTTAAGTGGGAAGATAGAATATGCCATTAAAAAAAAAGTAATCCTTGGCATGGAAGGTTAAATGCCTTATAACTAACTGATGATTGATAGCAGAAGAGTGACTAATTCTCATCTAGAAAGAGAAGGCCTGGGCTCTAGTTTTGGTTCCACCACTTGTCAAGTTTGTAACCTAGGGAAATTCACTTCAATCCTTTGAACTTTCAGTTTTTCAAAGGAAATGGAGATGACGATATTTGCCCTACCATTCCCATAAGGTTGCTGTGAGGTTCAAATGAGCTAAGGTTTACGAAAACACATAATAAATTACAGCACTTCGGTGCTATTCCTTGGTGTGATCATTTTCCTTCCTCTGCCTCCTCATAGACTGAGACTCTCATAAACTGTTTTATTTTCTGTCTCAGCTTATGAAATATCTGCAAGTTATATCATTATGTGTGTGTGTGTATTGTGTGCACATTATCAAGTCTAATCAAGCCAAAGCAGCAGAACTAAACACAGATATCTGGACTCCTAAAAATCCACCACTTAATCGTGAAGACAACATTGTTAGAGAAGAAAAGATATTCTCTAAGGTTGGACCTATTTCAGAAATGAGTAGCATCACCCTTGCTTTACAATGGAGAAAACTGAGTATTGATTTATTGAACACTTATTTAATAAAGGTTTATGAAGAACCCATCCTGCACCAGGGGCCCAGGTACCAACTTAAAGAATGTGAGTGAGAAAAACAGGGAACTCAGTCCTGGCATTGACCTTTGCTGTAACTTCTGCTCATTGTAGGAATCAGCCAACTTCCTGTCCTTTAGTTTCCTCTTCTGCAAACTGAAGATTAGTTAGTTGTAGAGCATACAGTCAGTGTTATGTCTGAAAATATTGAAATACAGAGACAAAGTGAAAAAGAAGGGTATGAAACCCCTTTCCATTAGACTGTAAGAGGGATGATGATTGTTACTTTTGGGAGTTATGAGCGTGGGCAGTGGAGAGAGTGGTTTGTTTGAGGATGCCACGCTGAGCATTGGGTGGATGTGGAATTTGTGTGGGCAGGGAAGTAGAGAAGAGAGTTGGGGCAAGCTAAGACTGCCAGCTTCCAGACTGGAAGCTTCTGCGGTAGTTACGGGGAATGAGTCAGGAAATAGTTCTGTGTAAATAGTTATGAAATTTTAAAGCTAATTTTGTCATGGGCCAAAGGCATTTTTTGGGGATGATGAGAGATATCAAATTTTGTGGATGCGCCTACAAGTAGGTGATGGTTCTACACTGAAAGATTTGCCACTTTTCTTCACCCTAGAATGTTCATATTGTGCGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTATGGTTTCTTAGTGGACTGTGAGATATATTAAACATAGATAAAAGGAATATTTAACTAAAAGAGAAGCAACAGAAAGTTAATCAAATAGTATCCAAGACAGGACGGAAATGGGCTTTAGGGGAGTCCTGAGAGAAAGAGAACTCACATTCATTGAGTTCGTGTGAATTGTTTCTGGGCCCCGGGCACTGTCATATCCATGAAATAACCTTATTCTTGTCTTGAAAAGCTGTTCTCATACAGATCTGAAAACTAAGGCCCAGAGACAGTAAGCAGCTTCTGGGAATGACTATGTTGTTGAGCTCAGGTTTGAGCTATGGAGGGTATGAAGTTATTTCCTCTTAGCAACTCCATCACAGACTCAACATGCTGGGCAAACTCACTTTATCTTTAAAGAACAGTCTCTATTTGCAAAGGAGAGAACCTGCTTCCATACACTTGGGACTGTTAGAGTTGTCAGACGATGTTACCAAAGCAAAGGCACTTGAACTTAGGCCAAGGTATATGTTTCTGTAGTCACCCTGTGGTAACTACTGGGGTCAGCATTTCACAAAACCTACTTACCCTGTTTAGTTAGGAAAACCCTAGAGGTGGGGGAGTGGGAGTGAGGGTCCCCAGTCCCACTGTCATTTGGAAAAATGTCCAGATGAGAGTAGGCTGTCCACTTCCTAGAGGCAAATCTTTCTGAATCTACATAGTTTCACAGACTCACAGAACTTCAGAGCTGAAGAGACCTTCAGATAGATATTTTTCAGATAGACCTTCAGATAGACATTTTGCCGCACTGCTCAGTCTAGGTTAACGGGAAGCTAGGGCAAGAATTCACTTATGGCCCTCCCTTCTTCCTGTATTCAGTATTTTCCTGTCTGTAACATTGGGTCCATGATTAAGCTATTTAACCAGTTTCTGAATTTGTAATTTATGAAGCCAGGAAAAGGGCATTTATCACTTGAATCATCCCAGCAGCCTGTGTCAGAGTTAAGGAGGGAATTATTTTTTTTTCTAAAAATTCTGTTCTAGGCTATTTAAGGTCACTCTACTTGCCTCTTCTGGAGAGACTCGTACATGCGTTGCTGATCCCTGGGCTGAGTTCTCCCAGCCCTAGTGAACTCGGAAGTACAGGTCCAGAAGGTTCTGCTTGATGGTTCCCATCAGGGTAAAACTGAAAATAGGAAGCCGTTGGTTGCTGATTGTAAGATAAATTTGTTTAAGTAGTGTGCCAAAAGCAGTGGGTCATATGAAAAGCCACATGACCAACCAGAAATAATTGGAGCTTAAAAGATGCTAGGGTCTATGAGTAAGATTTCTTTCACCATGGGATTTAGGTAAGGCAAACTCACCCACTCACTAGTTCTTAATTCCCATTTTCTTTTTGTCCTGGAACATTTCACCTGCCCTGATGCGGCAAATTAAGTGATTGAATTAATACAGAAATGTCAGCCTTTATTGATGACAATTAGGTGTTCATATTATTTCTGTTTTATTAATAATTTATTTACCTATTCAACAAATCTTTAAAGCCTACTGTGTGCTAGATGTGGAGGAAGAAACAAGTAACACTTCCTCCGTGACAGTTTTTCTAATCCCTCTAGTGTAAATTCTCTCTCCCTTTCCTGAAACTTAGTAGTTCTTTGTTTATAGTTCTCCAATAGATTTATGCCATGTTGCCTTGTATTGTAGCAGCTTGAGAACATGTCTTACTATTTAGAACTAAGACAATTGCTTTACAAGTATTTGTCTGTACCATGATATTTAAAGTAGTGCTGGCACAGAGTATGTTGTCAGTGTTGTGGAATAAATGACTAAATGAATATTTGTTGAATTAGGTAAGAAGTTGCTTCAGCTTTGGCTGTTATGCTGCTGTAACAAACAGCTCCCAAATTTCAATAGCTCAGAACACAATGATTTATTTCTCATCTATGTTAATGCCCATAGTGAGTTAGGTGCAGCTCTGCTCCCCATCTTCTGGATTTGGGGATCTGGGTAGAAATAGCCATTAGTTGGGATTTTCTTGTGTTGGGGAACAAGAGAGATGGCAGAAACACATGATAGATCAGAAGTGGCATTCATTGGCTGGGCACGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCATAGGCAGGTGGATCACCTGAGCTCAGGAGCCCAAGATCAGCCTGGCCAACAATGGTGAAACCCCATCTCTACTAAAAATACAAAAATTAGCCAAGCACGGTGGCAGGCACCTGTATCTCAGCTACTTGGAAGGCTGAGGCAAGAGAATTGCTTGAACCCGGGAGGTGGAGGTTGCAGTGAGCTAAGATTGCGCTACCACCCTCCACCTGAGCAGCAGAGCGAGACTCTGTCAAAAAACAAACAAACAAACAAACAACATCACTTCTGCTCAAATTTCGTTGGCCCAAACTAGTCATGTAGCCACGCCTGCCGTGGAGGGCAGACAAGGATAATTCTCCCATGAGAAAGGCCATGAATCTTTGGGAATAATAATATAATTTACCAGAGAAGTCATCCTTATTTTTTAAAGAACTTAAAATTTAGTTGAGGAAGTAAGCTATACACAAAGAAATACAATAAAAAAAAGGTGCAAGCAACATGTTATAGAGGTGAGGGAGGAGAGATTTCTTTGGACTAAGATTAGTCACAGAAGGATTAATAAAAGATGTGTTCTTTAAATTGGACATGAAAAGTAAGATTTTGCCAAGTGGAACTGGACAAGAGGTGAATAGAAGAGTATTTAAAAAGATATGAAGGTACTCAAACAAAAAATGTACTAAAAAAAAGAGTGAAAAGTCCACTTTTGGTGGATAATTAGGTCCACATTTCAAAGTTGGGAATTTAGAGTCTATTAAGCAGGAAATTATAAACCACTAGAGATTTGGAAAGCTAACTAAAGGATGCAATGGAGAGAAGCTGAAAATATTTTTGAGGCTATGCAAAGAGTTCAGGAAACAGGGACTAAAGACAGAATCAGAATAGTGAAAAGTATGAACAGGACAGAACATACAGAGGCAAGATGCAAAGGAAATGTACAAAGGTTGAAAACCGATTGGTTTGGAAAGCAAAGGAGAGAGGCAGTGAAAGAAGTTGCAGATGATTATTCCATTAATGGTGGTGCCATTAATGGAATTCAAAAAATAAGAAGAGGACTGACTCATAGGAAGAGAAAATAAGTTTTGTTTGAGGTATTCTGATTTCGAGGAATTTCAGAGAGAAATGTTTAGTAGGCGTATGGAACTCTGGGAATAGAGTTTGTGGGATTGTGGTTGTGATTGAAGATGTAGTCCTGAGGGACCCCTGAAGAGGTGACAGTTGAAGCCATGAGTGCAGATGAGAATCCCAAAGGAAACTAGTGGCCAAAAGGCAGAGTCTTGGAGGGCTGCCAACATGTAGGATGTGGGAAGATGAAGACAAACCAGGGAGGGAAGCTGAAGAACCTTGACAAGGCAGAGAGGAGAACACTATAGTGTGGGATCAAGTGAGCTGAGGCAGGAGAGAGGCTGAGGAGCAGGGAGAGGTCAGCGGTGTCAAATGCTTTAGAAAGTGCTAAGAAGATGAGAATGTAGGAAGTGGTATTGAGGTTAGAGTAGGAGATCATTGGCGATGAGTAAGGAAACAACTTCAGTGAGGACTGGAGATGTTCTTGTGAGATATCTGATAACAAAAATTACAGAGATTGCATAATGGAGGATTAGTTGGAACTGGTGGAACTGAGAGTACGCTTAGTGCGATAACCTTTGAAAAGAAGAGGAACCTATTCCATTTGGGGAAGGCAGGAGAAAACTATGCACTAAGAGAGAACTTGTCCATGAGAAGGAGTGATTTTTAAGGTGCTTCTTAACAAAGTAGAGTTTAGGGAATGTATTCACTCTTTGAAATTAAAAAGCAATTGCTTATTATTGAAAACCCAGGTTAGCTATTAAAAAAAAAAAAAGAGAAAAATAAGACAAAAAAAGAAAAAAAAACCATGCATGTGTAACAAGTCAGGGGAAGCTGAGGAGACCTTCCAAACTGTACTGTATTCACTTGCATATATTCCACATCTGGCACTGGGCAGTCAAATATTCACAGGTAATAAATAGATATTAAAGAATGTATTATTGGGCATTAGGACTCATAATTTTAGAAAAATGTTTTTTGTGGCTGGGCGTGGTGGCTCACTCCTGTAATCCCAGCACTTTGGGAGGCCAAGGAGAGTGGATCAGAAGGTCAGGAGATCGACAGCATCCTGGCCAACATGGTGAAACCCCGT,2.37,[CLS] AGCTAC TTGGG AGGTTGAGGCAGGAGAA TCACTTGAACC AGAAGGC AGAGGTTGC AGTGGGCC G AGATCACG TCATTGC ACCCC AGCCTGGGCAACAAG AGGGAAAC TCTGTCTC AAAAGAAAAAAAA AATTAAC ACAGG TAAAAAGC TTAGATC AGTGC TGAGC ACAA TATAAACCC ATT AGTGGC TAAACC ATCAAC AAG TGTTGGG AGCTGCTGC TATTTTTAC TTTCCC TAGAATTC TATC TCTTACC TTTCACTC TTCTCAC TGCCC TTATT TGCCC AGAAATCCC TTTATG TCCTGAAAA ACTC AACTCTC ATATT TTACTTTT AGGAAATT ATC AGTTAC TGCTC TAACACAG TTCTTG ATGTATGC TCTTC ACTCCC TGACC TTTTGC TTTGTTG ATAC TTTATT ATTGTAC TTACG ACTCC ATACTTAAAA AATAT AATTGG TAAAAAA AAATGTAAC TAGTAA TAGGC AGAAAA ACTGG AATTG ATTCCC AGTGCC TGTTAC ATGAC AGGGGC TCATT ATAT ACTTGC TGAGTGAA TGATGG AAGGTCAAG TGAAC AAATT AGAGAA ATCAGGC AGAAAATATT TCCAGG TATC TTGGGG AGTTG AGAA TTAGAG AAGAAAAG AATG AAGGAGG TTGGG ATTTGATG AAGAAC ATATTTGTG ACAGTG AAAC TCAGTC GTGGG ATTTGC TGTTTAT ATTGTTTTC TTTCC TTCTC AAATC AACATG AGTTGTAC AGACC ATAATAA AAGCTTC ATCTTG AGCC TGTTATTGC ATCACC ATTTGGC TGATGTTTC ACTGC TCCATC ACTG TGGGAGG TTAAC ACTCAC TGAGGGG TGGC AGTACCC TCTGC ATTTCTC TGGG AAACTCC AATG ATTCATCC AAAAGTGTG AGAAGCC AAGC AGCTTTT ATCACCC AGGAGAC AGC TGTAACC TGACC TCAATTC ATGCC AAAGAAGCC TGAGG AAAGTGCCC TGGAAG TGAAC AGCCTGC TCATG ACTCAAGG AACTCAAAAG TCAGAG TTCTGACC AGTATTG TTGGGG TGGG TAAAAGAAC TTCACTCCC TCAGATC TGAAAG TGTCC TTGCC AGAGGAG AGGGAGACC TTATT TCAAG TGTGTTTG AATAAACATG ACATAC ATAAACTTG ATTTTCC AGGTTTTGG AGAAAGC ATACATTTG TCCTCTGC ATCATG AAATAA TGTCC TTGGTGGC TCCTTTC AGGGCC TGTGCTGC ACTCTCC TTAGTG ACTATT AGCATTGG AGTTGG ACAATTTAA GGGC AGGAGTGG AGACC TGCTAC TTATAA AGGATG ACTAC ACTTATT TAGGG ATACTGC TCACGC TGACTCTC AGAGC AATTC TTTTG TTCCAAC AGCTG TTCCCAGGG TAGGG TAA TATTGG AAC AGAGGC TTATGC TGC AGTATCC ATTG AGTGGG ACTG AGGCCCC TTCAGTAGC TGAAAA TCCCC ACTTC AGTGCTAC TGCTTC AGCTAC TGC AGCTC TTACTGTC TTCAAAA ACAATGG TAAGG ATTCC TTTAACC TCAG AGGAGG AATTAGC TTTTTGC AGAGACTAC AAAGAA TCC ATAGG ATACAAAC ATTTC TATAGTCC AGGAAGG AGTCCC ACATAT AAAAACAAAAC TGTAA TATATTTT ATAAG TGATTTGCC TAAATATG TGAGGC TGTATTC ACTCAG TTTCTCAAG AAGC ATTTCTTG AGAAGC TACTGTG TGCC AGAGCC TCC TTAGGG GGC AGGAAC TGCTTATT TATCTTC ATATCAAC ATCCC TAGG TAAGTGCC TAGCCC ATCG TATGGGC TACAGAC TATGC AATGC TATTTCCC TTAGCCCC ACCAGAG TTCAGGG TCAGAC TGATGGGC AGGAC TATGAAC AGATC TTCTTTC TCTCC TTGAAGG TAAC TAACC TTCC ATGGG ACTTG AAGCTTC AGATT TTGGCC TTAACC AAGTCAAC TAGC TCAAG TCAG AGGGGC AGTG ATTATT TGAATTGCC AAGGTATT ACCTAA TGAGAA TCTTTGTG ACTAAGC TCTTAAAG TTGAAAC TTAAGTAAC ATTAGC TGAAAA ACTTG TTGGATAA ACATTGC TACTCCC TTGAAAA TTCCGGG AGTTCC AGTTTGG TTGC TGACC ATTTTTT ACC ATTTATC TATT TGTTTAGC ACTAACG TTTC TTAAGC TTCCAATG TATATAGAA TGCTATGC TGGG TTGTGGG AAATAC AATGAGC TATGC TCCCTGTC TGCAAG TCGG TCAC ATTTTAAG TGGGGG TGC AATAAATG ACAGATTC AAACC ACTGAAC AATTATT AACAGAG AAAAGC AACTTTT ATGGGC AAAGGC TTTCGGC AACTCC AGGC ACAGTCTC ACCC AAGGCC TTGATTG TGGCACTGC TTCTGTCAC AGAGAA TAAG AGTGAA ATG TTAGAAG ACTGTTG AAACAC TGCGG AGTTAA TGTTATG TTCC TTTTCATC TTTGGG TCTTTG TAC ATGCTGG TTCC TTGTC TTCCC ACCAC TACCCC TATATC ATTTATC TAA TTAAAAC TCATAA ACATG AATG AGAAGCCC TTTT TGACC ACCAGCC TACAAAC AGACAC ACAG ACACACACACACACACACACACACACACACACACACACAC TGCG TTGTCC TTCCATTG AGGTACC AACAGC ACAC TATAATTTC TCC ATTATG ATAGC ATTTATT ACAAGG TATT ATGATT TCTG TTTAAC TTCTCTG TATCCC TCCTGCC TGCTAC ATTGTAAC TTCTGTG ACTGC AGGG ATATATC TGTTTTG TTCACC ATTATATT GGC TAGC ATGTAGC AGCCATTC AATAAATAC TTGCTGAA TGCATG AATGAAC GGC TGAATGGC AGAACC AACATT TGAG TAAAATTTTC GTG TATTG TTTAC TTTGTGC TATAAC TTCC TAGGTATT TTATGG ATCTTC TTTC TGTGGGG TTATAT ATAG TATAAATT TGTTGC AATATT ATATTC TTTTTAA ATGCC TCAG TCACTTG TTAA ATTTAG TGCTTG TTGC AGAAGGG TATAATG TTAC TGATAGG AAAGCC ATAGTC TTGATCCC TATATCG AGGCC AAATGGC TTCTTATC TGG AAATCTC TGCC TTAAATTG AGCAGTATC TAGATT AGATG TTTTGAAAC TATGTATC ACTCAC TATGG TGGGC AAATAG TTCAGAC AGACTAGG AGACGGG ATATG AGAA ACTTAGAA TAAGCTAC AAGAAG AATTCTAA AGACAC ATGACCC ATT AAATTCC TTTTTC ATTGAAAA TCAG ACCAAAA TCTGTGGC AAAAACAG AAAACG TATTCC GG AAATATGGC TGTAG AACTGAAG ACTAA ATAGC AAGCAGTG TTTAA TCTG AAGTAA TGAA TGTTATT TCAAGG AGC AAAGAAGC TAAC ACTTGC AATAA ATCTTTG TTTTG AAGTATC TTTC TCAAAGG TCATC AAAATAAG TTTT AATTTAG ATTCC TAAATCC AGTTTC TGCTCTG TTAGTTATT GGGG ATTTTTTG AATAAATAA TCTACGC AGAAC TGTGG ACTCTGC TCTGC TTTTTC AACCCC ATGGTGTGG TCATCC AGAAAGG ATTTC TTCTCC GC TCTAGGC TTAGAA ATGGGG TACC TCCTGCC TGATG TATCC TATGC TTTCC AGAACC TGAAAG ATTAAGATG AATC ATTACAAG TGAAATG ACCCTAG ACAGAG AACAAAG AGGGCTGGC ACATG TTTGC TGTAAC ATTCC GGG AGAGC TCTTC ATCCCG TTTAC ATGTTC TTG AGAGGG TGCCTTCC GTGC TGTG ATGAATG AGCCACCC AGACC TCCCGC TACC ACACAGC AATTG TTTAG TCAGAG ATCCTGTGC ATCTGGG TCTTTTTTTT AATC AGCAGG TTCTAA ATAAAAAAC AAAAAAC AATAAC AAGCCC ACCCTCTC TGAATATG ACTCTC TGAC TCTCTTG TGTTTC TTGTTTAC ATTTTATTG TGCG AATGTG ATTC TGCTTC TTAGCC TAGTGC ATTTGG ATTTG TTGTTC ACACTGAGC ATAA ATTGCC AAACAC TCAAC TTTAA TCTAA TTGTAC ATAC TATAAAC AGAAAA TGTTG ACG TTAAAAGC ATTTCC ATAATCAC AGATTGGG TGTATGG ATG AGCAAG TGGATG AGTT AGGCC TTTTG TCATC TCAGTCC ATAGC TTGATCC TTCAGG TATTC AAAAGGAAAC GGGG ACTGTC TTCCACTG ATGACC TCACTGATG ATGAGG TTCATC TGCC ACCATC TATAGTG AGTGAAAC TTTATGGTG TAGTTG TTAAGTCTC AAATTC AGAGAGAC TTAGG ATCAAATC TCACTCTGC TACTTTC TAGCTATG TGACC TTGGG AAAGCC ACATGG TGCC TTGAAG ACTC AGTCTCC TTAAC TATATT ATAAGAATAA TAATATT CCC TATGCC AAAGGG ATCCTGTG AGATAA TAACATC TTAATTG AGTTAA ATTATT TAAG AGTTAA ATGAGATAA TGGATAAAA ATCATGGC ACATTTTG AGCAC TTCATAA ATATTAATG ATAACG ATCC TTATTTAA ACGTGCCC TGCATTC TAAAAATG AGAAG TAACTTTC TGGC TGAAACC AACCCC TGAA TGGCAAC AGAGAA AGCTGTTTC AAC AGGGTTG AGAAAA AAGC TGGGGG ATAAAGTAA TGTTTC TAA TCTTAGAG TTTAAG AGAAAATAC ATTTTTT AATTC ACTTGG TAAATT AGAG ATCTTTT AGGGACACC AGAAG AAGGC ACTTTC TGAAAGAG TTAAAA TGATTTCC TTAGAG TAAACAA ATCTCTC TCATAGAA TTTTTGC TTAGAC TAAGTTG ATGGG ACATTC ATTAAG AAATAA ACTTTTC ATCC TCGC TTGGG TAATGC AACCAGGG AACG AGTAA ATATCCC GGG AAAGCC AACTTGC TATATGC AGGTAC TATT TCTTAAAA ATGTTATT TTTATC TATC AAAATAA TATT ACTGTTATT AAGTATC ATTG AGGTTC AATCC TGCG ACAGAA ACTGTAC TTAGC TATAGGG AATC AAATATG ATTGTGAC ATAGTTC TACCC TCAGGGG TTTTAAG TGGGAAG ATAGAA TATGCC ATTAAAAAAAA AGTAA TCCTTGGC ATGGAAGG TTAAATGCC TTATAAC TAAC TGATG ATTG ATAGC AGAAGAGTG ACTAA TTCTC ATCTAG AAAGAGAA GGCC TGGGC TCTAG TTTTGG TTCC ACCAC TTGTCAAG TTTGTAACC TAGGG AAATTC ACTTC AATCC TTTG AACTTTC AGTTTT TCAAAGG AAATGG AGATG ACG ATATT TGCCC TACC ATTCCC ATAAGG TTGCTGTG AGGTTC AAATG AGCTAAGG TTTACG AAAAC ACATAA TAAATTAC AGCAC TTCGG TGC TATTCC TTGGTGTG ATCATT TTCCTTCC TCTGCC TCCTC ATAGAC TGAGAC TCTC ATAAACTG TTTTATT TTCTG TCTCAGC TTATG AAATATC TGCAAG TTATATC ATTATG TGTGTGTG TGTATTG TGTGC ACATT ATCAAG TCTAA TCAAGCC AAAGC AGCAGAAC TAAACAC AGATATC TGGACTCC TAAAAATCC ACCAC TTAATCG TGAAG ACAAC ATTG TTAGAG AAGAAAAG ATATTC TCTAAGG TTGG ACCTATT TCAGAA ATG AGTAGC ATCACCC TTGCTTTAC AATGG AGAAAAC TGAG TATTG ATTTATTG AACAC TTATT TAATAA AGGTTTATG AAGAACCC ATCC TGCACC AGGGGCCC AGGTACC AAC TTAAAGAA TGTGAGTG AGAAAA ACAGGG AACTCAG TCCTGGC ATTGACC TTTGC TGTAAC TTCTGCTC ATTGTAGG AATCAGCC AACTTCC TGTCC TTTAG TTTCCTCTTC TGCAAAC TGAAG ATT AGTTAG TTGTAG AGCATAC AGTCAGTG TTATG TCTGAAAA TATTG AAATAC AGAGACAAAG TGAAAA AGAAGGG TATG AAACCCC TTTCC ATTAGAC TGTAAG AGGG ATGATG ATTGTTAC TTTTGGG AGTTATG AGCG TGGGC AGTGG AGAGAGTGG TTTGTTTG AGGATGCC ACGC TGAGC ATTGGG TGG ATGTGG AATTTGTG TGGGCAGGG AAGTAG AGAAGAGAG TTGGGGC AAGCTAAG ACTGCC AGCTTCC AGAC TGGAAGC TTCTGC GGTAG TTAC GGGG AATGAGTC AGGAAATAG TTCTGTG TAAATAG TTATG AAATTTTAA AGCTAA TTTTG TCATGGGCC AAAGGC ATTTTTT GGGG ATGATG AGAG ATATC AAATT TTGTGG ATGCGCC TACAAG TAGG TGATGG TTCTAC ACTGAAAG ATTTGCC ACTTTTC TTCACCC TAGAATG TTCATATTG TGCG TGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTG TGTATGG TTTCTTAG TGGACTGTG AGATATATT AAACATAG ATAAAAGG AATATT TAAC TAAAAG AGAAGC AACAGAA AGTTAA TCAAATAG TATCC AAGACAGG ACGG AAATGGGC TTTAGGGG AGTCC TGAGAGAA AGAGAAC TCAC ATTCATTG AGTTCG TGTG AATTGTTTC TGGGCCCC GGGC ACTGTC ATATCC ATG AAATAACC TTATTC TTGTCTTG AAAAGC TGTTCTC ATACAGATC TGAAAAC TAAGGCCC AGAGACAG TAAGC AGCTTC TGGGAATG ACTATG TTGTTG AGCTCAGG TTTGAGC TATGG AGGG TATGAAG TTATT TCCTC TTAGC AACTCC ATCACAGAC TCAAC ATGCTGGGC AAACTCAC TTTATC TTTAA AGAAC AGTCTC TATTTGC AAAGGAG AGAACC TGCTTCC ATACAC TTGGG ACTG TTAGAG TTGTC AGACG ATGTTACC AAAGC AAAGGC ACTTGAAC TTAGGCC AAGG TATATG TTTCTGTAG TCACCC TGTGG TAACTAC TGGGG TCAGC ATTTCAC AAAACC TAC TTACCC TGTTTAG TTAGG AAAACCC TAGAGG TGGGGG AGTGGG AGTGAGGG TCCCC AGTCCC ACTGTC ATTTGG AAAA ATGTCC AGATG AGAG TAGGC TGTCC ACTTCC TAGAGGC AAATC TTTCTGAA TCTAC ATAGTTTC ACAGAC TCACAGAAC TTCAGAGC TGAAG AGACC TTC AGATAG ATATTTTTC AGATAG ACCTTC AGATAGAC ATTTTGCC GC ACTGC TCAGTC TAGG TTAAC GGGAAGC TAGGGC AAGAATTC ACTT ATGGCCC TCCC TTCTTCC TGTATTC AGTATT TTCC TGTCTG TAAC ATTGGG TCCATG ATTAAGC TATTTAACC AGTTTC TGAA TTTGTAA TTTATG AAGCC AGGAAAA GGGC ATTTATC ACTTG AATCATCCC AGCAGCC TGTG TCAGAG TTAAGG AGGG AATTATT TTTTTTTC TAAAAATTC TGTTC TAGGC TATTTAAGG TCAC TCTAC TTGCC TCTTC TGGAGAG ACTCG TAC ATGCG TTGC TGATCCC TGGGC TGAG TTCTCCC AGCCC TAGTGAAC TCGG AAGTAC AGGTCC AGAAGG TTCTGC TTGATGG TTCCC ATCAGGG TAAAAC TGAAAA TAGG AAGCCG TTGGTTGC TGATTG TAAGATAA ATTTGTTTAAG TAG TGTGCC AAAAGC AGTGGG TCATATG AAAAGCC ACATG ACCAACC AGAAATAA TTGGAGC TTAAAAG ATGC TAGGG TCTATG AGTAAG ATTTC TTTCACC ATGGG ATTTAGG TAAGGC AAAC TCACCC ACTCAC TAGTTC TTAATTCCC ATTTTCTTTT TGTCC TGGAAC ATTTC ACCTGCCC TGATGC GGC AAATTAAG TGATTG AATTAA TAC AGAAATG TCAGCC TTTATTG ATGACAA TTAGG TGTTC ATATT ATTTCTG TTTTATT AATAA TTTATT TACC TATTCAAC AAATC TTTAAAGCC TACTGTG TGCTAG ATGTGG AGGAAG AAACAAG TAAC ACTTCC TCCG TGAC AGTTTT TCTAA TCCCTCTAG TGTAAATTC TCTCTCCC TTTCC TGAAAC TTAGTAG TTCTTTG TTTAT AGTTCTCC AATAG ATTTATGCC ATGTTGCC TTGTATTG TAGC AGCTTG AGAAC ATGTC TTACTATT TAGAAC TAAG ACAATTGC TTTAC AAGTATT TGTCTG TACCATG ATATTTAA AGTAG TGCTGGC ACAGAG TATG TTGTCAGTG TTGTGG AATAAATG ACTAA ATGAATATT TGTTG AATTAGG TAAGAAG TTGC TTCAGC TTTGGC TGTT ATGCTGC TGTAAC AAAC AGCTCCC AAATT TCAATAGC TCAG AACACAATG ATTTATT TCTC ATCTATG TTAA TGCCC ATAGTG AGTTAGG TGCAGC TCTGC TCCCC ATCTTC TGGATT TGGGG ATCTGGG TAG AAATAGCC ATT AGTTGGG ATTTTCTTG TGTTGGGG AACAAG AGAGATGGC AGAAACAC ATG ATAGATC AGAAG TGGCATTC ATTGGC TGGGCACGG TGGCTCACGCCTGTAATCCCAGCACTTTGGG AGGC ATAGGC AGGTGG ATCACC TGAGC TCAGGAG CCC AAGATC AGCC TGGCCAAC AATGG TGAAACCCCATCTCTACTAAAAATACAAAAATT AGCCAAGC ACGGTGGC AGGCACC TGTATC TCAGC TACTTGG AAGGCTGAGGC AAGAGAA TTGCTTGAACCC GGGAGGTGGAGG TTGCAGTG AGCTAAG ATTGCGC TACCACCC TCCACC TGAGC AGC AGAGCGAGAC TCTG TCAAAAAAC AAACAAACAAACAAAC AACATCAC TTCTGCTC AAATT TCG TTGGCCC AAACTAG TCATG TAGCC ACGCC TGCC GTGG AGGGC AGACAAGG ATAA TTCTCCC ATGAGAA AGGCC ATGAATC TTTGGG AATAA TAATAT AATTTACC AGAG AAGTCATCC TTATTTTTT AAAGAAC TTAAAA TTTAGTTG AGGAAG TAAGC TATACAC AAAGAAATAC AATAAAAAA AAGGTGC AAGC AACATG TTATAG AGGTGAGGG AGGAGAG ATTTCTTTGG ACTAAG ATTAGTCAC AGAAGG ATTAATAA AAGATG TGTTC TTTAA ATTGG ACATG AAAAGTAAG ATTTTGCC AAG TGGAAC TGGACAAG AGGTGAA TAGAAG AGTATT TAAAAAG ATATG AAGGTAC TCAAAC AAAA AATGTAC TAAAAAA AAGAGTG AAAAG TCCAC TTTTGG TGGATAA TTAGG TCCAC ATTTCAAAG TTGGG AATTTAG AGTCTATT AAGC AGGAAATT ATAA ACCACTAG AGATTTGG AAAGC TAAC TAAAGG ATGCAATGG AGAGAAGC TGAAAA TATTTTTG AGGC TATGC AAAGAG TTCAGG AAACAGGG ACTAA AGACAGAA TCAGAA TAG TGAAAAG TATG AACAGG ACAGAAC ATAC AGAGGC AAGATGC AAAGG AAATGTAC AAAGGTTG AAAACCG ATTGG TTTGG AAAGC AAAGG AGAGAGGC AGTG AAAGAAG TTGCAGATG ATTATTCC ATTAATGG TGGTGCC ATTAATGG AATTCAAAA AATAAG AAG AGGACTGAC TCATAGG AAGAGAAAA TAAGTTTTG TTTGAGG TATTC TGATTTC GAGG AATTTC AGAG AGAAATG TTTAG TAGGCG TATGG AACTCTGGG AATAG AGTTTG TGGGATTG TGGTTG TGATTG AAGATG TAGTCC TGAGGG ACCCC TGAAG AGGTGAC AGTTG AAGCC ATGAGTGC AGATG AGAATCCC AAAGG AAACTAG TGGCC AAAAGGC AGAG TCTTGG AGGGCTGCC AACATG TAGGATG TGGGAAG ATGAAG ACAAACC AGGGAGGG AAGCTGAAG AACC TTGAC AAGGCAGAG AGGAG AACAC TATAGTG TGGG ATCAAG TGAGC TGAGGC AGGAGAG AGGCTGAGG AGCAGGG AGAGG TCAGCGG TGTC AAATGC TTTAG AAAGTGC TAAG AAGATG AGAA TGTAGG AAGTGG TATTG AGGTTAGAG TAGG AGATC ATTGGC GATG AGTAAGG AAAC AACTTC AGTGAGG ACTGG AGATG TTCTTG TGAGATATC TGATAAC AAAAATTAC AGAGATTGC ATAA TGGAGG ATT AGTTGG AAC TGGTGG AAC TGAGAG TACGC TTAG TGCG ATAACC TTTGAAAAG AAGAGG AACC TATTCC ATTTGGGG AAGGC AGGAGAAAAC TATGC ACTAAG AGAG AACTTG TCCATG AGAAGG AGTG ATTTTTAAGG TGCTTC TTAAC AAAGTAG AGTTTAGGG AATGTATTC ACTC TTTGAAATT AAAAAGC AATTGC TTATTATTG AAAACCC AGGTTAGC TATT AAAAAAAAAAAA AGAGAAAA ATAAG ACAAAA AAAGAAAAAAAA ACCATGC ATGTGTAAC AAGTC AGGGGAAGC TGAGGAG ACCTTCC AAACTGTAC TGTATTC ACTTGC ATATATTCC ACATCTGGC ACTGGGC AGTC AAATATTC ACAGG TAATAA ATAGATATT AAAGAA TGTATT ATTGGGC ATTAGG ACTC ATAATTTT AGAAAAATG TTTTTTG TGGC TGGGCGTGG TGGCTCACTCC TGTAATCCCAGCACTTTGGG AGGCCAAGG AGAG TGGATC AGAAGG TCAGGAG ATCG ACAGCATCC TGGCCAACATGGTGAAACCCC G T [SEP]
,,,,


True Label,Predicted Label,Attribution Label,Attribution Score,Word Importance
1.0,0 (0.55),AGCTACTTGGGAGGTTGAGGCAGGAGAATCACTTGAACCAGAAGGCAGAGGTTGCAGTGGGCCGAGATCACGTCATTGCACCCCAGCCTGGGCAACAAGAGGGAAACTCTGTCTCAAAAGAAAAAAAAAATTAACACAGGTAAAAAGCTTAGATCAGTGCTGAGCACAATATAAACCCATTAGTGGCTAAACCATCAACAAGTGTTGGGAGCTGCTGCTATTTTTACTTTCCCTAGAATTCTATCTCTTACCTTTCACTCTTCTCACTGCCCTTATTTGCCCAGAAATCCCTTTATGTCCTGAAAAACTCAACTCTCATATTTTACTTTTAGGAAATTATCAGTTACTGCTCTAACACAGTTCTTGATGTATGCTCTTCACTCCCTGACCTTTTGCTTTGTTGATACTTTATTATTGTACTTACGACTCCATACTTAAAAAATATAATTGGTAAAAAAAAATGTAACTAGTAATAGGCAGAAAAACTGGAATTGATTCCCAGTGCCTGTTACATGACAGGGGCTCATTATATACTTGCTGAGTGAATGATGGAAGGTCAAGTGAACAAATTAGAGAAATCAGGCAGAAAATATTTCCAGGTATCTTGGGGAGTTGAGAATTAGAGAAGAAAAGAATGAAGGAGGTTGGGATTTGATGAAGAACATATTTGTGACAGTGAAACTCAGTCGTGGGATTTGCTGTTTATATTGTTTTCTTTCCTTCTCAAATCAACATGAGTTGTACAGACCATAATAAAAGCTTCATCTTGAGCCTGTTATTGCATCACCATTTGGCTGATGTTTCACTGCTCCATCACTGTGGGAGGTTAACACTCACTGAGGGGTGGCAGTACCCTCTGCATTTCTCTGGGAAACTCCAATGATTCATCCAAAAGTGTGAGAAGCCAAGCAGCTTTTATCACCCAGGAGACAGCTGTAACCTGACCTCAATTCATGCCAAAGAAGCCTGAGGAAAGTGCCCTGGAAGTGAACAGCCTGCTCATGACTCAAGGAACTCAAAAGTCAGAGTTCTGACCAGTATTGTTGGGGTGGGTAAAAGAACTTCACTCCCTCAGATCTGAAAGTGTCCTTGCCAGAGGAGAGGGAGACCTTATTTCAAGTGTGTTTGAATAAACATGACATACATAAACTTGATTTTCCAGGTTTTGGAGAAAGCATACATTTGTCCTCTGCATCATGAAATAATGTCCTTGGTGGCTCCTTTCAGGGCCTGTGCTGCACTCTCCTTAGTGACTATTAGCATTGGAGTTGGACAATTTAAGGGCAGGAGTGGAGACCTGCTACTTATAAAGGATGACTACACTTATTTAGGGATACTGCTCACGCTGACTCTCAGAGCAATTCTTTTGTTCCAACAGCTGTTCCCAGGGTAGGGTAATATTGGAACAGAGGCTTATGCTGCAGTATCCATTGAGTGGGACTGAGGCCCCTTCAGTAGCTGAAAATCCCCACTTCAGTGCTACTGCTTCAGCTACTGCAGCTCTTACTGTCTTCAAAAACAATGGTAAGGATTCCTTTAACCTCAGAGGAGGAATTAGCTTTTTGCAGAGACTACAAAGAATCCATAGGATACAAACATTTCTATAGTCCAGGAAGGAGTCCCACATATAAAAACAAAACTGTAATATATTTTATAAGTGATTTGCCTAAATATGTGAGGCTGTATTCACTCAGTTTCTCAAGAAGCATTTCTTGAGAAGCTACTGTGTGCCAGAGCCTCCTTAGGGGGCAGGAACTGCTTATTTATCTTCATATCAACATCCCTAGGTAAGTGCCTAGCCCATCGTATGGGCTACAGACTATGCAATGCTATTTCCCTTAGCCCCACCAGAGTTCAGGGTCAGACTGATGGGCAGGACTATGAACAGATCTTCTTTCTCTCCTTGAAGGTAACTAACCTTCCATGGGACTTGAAGCTTCAGATTTTGGCCTTAACCAAGTCAACTAGCTCAAGTCAGAGGGGCAGTGATTATTTGAATTGCCAAGGTATTACCTAATGAGAATCTTTGTGACTAAGCTCTTAAAGTTGAAACTTAAGTAACATTAGCTGAAAAACTTGTTGGATAAACATTGCTACTCCCTTGAAAATTCCGGGAGTTCCAGTTTGGTTGCTGACCATTTTTTACCATTTATCTATTTGTTTAGCACTAACGTTTCTTAAGCTTCCAATGTATATAGAATGCTATGCTGGGTTGTGGGAAATACAATGAGCTATGCTCCCTGTCTGCAAGTCGGTCACATTTTAAGTGGGGGTGCAATAAATGACAGATTCAAACCACTGAACAATTATTAACAGAGAAAAGCAACTTTTATGGGCAAAGGCTTTCGGCAACTCCAGGCACAGTCTCACCCAAGGCCTTGATTGTGGCACTGCTTCTGTCACAGAGAATAAGAGTGAAATGTTAGAAGACTGTTGAAACACTGCGGAGTTAATGTTATGTTCCTTTTCATCTTTGGGTCTTTGTACATGCTGGTTCCTTGTCTTCCCACCACTACCCCTATATCATTTATCTAATTAAAACTCATAAACATGAATGAGAAGCCCTTTTTGACCACCAGCCTACAAACAGACACACAGACACACACACACACACACACACACACACACACACACACACTGCGTTGTCCTTCCATTGAGGTACCAACAGCACACTATAATTTCTCCATTATGATAGCATTTATTACAAGGTATTATGATTTCTGTTTAACTTCTCTGTATCCCTCCTGCCTGCTACATTGTAACTTCTGTGACTGCAGGGATATATCTGTTTTGTTCACCATTATATTGGCTAGCATGTAGCAGCCATTCAATAAATACTTGCTGAATGCATGAATGAACGGCTGAATGGCAGAACCAACATTTGAGTAAAATTTTCGTGTATTGTTTACTTTGTGCTATAACTTCCTAGGTATTTTATGGATCTTCTTTCTGTGGGGTTATATATAGTATAAATTTGTTGCAATATTATATTCTTTTTAAATGCCTCAGTCACTTGTTAAATTTAGTGCTTGTTGCAGAAGGGTATAATGTTACTGATAGGAAAGCCATAGTCTTGATCCCTATATCGAGGCCAAATGGCTTCTTATCTGGAAATCTCTGCCTTAAATTGAGCAGTATCTAGATTAGATGTTTTGAAACTATGTATCACTCACTATGGTGGGCAAATAGTTCAGACAGACTAGGAGACGGGATATGAGAAACTTAGAATAAGCTACAAGAAGAATTCTAAAGACACATGACCCATTAAATTCCTTTTTCATTGAAAATCAGACCAAAATCTGTGGCAAAAACAGAAAACGTATTCCGGAAATATGGCTGTAGAACTGAAGACTAAATAGCAAGCAGTGTTTAATCTGAAGTAATGAATGTTATTTCAAGGAGCAAAGAAGCTAACACTTGCAATAAATCTTTGTTTTGAAGTATCTTTCTCAAAGGTCATCAAAATAAGTTTTAATTTAGATTCCTAAATCCAGTTTCTGCTCTGTTAGTTATTGGGGATTTTTTGAATAAATAATCTACGCAGAACTGTGGACTCTGCTCTGCTTTTTCAACCCCATGGTGTGGTCATCCAGAAAGGATTTCTTCTCCGCTCTAGGCTTAGAAATGGGGTACCTCCTGCCTGATGTATCCTATGCTTTCCAGAACCTGAAAGATTAAGATGAATCATTACAAGTGAAATGACCCTAGACAGAGAACAAAGAGGGCTGGCACATGTTTGCTGTAACATTCCGGGAGAGCTCTTCATCCCGTTTACATGTTCTTGAGAGGGTGCCTTCCGTGCTGTGATGAATGAGCCACCCAGACCTCCCGCTACCACACAGCAATTGTTTAGTCAGAGATCCTGTGCATCTGGGTCTTTTTTTTAATCAGCAGGTTCTAAATAAAAAACAAAAAACAATAACAAGCCCACCCTCTCTGAATATGACTCTCTGACTCTCTTGTGTTTCTTGTTTACATTTTATTGTGCGAATGTGATTCTGCTTCTTAGCCTAGTGCATTTGGATTTGTTGTTCACACTGAGCATAAATTGCCAAACACTCAACTTTAATCTAATTGTACATACTATAAACAGAAAATGTTGACGTTAAAAGCATTTCCATAATCACAGATTGGGTGTATGGATGAGCAAGTGGATGAGTTAGGCCTTTTGTCATCTCAGTCCATAGCTTGATCCTTCAGGTATTCAAAAGGAAACGGGGACTGTCTTCCACTGATGACCTCACTGATGATGAGGTTCATCTGCCACCATCTATAGTGAGTGAAACTTTATGGTGTAGTTGTTAAGTCTCAAATTCAGAGAGACTTAGGATCAAATCTCACTCTGCTACTTTCTAGCTATGTGACCTTGGGAAAGCCACATGGTGCCTTGAAGACTCAGTCTCCTTAACTATATTATAAGAATAATAATATTCCCTATGCCAAAGGGATCCTGTGAGATAATAACATCTTAATTGAGTTAAATTATTTAAGAGTTAAATGAGATAATGGATAAAAATCATGGCACATTTTGAGCACTTCATAAATATTAATGATAACGATCCTTATTTAAACGTGCCCTGCATTCTAAAAATGAGAAGTAACTTTCTGGCTGAAACCAACCCCTGAATGGCAACAGAGAAAGCTGTTTCAACAGGGTTGAGAAAAAAGCTGGGGGATAAAGTAATGTTTCTAATCTTAGAGTTTAAGAGAAAATACATTTTTTAATTCACTTGGTAAATTAGAGATCTTTTAGGGACACCAGAAGAAGGCACTTTCTGAAAGAGTTAAAATGATTTCCTTAGAGTAAACAAATCTCTCTCATAGAATTTTTGCTTAGACTAAGTTGATGGGACATTCATTAAGAAATAAACTTTTCATCCTCGCTTGGGTAATGCAACCAGGGAACGAGTAAATATCCCGGGAAAGCCAACTTGCTATATGCAGGTACTATTTCTTAAAAATGTTATTTTTATCTATCAAAATAATATTACTGTTATTAAGTATCATTGAGGTTCAATCCTGCGACAGAAACTGTACTTAGCTATAGGGAATCAAATATGATTGTGACATAGTTCTACCCTCAGGGGTTTTAAGTGGGAAGATAGAATATGCCATTAAAAAAAAAGTAATCCTTGGCATGGAAGGTTAAATGCCTTATAACTAACTGATGATTGATAGCAGAAGAGTGACTAATTCTCATCTAGAAAGAGAAGGCCTGGGCTCTAGTTTTGGTTCCACCACTTGTCAAGTTTGTAACCTAGGGAAATTCACTTCAATCCTTTGAACTTTCAGTTTTTCAAAGGAAATGGAGATGACGATATTTGCCCTACCATTCCCATAAGGTTGCTGTGAGGTTCAAATGAGCTAAGGTTTACGAAAACACATAATAAATTACAGCACTTCGGTGCTATTCCTTGGTGTGATCATTTTCCTTCCTCTGCCTCCTCATAGACTGAGACTCTCATAAACTGTTTTATTTTCTGTCTCAGCTTATGAAATATCTGCAAGTTATATCATTATGTGTGTGTGTGTATTGTGTGCACATTATCAAGTCTAATCAAGCCAAAGCAGCAGAACTAAACACAGATATCTGGACTCCTAAAAATCCACCACTTAATCGTGAAGACAACATTGTTAGAGAAGAAAAGATATTCTCTAAGGTTGGACCTATTTCAGAAATGAGTAGCATCACCCTTGCTTTACAATGGAGAAAACTGAGTATTGATTTATTGAACACTTATTTAATAAAGGTTTATGAAGAACCCATCCTGCACCAGGGGCCCAGGTACCAACTTAAAGAATGTGAGTGAGAAAAACAGGGAACTCAGTCCTGGCATTGACCTTTGCTGTAACTTCTGCTCATTGTAGGAATCAGCCAACTTCCTGTCCTTTAGTTTCCTCTTCTGCAAACTGAAGATTAGTTAGTTGTAGAGCATACAGTCAGTGTTATGTCTGAAAATATTGAAATACAGAGACAAAGTGAAAAAGAAGGGTATGAAACCCCTTTCCATTAGACTGTAAGAGGGATGATGATTGTTACTTTTGGGAGTTATGAGCGTGGGCAGTGGAGAGAGTGGTTTGTTTGAGGATGCCACGCTGAGCATTGGGTGGATGTGGAATTTGTGTGGGCAGGGAAGTAGAGAAGAGAGTTGGGGCAAGCTAAGACTGCCAGCTTCCAGACTGGAAGCTTCTGCGGTAGTTACGGGGAATGAGTCAGGAAATAGTTCTGTGTAAATAGTTATGAAATTTTAAAGCTAATTTTGTCATGGGCCAAAGGCATTTTTTGGGGATGATGAGAGATATCAAATTTTGTGGATGCGCCTACAAGTAGGTGATGGTTCTACACTGAAAGATTTGCCACTTTTCTTCACCCTAGAATGTTCATATTGTGCGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTATGGTTTCTTAGTGGACTGTGAGATATATTAAACATAGATAAAAGGAATATTTAACTAAAAGAGAAGCAACAGAAAGTTAATCAAATAGTATCCAAGACAGGACGGAAATGGGCTTTAGGGGAGTCCTGAGAGAAAGAGAACTCACATTCATTGAGTTCGTGTGAATTGTTTCTGGGCCCCGGGCACTGTCATATCCATGAAATAACCTTATTCTTGTCTTGAAAAGCTGTTCTCATACAGATCTGAAAACTAAGGCCCAGAGACAGTAAGCAGCTTCTGGGAATGACTATGTTGTTGAGCTCAGGTTTGAGCTATGGAGGGTATGAAGTTATTTCCTCTTAGCAACTCCATCACAGACTCAACATGCTGGGCAAACTCACTTTATCTTTAAAGAACAGTCTCTATTTGCAAAGGAGAGAACCTGCTTCCATACACTTGGGACTGTTAGAGTTGTCAGACGATGTTACCAAAGCAAAGGCACTTGAACTTAGGCCAAGGTATATGTTTCTGTAGTCACCCTGTGGTAACTACTGGGGTCAGCATTTCACAAAACCTACTTACCCTGTTTAGTTAGGAAAACCCTAGAGGTGGGGGAGTGGGAGTGAGGGTCCCCAGTCCCACTGTCATTTGGAAAAATGTCCAGATGAGAGTAGGCTGTCCACTTCCTAGAGGCAAATCTTTCTGAATCTACATAGTTTCACAGACTCACAGAACTTCAGAGCTGAAGAGACCTTCAGATAGATATTTTTCAGATAGACCTTCAGATAGACATTTTGCCGCACTGCTCAGTCTAGGTTAACGGGAAGCTAGGGCAAGAATTCACTTATGGCCCTCCCTTCTTCCTGTATTCAGTATTTTCCTGTCTGTAACATTGGGTCCATGATTAAGCTATTTAACCAGTTTCTGAATTTGTAATTTATGAAGCCAGGAAAAGGGCATTTATCACTTGAATCATCCCAGCAGCCTGTGTCAGAGTTAAGGAGGGAATTATTTTTTTTTCTAAAAATTCTGTTCTAGGCTATTTAAGGTCACTCTACTTGCCTCTTCTGGAGAGACTCGTACATGCGTTGCTGATCCCTGGGCTGAGTTCTCCCAGCCCTAGTGAACTCGGAAGTACAGGTCCAGAAGGTTCTGCTTGATGGTTCCCATCAGGGTAAAACTGAAAATAGGAAGCCGTTGGTTGCTGATTGTAAGATAAATTTGTTTAAGTAGTGTGCCAAAAGCAGTGGGTCATATGAAAAGCCACATGACCAACCAGAAATAATTGGAGCTTAAAAGATGCTAGGGTCTATGAGTAAGATTTCTTTCACCATGGGATTTAGGTAAGGCAAACTCACCCACTCACTAGTTCTTAATTCCCATTTTCTTTTTGTCCTGGAACATTTCACCTGCCCTGATGCGGCAAATTAAGTGATTGAATTAATACAGAAATGTCAGCCTTTATTGATGACAATTAGGTGTTCATATTATTTCTGTTTTATTAATAATTTATTTACCTATTCAACAAATCTTTAAAGCCTACTGTGTGCTAGATGTGGAGGAAGAAACAAGTAACACTTCCTCCGTGACAGTTTTTCTAATCCCTCTAGTGTAAATTCTCTCTCCCTTTCCTGAAACTTAGTAGTTCTTTGTTTATAGTTCTCCAATAGATTTATGCCATGTTGCCTTGTATTGTAGCAGCTTGAGAACATGTCTTACTATTTAGAACTAAGACAATTGCTTTACAAGTATTTGTCTGTACCATGATATTTAAAGTAGTGCTGGCACAGAGTATGTTGTCAGTGTTGTGGAATAAATGACTAAATGAATATTTGTTGAATTAGGTAAGAAGTTGCTTCAGCTTTGGCTGTTATGCTGCTGTAACAAACAGCTCCCAAATTTCAATAGCTCAGAACACAATGATTTATTTCTCATCTATGTTAATGCCCATAGTGAGTTAGGTGCAGCTCTGCTCCCCATCTTCTGGATTTGGGGATCTGGGTAGAAATAGCCATTAGTTGGGATTTTCTTGTGTTGGGGAACAAGAGAGATGGCAGAAACACATGATAGATCAGAAGTGGCATTCATTGGCTGGGCACGGTGGCTCACGCCTGTAATCCCAGCACTTTGGGAGGCATAGGCAGGTGGATCACCTGAGCTCAGGAGCCCAAGATCAGCCTGGCCAACAATGGTGAAACCCCATCTCTACTAAAAATACAAAAATTAGCCAAGCACGGTGGCAGGCACCTGTATCTCAGCTACTTGGAAGGCTGAGGCAAGAGAATTGCTTGAACCCGGGAGGTGGAGGTTGCAGTGAGCTAAGATTGCGCTACCACCCTCCACCTGAGCAGCAGAGCGAGACTCTGTCAAAAAACAAACAAACAAACAAACAACATCACTTCTGCTCAAATTTCGTTGGCCCAAACTAGTCATGTAGCCACGCCTGCCGTGGAGGGCAGACAAGGATAATTCTCCCATGAGAAAGGCCATGAATCTTTGGGAATAATAATATAATTTACCAGAGAAGTCATCCTTATTTTTTAAAGAACTTAAAATTTAGTTGAGGAAGTAAGCTATACACAAAGAAATACAATAAAAAAAAGGTGCAAGCAACATGTTATAGAGGTGAGGGAGGAGAGATTTCTTTGGACTAAGATTAGTCACAGAAGGATTAATAAAAGATGTGTTCTTTAAATTGGACATGAAAAGTAAGATTTTGCCAAGTGGAACTGGACAAGAGGTGAATAGAAGAGTATTTAAAAAGATATGAAGGTACTCAAACAAAAAATGTACTAAAAAAAAGAGTGAAAAGTCCACTTTTGGTGGATAATTAGGTCCACATTTCAAAGTTGGGAATTTAGAGTCTATTAAGCAGGAAATTATAAACCACTAGAGATTTGGAAAGCTAACTAAAGGATGCAATGGAGAGAAGCTGAAAATATTTTTGAGGCTATGCAAAGAGTTCAGGAAACAGGGACTAAAGACAGAATCAGAATAGTGAAAAGTATGAACAGGACAGAACATACAGAGGCAAGATGCAAAGGAAATGTACAAAGGTTGAAAACCGATTGGTTTGGAAAGCAAAGGAGAGAGGCAGTGAAAGAAGTTGCAGATGATTATTCCATTAATGGTGGTGCCATTAATGGAATTCAAAAAATAAGAAGAGGACTGACTCATAGGAAGAGAAAATAAGTTTTGTTTGAGGTATTCTGATTTCGAGGAATTTCAGAGAGAAATGTTTAGTAGGCGTATGGAACTCTGGGAATAGAGTTTGTGGGATTGTGGTTGTGATTGAAGATGTAGTCCTGAGGGACCCCTGAAGAGGTGACAGTTGAAGCCATGAGTGCAGATGAGAATCCCAAAGGAAACTAGTGGCCAAAAGGCAGAGTCTTGGAGGGCTGCCAACATGTAGGATGTGGGAAGATGAAGACAAACCAGGGAGGGAAGCTGAAGAACCTTGACAAGGCAGAGAGGAGAACACTATAGTGTGGGATCAAGTGAGCTGAGGCAGGAGAGAGGCTGAGGAGCAGGGAGAGGTCAGCGGTGTCAAATGCTTTAGAAAGTGCTAAGAAGATGAGAATGTAGGAAGTGGTATTGAGGTTAGAGTAGGAGATCATTGGCGATGAGTAAGGAAACAACTTCAGTGAGGACTGGAGATGTTCTTGTGAGATATCTGATAACAAAAATTACAGAGATTGCATAATGGAGGATTAGTTGGAACTGGTGGAACTGAGAGTACGCTTAGTGCGATAACCTTTGAAAAGAAGAGGAACCTATTCCATTTGGGGAAGGCAGGAGAAAACTATGCACTAAGAGAGAACTTGTCCATGAGAAGGAGTGATTTTTAAGGTGCTTCTTAACAAAGTAGAGTTTAGGGAATGTATTCACTCTTTGAAATTAAAAAGCAATTGCTTATTATTGAAAACCCAGGTTAGCTATTAAAAAAAAAAAAAGAGAAAAATAAGACAAAAAAAGAAAAAAAAACCATGCATGTGTAACAAGTCAGGGGAAGCTGAGGAGACCTTCCAAACTGTACTGTATTCACTTGCATATATTCCACATCTGGCACTGGGCAGTCAAATATTCACAGGTAATAAATAGATATTAAAGAATGTATTATTGGGCATTAGGACTCATAATTTTAGAAAAATGTTTTTTGTGGCTGGGCGTGGTGGCTCACTCCTGTAATCCCAGCACTTTGGGAGGCCAAGGAGAGTGGATCAGAAGGTCAGGAGATCGACAGCATCCTGGCCAACATGGTGAAACCCCGT,2.37,[CLS] AGCTAC TTGGG AGGTTGAGGCAGGAGAA TCACTTGAACC AGAAGGC AGAGGTTGC AGTGGGCC G AGATCACG TCATTGC ACCCC AGCCTGGGCAACAAG AGGGAAAC TCTGTCTC AAAAGAAAAAAAA AATTAAC ACAGG TAAAAAGC TTAGATC AGTGC TGAGC ACAA TATAAACCC ATT AGTGGC TAAACC ATCAAC AAG TGTTGGG AGCTGCTGC TATTTTTAC TTTCCC TAGAATTC TATC TCTTACC TTTCACTC TTCTCAC TGCCC TTATT TGCCC AGAAATCCC TTTATG TCCTGAAAA ACTC AACTCTC ATATT TTACTTTT AGGAAATT ATC AGTTAC TGCTC TAACACAG TTCTTG ATGTATGC TCTTC ACTCCC TGACC TTTTGC TTTGTTG ATAC TTTATT ATTGTAC TTACG ACTCC ATACTTAAAA AATAT AATTGG TAAAAAA AAATGTAAC TAGTAA TAGGC AGAAAA ACTGG AATTG ATTCCC AGTGCC TGTTAC ATGAC AGGGGC TCATT ATAT ACTTGC TGAGTGAA TGATGG AAGGTCAAG TGAAC AAATT AGAGAA ATCAGGC AGAAAATATT TCCAGG TATC TTGGGG AGTTG AGAA TTAGAG AAGAAAAG AATG AAGGAGG TTGGG ATTTGATG AAGAAC ATATTTGTG ACAGTG AAAC TCAGTC GTGGG ATTTGC TGTTTAT ATTGTTTTC TTTCC TTCTC AAATC AACATG AGTTGTAC AGACC ATAATAA AAGCTTC ATCTTG AGCC TGTTATTGC ATCACC ATTTGGC TGATGTTTC ACTGC TCCATC ACTG TGGGAGG TTAAC ACTCAC TGAGGGG TGGC AGTACCC TCTGC ATTTCTC TGGG AAACTCC AATG ATTCATCC AAAAGTGTG AGAAGCC AAGC AGCTTTT ATCACCC AGGAGAC AGC TGTAACC TGACC TCAATTC ATGCC AAAGAAGCC TGAGG AAAGTGCCC TGGAAG TGAAC AGCCTGC TCATG ACTCAAGG AACTCAAAAG TCAGAG TTCTGACC AGTATTG TTGGGG TGGG TAAAAGAAC TTCACTCCC TCAGATC TGAAAG TGTCC TTGCC AGAGGAG AGGGAGACC TTATT TCAAG TGTGTTTG AATAAACATG ACATAC ATAAACTTG ATTTTCC AGGTTTTGG AGAAAGC ATACATTTG TCCTCTGC ATCATG AAATAA TGTCC TTGGTGGC TCCTTTC AGGGCC TGTGCTGC ACTCTCC TTAGTG ACTATT AGCATTGG AGTTGG ACAATTTAA GGGC AGGAGTGG AGACC TGCTAC TTATAA AGGATG ACTAC ACTTATT TAGGG ATACTGC TCACGC TGACTCTC AGAGC AATTC TTTTG TTCCAAC AGCTG TTCCCAGGG TAGGG TAA TATTGG AAC AGAGGC TTATGC TGC AGTATCC ATTG AGTGGG ACTG AGGCCCC TTCAGTAGC TGAAAA TCCCC ACTTC AGTGCTAC TGCTTC AGCTAC TGC AGCTC TTACTGTC TTCAAAA ACAATGG TAAGG ATTCC TTTAACC TCAG AGGAGG AATTAGC TTTTTGC AGAGACTAC AAAGAA TCC ATAGG ATACAAAC ATTTC TATAGTCC AGGAAGG AGTCCC ACATAT AAAAACAAAAC TGTAA TATATTTT ATAAG TGATTTGCC TAAATATG TGAGGC TGTATTC ACTCAG TTTCTCAAG AAGC ATTTCTTG AGAAGC TACTGTG TGCC AGAGCC TCC TTAGGG GGC AGGAAC TGCTTATT TATCTTC ATATCAAC ATCCC TAGG TAAGTGCC TAGCCC ATCG TATGGGC TACAGAC TATGC AATGC TATTTCCC TTAGCCCC ACCAGAG TTCAGGG TCAGAC TGATGGGC AGGAC TATGAAC AGATC TTCTTTC TCTCC TTGAAGG TAAC TAACC TTCC ATGGG ACTTG AAGCTTC AGATT TTGGCC TTAACC AAGTCAAC TAGC TCAAG TCAG AGGGGC AGTG ATTATT TGAATTGCC AAGGTATT ACCTAA TGAGAA TCTTTGTG ACTAAGC TCTTAAAG TTGAAAC TTAAGTAAC ATTAGC TGAAAA ACTTG TTGGATAA ACATTGC TACTCCC TTGAAAA TTCCGGG AGTTCC AGTTTGG TTGC TGACC ATTTTTT ACC ATTTATC TATT TGTTTAGC ACTAACG TTTC TTAAGC TTCCAATG TATATAGAA TGCTATGC TGGG TTGTGGG AAATAC AATGAGC TATGC TCCCTGTC TGCAAG TCGG TCAC ATTTTAAG TGGGGG TGC AATAAATG ACAGATTC AAACC ACTGAAC AATTATT AACAGAG AAAAGC AACTTTT ATGGGC AAAGGC TTTCGGC AACTCC AGGC ACAGTCTC ACCC AAGGCC TTGATTG TGGCACTGC TTCTGTCAC AGAGAA TAAG AGTGAA ATG TTAGAAG ACTGTTG AAACAC TGCGG AGTTAA TGTTATG TTCC TTTTCATC TTTGGG TCTTTG TAC ATGCTGG TTCC TTGTC TTCCC ACCAC TACCCC TATATC ATTTATC TAA TTAAAAC TCATAA ACATG AATG AGAAGCCC TTTT TGACC ACCAGCC TACAAAC AGACAC ACAG ACACACACACACACACACACACACACACACACACACACAC TGCG TTGTCC TTCCATTG AGGTACC AACAGC ACAC TATAATTTC TCC ATTATG ATAGC ATTTATT ACAAGG TATT ATGATT TCTG TTTAAC TTCTCTG TATCCC TCCTGCC TGCTAC ATTGTAAC TTCTGTG ACTGC AGGG ATATATC TGTTTTG TTCACC ATTATATT GGC TAGC ATGTAGC AGCCATTC AATAAATAC TTGCTGAA TGCATG AATGAAC GGC TGAATGGC AGAACC AACATT TGAG TAAAATTTTC GTG TATTG TTTAC TTTGTGC TATAAC TTCC TAGGTATT TTATGG ATCTTC TTTC TGTGGGG TTATAT ATAG TATAAATT TGTTGC AATATT ATATTC TTTTTAA ATGCC TCAG TCACTTG TTAA ATTTAG TGCTTG TTGC AGAAGGG TATAATG TTAC TGATAGG AAAGCC ATAGTC TTGATCCC TATATCG AGGCC AAATGGC TTCTTATC TGG AAATCTC TGCC TTAAATTG AGCAGTATC TAGATT AGATG TTTTGAAAC TATGTATC ACTCAC TATGG TGGGC AAATAG TTCAGAC AGACTAGG AGACGGG ATATG AGAA ACTTAGAA TAAGCTAC AAGAAG AATTCTAA AGACAC ATGACCC ATT AAATTCC TTTTTC ATTGAAAA TCAG ACCAAAA TCTGTGGC AAAAACAG AAAACG TATTCC GG AAATATGGC TGTAG AACTGAAG ACTAA ATAGC AAGCAGTG TTTAA TCTG AAGTAA TGAA TGTTATT TCAAGG AGC AAAGAAGC TAAC ACTTGC AATAA ATCTTTG TTTTG AAGTATC TTTC TCAAAGG TCATC AAAATAAG TTTT AATTTAG ATTCC TAAATCC AGTTTC TGCTCTG TTAGTTATT GGGG ATTTTTTG AATAAATAA TCTACGC AGAAC TGTGG ACTCTGC TCTGC TTTTTC AACCCC ATGGTGTGG TCATCC AGAAAGG ATTTC TTCTCC GC TCTAGGC TTAGAA ATGGGG TACC TCCTGCC TGATG TATCC TATGC TTTCC AGAACC TGAAAG ATTAAGATG AATC ATTACAAG TGAAATG ACCCTAG ACAGAG AACAAAG AGGGCTGGC ACATG TTTGC TGTAAC ATTCC GGG AGAGC TCTTC ATCCCG TTTAC ATGTTC TTG AGAGGG TGCCTTCC GTGC TGTG ATGAATG AGCCACCC AGACC TCCCGC TACC ACACAGC AATTG TTTAG TCAGAG ATCCTGTGC ATCTGGG TCTTTTTTTT AATC AGCAGG TTCTAA ATAAAAAAC AAAAAAC AATAAC AAGCCC ACCCTCTC TGAATATG ACTCTC TGAC TCTCTTG TGTTTC TTGTTTAC ATTTTATTG TGCG AATGTG ATTC TGCTTC TTAGCC TAGTGC ATTTGG ATTTG TTGTTC ACACTGAGC ATAA ATTGCC AAACAC TCAAC TTTAA TCTAA TTGTAC ATAC TATAAAC AGAAAA TGTTG ACG TTAAAAGC ATTTCC ATAATCAC AGATTGGG TGTATGG ATG AGCAAG TGGATG AGTT AGGCC TTTTG TCATC TCAGTCC ATAGC TTGATCC TTCAGG TATTC AAAAGGAAAC GGGG ACTGTC TTCCACTG ATGACC TCACTGATG ATGAGG TTCATC TGCC ACCATC TATAGTG AGTGAAAC TTTATGGTG TAGTTG TTAAGTCTC AAATTC AGAGAGAC TTAGG ATCAAATC TCACTCTGC TACTTTC TAGCTATG TGACC TTGGG AAAGCC ACATGG TGCC TTGAAG ACTC AGTCTCC TTAAC TATATT ATAAGAATAA TAATATT CCC TATGCC AAAGGG ATCCTGTG AGATAA TAACATC TTAATTG AGTTAA ATTATT TAAG AGTTAA ATGAGATAA TGGATAAAA ATCATGGC ACATTTTG AGCAC TTCATAA ATATTAATG ATAACG ATCC TTATTTAA ACGTGCCC TGCATTC TAAAAATG AGAAG TAACTTTC TGGC TGAAACC AACCCC TGAA TGGCAAC AGAGAA AGCTGTTTC AAC AGGGTTG AGAAAA AAGC TGGGGG ATAAAGTAA TGTTTC TAA TCTTAGAG TTTAAG AGAAAATAC ATTTTTT AATTC ACTTGG TAAATT AGAG ATCTTTT AGGGACACC AGAAG AAGGC ACTTTC TGAAAGAG TTAAAA TGATTTCC TTAGAG TAAACAA ATCTCTC TCATAGAA TTTTTGC TTAGAC TAAGTTG ATGGG ACATTC ATTAAG AAATAA ACTTTTC ATCC TCGC TTGGG TAATGC AACCAGGG AACG AGTAA ATATCCC GGG AAAGCC AACTTGC TATATGC AGGTAC TATT TCTTAAAA ATGTTATT TTTATC TATC AAAATAA TATT ACTGTTATT AAGTATC ATTG AGGTTC AATCC TGCG ACAGAA ACTGTAC TTAGC TATAGGG AATC AAATATG ATTGTGAC ATAGTTC TACCC TCAGGGG TTTTAAG TGGGAAG ATAGAA TATGCC ATTAAAAAAAA AGTAA TCCTTGGC ATGGAAGG TTAAATGCC TTATAAC TAAC TGATG ATTG ATAGC AGAAGAGTG ACTAA TTCTC ATCTAG AAAGAGAA GGCC TGGGC TCTAG TTTTGG TTCC ACCAC TTGTCAAG TTTGTAACC TAGGG AAATTC ACTTC AATCC TTTG AACTTTC AGTTTT TCAAAGG AAATGG AGATG ACG ATATT TGCCC TACC ATTCCC ATAAGG TTGCTGTG AGGTTC AAATG AGCTAAGG TTTACG AAAAC ACATAA TAAATTAC AGCAC TTCGG TGC TATTCC TTGGTGTG ATCATT TTCCTTCC TCTGCC TCCTC ATAGAC TGAGAC TCTC ATAAACTG TTTTATT TTCTG TCTCAGC TTATG AAATATC TGCAAG TTATATC ATTATG TGTGTGTG TGTATTG TGTGC ACATT ATCAAG TCTAA TCAAGCC AAAGC AGCAGAAC TAAACAC AGATATC TGGACTCC TAAAAATCC ACCAC TTAATCG TGAAG ACAAC ATTG TTAGAG AAGAAAAG ATATTC TCTAAGG TTGG ACCTATT TCAGAA ATG AGTAGC ATCACCC TTGCTTTAC AATGG AGAAAAC TGAG TATTG ATTTATTG AACAC TTATT TAATAA AGGTTTATG AAGAACCC ATCC TGCACC AGGGGCCC AGGTACC AAC TTAAAGAA TGTGAGTG AGAAAA ACAGGG AACTCAG TCCTGGC ATTGACC TTTGC TGTAAC TTCTGCTC ATTGTAGG AATCAGCC AACTTCC TGTCC TTTAG TTTCCTCTTC TGCAAAC TGAAG ATT AGTTAG TTGTAG AGCATAC AGTCAGTG TTATG TCTGAAAA TATTG AAATAC AGAGACAAAG TGAAAA AGAAGGG TATG AAACCCC TTTCC ATTAGAC TGTAAG AGGG ATGATG ATTGTTAC TTTTGGG AGTTATG AGCG TGGGC AGTGG AGAGAGTGG TTTGTTTG AGGATGCC ACGC TGAGC ATTGGG TGG ATGTGG AATTTGTG TGGGCAGGG AAGTAG AGAAGAGAG TTGGGGC AAGCTAAG ACTGCC AGCTTCC AGAC TGGAAGC TTCTGC GGTAG TTAC GGGG AATGAGTC AGGAAATAG TTCTGTG TAAATAG TTATG AAATTTTAA AGCTAA TTTTG TCATGGGCC AAAGGC ATTTTTT GGGG ATGATG AGAG ATATC AAATT TTGTGG ATGCGCC TACAAG TAGG TGATGG TTCTAC ACTGAAAG ATTTGCC ACTTTTC TTCACCC TAGAATG TTCATATTG TGCG TGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTG TGTATGG TTTCTTAG TGGACTGTG AGATATATT AAACATAG ATAAAAGG AATATT TAAC TAAAAG AGAAGC AACAGAA AGTTAA TCAAATAG TATCC AAGACAGG ACGG AAATGGGC TTTAGGGG AGTCC TGAGAGAA AGAGAAC TCAC ATTCATTG AGTTCG TGTG AATTGTTTC TGGGCCCC GGGC ACTGTC ATATCC ATG AAATAACC TTATTC TTGTCTTG AAAAGC TGTTCTC ATACAGATC TGAAAAC TAAGGCCC AGAGACAG TAAGC AGCTTC TGGGAATG ACTATG TTGTTG AGCTCAGG TTTGAGC TATGG AGGG TATGAAG TTATT TCCTC TTAGC AACTCC ATCACAGAC TCAAC ATGCTGGGC AAACTCAC TTTATC TTTAA AGAAC AGTCTC TATTTGC AAAGGAG AGAACC TGCTTCC ATACAC TTGGG ACTG TTAGAG TTGTC AGACG ATGTTACC AAAGC AAAGGC ACTTGAAC TTAGGCC AAGG TATATG TTTCTGTAG TCACCC TGTGG TAACTAC TGGGG TCAGC ATTTCAC AAAACC TAC TTACCC TGTTTAG TTAGG AAAACCC TAGAGG TGGGGG AGTGGG AGTGAGGG TCCCC AGTCCC ACTGTC ATTTGG AAAA ATGTCC AGATG AGAG TAGGC TGTCC ACTTCC TAGAGGC AAATC TTTCTGAA TCTAC ATAGTTTC ACAGAC TCACAGAAC TTCAGAGC TGAAG AGACC TTC AGATAG ATATTTTTC AGATAG ACCTTC AGATAGAC ATTTTGCC GC ACTGC TCAGTC TAGG TTAAC GGGAAGC TAGGGC AAGAATTC ACTT ATGGCCC TCCC TTCTTCC TGTATTC AGTATT TTCC TGTCTG TAAC ATTGGG TCCATG ATTAAGC TATTTAACC AGTTTC TGAA TTTGTAA TTTATG AAGCC AGGAAAA GGGC ATTTATC ACTTG AATCATCCC AGCAGCC TGTG TCAGAG TTAAGG AGGG AATTATT TTTTTTTC TAAAAATTC TGTTC TAGGC TATTTAAGG TCAC TCTAC TTGCC TCTTC TGGAGAG ACTCG TAC ATGCG TTGC TGATCCC TGGGC TGAG TTCTCCC AGCCC TAGTGAAC TCGG AAGTAC AGGTCC AGAAGG TTCTGC TTGATGG TTCCC ATCAGGG TAAAAC TGAAAA TAGG AAGCCG TTGGTTGC TGATTG TAAGATAA ATTTGTTTAAG TAG TGTGCC AAAAGC AGTGGG TCATATG AAAAGCC ACATG ACCAACC AGAAATAA TTGGAGC TTAAAAG ATGC TAGGG TCTATG AGTAAG ATTTC TTTCACC ATGGG ATTTAGG TAAGGC AAAC TCACCC ACTCAC TAGTTC TTAATTCCC ATTTTCTTTT TGTCC TGGAAC ATTTC ACCTGCCC TGATGC GGC AAATTAAG TGATTG AATTAA TAC AGAAATG TCAGCC TTTATTG ATGACAA TTAGG TGTTC ATATT ATTTCTG TTTTATT AATAA TTTATT TACC TATTCAAC AAATC TTTAAAGCC TACTGTG TGCTAG ATGTGG AGGAAG AAACAAG TAAC ACTTCC TCCG TGAC AGTTTT TCTAA TCCCTCTAG TGTAAATTC TCTCTCCC TTTCC TGAAAC TTAGTAG TTCTTTG TTTAT AGTTCTCC AATAG ATTTATGCC ATGTTGCC TTGTATTG TAGC AGCTTG AGAAC ATGTC TTACTATT TAGAAC TAAG ACAATTGC TTTAC AAGTATT TGTCTG TACCATG ATATTTAA AGTAG TGCTGGC ACAGAG TATG TTGTCAGTG TTGTGG AATAAATG ACTAA ATGAATATT TGTTG AATTAGG TAAGAAG TTGC TTCAGC TTTGGC TGTT ATGCTGC TGTAAC AAAC AGCTCCC AAATT TCAATAGC TCAG AACACAATG ATTTATT TCTC ATCTATG TTAA TGCCC ATAGTG AGTTAGG TGCAGC TCTGC TCCCC ATCTTC TGGATT TGGGG ATCTGGG TAG AAATAGCC ATT AGTTGGG ATTTTCTTG TGTTGGGG AACAAG AGAGATGGC AGAAACAC ATG ATAGATC AGAAG TGGCATTC ATTGGC TGGGCACGG TGGCTCACGCCTGTAATCCCAGCACTTTGGG AGGC ATAGGC AGGTGG ATCACC TGAGC TCAGGAG CCC AAGATC AGCC TGGCCAAC AATGG TGAAACCCCATCTCTACTAAAAATACAAAAATT AGCCAAGC ACGGTGGC AGGCACC TGTATC TCAGC TACTTGG AAGGCTGAGGC AAGAGAA TTGCTTGAACCC GGGAGGTGGAGG TTGCAGTG AGCTAAG ATTGCGC TACCACCC TCCACC TGAGC AGC AGAGCGAGAC TCTG TCAAAAAAC AAACAAACAAACAAAC AACATCAC TTCTGCTC AAATT TCG TTGGCCC AAACTAG TCATG TAGCC ACGCC TGCC GTGG AGGGC AGACAAGG ATAA TTCTCCC ATGAGAA AGGCC ATGAATC TTTGGG AATAA TAATAT AATTTACC AGAG AAGTCATCC TTATTTTTT AAAGAAC TTAAAA TTTAGTTG AGGAAG TAAGC TATACAC AAAGAAATAC AATAAAAAA AAGGTGC AAGC AACATG TTATAG AGGTGAGGG AGGAGAG ATTTCTTTGG ACTAAG ATTAGTCAC AGAAGG ATTAATAA AAGATG TGTTC TTTAA ATTGG ACATG AAAAGTAAG ATTTTGCC AAG TGGAAC TGGACAAG AGGTGAA TAGAAG AGTATT TAAAAAG ATATG AAGGTAC TCAAAC AAAA AATGTAC TAAAAAA AAGAGTG AAAAG TCCAC TTTTGG TGGATAA TTAGG TCCAC ATTTCAAAG TTGGG AATTTAG AGTCTATT AAGC AGGAAATT ATAA ACCACTAG AGATTTGG AAAGC TAAC TAAAGG ATGCAATGG AGAGAAGC TGAAAA TATTTTTG AGGC TATGC AAAGAG TTCAGG AAACAGGG ACTAA AGACAGAA TCAGAA TAG TGAAAAG TATG AACAGG ACAGAAC ATAC AGAGGC AAGATGC AAAGG AAATGTAC AAAGGTTG AAAACCG ATTGG TTTGG AAAGC AAAGG AGAGAGGC AGTG AAAGAAG TTGCAGATG ATTATTCC ATTAATGG TGGTGCC ATTAATGG AATTCAAAA AATAAG AAG AGGACTGAC TCATAGG AAGAGAAAA TAAGTTTTG TTTGAGG TATTC TGATTTC GAGG AATTTC AGAG AGAAATG TTTAG TAGGCG TATGG AACTCTGGG AATAG AGTTTG TGGGATTG TGGTTG TGATTG AAGATG TAGTCC TGAGGG ACCCC TGAAG AGGTGAC AGTTG AAGCC ATGAGTGC AGATG AGAATCCC AAAGG AAACTAG TGGCC AAAAGGC AGAG TCTTGG AGGGCTGCC AACATG TAGGATG TGGGAAG ATGAAG ACAAACC AGGGAGGG AAGCTGAAG AACC TTGAC AAGGCAGAG AGGAG AACAC TATAGTG TGGG ATCAAG TGAGC TGAGGC AGGAGAG AGGCTGAGG AGCAGGG AGAGG TCAGCGG TGTC AAATGC TTTAG AAAGTGC TAAG AAGATG AGAA TGTAGG AAGTGG TATTG AGGTTAGAG TAGG AGATC ATTGGC GATG AGTAAGG AAAC AACTTC AGTGAGG ACTGG AGATG TTCTTG TGAGATATC TGATAAC AAAAATTAC AGAGATTGC ATAA TGGAGG ATT AGTTGG AAC TGGTGG AAC TGAGAG TACGC TTAG TGCG ATAACC TTTGAAAAG AAGAGG AACC TATTCC ATTTGGGG AAGGC AGGAGAAAAC TATGC ACTAAG AGAG AACTTG TCCATG AGAAGG AGTG ATTTTTAAGG TGCTTC TTAAC AAAGTAG AGTTTAGGG AATGTATTC ACTC TTTGAAATT AAAAAGC AATTGC TTATTATTG AAAACCC AGGTTAGC TATT AAAAAAAAAAAA AGAGAAAA ATAAG ACAAAA AAAGAAAAAAAA ACCATGC ATGTGTAAC AAGTC AGGGGAAGC TGAGGAG ACCTTCC AAACTGTAC TGTATTC ACTTGC ATATATTCC ACATCTGGC ACTGGGC AGTC AAATATTC ACAGG TAATAA ATAGATATT AAAGAA TGTATT ATTGGGC ATTAGG ACTC ATAATTTT AGAAAAATG TTTTTTG TGGC TGGGCGTGG TGGCTCACTCC TGTAATCCCAGCACTTTGGG AGGCCAAGG AGAG TGGATC AGAAGG TCAGGAG ATCG ACAGCATCC TGGCCAACATGGTGAAACCCC G T [SEP]
,,,,


In [13]:
df = dataframe_creation(attributions_sum, all_tokens, 101086907, 1)
bed_file_creation(df, './67718')

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_neg['score']= df_neg['score']*mult*(-1)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df_pos['score']= df_pos['score']*mult
