In [1]:
#!pip install -qq transformers genomic-benchmarks datasets

In [2]:
### Parameters
MODEL_NAME = "simecek/DNADeberta2" #DebertaSmall trained for 30 epochs
TOKENIZER_NAME = "armheb/DNA_bert_6"
K = 6
STRIDE = K

# if less than 1, only this fraction of each dataset is used
DATASET_THINING = 1

BENCHMARKS_FOLDER = '/root/.genomic_benchmarks'
# BENCHMARKS_FOLDER = '/home/jovyan/.genomic_benchmarks/' (for INFRA HUB)

DATASETS = [('demo_coding_vs_intergenomic_seqs', 0),
 ('demo_human_or_worm', 0), ('human_enhancers_cohn', 0), ('human_enhancers_ensembl', 0),
 ('human_ensembl_regulatory', 0), ('human_nontata_promoters', 0), ('human_ocr_ensembl', 0)]

BATCH_SIZE = 32
LEARNING_RATE = 8e-5
EPOCHS = 4
RUNS = 5

# do not forget to attach drive
OUTPUT_PATH = 'drive/MyDrive/genomic_benchmarks/DNADebertaSmall.csv'

## Download benchmark datasets and tokenizer

In [3]:
from genomic_benchmarks.loc2seq import download_dataset
from genomic_benchmarks.data_check.info import is_downloaded
from pathlib import Path
from tqdm.autonotebook import tqdm

for dataset_name, dataset_version in tqdm(DATASETS):
    if not is_downloaded(dataset_name):
        download_dataset(dataset_name, version=dataset_version)

benchmark_root = Path(BENCHMARKS_FOLDER)

  from tqdm.autonotebook import tqdm


  0%|          | 0/7 [00:00<?, ?it/s]

Downloading...
From: https://drive.google.com/uc?id=1cpXg0ULuTGF7h1_HTYvc6p8M-ee43t-v
To: /root/.genomic_benchmarks/demo_coding_vs_intergenomic_seqs.zip

  0%|          | 0.00/33.9M [00:00<?, ?B/s][A
100%|██████████| 33.9M/33.9M [00:00<00:00, 133MB/s] 
Downloading...
From: https://drive.google.com/uc?id=1JW0-eTB-rJXvFcglqBo3pFZi1kyIWC3X
To: /root/.genomic_benchmarks/demo_human_or_worm.zip

  0%|          | 0.00/28.9M [00:00<?, ?B/s][A
100%|██████████| 28.9M/28.9M [00:00<00:00, 169MB/s]
Downloading...
From: https://drive.google.com/uc?id=176563cDPQ5Y094WyoSBF02QjoVQhWuCh
To: /root/.genomic_benchmarks/human_enhancers_cohn.zip

  0%|          | 0.00/11.9M [00:00<?, ?B/s][A
100%|██████████| 11.9M/11.9M [00:00<00:00, 52.2MB/s]
Downloading...
From: https://drive.google.com/uc?id=1gZBEV_RGxJE8EON5OObdrp5Tp8JL0Fxb
To: /root/.genomic_benchmarks/human_enhancers_ensembl.zip

  0%|          | 0.00/51.1M [00:00<?, ?B/s][A
  9%|▉         | 4.72M/51.1M [00:00<00:02, 20.9MB/s][A
100%|██████████| 

In [4]:
from transformers import AutoTokenizer

tokenizer = AutoTokenizer.from_pretrained(TOKENIZER_NAME)

Downloading:   0%|          | 0.00/40.0 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/1.08k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/28.0k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/112 [00:00<?, ?B/s]

In [5]:
def kmers_strideK(s, k=K):
    return [s[i:i + k] for i in range(0, len(s), k) if i + k <= len(s)]

def kmers_stride1(s, k=K):
    return [s[i:i + k] for i in range(0, len(s)-k+1)]

if (STRIDE == 1):
  kmers = kmers_stride1
else:
  kmers = kmers_strideK

# function used for the actual tokenization
def tok_func(x): return tokenizer(" ".join(kmers(x["seq"])))

# example
tok_func({'seq': 'ATGGAAAGAGGCACCATTCT'})    

{'input_ids': [2, 501, 835, 650, 3], 'token_type_ids': [0, 0, 0, 0, 0], 'attention_mask': [1, 1, 1, 1, 1]}

## Looping through datasets, fine-tuning the model for each of them, logging metrics

In [6]:
import pandas as pd
import numpy as np
from random import random, randrange
from transformers import AutoModelForSequenceClassification
from transformers import TrainingArguments, Trainer
from datasets import Dataset, DatasetDict, load_metric

def compute_metrics_binary(eval_preds):
    metric = load_metric("glue", "mrpc")
    logits, labels = eval_preds
    predictions = np.argmax(logits, axis=-1)
    return metric.compute(predictions=predictions, references=labels)

def compute_metrics_multi(eval_preds):
    metric = load_metric("accuracy")
    logits, labels = eval_preds
    predictions = np.argmax(logits, axis=-1)
    return metric.compute(predictions=predictions, references=labels)

outputs = []

for dataset_name, dataset_version in tqdm(DATASETS):
    

    labels = sorted([x.stem for x in (benchmark_root / dataset_name / 'train').iterdir()])
    
    tmp_dict = {}

    for split in ['train', 'test']:
        for nlabel, label in enumerate(labels):
            for f in (benchmark_root / dataset_name / split / label).glob('*.txt'):
                txt = f.read_text()
                if not DATASET_THINING or DATASET_THINING==1:
                    tmp_dict[f"{label} {f.stem}"] = (split, nlabel, txt)
                elif random() < DATASET_THINING:
                    tmp_dict[f"{label} {f.stem}"] = (split, nlabel, txt)

    df = pd.DataFrame.from_dict(tmp_dict).T.rename(columns = {0: "dset", 1: "cat", 2: "seq"})

    ds = Dataset.from_pandas(df)

    tok_ds = ds.map(tok_func, batched=False, remove_columns=['__index_level_0__', 'seq'])
    tok_ds = tok_ds.rename_columns({'cat':'labels'})

    dds = DatasetDict({
        'train': tok_ds.filter(lambda x: x["dset"] == "train").remove_columns('dset'),
        'test':  tok_ds.filter(lambda x: x["dset"] == "test").remove_columns('dset')
    })

    compute_metrics = compute_metrics_binary if len(labels) == 2 else compute_metrics_multi

    for _ in range(RUNS):

        model_cls = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME, num_labels=len(labels))
        
        args = TrainingArguments('outputs', learning_rate=LEARNING_RATE, warmup_ratio=0.1, lr_scheduler_type='cosine', fp16=True,
            evaluation_strategy="epoch", per_device_train_batch_size=BATCH_SIZE, per_device_eval_batch_size=BATCH_SIZE*2,
            num_train_epochs=EPOCHS, weight_decay=0.01, save_steps=100000, report_to='none', seed=randrange(1,10001))
        
        trainer = Trainer(model_cls, args, train_dataset=dds['train'], eval_dataset=dds['test'],
                          tokenizer=tokenizer, compute_metrics=compute_metrics)
        trainer.train()
        
        max_accuracy = max([x['eval_accuracy'] for x in trainer.state.log_history if 'eval_accuracy' in x])
        max_f1 = max([x['eval_f1'] for x in trainer.state.log_history if 'eval_f1' in x]) if len(labels) == 2 else np.nan
        train_runtime = max([x['train_runtime'] for x in trainer.state.log_history if 'train_runtime' in x])
        
        outputs.append((dataset_name, max_accuracy, max_f1, train_runtime))




  0%|          | 0/7 [00:00<?, ?it/s]



  0%|          | 0/100000 [00:00<?, ?ex/s]

  0%|          | 0/100 [00:00<?, ?ba/s]

  0%|          | 0/100 [00:00<?, ?ba/s]

Downloading:   0%|          | 0.00/704 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/178M [00:00<?, ?B/s]

Some weights of the model checkpoint at simecek/DNADeberta2 were not used when initializing DebertaForSequenceClassification: ['cls.predictions.transform.LayerNorm.bias', 'cls.predictions.decoder.bias', 'cls.predictions.decoder.weight', 'cls.predictions.bias', 'cls.predictions.transform.dense.bias', 'cls.predictions.transform.LayerNorm.weight', 'cls.predictions.transform.dense.weight']
- This IS expected if you are initializing DebertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing DebertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Some weights of DebertaForSequenceClassification were not initialized from the model checkpoint at simecek/DNADe

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.2496,0.274902,0.90892,0.906898
2,0.1884,0.241844,0.9116,0.909914
3,0.1256,0.253503,0.916,0.914987
4,0.0841,0.291718,0.92124,0.921432


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Downloading builder script:   0%|          | 0.00/1.84k [00:00<?, ?B/s]

***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.2482,0.23066,0.90592,0.90616
2,0.1935,0.233084,0.9196,0.920947
3,0.1131,0.242231,0.92172,0.922828
4,0.075,0.286372,0.92328,0.923329


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.2488,0.254195,0.90532,0.90612
2,0.1907,0.229334,0.91528,0.914438
3,0.1196,0.265294,0.9208,0.922322
4,0.0785,0.296843,0.92128,0.920983


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.2485,0.229064,0.91144,0.911149
2,0.181,0.221114,0.92128,0.92222
3,0.1194,0.258664,0.92228,0.922451
4,0.067,0.308995,0.92196,0.921901


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.2558,0.285462,0.90196,0.897082
2,0.1943,0.235917,0.91424,0.916569
3,0.1249,0.254168,0.92228,0.923495
4,0.0813,0.29139,0.92164,0.921949


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




  0%|          | 0/100000 [00:00<?, ?ex/s]

  0%|          | 0/100 [00:00<?, ?ba/s]

  0%|          | 0/100 [00:00<?, ?ba/s]

loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 6,
  "pad_token_id": 0,
  "pooler_dropout": 0,
  "pooler_hidden_act": "gelu",
  "pooler_hidden_size": 768,
  "pos_att_type": null,
  "position_biased_input": true,
  "relative_attention": false,
  "torch_dtype": "float32",
  "transformers_version": "4.20.1

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.1818,0.171567,0.93212,0.929064
2,0.1448,0.159869,0.94176,0.942061
3,0.0784,0.187243,0.94644,0.945827
4,0.0434,0.206986,0.94724,0.947043


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.1962,0.233153,0.93596,0.934426
2,0.1414,0.153688,0.94204,0.941547
3,0.0794,0.178838,0.94592,0.945387
4,0.0456,0.203719,0.94764,0.947487


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.1915,0.188075,0.93144,0.928291
2,0.1303,0.171263,0.9422,0.942738
3,0.0795,0.179461,0.94576,0.945985
4,0.0435,0.209647,0.94576,0.945886


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.1789,0.184636,0.94132,0.941153
2,0.1358,0.189402,0.94436,0.944491
3,0.078,0.170827,0.94756,0.947301
4,0.0376,0.211498,0.94696,0.946977


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.1853,0.179087,0.935,0.935132
2,0.1361,0.155031,0.94468,0.944607
3,0.0747,0.18424,0.94708,0.947196
4,0.0385,0.220063,0.94672,0.94663


***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64
***** Running Evaluation *****
  Num examples = 25000
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




  0%|          | 0/27791 [00:00<?, ?ex/s]

  0%|          | 0/28 [00:00<?, ?ba/s]

  0%|          | 0/28 [00:00<?, ?ba/s]

loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 6,
  "pad_token_id": 0,
  "pooler_dropout": 0,
  "pooler_hidden_act": "gelu",
  "pooler_hidden_size": 768,
  "pos_att_type": null,
  "position_biased_input": true,
  "relative_attention": false,
  "torch_dtype": "float32",
  "transformers_version": "4.20.1

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5707,0.546654,0.72179,0.716694
2,0.5145,0.562476,0.720783,0.733736
3,0.4331,0.605278,0.719056,0.726457
4,0.2086,0.817298,0.714018,0.718914


***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5693,0.558367,0.704519,0.662391
2,0.5097,0.545964,0.72251,0.732594
3,0.4439,0.633791,0.714306,0.715494
4,0.2232,0.79863,0.708837,0.714387


***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5795,0.569647,0.7192,0.71439
2,0.5152,0.566718,0.711572,0.737971
3,0.4429,0.646737,0.715026,0.731343
4,0.2377,0.795977,0.712003,0.718526


***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5787,0.566443,0.695164,0.746953
2,0.5004,0.581057,0.720207,0.700831
3,0.437,0.679821,0.717329,0.728954
4,0.2073,0.835557,0.713155,0.715651


***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5755,0.552271,0.705815,0.744819
2,0.5155,0.576543,0.717904,0.708333
3,0.4491,0.661373,0.714594,0.724315
4,0.2307,0.810464,0.707542,0.711035


***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64
***** Running Evaluation *****
  Num examples = 6948
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




  0%|          | 0/123872 [00:00<?, ?ex/s]

  0%|          | 0/124 [00:00<?, ?ba/s]

  0%|          | 0/124 [00:00<?, ?ba/s]

loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 6,
  "pad_token_id": 0,
  "pooler_dropout": 0,
  "pooler_hidden_act": "gelu",
  "pooler_hidden_size": 768,
  "pos_att_type": null,
  "position_biased_input": true,
  "relative_attention": false,
  "torch_dtype": "float32",
  "transformers_version": "4.20.1

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4403,0.436928,0.799613,0.819813
2,0.3491,0.38561,0.832967,0.827928
3,0.2102,0.410586,0.856151,0.860165
4,0.1095,0.514475,0.859057,0.86268


***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4288,0.406576,0.816242,0.820434
2,0.3433,0.380862,0.837262,0.8443
3,0.2171,0.39164,0.856183,0.857308
4,0.1122,0.522764,0.856248,0.860631


***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4323,0.406869,0.815531,0.822869
2,0.3466,0.392856,0.835034,0.831891
3,0.2142,0.419164,0.849629,0.855655
4,0.1191,0.521445,0.855893,0.859305


***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4359,0.414115,0.818082,0.818258
2,0.3516,0.367747,0.838909,0.838903
3,0.207,0.408807,0.854924,0.855022
4,0.1153,0.524112,0.857798,0.861352


***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4347,0.409562,0.813529,0.821379
2,0.3447,0.378843,0.839361,0.837285
3,0.2066,0.376809,0.85896,0.85955
4,0.1226,0.511397,0.858767,0.86285


***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64
***** Running Evaluation *****
  Num examples = 30970
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




  0%|          | 0/231348 [00:00<?, ?ex/s]

  0%|          | 0/232 [00:00<?, ?ba/s]

  0%|          | 0/232 [00:00<?, ?ba/s]

loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1": 1,
    "LABEL_2": 2
  },
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 6,
  "pad_token_id": 0,
  "pooler_dropout": 0,
  "pooler_hidden_act": "gelu",
  "pooler_hidden_size": 

Epoch,Training Loss,Validation Loss,Accuracy
1,0.2538,0.252627,0.909189
2,0.2322,0.236055,0.912169
3,0.206,0.24368,0.910991
4,0.1788,0.265509,0.908426


***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64


Downloading builder script:   0%|          | 0.00/1.65k [00:00<?, ?B/s]

***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "label2id": {
    "LABEL_0": 0,
    "LABEL_1

Epoch,Training Loss,Validation Loss,Accuracy
1,0.2415,0.247953,0.910523
2,0.2258,0.236542,0.908374
3,0.206,0.239453,0.911095
4,0.1838,0.264993,0.907768


***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "

Epoch,Training Loss,Validation Loss,Accuracy
1,0.2459,0.248227,0.909085
2,0.2263,0.266836,0.903886
3,0.1982,0.251565,0.910246
4,0.1703,0.27749,0.906451


***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "

Epoch,Training Loss,Validation Loss,Accuracy
1,0.254,0.245608,0.910731
2,0.2252,0.246663,0.908981
3,0.1998,0.253547,0.907577
4,0.1837,0.265639,0.907491


***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "id2label": {
    "0": "LABEL_0",
    "1": "LABEL_1",
    "2": "LABEL_2"
  },
  "initializer_range": 0.02,
  "

Epoch,Training Loss,Validation Loss,Accuracy
1,0.2467,0.237024,0.910038
2,0.2377,0.237873,0.90808
3,0.2061,0.255706,0.911008
4,0.1843,0.270093,0.908738


***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64
***** Running Evaluation *****
  Num examples = 57713
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




  0%|          | 0/36131 [00:00<?, ?ex/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

  0%|          | 0/37 [00:00<?, ?ba/s]

loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 6,
  "pad_token_id": 0,
  "pooler_dropout": 0,
  "pooler_hidden_act": "gelu",
  "pooler_hidden_size": 768,
  "pos_att_type": null,
  "position_biased_input": true,
  "relative_attention": false,
  "torch_dtype": "float32",
  "transformers_version": "4.20.1

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4185,0.33077,0.87547,0.87868
2,0.2442,0.31204,0.875913,0.888469
3,0.1421,0.326835,0.888975,0.89551
4,0.078,0.44965,0.887204,0.895946


***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.42,0.312261,0.865729,0.873157
2,0.2693,0.295829,0.880341,0.890885
3,0.1756,0.304966,0.890635,0.898354
4,0.1139,0.374522,0.890082,0.898642


***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4111,0.319148,0.874696,0.886185
2,0.2549,0.296505,0.883994,0.886849
3,0.1423,0.305077,0.893735,0.900083
4,0.086,0.405583,0.888089,0.896531


***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4206,0.378005,0.816028,0.847355
2,0.2659,0.324672,0.881669,0.892875
3,0.1679,0.32354,0.888311,0.896247
4,0.1043,0.397501,0.889196,0.897217


***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 51

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.4176,0.302508,0.876024,0.880699
2,0.257,0.271242,0.887093,0.889968
3,0.149,0.320363,0.891964,0.89886
4,0.0868,0.418245,0.890525,0.898073


***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64
***** Running Evaluation *****
  Num examples = 9034
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




  0%|          | 0/139804 [00:00<?, ?ex/s]

  0%|          | 0/140 [00:00<?, ?ba/s]

  0%|          | 0/140 [00:00<?, ?ba/s]

loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings": 512,
  "max_relative_positions": -1,
  "model_type": "deberta",
  "num_attention_heads": 12,
  "num_hidden_layers": 6,
  "pad_token_id": 0,
  "pooler_dropout": 0,
  "pooler_hidden_act": "gelu",
  "pooler_hidden_size": 768,
  "pos_att_type": null,
  "position_biased_input": true,
  "relative_attention": false,
  "torch_dtype": "float32",
  "transformers_version": "4.20.1

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5668,0.547972,0.717126,0.723154
2,0.5042,0.534007,0.725853,0.726009
3,0.3923,0.611526,0.722333,0.714366
4,0.284,0.727793,0.719959,0.719718


***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5684,0.586724,0.703679,0.680428
2,0.4979,0.554899,0.722333,0.7291
3,0.3994,0.593006,0.725738,0.724604
4,0.2771,0.718765,0.721675,0.719929


***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5722,0.560723,0.709058,0.731682
2,0.5147,0.540454,0.727255,0.727559
3,0.4026,0.571875,0.727226,0.733225
4,0.2899,0.687319,0.723478,0.727815


***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5745,0.551974,0.717327,0.708417
2,0.4999,0.567157,0.717527,0.690201
3,0.3841,0.606409,0.722362,0.706952
4,0.2621,0.720666,0.72282,0.721913


***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)


loading configuration file https://huggingface.co/simecek/DNADeberta2/resolve/main/config.json from cache at /root/.cache/huggingface/transformers/eaa84554db67bd0bd1237534157006a6e5a26745104c342ca1a8117c146aa517.c7f87ccb839059561ef6996c9f8559644ce254107c992b74bd0b46fbe8c80d51
Model config DebertaConfig {
  "_name_or_path": "simecek/DNADeberta2",
  "architectures": [
    "DebertaForMaskedLM"
  ],
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_range": 0.02,
  "intermediate_size": 3072,
  "layer_norm_eps": 1e-07,
  "max_position_embeddings"

Epoch,Training Loss,Validation Loss,Accuracy,F1
1,0.5717,0.587351,0.699617,0.72698
2,0.5068,0.554235,0.721332,0.718204
3,0.3904,0.597719,0.726825,0.729196
4,0.2804,0.705646,0.724279,0.725575


***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64
***** Running Evaluation *****
  Num examples = 34952
  Batch size = 64


Training completed. Do not forget to share your model on huggingface.co/models =)




## Outputs

In [7]:
outputs_df = pd.DataFrame(outputs, columns = ['dataset', 'accuracy', 'f1', 'train_runtime'])
outputs_df

Unnamed: 0,dataset,accuracy,f1,train_runtime
0,demo_coding_vs_intergenomic_seqs,0.92124,0.921432,537.8861
1,demo_coding_vs_intergenomic_seqs,0.92328,0.923329,540.8948
2,demo_coding_vs_intergenomic_seqs,0.92128,0.922322,534.4755
3,demo_coding_vs_intergenomic_seqs,0.92228,0.922451,527.3855
4,demo_coding_vs_intergenomic_seqs,0.92228,0.923495,525.9056
5,demo_human_or_worm,0.94724,0.947043,528.9461
6,demo_human_or_worm,0.94764,0.947487,529.3401
7,demo_human_or_worm,0.94576,0.945985,532.4752
8,demo_human_or_worm,0.94756,0.947301,528.2359
9,demo_human_or_worm,0.94708,0.947196,529.8365


In [8]:
outputs_df.groupby('dataset').agg({'accuracy' : ['mean', 'sem'], 'f1' : ['mean','sem'], 'train_runtime': ['mean', 'sem']})

Unnamed: 0_level_0,accuracy,accuracy,f1,f1,train_runtime,train_runtime
Unnamed: 0_level_1,mean,sem,mean,sem,mean,sem
dataset,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2
demo_coding_vs_intergenomic_seqs,0.922072,0.000379,0.922606,0.000374,533.3095,2.913358
demo_human_or_worm,0.947056,0.00034,0.947002,0.000264,529.76676,0.725933
human_enhancers_cohn,0.720322,0.000838,0.739215,0.002887,172.3664,1.177469
human_enhancers_ensembl,0.857591,0.000662,0.861363,0.00066,757.75812,6.871512
human_ensembl_regulatory,0.91105,0.000317,,,1798.63176,8.539986
human_nontata_promoters,0.890901,0.00089,0.89815,0.000715,186.04308,0.531168
human_ocr_ensembl,0.725698,0.000775,0.727889,0.001883,840.8682,1.99188


In [9]:
# saving outputs to csv file
outputs_df.to_csv(OUTPUT_PATH, index=False)