In [1]:
import os
import torch

from transformers import set_seed

from functions import *
from utils.telegram import sendMessage

from config import get_model_config
from functions import get_roberta_finetuned_results

In [2]:
os.environ['TOKENIZERS_PARALLELISM'] = 'false'

set_seed(42)
torch.cuda.manual_seed(42)
torch.cuda.manual_seed_all(42)
torch.backends.cudnn.deterministic = True
torch.backends.cudnn.benchmark = False

device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

In [3]:
datasets = [
    'btc_news',
    'eth_news',
    'reddit_r_bitcoin',
    'reddit_r_ethereum',
    'btc_tweets',
    'eth_tweets',
]

In [4]:
directory = 'results'

if not os.path.exists(directory):
    os.makedirs(directory)

In [None]:
for DATASET_NAME in datasets:

    print(f'\nCalculating predictions on {DATASET_NAME} dataset\n')

    try:
        model_config = get_model_config(DATASET_NAME)
        predictions = get_roberta_finetuned_results(DATASET_NAME, **model_config)
        predictions.to_parquet(f'results/{DATASET_NAME}_roberta_finetuned.parquet.gzip', compression='gzip')
        sendMessage(f'RoBERTa {DATASET_NAME} predictions successfully calculated and saved. \U0001F389')
    except Exception as e:
        sendMessage(f'RoBERTa {DATASET_NAME} prediction calculation returned error: {e} \U0001F614')
