In [1]:
from __future__ import absolute_import, division, print_function

import argparse
import sys
import csv
import logging
import os
import random
import sys

import numpy as np
import torch
from torch.utils.data import (DataLoader, RandomSampler, SequentialSampler,
                              TensorDataset)
from torch.utils.data.distributed import DistributedSampler
from tqdm import tqdm, trange
from transformers import BertForSequenceClassification, BertConfig,BertTokenizer
from transformers import LongformerForSequenceClassification, LongformerConfig,LongformerTokenizer

from transformers import BigBirdForSequenceClassification, BigBirdConfig,BigBirdTokenizer

from sklearn.metrics import classification_report

import random

csv.field_size_limit(sys.maxsize)
logging.basicConfig(format = '%(asctime)s - %(levelname)s - %(name)s -   %(message)s',
                    datefmt = '%m/%d/%Y %H:%M:%S',
                    level = logging.INFO)
logger = logging.getLogger(__name__)



In [2]:
class InputExample(object):
    """A single training/test example for simple sequence classification."""

    def __init__(self, guid, text_a, text_b=None, label=None):
        """Constructs a InputExample.
        Args:
            guid: Unique id for the example.
            text_a: string. The untokenized text of the first sequence. For single
            sequence tasks, only this sequence must be specified.
            text_b: (Optional) string. The untokenized text of the second sequence.
            Only must be specified for sequence pair tasks.
            label: (Optional) string. The label of the example. This should be
            specified for train and dev examples, but not for test examples.
        """
        self.guid = guid
        self.text_a = text_a
        self.text_b = text_b
        self.label = label

In [3]:
class InputFeatures(object):
    """A single set of features of data."""

    def __init__(self, input_ids, input_mask, segment_ids, label_id):
        self.input_ids = input_ids
        self.input_mask = input_mask
        self.segment_ids = segment_ids
        self.label_id = label_id

In [4]:
class DataProcessor(object):
    """Base class for data converters for sequence classification data sets."""

    def get_train_examples(self, data_dir):
        """Gets a collection of `InputExample`s for the train set."""
        raise NotImplementedError()

    def get_dev_examples(self, data_dir):
        """Gets a collection of `InputExample`s for the dev set."""
        raise NotImplementedError()

    def get_labels(self):
        """Gets the list of labels for this data set."""
        raise NotImplementedError()

    @classmethod
    def _read_tsv(cls, input_file, quotechar=None):
        """Reads a tab separated value file."""
        with open(input_file, "r") as f:
            reader = csv.reader(f, delimiter="\t", quotechar=quotechar)
            lines = []
            for line in reader:
                if sys.version_info[0] == 2:
                    line = list(unicode(cell, 'utf-8') for cell in line)
                lines.append(line)
            return lines

In [5]:
def get_tp_fp_fn(logits, labels):
    assert labels.shape[1] == 1
    labels = labels.squeeze()
    predictions = np.argmax(logits, axis=1)
    labels, predictions = labels.astype(int), predictions.astype(int)
    tp = np.sum(np.logical_and(predictions == 1, labels == 1))
    fp = np.sum(np.logical_and(predictions == 1, labels == 0))
    fn = np.sum(np.logical_and(predictions == 0, labels == 1))
    return tp, fp, fn

def compute_metrics(tp, fp, fn):
  precision = tp / (tp + fp + np.finfo(float).eps)
  recall = tp / (tp + fn + np.finfo(float).eps)
  f1 = 2 * precision * recall / (precision + recall + np.finfo(float).eps)
  return precision, recall, f1

class CLPsychProcessor(DataProcessor):
    """Processor for the CLPsych data set."""

    def get_train_examples(self, data_dir):
        """See base class."""
        return self._create_examples(
            # self._read_tsv(os.path.join(data_dir, "User_Posts_Processed_Train_Final.tsv")), "train")
            self._read_tsv(os.path.join(data_dir, "User_Posts_Processed_Train_Final.tsv")), "train")

    def get_dev_examples(self, data_dir):
        """See base class."""
        return self._create_examples(
            # self._read_tsv(os.path.join(data_dir, "User_Posts_Processed_Dev_Final.tsv")), "dev")
            self._read_tsv(os.path.join(data_dir, "User_Posts_Processed_Dev_Final.tsv")), "dev")


    def get_test_examples(self, data_dir):
        """See base class."""
        return self._create_examples_test(
            # self._read_tsv(os.path.join(data_dir, "User_Posts_Processed_Test_Final.tsv")), "test")
            self._read_tsv(os.path.join(data_dir, "Full_Test_Data.tsv")), "test")


    def get_labels(self):
        """See base class."""
        return ["a", "b", "c", "d"]

    def _create_examples_test(self, lines, set_type):
        """Creates examples for the training and dev sets."""
        examples = []
        random.seed(9001)
        req = list()
        for i in range(0, len(lines)):
            req.append(i)
        req_final = random.sample(req, len(lines))
        for i in req_final:
            if i == 0:
                continue
            guid = lines[i][0]
            text_a = lines[i][1]
            text_b = None
            examples.append(
                InputExample(guid=guid, text_a=text_a, text_b=text_b))
        return examples

    def _create_examples(self, lines, set_type):
        """Creates examples for the training and dev sets."""
        examples = []
        random.seed(9001)
        req = list()
        for i in range(0, len(lines)):
            req.append(i)
        req_final = random.sample(req, len(lines))	
        for i in req_final:
            if i == 0:
                continue
            guid = lines[i][0]
            text_a = lines[i][1]
            text_b = None
            label = lines[i][2]
            examples.append(
                InputExample(guid=guid, text_a=text_a, text_b=text_b, label=label))
        return examples
         

In [6]:
def convert_examples_to_features(examples, label_list, max_seq_length, tokenizer):
    """Loads a data file into a list of `InputBatch`s."""

    label_map = {label : i for i, label in enumerate(label_list)}

    features = []
    for (ex_index, example) in enumerate(examples):
        tokens_a = tokenizer.tokenize(example.text_a)

        tokens_b = None
        if example.text_b:
            tokens_b = tokenizer.tokenize(example.text_b)
            # Modifies `tokens_a` and `tokens_b` in place so that the total
            # length is less than the specified length.
            # Account for [CLS], [SEP], [SEP] with "- 3"
            _truncate_seq_pair(tokens_a, tokens_b, max_seq_length - 3)
        else:
            # Account for [CLS] and [SEP] with "- 2"
            if len(tokens_a) > max_seq_length - 2:
                tokens_a = tokens_a[:(max_seq_length - 2)]

        # The convention in BERT is:
        # (a) For sequence pairs:
        #  tokens:   [CLS] is this jack ##son ##ville ? [SEP] no it is not . [SEP]
        #  type_ids: 0   0  0    0    0     0       0 0    1  1  1  1   1 1
        # (b) For single sequences:
        #  tokens:   [CLS] the dog is hairy . [SEP]
        #  type_ids: 0   0   0   0  0     0 0
        #
        # Where "type_ids" are used to indicate whether this is the first
        # sequence or the second sequence. The embedding vectors for `type=0` and
        # `type=1` were learned during pre-training and are added to the wordpiece
        # embedding vector (and position vector). This is not *strictly* necessary
        # since the [SEP] token unambigiously separates the sequences, but it makes
        # it easier for the model to learn the concept of sequences.
        #
        # For classification tasks, the first vector (corresponding to [CLS]) is
        # used as as the "sentence vector". Note that this only makes sense because
        # the entire model is fine-tuned.
        tokens = ["[CLS]"] + tokens_a + ["[SEP]"]
        segment_ids = [0] * len(tokens)

        if tokens_b:
            tokens += tokens_b + ["[SEP]"]
            segment_ids += [1] * (len(tokens_b) + 1)

        input_ids = tokenizer.convert_tokens_to_ids(tokens)

        # The mask has 1 for real tokens and 0 for padding tokens. Only real
        # tokens are attended to.
        input_mask = [1] * len(input_ids)

        # Zero-pad up to the sequence length.
        padding = [0] * (max_seq_length - len(input_ids))
        input_ids += padding
        input_mask += padding
        segment_ids += padding

        assert len(input_ids) == max_seq_length
        assert len(input_mask) == max_seq_length
        assert len(segment_ids) == max_seq_length

        label_id = None
        if(example.label is not None):
            label_id = label_map[example.label]
        #if ex_index < 5:
        #    logger.info("*** Example ***")
        #    logger.info("guid: %s" % (example.guid))
        #    logger.info("tokens: %s" % " ".join(
        #            [str(x) for x in tokens]))
        #    logger.info("input_ids: %s" % " ".join([str(x) for x in input_ids]))
        #    logger.info("input_mask: %s" % " ".join([str(x) for x in input_mask]))
        #    logger.info(
        #            "segment_ids: %s" % " ".join([str(x) for x in segment_ids]))
        #    logger.info("label: %s (id = %d)" % (example.label, label_id))

        features.append(
                InputFeatures(input_ids=input_ids,
                              input_mask=input_mask,
                              segment_ids=segment_ids,
                              label_id=label_id))
    return features

In [7]:
def _truncate_seq_pair(tokens_a, tokens_b, max_length):
    """Truncates a sequence pair in place to the maximum length."""

    # This is a simple heuristic which will always truncate the longer sequence
    # one token at a time. This makes more sense than truncating an equal percent
    # of tokens from each, since if one sequence is very short then each token
    # that's truncated likely contains more information than a longer sequence.
    while True:
        total_length = len(tokens_a) + len(tokens_b)
        if total_length <= max_length:
            break
        if len(tokens_a) > len(tokens_b):
            tokens_a.pop()
        else:
            tokens_b.pop()

In [8]:
def accuracy(out, labels):
    outputs = np.argmax(out, axis=-1)
    pred.extend(outputs)
    true.extend(labels)
    return np.sum(outputs == labels)


In [9]:
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
n_gpu = torch.cuda.device_count()
logger.info("device: {} n_gpu: {}, distributed training: {}, 16-bits training: {}".format(
    device, n_gpu, False, False))

05/22/2022 00:25:03 - INFO - __main__ -   device: cuda n_gpu: 1, distributed training: False, 16-bits training: False


In [10]:
seed = 42
random.seed(seed)
np.random.seed(seed)
torch.manual_seed(seed)
torch.cuda.manual_seed_all(seed)

# training

In [11]:
from transformers import LongformerTokenizer as tokenizer
tokenizer = tokenizer.from_pretrained('allenai/longformer-base-4096', do_lower_case=True)

In [12]:
train_examples = None
num_train_optimization_steps = None
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/task_a'
batch_size = 16
epochs = 75
max_seq_length = 384

processor = CLPsychProcessor()

train_examples = processor.get_train_examples(data_dir)
validation_examples = processor.get_dev_examples(data_dir)

num_train_optimization_steps = int(
    len(train_examples) / batch_size ) * epochs
        

In [13]:
optimizer = AdamW(model.parameters(),
                  lr = 2e-5, 
                  eps = 1e-8 
                )

NameError: name 'AdamW' is not defined

In [None]:
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

train_features = convert_examples_to_features(
    train_examples, label_list, max_seq_length, tokenizer)
logger.info("***** Running training *****")
logger.info("  Num examples = %d", len(train_examples))
logger.info("  Batch size = %d", batch_size)
logger.info("  Num steps = %d", num_train_optimization_steps)
all_input_ids = torch.tensor([f.input_ids for f in train_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in train_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in train_features], dtype=torch.long)
all_label_ids = torch.tensor([f.label_id for f in train_features], dtype=torch.long)
train_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)

In [15]:
train_sampler = RandomSampler(train_data)
train_dataloader = DataLoader(train_data, sampler=train_sampler, batch_size=batch_size)

In [16]:
# Total number of training steps is number of batches * number of epochs.
total_steps = len(train_dataloader) * epochs

# Create the learning rate scheduler.
scheduler = get_linear_schedule_with_warmup(optimizer, 
                                            num_warmup_steps = 0, # Default value in run_glue.py
                                            num_training_steps = total_steps)
scheduler

NameError: name 'get_linear_schedule_with_warmup' is not defined

In [15]:
for ep in trange(int(epochs), desc="Epoch"):
    model.train()
    tr_loss = 0
    nb_tr_examples, nb_tr_steps = 0, 0
    for step, batch in enumerate(train_dataloader):
        batch = tuple(t.to(device) for t in batch)
        input_ids, input_mask, segment_ids, label_ids = batch
        outputs = model(input_ids, 
            token_type_ids=None, 
            attention_mask=input_mask, 
            labels=label_ids)

        # The call to `model` always returns a tuple, so we need to pull the 
        # loss value out of the tuple.
        loss = outputs[0]

        # Accumulate the training loss over all of the batches so that we can
        # calculate the average loss at the end. `loss` is a Tensor containing a
        # single value; the `.item()` function just returns the Python value 
        # from the tensor.

        tr_loss += loss.item()
        loss.backward()
        torch.nn.utils.clip_grad_norm_(model.parameters(), 1.0)
        nb_tr_examples += input_ids.size(0)
        nb_tr_steps += 1
        
        optimizer.step()
        scheduler.step()
        global_step += 1

    eval_examples = processor.get_dev_examples(data_dir)
    eval_features = convert_examples_to_features(
        eval_examples, label_list, max_seq_length, tokenizer)
    print("\n")
    print("Running evaluation for epoch: {}".format(ep))
    all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
    all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
    all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
    all_label_ids = torch.tensor([f.label_id for f in eval_features], dtype=torch.long)
    eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
    
    # Run prediction for full data
    eval_sampler = SequentialSampler(eval_data)
    eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)

    model.eval()
    eval_loss, eval_accuracy = 0, 0
    nb_eval_steps, nb_eval_examples = 0, 0

    for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
        input_ids = input_ids.to(device)
        input_mask = input_mask.to(device)
        segment_ids = segment_ids.to(device)
        label_ids = label_ids.to(device)

        with torch.no_grad():
            outputs = model(input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask)

        # Get the "logits" output by the model. The "logits" are the output
        # values prior to applying an activation function like the softmax.
        logits = outputs[0]

        # Move logits and labels to CPU
        logits = logits.detach().cpu().numpy()
        label_ids = label_ids.to('cpu').numpy()
        tmp_eval_accuracy = accuracy(logits, label_ids)

        eval_accuracy += tmp_eval_accuracy

        nb_eval_examples += input_ids.size(0)
        nb_eval_steps += 1

    eval_accuracy = eval_accuracy / nb_eval_examples
    loss = tr_loss/nb_tr_steps
    result = {'eval_accuracy': eval_accuracy,
              'global_step': global_step,
              'loss': loss}

    for key in sorted(result.keys()):
        print(key, str(result[key]))
    print()

Epoch:   0%|          | 0/75 [00:00<?, ?it/s]


NameError: name 'train_dataloader' is not defined

In [27]:
pred = list()
true = list()
eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()
for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)


model.eval()

eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)

    with torch.no_grad():
        outputs = model(input_ids, 
                        token_type_ids=None, 
                        attention_mask=input_mask)

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    logits = outputs[0]

    # Move logits and labels to CPU
    logits = logits.detach().cpu().numpy()
    
    outputs = np.argmax(logits, axis=1)
    complete_logits.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1
    
eval_accuracy = eval_accuracy / nb_eval_examples
loss = tr_loss/nb_tr_steps
result = {'eval_accuracy': eval_accuracy,
          'global_step': global_step,
          'loss': loss}
#     with torch.no_grad():
#         tmp_eval_loss = model(input_ids, segment_ids, input_mask, label_ids)
#         logits = model(input_ids, segment_ids, input_mask)

#     logits = logits.detach().cpu().numpy()
#     outputs = np.argmax(logits, axis=1)
#     complete_outputs.extend(outputs)
#     label_ids = label_ids.to('cpu').numpy()
#     complete_label_ids.extend(label_ids)
#     tmp_eval_accuracy = accuracy(logits, label_ids)

#     eval_loss += tmp_eval_loss.mean().item()
#     eval_accuracy += tmp_eval_accuracy

#     nb_eval_examples += input_ids.size(0)
#     nb_eval_steps += 1



for i in range(len(complete_logits)):
    print(complete_outputs[i], complete_logits[i])

02/22/2022 23:47:47 - INFO - __main__ -   ***** Running evaluation *****
02/22/2022 23:47:47 - INFO - __main__ -     Num examples = 125
02/22/2022 23:47:47 - INFO - __main__ -     Batch size = 16


RuntimeError: CUDA error: device-side assert triggered
CUDA kernel errors might be asynchronously reported at some other API call,so the stacktrace below might be incorrect.
For debugging consider passing CUDA_LAUNCH_BLOCKING=1.

In [26]:
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/longformer_1024"


In [None]:
model_to_save = model.module if hasattr(model, 'module') else model  # Only save the model it-self
output_model_file = os.path.join(output_dir, "longformer.bin")
torch.save(model_to_save.state_dict(), output_model_file)
output_config_file = os.path.join(output_dir, "config.json")
with open(output_config_file, 'w') as f:
    f.write(model_to_save.config.to_json_string())	

In [None]:
output_file = os.path.join(output_dir, "longformer_a.csv")
outcsv = open(output_file,'w', encoding = 'utf8', newline='')
writer = csv.writer(outcsv,quotechar = '"')
writer.writerow(["User","results"])
for user,pred in zip(complete_user_ids, complete_outputs):
    writer.writerow([user,pred])
outcsv.close()

In [24]:
from pytorch_pretrained_bert.modeling import BertForSequenceClassification, BertConfig
# output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/01022022_expert_1000"
output_model_file = os.path.join(output_dir, "pytorch_model.bin")
output_config_file = os.path.join(output_dir, "config.json")
config = BertConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model = BertForSequenceClassification.from_pretrained("bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model.to(device)

02/02/2022 12:40:46 - INFO - pytorch_pretrained_bert.modeling -   Better speed can be achieved with apex installed from https://www.github.com/nvidia/apex .
02/02/2022 12:40:50 - INFO - pytorch_pretrained_bert.modeling -   loading archive file https://s3.amazonaws.com/models.huggingface.co/bert/bert-base-uncased.tar.gz from cache at /home/yy452/.pytorch_pretrained_bert/9c41111e2de84547a463fd39217199738d1e3deb72d4fec4399e6e241983c6f0.ae3cef932725ca7a30cdcb93fc6e09150a55e2a130ec7af63975a16c153ae2ba
02/02/2022 12:40:50 - INFO - pytorch_pretrained_bert.modeling -   extracting archive file /home/yy452/.pytorch_pretrained_bert/9c41111e2de84547a463fd39217199738d1e3deb72d4fec4399e6e241983c6f0.ae3cef932725ca7a30cdcb93fc6e09150a55e2a130ec7af63975a16c153ae2ba to temp dir /tmp/tmpzlszxjsa
02/02/2022 12:40:54 - INFO - pytorch_pretrained_bert.modeling -   Model config {
  "attention_probs_dropout_prob": 0.1,
  "hidden_act": "gelu",
  "hidden_dropout_prob": 0.1,
  "hidden_size": 768,
  "initializer_r

BertForSequenceClassification(
  (bert): BertModel(
    (embeddings): BertEmbeddings(
      (word_embeddings): Embedding(30522, 768, padding_idx=0)
      (position_embeddings): Embedding(512, 768)
      (token_type_embeddings): Embedding(2, 768)
      (LayerNorm): BertLayerNorm()
      (dropout): Dropout(p=0.1, inplace=False)
    )
    (encoder): BertEncoder(
      (layer): ModuleList(
        (0): BertLayer(
          (attention): BertAttention(
            (self): BertSelfAttention(
              (query): Linear(in_features=768, out_features=768, bias=True)
              (key): Linear(in_features=768, out_features=768, bias=True)
              (value): Linear(in_features=768, out_features=768, bias=True)
              (dropout): Dropout(p=0.1, inplace=False)
            )
            (output): BertSelfOutput(
              (dense): Linear(in_features=768, out_features=768, bias=True)
              (LayerNorm): BertLayerNorm()
              (dropout): Dropout(p=0.1, inplace=False)
   

## load longformer model

In [17]:
from transformers import LongformerForSequenceClassification, LongformerConfig
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/longformer_2048_2"
output_model_file = os.path.join(output_dir, "longformer.bin")
output_config_file = os.path.join(output_dir, "config.json")
config = LongformerConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model_lf = LongformerForSequenceClassification.from_pretrained("allenai/longformer-base-4096", state_dict=model_state_dict, num_labels=4)
model_lf.to(device)

LongformerForSequenceClassification(
  (longformer): LongformerModel(
    (embeddings): LongformerEmbeddings(
      (word_embeddings): Embedding(50265, 768, padding_idx=1)
      (position_embeddings): Embedding(4098, 768, padding_idx=1)
      (token_type_embeddings): Embedding(1, 768)
      (LayerNorm): LayerNorm((768,), eps=1e-05, elementwise_affine=True)
      (dropout): Dropout(p=0.1, inplace=False)
    )
    (encoder): LongformerEncoder(
      (layer): ModuleList(
        (0): LongformerLayer(
          (attention): LongformerAttention(
            (self): LongformerSelfAttention(
              (query): Linear(in_features=768, out_features=768, bias=True)
              (key): Linear(in_features=768, out_features=768, bias=True)
              (value): Linear(in_features=768, out_features=768, bias=True)
              (query_global): Linear(in_features=768, out_features=768, bias=True)
              (key_global): Linear(in_features=768, out_features=768, bias=True)
              (val

## load bert model

In [14]:
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bert_expert"
output_model_file = os.path.join(output_dir, "bert.bin")
output_config_file = os.path.join(output_dir, "config.json")
config = BertConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model = BertForSequenceClassification.from_pretrained("bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model.to(device)

BertForSequenceClassification(
  (bert): BertModel(
    (embeddings): BertEmbeddings(
      (word_embeddings): Embedding(30522, 768, padding_idx=0)
      (position_embeddings): Embedding(512, 768)
      (token_type_embeddings): Embedding(2, 768)
      (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)
      (dropout): Dropout(p=0.1, inplace=False)
    )
    (encoder): BertEncoder(
      (layer): ModuleList(
        (0): BertLayer(
          (attention): BertAttention(
            (self): BertSelfAttention(
              (query): Linear(in_features=768, out_features=768, bias=True)
              (key): Linear(in_features=768, out_features=768, bias=True)
              (value): Linear(in_features=768, out_features=768, bias=True)
              (dropout): Dropout(p=0.1, inplace=False)
            )
            (output): BertSelfOutput(
              (dense): Linear(in_features=768, out_features=768, bias=True)
              (LayerNorm): LayerNorm((768,), eps=1e-12, element

In [26]:
pred = list()
true = list()
eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()
for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)

model.eval()
model2.eval()
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)

    with torch.no_grad():
        logits1 = model(input_ids, segment_ids, input_mask)
        logits2 = model2(input_ids, segment_ids, input_mask)

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
#     logits1 = outputs[0]
#     logits2 = outputs2[0]
    
    

    # Move logits and labels to CPU
    logits1 = logits1.detach().cpu().numpy()
    logits2 = logits2.detach().cpu().numpy()
    
    logits = (logits1 + logits2)/2.0
    
    outputs = np.argmax(logits, axis=1)
    complete_logits.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1

# eval_accuracy = eval_accuracy / nb_eval_examples
# loss = tr_loss/nb_tr_steps
# result = {'eval_accuracy': eval_accuracy,
#           'global_step': global_step,
#           'loss': loss}

# for i in range(len(complete_logits)):
#     print(complete_outputs[i], complete_logits[i])

02/02/2022 12:41:06 - INFO - __main__ -   ***** Running evaluation *****
02/02/2022 12:41:06 - INFO - __main__ -     Num examples = 125
02/02/2022 12:41:06 - INFO - __main__ -     Batch size = 16


RuntimeError: CUDA error: device-side assert triggered
CUDA kernel errors might be asynchronously reported at some other API call,so the stacktrace below might be incorrect.
For debugging consider passing CUDA_LAUNCH_BLOCKING=1.

# test multimodel

In [11]:
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 16
epochs = 75
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None
models = {}
dataloaders = {}

In [12]:
# load bert
from transformers import BertTokenizer, BertForSequenceClassification, BertConfig
model_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bert_expert"
output_model_file = os.path.join(model_dir, "bert.bin")
output_config_file = os.path.join(model_dir, "config.json")
config = BertConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model_bert = BertForSequenceClassification.from_pretrained("bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model_bert.to(device)
model_bert.eval()
token_bert = BertTokenizer.from_pretrained('bert-base-uncased', do_lower_case=True)
models["bert"]= model_bert

eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, 384, token_bert)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)

dataloaders["bert"] =  eval_dataloader


05/21/2022 16:42:24 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 16:42:24 - INFO - __main__ -     Num examples = 125
05/21/2022 16:42:24 - INFO - __main__ -     Batch size = 16


In [13]:
# load longformer
from transformers import LongformerForSequenceClassification, LongformerConfig, LongformerTokenizer
model_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_expert"
output_model_file = os.path.join(model_dir, "model.bin")
output_config_file = os.path.join(model_dir, "config.json")
config = LongformerConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model_lf = LongformerForSequenceClassification.from_pretrained("allenai/longformer-base-4096", state_dict=model_state_dict, num_labels=4)
model_lf.to(device)
model_lf.eval()
models["longformer"] = model_lf
tokenizer_lf = LongformerTokenizer.from_pretrained('allenai/longformer-base-4096', do_lower_case=True)

eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, 2048, tokenizer_lf)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)


dataloaders["longformer"] =  eval_dataloader


05/21/2022 16:42:32 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 16:42:32 - INFO - __main__ -     Num examples = 125
05/21/2022 16:42:32 - INFO - __main__ -     Batch size = 16


In [53]:
# load mentalbert
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'

from transformers import AutoModelForSequenceClassification, AutoConfig, AutoTokenizer
model_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/mentalbert_expert"
output_model_file = os.path.join(model_dir, "mentalbert.bin")
output_config_file = os.path.join(model_dir, "config.json")
config = AutoConfig.from_pretrained(output_config_file)
model_state_dict = torch.load(output_model_file)
model_lf = AutoModelForSequenceClassification.from_pretrained("mental/mental-bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model_lf.to(device)
model_lf.eval()
models["mentalbert"] = model_lf
tokenizer = AutoTokenizer.from_pretrained('mental/mental-bert-base-uncased', do_lower_case=True)

eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, 512, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)


dataloaders["mentalbert"] =  eval_dataloader


Token indices sequence length is longer than the specified maximum sequence length for this model (1100 > 512). Running this sequence through the model will result in indexing errors
05/21/2022 17:01:33 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 17:01:33 - INFO - __main__ -     Num examples = 125
05/21/2022 17:01:33 - INFO - __main__ -     Batch size = 16


In [18]:
# load bigbird
model_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a/bird_addexpert"
output_model_file = os.path.join(model_dir, "longformer.bin")
output_config_file = os.path.join(model_dir, "config.json")
config = BigBirdConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model_lf = BigBirdForSequenceClassification.from_pretrained("google/bigbird-roberta-base", state_dict=model_state_dict, num_labels=4)
model_lf.to(device)
model_lf.eval()
models["bigbird"] = model_lf
tokenizer_lf = BigBirdTokenizer.from_pretrained('google/bigbird-roberta-base', do_lower_case=True)

eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, 1024, tokenizer_lf)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)


dataloaders["bigbird"] =  eval_dataloader


05/21/2022 16:47:26 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 16:47:26 - INFO - __main__ -     Num examples = 125
05/21/2022 16:47:26 - INFO - __main__ -     Batch size = 16


In [54]:
combined_model = {0:"mentalbert", 1:"bigbird"}
model_logits = {}

for i in range(2):
    complete_logits = []
    complete_outputs = list()
    pred = list()
    true = list()   
    eval_loss, eval_accuracy = 0, 0
    nb_eval_steps, nb_eval_examples = 0, 0
    complete_label_ids = list()
    for input_ids, input_mask, segment_ids, label_ids in dataloaders[combined_model[i]]:
        input_ids = input_ids.to(device)
        input_mask = input_mask.to(device)
        segment_ids = segment_ids.to(device)
        label_ids = label_ids.to(device)
        outputs_models = []

        model = models[combined_model[i]]
        with torch.no_grad():
            outputs = model(input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask)

        # Get the "logits" output by the model. The "logits" are the output
        # values prior to applying an activation function like the softmax.
        logits = outputs[0]

        # Move logits and labels to CPU
        logits = logits.detach().cpu().numpy()

        outputs = np.argmax(logits, axis=1)
        complete_logits.append(logits)
        complete_outputs.extend(outputs)
        label_ids = label_ids.to('cpu').numpy()
        complete_label_ids.extend(label_ids)
        tmp_eval_accuracy = accuracy(logits, label_ids)

        eval_accuracy += tmp_eval_accuracy

        nb_eval_examples += input_ids.size(0)
        nb_eval_steps += 1
    model_logits[combined_model[i]] = complete_logits
    

In [81]:
combined_logits = []
x = 0.1
y = 0.9
for i, batch in enumerate(model_logits["mentalbert"]):
    for j in range(len(batch)):
        combined_logits.append(x * batch[j] + y * model_logits["bigbird"][i][j])

In [82]:
complete_outputs = []
for i in combined_logits:
    complete_outputs.append(np.argmax(i))
    
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/combines"
output_file = os.path.join(output_dir, "mentalbert_bigbird.csv")
outcsv = open(output_file,'w', encoding = 'utf8', newline='')
writer = csv.writer(outcsv,quotechar = '"')
writer.writerow(["User","results"])
for user,pred in zip(complete_user_ids, complete_outputs):
    writer.writerow([user,pred])
outcsv.close()

In [83]:
%%bash
python /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/umd_reddit_suicidewatch_dataset_v2/scripts/evaluation.py -gold /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/umd_reddit_suicidewatch_dataset_v2/crowd/test/crowd_test_A.csv -pred /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/combines/mentalbert_bigbird.csv -out /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/combines/mentalbert_bigbird



******************************************
*********  EVALUATING PREDICTIONS ********
******************************************

Evaluating /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/combines/mentalbert_bigbird.csv and writing output to /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/combines/mentalbert_bigbird


In [84]:
# bigbird 10 + mental
tokenizer = BigBirdTokenizer.from_pretrained('google/bigbird-roberta-base', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()


batch_size = 8
epochs = 75
max_seq_length = 1024
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bigbird_10fold"

    bigbird_model = "BigBird_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bigbird_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = BigBirdConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model =BigBirdForSequenceClassification.from_pretrained("google/bigbird-roberta-base", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)

from transformers import AutoTokenizer
from transformers import AutoModelForSequenceClassification, AutoConfig
tokenizer = AutoTokenizer.from_pretrained('mental/mental-bert-base-uncased', do_lower_case=True)
max_seq_length = 512
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'


eval_examples_mental = processor.get_test_examples(data_dir)
eval_features_mental = convert_examples_to_features(
    eval_examples_mental, label_list, max_seq_length, tokenizer)
	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids_mental = torch.tensor([f.input_ids for f in eval_features_mental], dtype=torch.long)
all_input_mask_mental = torch.tensor([f.input_mask for f in eval_features_mental], dtype=torch.long)
all_segment_ids_mental = torch.tensor([f.segment_ids for f in eval_features_mental], dtype=torch.long)
all_label_ids_mental = torch.tensor([0 for f in eval_features_mental], dtype=torch.long)

eval_data_mental = TensorDataset(all_input_ids_mental, all_input_mask_mental, all_segment_ids_mental, all_label_ids_mental)
# Run prediction for full data
eval_sampler_mental = SequentialSampler(eval_data_mental)
eval_dataloader_mental = DataLoader(eval_data_mental, sampler=eval_sampler_mental, batch_size=batch_size)

mental_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/mentalbert_expert"
bert_model = "mentalbert.bin"
output_model_file = os.path.join(mental_dir, bert_model)
output_config_file = os.path.join(mental_dir, "config.json")
config = AutoConfig.from_pretrained(output_config_file)
model_state_dict = torch.load(output_model_file)
model = AutoModelForSequenceClassification.from_pretrained("mental/mental-bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model.to(device)
model.eval()
models.append(model)

# model.eval()
pred = list()
true = list()   
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)
    outputs_models = []
    logits = None
    with torch.no_grad():
        for i in range(k):
            outputs_models.append(models[i](input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask))

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    for i, outputs in enumerate(outputs_models):
        logits_new = outputs[0]

        # Move logits and labels to CPU
        logits_new = logits_new.detach().cpu().numpy()
        if i == 0:
            logits = logits_new
        else:
            logits = (logits * i + logits_new)/(i+1)
    outputs = np.argmax(logits, axis=1)
    complete_logits.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1
    
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits_mental = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader_mental:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)

    with torch.no_grad():
        outputs = models[-1](input_ids, 
                        token_type_ids=None, 
                        attention_mask=input_mask)

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    logits = outputs[0]

    # Move logits and labels to CPU
    logits = logits.detach().cpu().numpy()
    
    outputs = np.argmax(logits, axis=1)
    complete_logits_mental.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1

05/21/2022 17:22:35 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 17:22:35 - INFO - __main__ -     Num examples = 125
05/21/2022 17:22:35 - INFO - __main__ -     Batch size = 8


KeyboardInterrupt: 

In [87]:
# longformer 10 + mental
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold"

tokenizer = LongformerTokenizer.from_pretrained('allenai/longformer-base-4096', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 2048
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    # output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/01022022_expert_1000"
    bigbird_model = "longformer_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bigbird_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = LongformerConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = LongformerForSequenceClassification.from_pretrained("allenai/longformer-base-4096", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)
    

from transformers import AutoTokenizer
from transformers import AutoModelForSequenceClassification, AutoConfig
tokenizer = AutoTokenizer.from_pretrained('mental/mental-bert-base-uncased', do_lower_case=True)
max_seq_length = 512
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'


eval_examples_mental = processor.get_test_examples(data_dir)
eval_features_mental = convert_examples_to_features(
    eval_examples_mental, label_list, max_seq_length, tokenizer)
	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids_mental = torch.tensor([f.input_ids for f in eval_features_mental], dtype=torch.long)
all_input_mask_mental = torch.tensor([f.input_mask for f in eval_features_mental], dtype=torch.long)
all_segment_ids_mental = torch.tensor([f.segment_ids for f in eval_features_mental], dtype=torch.long)
all_label_ids_mental = torch.tensor([0 for f in eval_features_mental], dtype=torch.long)

eval_data_mental = TensorDataset(all_input_ids_mental, all_input_mask_mental, all_segment_ids_mental, all_label_ids_mental)
# Run prediction for full data
eval_sampler_mental = SequentialSampler(eval_data_mental)
eval_dataloader_mental = DataLoader(eval_data_mental, sampler=eval_sampler_mental, batch_size=batch_size)

mental_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/mentalbert_expert"
bert_model = "mentalbert.bin"
output_model_file = os.path.join(mental_dir, bert_model)
output_config_file = os.path.join(mental_dir, "config.json")
config = AutoConfig.from_pretrained(output_config_file)
model_state_dict = torch.load(output_model_file)
model = AutoModelForSequenceClassification.from_pretrained("mental/mental-bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model.to(device)
model.eval()
models.append(model)

# model.eval()
pred = list()
true = list()   
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)
    outputs_models = []
    logits = None
    with torch.no_grad():
        for i in range(k):
            outputs_models.append(models[i](input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask))

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    for i, outputs in enumerate(outputs_models):
        logits_new = outputs[0]

        # Move logits and labels to CPU
        logits_new = logits_new.detach().cpu().numpy()
        if i == 0:
            logits = logits_new
        else:
            logits = (logits * i + logits_new)/(i+1)
    outputs = np.argmax(logits, axis=1)
    complete_logits.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1
    
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits_mental = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader_mental:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)

    with torch.no_grad():
        outputs = models[-1](input_ids, 
                        token_type_ids=None, 
                        attention_mask=input_mask)

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    logits = outputs[0]

    # Move logits and labels to CPU
    logits = logits.detach().cpu().numpy()
    
    outputs = np.argmax(logits, axis=1)
    complete_logits_mental.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1

05/21/2022 17:27:32 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 17:27:32 - INFO - __main__ -     Num examples = 125
05/21/2022 17:27:32 - INFO - __main__ -     Batch size = 8
Token indices sequence length is longer than the specified maximum sequence length for this model (1100 > 512). Running this sequence through the model will result in indexing errors
05/21/2022 17:28:31 - INFO - __main__ -   ***** Running evaluation *****
05/21/2022 17:28:31 - INFO - __main__ -     Num examples = 125
05/21/2022 17:28:31 - INFO - __main__ -     Batch size = 8


In [11]:
# longformer 10 + bert
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold"

tokenizer = LongformerTokenizer.from_pretrained('allenai/longformer-base-4096', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 2048
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    # output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/01022022_expert_1000"
    bigbird_model = "longformer_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bigbird_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = LongformerConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = LongformerForSequenceClassification.from_pretrained("allenai/longformer-base-4096", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)
    

from transformers import AutoTokenizer
from transformers import AutoModelForSequenceClassification, AutoConfig
tokenizer = AutoTokenizer.from_pretrained('mental/mental-bert-base-uncased', do_lower_case=True)
max_seq_length = 512
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'


eval_examples_mental = processor.get_test_examples(data_dir)
eval_features_mental = convert_examples_to_features(
    eval_examples_mental, label_list, max_seq_length, tokenizer)
	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids_mental = torch.tensor([f.input_ids for f in eval_features_mental], dtype=torch.long)
all_input_mask_mental = torch.tensor([f.input_mask for f in eval_features_mental], dtype=torch.long)
all_segment_ids_mental = torch.tensor([f.segment_ids for f in eval_features_mental], dtype=torch.long)
all_label_ids_mental = torch.tensor([0 for f in eval_features_mental], dtype=torch.long)

eval_data_mental = TensorDataset(all_input_ids_mental, all_input_mask_mental, all_segment_ids_mental, all_label_ids_mental)
# Run prediction for full data
eval_sampler_mental = SequentialSampler(eval_data_mental)
eval_dataloader_mental = DataLoader(eval_data_mental, sampler=eval_sampler_mental, batch_size=batch_size)

model_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bert_expert"
output_model_file = os.path.join(model_dir, "bert.bin")
output_config_file = os.path.join(model_dir, "config.json")
config = BertConfig.from_json_file(output_config_file)
model_state_dict = torch.load(output_model_file)
model_bert = BertForSequenceClassification.from_pretrained("bert-base-uncased", state_dict=model_state_dict, num_labels=4)
model_bert.to(device)
model_bert.eval()
token_bert = BertTokenizer.from_pretrained('bert-base-uncased', do_lower_case=True)
models.append(model_bert)

# model.eval()
pred = list()
true = list()   
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)
    outputs_models = []
    logits = None
    with torch.no_grad():
        for i in range(k):
            outputs_models.append(models[i](input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask))

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    for i, outputs in enumerate(outputs_models):
        logits_new = outputs[0]

        # Move logits and labels to CPU
        logits_new = logits_new.detach().cpu().numpy()
        if i == 0:
            logits = logits_new
        else:
            logits = (logits * i + logits_new)/(i+1)
    outputs = np.argmax(logits, axis=1)
    complete_logits.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1
    
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits_mental = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader_mental:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)

    with torch.no_grad():
        outputs = models[-1](input_ids, 
                        token_type_ids=None, 
                        attention_mask=input_mask)

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    logits = outputs[0]

    # Move logits and labels to CPU
    logits = logits.detach().cpu().numpy()
    
    outputs = np.argmax(logits, axis=1)
    complete_logits_mental.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1

05/22/2022 00:25:13 - INFO - __main__ -   ***** Running evaluation *****
05/22/2022 00:25:13 - INFO - __main__ -     Num examples = 125
05/22/2022 00:25:13 - INFO - __main__ -     Batch size = 8
Token indices sequence length is longer than the specified maximum sequence length for this model (1100 > 512). Running this sequence through the model will result in indexing errors
05/22/2022 00:30:47 - INFO - __main__ -   ***** Running evaluation *****
05/22/2022 00:30:47 - INFO - __main__ -     Num examples = 125
05/22/2022 00:30:47 - INFO - __main__ -     Batch size = 8


NameError: name 'mental_dir' is not defined

In [18]:
# two 10fold
tokenizer = BigBirdTokenizer.from_pretrained('google/bigbird-roberta-base', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 1024
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bigbird_10fold"

    bigbird_model = "BigBird_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bigbird_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = BigBirdConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model =BigBirdForSequenceClassification.from_pretrained("google/bigbird-roberta-base", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)
    
    
from transformers import AutoTokenizer
from transformers import AutoModelForSequenceClassification, AutoConfig
tokenizer = AutoTokenizer.from_pretrained('mental/mental-bert-base-uncased', do_lower_case=True)
max_seq_length = 512
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'


eval_examples_mental = processor.get_test_examples(data_dir)
eval_features_mental = convert_examples_to_features(
    eval_examples_mental, label_list, max_seq_length, tokenizer)
	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids_mental = torch.tensor([f.input_ids for f in eval_features_mental], dtype=torch.long)
all_input_mask_mental = torch.tensor([f.input_mask for f in eval_features_mental], dtype=torch.long)
all_segment_ids_mental = torch.tensor([f.segment_ids for f in eval_features_mental], dtype=torch.long)
all_label_ids_mental = torch.tensor([0 for f in eval_features_mental], dtype=torch.long)

eval_data_mental = TensorDataset(all_input_ids_mental, all_input_mask_mental, all_segment_ids_mental, all_label_ids_mental)
# Run prediction for full data
eval_sampler_mental = SequentialSampler(eval_data_mental)
eval_dataloader_mental = DataLoader(eval_data_mental, sampler=eval_sampler_mental, batch_size=batch_size)

for i in range(k):
    output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/mentalbert_10fold"

    bigbird_model = "mentalbert_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bigbird_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = AutoConfig.from_pretrained(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = AutoModelForSequenceClassification.from_pretrained("mental/mental-bert-base-uncased", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)

# model.eval()
pred = list()
true = list()   
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)
    outputs_models = []
    logits = None
    with torch.no_grad():
        for i in range(k):
            outputs_models.append(models[i](input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask))

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    for i, outputs in enumerate(outputs_models):
        logits_new = outputs[0]

        # Move logits and labels to CPU
        logits_new = logits_new.detach().cpu().numpy()
        if i == 0:
            logits = logits_new
        else:
            logits = (logits * i + logits_new)/(i+1)
    outputs = np.argmax(logits, axis=1)
    complete_logits.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1
    
eval_loss, eval_accuracy = 0, 0
nb_eval_steps, nb_eval_examples = 0, 0
complete_label_ids = list()
complete_outputs = list()
complete_logits_mental = []
for input_ids, input_mask, segment_ids, label_ids in eval_dataloader_mental:
    input_ids = input_ids.to(device)
    input_mask = input_mask.to(device)
    segment_ids = segment_ids.to(device)
    label_ids = label_ids.to(device)
    outputs_models = []
    logits = None
    with torch.no_grad():
        for i in range(10,20):
            outputs_models.append(models[i](input_ids, 
                            token_type_ids=None, 
                            attention_mask=input_mask))

    # Get the "logits" output by the model. The "logits" are the output
    # values prior to applying an activation function like the softmax.
    for i, outputs in enumerate(outputs_models):
        logits_new = outputs[0]

        # Move logits and labels to CPU
        logits_new = logits_new.detach().cpu().numpy()
        if i == 0:
            logits = logits_new
        else:
            logits = (logits * i + logits_new)/(i+1)
    outputs = np.argmax(logits, axis=1)
    complete_logits_mental.append(logits)
    complete_outputs.extend(outputs)
    label_ids = label_ids.to('cpu').numpy()
    complete_label_ids.extend(label_ids)
    tmp_eval_accuracy = accuracy(logits, label_ids)

    eval_accuracy += tmp_eval_accuracy

    nb_eval_examples += input_ids.size(0)
    nb_eval_steps += 1

03/20/2022 22:46:28 - INFO - __main__ -   ***** Running evaluation *****
03/20/2022 22:46:28 - INFO - __main__ -     Num examples = 125
03/20/2022 22:46:28 - INFO - __main__ -     Batch size = 8
Token indices sequence length is longer than the specified maximum sequence length for this model (1100 > 512). Running this sequence through the model will result in indexing errors
03/20/2022 22:46:49 - INFO - __main__ -   ***** Running evaluation *****
03/20/2022 22:46:49 - INFO - __main__ -     Num examples = 125
03/20/2022 22:46:49 - INFO - __main__ -     Batch size = 8


In [96]:
combined_logits = []
x = 0.5
y = 0.5
for i, batch in enumerate(complete_logits):
    for j in range(len(batch)):
        combined_logits.append(x * batch[j] + y * complete_logits_mental[i][j])

In [97]:
complete_outputs = []
for i in combined_logits:
    complete_outputs.append(np.argmax(i))
    
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/combines"
output_file = os.path.join(output_dir, "mentalbert_longformer10.csv")
outcsv = open(output_file,'w', encoding = 'utf8', newline='')
writer = csv.writer(outcsv,quotechar = '"')
writer.writerow(["User","results"])
for user,pred in zip(complete_user_ids, complete_outputs):
    writer.writerow([user,pred])
outcsv.close()

# test 10_fold hard voting

In [15]:
#bert
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bert_10fold"

tokenizer = BertTokenizer.from_pretrained('bert-base-uncased', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 384
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    # output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/01022022_expert_1000"
    bert_model = "bert_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bert_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = BertConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = BertForSequenceClassification.from_pretrained("bert-base-uncased", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)


03/02/2022 11:00:47 - INFO - __main__ -   ***** Running evaluation *****
03/02/2022 11:00:47 - INFO - __main__ -     Num examples = 125
03/02/2022 11:00:47 - INFO - __main__ -     Batch size = 8


In [22]:
#mentalbert
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/mentalbert_10fold"

tokenizer = BertTokenizer.from_pretrained('bert-base-uncased', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 512
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    # output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/01022022_expert_1000"
    bert_model = "mentalbert_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bert_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = BertConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = BertForSequenceClassification.from_pretrained("mental/mental-bert-base-uncased", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)


03/02/2022 11:22:24 - INFO - __main__ -   ***** Running evaluation *****
03/02/2022 11:22:24 - INFO - __main__ -     Num examples = 125
03/02/2022 11:22:24 - INFO - __main__ -     Batch size = 8


In [66]:
#longformer
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold"

tokenizer = LongformerTokenizer.from_pretrained('allenai/longformer-base-4096', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 2048
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    bert_model = "longformer_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bert_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = LongformerConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = LongformerForSequenceClassification.from_pretrained("allenai/longformer-base-4096", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)


03/03/2022 11:31:20 - INFO - __main__ -   ***** Running evaluation *****
03/03/2022 11:31:20 - INFO - __main__ -     Num examples = 125
03/03/2022 11:31:20 - INFO - __main__ -     Batch size = 8


In [11]:
#bigbird
output_dir = "/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/bigbird_10fold"

tokenizer = BigBirdTokenizer.from_pretrained('google/bigbird-roberta-base', do_lower_case=True)
processor = CLPsychProcessor()
global_step = 0
nb_tr_steps = 0
tr_loss = 0
label_list = processor.get_labels()

batch_size = 8
epochs = 75
max_seq_length = 1024
data_dir = '/home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/Dataset/add_expert/emoticons_add'
complete_logits = None


eval_examples = processor.get_test_examples(data_dir)
eval_features = convert_examples_to_features(
    eval_examples, label_list, max_seq_length, tokenizer)
complete_user_ids = list()

for example in eval_examples:
    complete_user_ids.append(example.guid)	
logger.info("***** Running evaluation *****")
logger.info("  Num examples = %d", len(eval_examples))
logger.info("  Batch size = %d", batch_size)
all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
all_label_ids = torch.tensor([0 for f in eval_features], dtype=torch.long)

eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids)
# Run prediction for full data
eval_sampler = SequentialSampler(eval_data)
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=batch_size)
models = []

k=10
for i in range(k):
    bert_model = "BigBird_{}.bin".format(i+1)
    output_model_file = os.path.join(output_dir, bert_model)
    output_config_file = os.path.join(output_dir, "config.json")
    config = BigBirdConfig.from_json_file(output_config_file)
    model_state_dict = torch.load(output_model_file)
    model = BigBirdForSequenceClassification.from_pretrained("google/bigbird-roberta-base", state_dict=model_state_dict, num_labels=4)
    model.to(device)
    model.eval()
    models.append(model)


03/02/2022 08:55:28 - INFO - __main__ -   ***** Running evaluation *****
03/02/2022 08:55:28 - INFO - __main__ -     Num examples = 125
03/02/2022 08:55:28 - INFO - __main__ -     Batch size = 8


In [67]:
# hard voting
complete_labels = []
for i in range(k):
    pred = list()
    true = list()   
    eval_loss, eval_accuracy = 0, 0
    nb_eval_steps, nb_eval_examples = 0, 0
    complete_label_ids = list()
    complete_outputs = list()


    for input_ids, input_mask, segment_ids, label_ids in eval_dataloader:
        input_ids = input_ids.to(device)
        input_mask = input_mask.to(device)
        segment_ids = segment_ids.to(device)
        label_ids = label_ids.to(device)
        logits = None
        with torch.no_grad():
            outputs = models[i](input_ids, 
                                token_type_ids=None, 
                                attention_mask=input_mask)

        # Get the "logits" output by the model. The "logits" are the output
        # values prior to applying an activation function like the softmax.
        logits = outputs[0]

        # Move logits and labels to CPU
        logits = logits.detach().cpu().numpy()
            
        outputs = np.argmax(logits, axis=1)
        complete_outputs.extend(outputs)
        label_ids = label_ids.to('cpu').numpy()
        complete_label_ids.extend(label_ids)
        tmp_eval_accuracy = accuracy(logits, label_ids)

        eval_accuracy += tmp_eval_accuracy

        nb_eval_examples += input_ids.size(0)
        nb_eval_steps += 1

    complete_labels.append(complete_outputs)
complete_labels

[[3,
  2,
  0,
  2,
  2,
  3,
  3,
  2,
  2,
  2,
  0,
  3,
  2,
  3,
  3,
  3,
  3,
  2,
  3,
  2,
  3,
  0,
  2,
  2,
  0,
  2,
  2,
  3,
  0,
  3,
  2,
  3,
  3,
  3,
  2,
  2,
  0,
  2,
  1,
  0,
  3,
  3,
  2,
  0,
  0,
  2,
  0,
  2,
  3,
  0,
  3,
  1,
  0,
  2,
  2,
  2,
  3,
  0,
  2,
  3,
  0,
  0,
  0,
  3,
  3,
  3,
  0,
  0,
  2,
  2,
  3,
  0,
  2,
  2,
  3,
  3,
  1,
  2,
  2,
  2,
  3,
  0,
  0,
  2,
  2,
  0,
  3,
  3,
  3,
  3,
  3,
  2,
  3,
  2,
  3,
  0,
  3,
  3,
  2,
  0,
  0,
  3,
  2,
  2,
  3,
  3,
  3,
  2,
  2,
  0,
  3,
  2,
  0,
  3,
  0,
  0,
  0,
  2,
  3,
  2,
  2,
  1,
  2,
  0,
  0],
 [3,
  1,
  0,
  2,
  1,
  3,
  2,
  3,
  3,
  0,
  0,
  3,
  2,
  2,
  3,
  2,
  2,
  3,
  2,
  3,
  2,
  0,
  0,
  2,
  2,
  3,
  2,
  3,
  0,
  2,
  3,
  3,
  2,
  3,
  1,
  3,
  0,
  0,
  2,
  0,
  3,
  3,
  2,
  0,
  2,
  2,
  0,
  2,
  2,
  0,
  3,
  2,
  0,
  2,
  2,
  2,
  3,
  0,
  2,
  2,
  1,
  0,
  0,
  3,
  0,
  3,
  0,
  0,
  0,
  2,
  3,
  1,
  2,
  2,
  3,

In [68]:
hard_voted_id = []
for i in range(len(complete_labels[0])):
    curr_user = []
    for j in range(len(complete_labels)):
        curr_user.append(complete_labels[j][i])
    hard_voted_id.append(max(curr_user, key=curr_user.count))

# output_file = os.path.join(output_dir, "avg_results.csv")
# outcsv = open(output_file,'w', encoding = 'utf8', newline='')
# writer = csv.writer(outcsv,quotechar = '"')
# writer.writerow(["User","results"])
# for user,pred in zip(complete_user_ids, complete_outputs):
#     writer.writerow([user,pred])
# outcsv.close()

hard_voted_id

[3,
 1,
 0,
 2,
 2,
 3,
 3,
 2,
 2,
 2,
 0,
 3,
 3,
 3,
 3,
 3,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 2,
 3,
 0,
 2,
 2,
 3,
 2,
 3,
 3,
 3,
 0,
 2,
 2,
 0,
 3,
 3,
 2,
 0,
 0,
 2,
 2,
 2,
 3,
 0,
 3,
 2,
 0,
 2,
 2,
 2,
 3,
 0,
 2,
 3,
 0,
 0,
 0,
 3,
 3,
 3,
 0,
 0,
 3,
 2,
 3,
 2,
 2,
 2,
 3,
 3,
 1,
 2,
 2,
 2,
 3,
 0,
 0,
 3,
 3,
 0,
 3,
 3,
 3,
 2,
 3,
 0,
 3,
 2,
 3,
 0,
 2,
 3,
 2,
 2,
 0,
 3,
 3,
 2,
 3,
 3,
 3,
 2,
 1,
 0,
 3,
 2,
 2,
 3,
 0,
 0,
 0,
 3,
 3,
 2,
 2,
 2,
 0,
 0,
 0]

In [69]:
output_file = os.path.join(output_dir, "hardvote_results.csv")
outcsv = open(output_file,'w', encoding = 'utf8', newline='')
writer = csv.writer(outcsv,quotechar = '"')
writer.writerow(["User","results"])
for i in range(len(complete_user_ids)):
    writer.writerow([complete_user_ids[i],hard_voted_id[i]])
outcsv.close()

In [70]:
%%bash
python /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/umd_reddit_suicidewatch_dataset_v2/scripts/evaluation.py -gold /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/umd_reddit_suicidewatch_dataset_v2/crowd/test/crowd_test_A.csv -pred /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold/results_avg.csv -out /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold/results_avg



******************************************
*********  EVALUATING PREDICTIONS ********
******************************************

Evaluating /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold/hardvote_results.csv and writing output to /home/yy452/rds/rds-gvdd-Yuap0gjVpKM/yy452/CLPsych2019_12/output/task_a_emoji/longformer_10fold/hardvote_results
