In [5]:
# Follow tutorial from here: https://huggingface.co/docs/transformers/v4.17.0/en/tasks/language_modeling
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
import numpy as np
from sklearn.model_selection import train_test_split
import json
import torch
import datasets
from transformers import AutoTokenizer, DataCollatorWithPadding, AutoModelForCausalLM, TrainingArguments, Trainer, DataCollatorForLanguageModeling

# hyperparams
# checkpoint = "EleutherAI/gpt-j-6B"
checkpoint = "EleutherAI/gpt-neo-2.7B"
tokenizer = AutoTokenizer.from_pretrained(checkpoint)
tokenizer.pad_token = tokenizer.eos_token

# load model
checkpoint_dir = f'./title-{checkpoint.replace("/", "__")}/checkpoint-50'
mod = AutoModelForCausalLM.from_pretrained(
    # checkpoint,
    checkpoint_dir,
    # revision="float16",
    # torch_dtype=torch.float16,
    # low_cpu_mem_usage=True
)
# mod = mod.half()

In [6]:
# decode some examples
s = '2020:'
eos_token_id = tokenizer('\n')['input_ids'][0]
inputs = tokenizer(s, return_tensors='pt')
outputs = mod.generate(
    **inputs,
    do_sample=True,
    eos_token_id=eos_token_id,
    num_return_sequences=30,
)
tokenizer.batch_decode(outputs, skip_special_tokens=True)

Setting `pad_token_id` to `eos_token_id`:198 for open-end generation.


['2020: An algorithm for dimensioning time series\n\n\n\n\n\n\n\n\n\n\n',
 '2020: A deep learning for the analysis of large scale healthcare-specific problems using large-scale mathematical',
 '2020: A Supervised Neural Network for Mult-Image Supervised Learning\n\n\n\n\n\n',
 '2020: High Order Nonlinear Framework for the analysis of nonlinear Interaction networks in Neural Networks\n',
 '2020: The Dual-observational-based AI for non-object-based nonlinear classification',
 '2020: A linearization-based deep learning approach for differential diagnosis of severe COVID-19 pneumonia',
 '2020: A study of the cognitive architecture of rational argumentation\n\n\n\n\n\n\n\n',
 '2020: A comparative Study\n\n\n\n\n\n\n\n\n\n\n\n\n\n\n',
 '2020: A Deep Learning Approach to Appraisal of the Adversarial Robustness of Sal',
 '2020: Distual-limb segmentation for patients with stroke using deep CNN\n\n\n\n',
 '2020: A note on the Adversarial Robustness of Neural Networks\n\n\n\n\n',
 '2020: $\\beta$