In [1]:
import torch
from transformers import GPT2Tokenizer, GPT2LMHeadModel

# Load the tokenizer and model
tokenizer = GPT2Tokenizer.from_pretrained('./finetuned_model/')
model = GPT2LMHeadModel.from_pretrained('./finetuned_model/')

# Set the model to evaluation mode and run it on cuda (if exists)

device = torch.device("cuda") if torch.has_cuda else torch.device("cpu")

model.to(device)
model.eval()

GPT2LMHeadModel(
  (transformer): GPT2Model(
    (wte): Embedding(50257, 1024)
    (wpe): Embedding(1024, 1024)
    (drop): Dropout(p=0.1, inplace=False)
    (h): ModuleList(
      (0-23): 24 x GPT2Block(
        (ln_1): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
        (attn): GPT2Attention(
          (c_attn): Conv1D()
          (c_proj): Conv1D()
          (attn_dropout): Dropout(p=0.1, inplace=False)
          (resid_dropout): Dropout(p=0.1, inplace=False)
        )
        (ln_2): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
        (mlp): GPT2MLP(
          (c_fc): Conv1D()
          (c_proj): Conv1D()
          (act): NewGELUActivation()
          (dropout): Dropout(p=0.1, inplace=False)
        )
      )
    )
    (ln_f): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
  )
  (lm_head): Linear(in_features=1024, out_features=50257, bias=False)
)

In [27]:
def gentext(prompt:str, max_tokens:int):
    encoded_input = tokenizer(prompt, return_tensors='pt').to(device)
    output = model.generate(
        **encoded_input,
        temperature=1.0,
        repetition_penalty=1.01,
        max_new_tokens=max_tokens
    )
    outtext = tokenizer.decode(output[0])
    print(outtext)

In [28]:
gentext('Monika: "I deleted all their files."', 100)

Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


Monika: "I deleted all their files."
Monika: "I'm not sure if I can ever get them back."
Monika: "But I'll keep trying."
Monika: "It's just a shame they're so hard to find."
Monika: "They're usually hidden in the background."
Monika: "You know, like the ones that are always on the top of your screen."
Monika: "Like the ones that you don't even notice."
Monika: "Or


In [29]:
gentext('Monika: "Have you heard about progress in AI recently?"', 100)

Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


Monika: "Have you heard about progress in AI recently?"

Monika: "I'm not sure if it's been a big deal, but I've noticed that some of the AI seems to be getting better."
Monika: "It's like they're learning how to do things faster than before."
Monika: "They might even be able to figure out how to solve problems for themselves."
Monika: "But I don't think they'll ever get anywhere near as good as humans."
Monika: "And even


In [30]:
gentext('[player]: "What do you think about cheese?"\nMonika:', 100)

Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


[player]: "What do you think about cheese?"
Monika: "I'm not really into it."
Monika: "It's just too much work."
Monika: "I don't know if I can eat it all."
Monika: "I guess I'll have to try some other things."
Monika: "I mean, I could always go back to eating meat."
Monika: "But that would be a little weird."
Monika: "I'd probably just end up with a whole lot of junk."
