In [None]:
!pip install transformers

In [None]:
from transformers import pipeline, set_seed
import random

In [None]:
set_seed(42)

In [None]:
with open("mywords.txt", "r") as f:
    texts = f.read().splitlines()

In [None]:
from transformers import AutoTokenizer, AutoModelWithLMHead, TextDataset, DataCollatorForLanguageModeling, Trainer, TrainingArguments

tokenizer = AutoTokenizer.from_pretrained("microsoft/DialoGPT-medium")
model = AutoModelWithLMHead.from_pretrained("microsoft/DialoGPT-medium")

train_dataset = TextDataset(tokenizer=tokenizer, 
                            file_path="mywords.txt", 
                            block_size=128)

data_collator = DataCollatorForLanguageModeling(tokenizer=tokenizer, 
                                                mlm=False)

training_args = TrainingArguments(
    output_dir="./models",
    overwrite_output_dir=True,
    num_train_epochs=1,
    per_device_train_batch_size=32,
    save_steps=1000,
    save_total_limit=2,
    prediction_loss_only=True,
)

trainer = Trainer(
    model=model,
    args=training_args,
    data_collator=data_collator,
    train_dataset=train_dataset,
)

trainer.train()


In [None]:
generator = pipeline('text-generation', model='path/to/fine-tuned/model', tokenizer='microsoft/DialoGPT-medium')

def generate_response(prompt, length=50):
    response = generator(prompt, max_length=length, do_sample=True, temperature=0.7)[0]['generated_text']
    return response.strip()

In [None]:
prompt = "Hi, how are you doing today?"
response = generate_response(prompt)
print(response)