In [None]:
!pip install -q transformers sentencepiece tqdm

from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
from tqdm.auto import tqdm
import pathlib, re

# Load model on GPU
MODEL_ID   = "milyiyo/paraphraser-german-mt5-small"
tokenizer  = AutoTokenizer.from_pretrained(MODEL_ID)
model      = AutoModelForSeq2SeqLM.from_pretrained(MODEL_ID).to("cuda")
paraphraser= pipeline("text2text-generation", model=model, tokenizer=tokenizer,
                      device=0, do_sample=True, temperature=0.9, top_p=0.95, max_length=512)

# Grab first 3 templates
SRC_DIR    = pathlib.Path("data/golden_dataset_anonymized_granular")
examples   = list(SRC_DIR.glob("*.txt"))[:3]

for p in examples:
    text = p.read_text()
    print(f"\n📄 {p.name} (orig):\n{text}\n")
    out = paraphraser("paraphrase: " + text, num_return_sequences=1)[0]["generated_text"]
    print(f"✏️ paraphrase:\n{out}\n{'—'*60}")
