In [4]:
import torch
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM

# 1. 加载预训练翻译模型（中英互译）
model_name = "t5-base"  # 轻量版T5，可替换为"t5-base"（效果更好）
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSeq2SeqLM.from_pretrained(model_name)

# 2. 定义翻译任务（T5需要明确指令）
# 英译中："translate English to Chinese: 文本"
# 中译英："translate Chinese to English: 文本"
task = "translate English to Chinese: "
text = "Hugging Face Transformers is a powerful library for natural language processing."

# 3. 编码（拼接任务指令+文本）
inputs = tokenizer(
    task + text,
    return_tensors="pt",
    padding=True,
    truncation=True,
    max_length=512
)

# 4. 生成翻译结果
with torch.no_grad():
    outputs = model.generate(
        **inputs,
        max_new_tokens=100,
        num_beams=4,  # 束搜索（提升翻译准确性）
        early_stopping=True  # 生成EOS时停止
    )

# 5. 解码
translation = tokenizer.decode(outputs[0], skip_special_tokens=True)
print(f"原文：{text}")
print(f"译文：{translation}")

原文：Hugging Face Transformers is a powerful library for natural language processing.
译文：Chinesisch Hugging Face Transformers ist eine leistungsstarke Bibliothek für die Verarbeitung natürlicher Sprachen.
