In [1]:
from transformers import MT5ForConditionalGeneration, MT5Tokenizer
import torch
import tqdm as notebook_tqdm

# Use CPU (or change to cuda if you move to GPU)
device = torch.device("cpu")

# Load tokenizer and model from your saved directory
model_path = "../Trained_model_v2/"
tokenizer = MT5Tokenizer.from_pretrained(model_path)
model = MT5ForConditionalGeneration.from_pretrained(model_path).to(device)

# Translation function
def translate_nepali_to_english(texts):
    if isinstance(texts, str):
        texts = [texts]
    
    inputs = ["translate Nepali to English: " + t for t in texts]
    encoding = tokenizer(
        inputs,
        return_tensors="pt",
        padding=True,
        truncation=True,
        max_length=300
    ).to(device)
    
    with torch.no_grad():
        outputs = model.generate(
            input_ids=encoding["input_ids"],
            attention_mask=encoding["attention_mask"],
            max_length=300,
            num_beams=4
        )

    return tokenizer.batch_decode(outputs, skip_special_tokens=True)

# Example usage
nepali_sentences = [
    "तपाईंको नाम के हो?",
    "म विद्यालय जान्छु।",
    "ऊ पुस्तक पढ्दैछ।",
    "मौसम आज राम्रै छ।",
    "हामी काठमाण्डौ जाँदैछौं।",
    "तपाईंलाई कफी मनपर्छ?",
    "आज शुक्रबार हो।",
    "म नेपाली भाषा सिक्दैछु।",
    "तिमीलाई भेटेर खुशी लाग्यो।",
    "मलाई भोक लागेको छ।",
    "कृपया ढोका बन्द गर्नुहोस्।",
    "यो खाना स्वादिलो छ।",
    "हामीले धेरै मजा गर्यौं।",
    "म फुटबल खेल्न मन पराउँछु।",
    "परीक्षा कहिले सुरु हुन्छ?",
    "तिमी कति वर्षको हौ?",
    "यहाँ इन्टरनेट छ?",
    "म भोली भेट्न सक्छु।",
    "कृपया मलाई मद्दत गर्नुहोस्।",
    "तपाईं कहाँ बस्नुहुन्छ?"
]

translations = translate_nepali_to_english(nepali_sentences)

for src, tgt in zip(nepali_sentences, translations):
    print(f"📝 Nepali   : {src}")
    print(f"🌍 English  : {tgt}")


  from .autonotebook import tqdm as notebook_tqdm
The tokenizer class you load from this checkpoint is not the same type as the class this function is called from. It may result in unexpected tokenization. 
The tokenizer class you load from this checkpoint is 'T5Tokenizer'. 
The class this function is called from is 'MT5Tokenizer'.


📝 Nepali   : तपाईंको नाम के हो?
🌍 English  : What is your name?
📝 Nepali   : म विद्यालय जान्छु।
🌍 English  : I go to school.
📝 Nepali   : ऊ पुस्तक पढ्दैछ।
🌍 English  : He reads the book.
📝 Nepali   : मौसम आज राम्रै छ।
🌍 English  : The weather is good today.
📝 Nepali   : हामी काठमाण्डौ जाँदैछौं।
🌍 English  : We are going to Mumbai.
📝 Nepali   : तपाईंलाई कफी मनपर्छ?
🌍 English  : Do you want to drink coffee?
📝 Nepali   : आज शुक्रबार हो।
🌍 English  : Today is Friday.
📝 Nepali   : म नेपाली भाषा सिक्दैछु।
🌍 English  : I learn Nepali language.
📝 Nepali   : तिमीलाई भेटेर खुशी लाग्यो।
🌍 English  : You were happy with you.
📝 Nepali   : मलाई भोक लागेको छ।
🌍 English  : I have been sick.
📝 Nepali   : कृपया ढोका बन्द गर्नुहोस्।
🌍 English  : Please open the window.
📝 Nepali   : यो खाना स्वादिलो छ।
🌍 English  : This food is very good.
📝 Nepali   : हामीले धेरै मजा गर्यौं।
🌍 English  : We have killed a lot.
📝 Nepali   : म फुटबल खेल्न मन पराउँछु।
🌍 English  : I want to play football.
📝 Nepali   : परीक्षा