In [None]:
from transformers import TrOCRProcessor, VisionEncoderDecoderModel
from PIL import Image
import torch

# Load the processor and model
processor = TrOCRProcessor.from_pretrained("microsoft/trocr-large-printed")
model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-large-printed")

# Check if GPU is available and use it
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
model.to(device)

# Function to predict text from an image
def predict_text_from_image(image_path):
    # Open the image
    image = Image.open(image_path).convert("RGB")
    
    # Preprocess the image
    pixel_values = processor(images=image, return_tensors="pt").pixel_values
    pixel_values = pixel_values.to(device)
    
    # Generate predictions
    generated_ids = model.generate(pixel_values)
    predicted_text = processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
    
    return predicted_text

# Example usage
image_path = "/content/number-441.png"  # Replace with your image path
predicted_text = predict_text_from_image(image_path)
print("Predicted Text:", predicted_text)
