<a href="https://colab.research.google.com/github/farmountain/SmartGlass-AI-Agent/blob/main/colab_notebooks/Session7_Visual_OCR_and_Translation.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# 📘 Session 07: Visual OCR and Translation
In this session, we'll simulate a smart glasses view to:
- Extract text from images using Tesseract OCR
- Translate it into another language using HuggingFace MarianMT

In [None]:
# ✅ Install Required Packages
!apt install tesseract-ocr -y
!pip install -q pytesseract transformers Pillow

In [None]:
# ✅ Load Image and Perform OCR
import pytesseract
from PIL import Image
from google.colab import files

uploaded = files.upload()
image_path = next(iter(uploaded))
image = Image.open(image_path)

# OCR
extracted_text = pytesseract.image_to_string(image)
print('🧾 OCR Extracted Text:\n', extracted_text)

In [None]:
# ✅ Translate Using MarianMT
from transformers import MarianMTModel, MarianTokenizer

src_lang = 'fr'  # Assume the text is in French for demo
trg_lang = 'en'
model_name = f'Helsinki-NLP/opus-mt-{src_lang}-{trg_lang}'

# Load model and tokenizer
model = MarianMTModel.from_pretrained(model_name)
tokenizer = MarianTokenizer.from_pretrained(model_name)

# Tokenize and translate
batch = tokenizer([extracted_text], return_tensors="pt", padding=True)
translated = model.generate(**batch)
translated_text = tokenizer.decode(translated[0], skip_special_tokens=True)
print("🌐 Translated Text:\n", translated_text)

In [None]:
# ✅ Summary
print("👓 Smart Glasses OCR-to-Translation complete!")