In [1]:
from pathlib import Path

from ollama_ocr import OCRProcessor

image_path = Path("input/img.png")

# Create an instance
ocr = OCRProcessor(model_name='llama3.2-vision:11b')

# Test with an image (replace with your image path)
result = ocr.process_image(
    image=image_path,
    format_type="markdown"
)
print(result)

In [2]:
# Test batch processing
batch_results = ocr.process_batch('input')
print(batch_results['statistics'])

Processing images:   0%|          | 0/2 [00:00<?, ?it/s]

Processing images: 100%|██████████| 2/2 [56:54<00:00, 1707.14s/it]


{'total': 2, 'successful': 2, 'failed': 0}


In [3]:
# Print statistics
print("\nProcessing Statistics:")
print(f"Total images: {batch_results['statistics']['total']}")
print(f"Successfully processed: {batch_results['statistics']['successful']}")
print(f"Failed: {batch_results['statistics']['failed']}")


Processing Statistics:
Total images: 2
Successfully processed: 2
Failed: 0


In [6]:
# Get text from all successfully processed images
for file_path, text in batch_results['results'].items():
    print(f"\nFile: {file_path}")
    print("-" * 50)
    print(f"Extracted Text: {text}")




File: input\img.png
--------------------------------------------------
Extracted Text: **Invoice #1024**

**Billed To:**
Really Great Company

**Pay To:**
Avery Davis
123 Anywhere St., Any City
123-456-7890

**Bank Information:**
Really Great Bank
Account Name: John Smith
BSB: 000-000
Account Number: 0000 0000

**Description of Services:**

*   **Content Plan:** $200.00
*   **Copy Writing:** $100.00
*   **Website Design:** $250.00
*   **Website Development:** $500.00
*   **SEO:** $200.00

**Sub-Total:** $1,250.00 (30% discount applied)

**Total:** $875.00

**Payment Terms:**

*   Payment is required within 14 business days of invoice date.
*   Please send remittance to hello@reallygreatsite.com.

**Thank You for Your Business**

This invoice outlines the services provided by Really Great Company to Avery Davis, including content planning, copywriting, website design, website development, and SEO. The total amount due is $875.00, with a 30% discount applied to the sub-total of $1,250.0

In [7]:
# Check if there were any errors
if batch_results['errors']:
    print("\nErrors:")
    for file_path, error in batch_results['errors'].items():
        print(f"Error in {file_path}: {error}")

In [None]:
from ollama_ocr import OCRProcessor

# Create an instance
ocr = OCRProcessor(model_name='llama3.2-vision:11b')



In [None]:
# Test with key-value format
result = ocr.process_image(
    image=image_path,
    format_type="key_value"
)
print(result)

In [None]:
# Text
result = ocr.process_image(
    image=image_path,
    format_type="text"
)
print(result)

In [None]:
#  json format
result = ocr.process_image(
    image=image_path,
    format_type="json"
)
print(result)

In [None]:
#  structured format
result = ocr.process_image(
    image=image_path,
    format_type="structured"
)
print(result)