### Aparavi Pipeline Demo Notebook

This notebook demonstrates how to use the Aparavi Data Toolchain SDK for document processing and PII anonymization.

![Aparavi pipeline](../images/pipeline.png)

In [None]:
%pip install -q -U -r ../requirements.txt

In [None]:
# Load env and initialize Aparavi client
from dotenv import load_dotenv
import os
from aparavi_dtc_sdk import AparaviClient

load_dotenv(dotenv_path="../env", override=True)

api_key = os.getenv("APARAVI_API_KEY")
base_url = os.getenv("APARAVI_BASE_URL", "https://eaas.aparavi.com/")

print("✓ Environment loaded")
print("APARAVI_BASE_URL:", repr(base_url))
print("APARAVI_API_KEY set:", bool(api_key))


In [None]:
# initialize client
client = None
if not api_key:
    print("Please set APARAVI_API_KEY in ../env")
else:
    client = AparaviClient(base_url=base_url, api_key=api_key)
    print("✓ Client initialized")
    print("  Endpoint:", base_url)


In [None]:
# Process a sample document
try:
    result = client.execute_pipeline_workflow(
        pipeline ="../pipelines/anonymize_pipeline.json",
        file_glob="../tests/sampleData/*.pdf"
    )
    
    if result:
        print("✓ Document processed successfully!")
        if isinstance(result, dict):
            print(f"  Status: {result.get('status', 'Unknown')}")
            print(f"  Completed: {result.get('completed', False)}")
except Exception as e:
    print(f"✗ Error: {e}")


In [None]:
import sys
sys.path.insert(0, "..")
from tools.render import render_aparavi_result

# Render the result
render_aparavi_result(result)