# Step 1: Install Required Libraries
Make sure the necessary libraries are installed.

In [1]:
!pip install requests

# Step 2: Set up REST API interaction
In this step, we will define a function that interacts with the Flask API to process documents.

In [2]:
import requests
import os

def process_document_via_api(file_path):
    """
    This function sends a request to the document processor API to process the document.
    It sends the file path as a payload to the API.
    """
    # Define the API URL (adjust if running on a different host)
    api_url = "http://localhost:5000/process_document"

    # Check if the file exists
    if not os.path.exists(file_path):
        raise ValueError(f"The file at {file_path} does not exist.")

    # Create the payload with the file path
    payload = {"file_path": file_path}

    # Send the POST request to the API
    response = requests.post(api_url, json=payload)

    # Check if the request was successful
    if response.status_code == 200:
        print("Document processed successfully.")
        return response.json()
    else:
        print(f"Error: {response.status_code}")
        print(response.text)
        response.raise_for_status()

# Step 3: Process a Document via the REST API
Provide the file path to the document you want to process.

In [3]:
# Example file path (adjust this to point to your document)
file_path = "/home/jovyan/work/sample_document.pdf"

# Call the REST API to process the document
response = process_document_via_api(file_path)

# Output the API response
response

# Step 4: Perform Semantic Search Query (Optional)
Once the document is processed, you can modify this step to interact with the database for querying embeddings.
Here, you can build additional functionality to run queries directly on the database using `psycopg2`.