In [None]:
import json
import requests

# Set your Ollama local API endpoint
OLLAMA_API_URL = "http://localhost:11434/api/chat"

def deepseek_query(model_name: str, prompt: str, stream: bool = False) -> str:
    """
    Send a prompt to the specified DeepSeek model via Ollama API and return the model response.

    Parameters:
      model_name (str): Name of the DeepSeek model to run (e.g., "deepseek-r1:1.5b").
      prompt (str): The prompt to send to the model.
      stream (bool): Whether to enable streaming responses.

    Returns:
      str: The AI-generated response.
    """
    payload = {
        "model": model_name,
        "messages": [{"role": "user", "content": prompt}],
        "stream": stream
    }
    headers = {"Content-Type": "application/json"}

    response = requests.post(OLLAMA_API_URL, data=json.dumps(payload), headers=headers)
    if response.status_code == 200:
        result = response.json()
        # Extract and return the text from the model's message response.
        return result.get("message", {}).get("content", "No content returned.")
    else:
        raise Exception(f"Error {response.status_code}: {response.text}")

if __name__ == "__main__":
    # Example usage:
    model = "deepseek-r1:1.5b"  # Change this to your preferred model tag.
    user_prompt = "Explain the advantages of using H800 GPUs for AI model training over H100 GPUs."

    try:
        answer = deepseek_query(model, user_prompt)
        print("DeepSeek Response:\n", answer)
    except Exception as e:
        print("An error occurred:", e)