# Using the requests library

In [25]:
import requests
import json

# Define the API endpoint
url = "http://localhost:5000/v1/completions"

# Define the payload (data to send to your custom API)
payload = {
    "prompt": "Write a short story about a brave knight.",
    "max_tokens": 2,
    "temperature": 0.7,
    "top_p": 1.0
}

# Set the headers (optional, depending on your API setup)
headers = {
    "Content-Type": "application/json"
}

# Make a POST request to the custom API
response = requests.post(url, headers=headers, data=json.dumps(payload))

# Check the response
if response.status_code == 200:
    # Parse and print the response
    print("Response from API:")
    print(json.dumps(response.json(), indent=4))
else:
    print(f"Error: {response.status_code}")
    print(response.text)


Response from API:
{
    "choices": [
        {
            "text": " Sir Edward"
        }
    ]
}


# Using the openai library

In [48]:
from openai import OpenAI

#Initialize the OpenAI Client pointing to the custom LLM server
client = OpenAI(
    api_key = 'test_api_key',
    base_url = 'http://localhost:5000/v1'
)

# Make a call to your custom completions endpoint
response = client.completions.create(
    model="llama",  
    prompt="Can you write a short poem about the ocean?",
    max_tokens=5,
    temperature=0.7
)

# Print the response
print("Response from custom API:")
print(response)


Response from custom API:
Completion(id=None, choices=[CompletionChoice(finish_reason=None, index=None, logprobs=None, text=' The ocean is a vast')], created=None, model=None, object=None, system_fingerprint=None, usage=None)


In [49]:
from openai import OpenAI

#Initialize the OpenAI Client pointing to the custom LLM server
client = OpenAI(
    api_key = 'test_api_key',
    base_url = 'http://localhost:5000/v1'
)

# Make a call to your custom completions endpoint
response = client.chat.completions.create(
    model="llama",  
    messages=[
        {"role": "system", "content": "You are a helpful assistant."},
        {"role": "user", "content": "Can you write a short poem about the ocean?"}
    ],
    max_tokens=5,
    temperature=0.7    
)

# Print the response
print("Response from custom API:")
print(response)


Response from custom API:
ChatCompletion(id=None, choices=[Choice(finish_reason=None, index=None, logprobs=None, message=ChatCompletionMessage(content="The ocean's waves crash", refusal=None, role='assistant', audio=None, function_call=None, tool_calls=None))], created=None, model=None, object=None, service_tier=None, system_fingerprint=None, usage=None)


In [50]:
print(response.choices[0].message.role)
print(response.choices[0].message.content)

assistant
The ocean's waves crash
