## Test Connection to LLM NIM

In [None]:
import os

# get NVIDIA_API_KEY from Colab Repo, then set SHELL variable
from google.colab import userdata
os.environ['NVIDIA_API_KEY'] = userdata.get('NVIDIA_API_KEY')
apikey = os.getenv('NVIDIA_API_KEY')

In [None]:
import requests
import json

url = "https://integrate.api.nvidia.com/v1/chat/completions"
headers = {
        "Content-Type": "application/json",
        "Authorization": f"Bearer {apikey}" # Add the API key here
}

data = {
    "model": "meta/llama-3.2-3b-instruct",
    "messages": [
        {"role": "user", "content": "Explain RAG in one sentence."}
    ],
    "max_tokens": 100
}

response = requests.post(url, json=data, headers=headers)

# Print the response text and status code for debugging
print(f"Status Code: {response.status_code}")
print(f"Response Text: {response.text}")

# Try to parse JSON only if the status code is 200
if response.status_code == 200:
    try:
        print(response.json()["choices"][0]["message"]["content"])
    except json.JSONDecodeError:
        print("Error decoding JSON response.")
else:
    print("API request failed.")

## Test connection to Embedding model

In [None]:
import requests
import json

url = "https://integrate.api.nvidia.com/v1/embeddings"
headers = {
        "Content-Type": "application/json",
        "Authorization": f"Bearer {apikey}" # Add the API key here
}

data = {
    "input": "What is NVIDIA NIM?",
    "model": "nvidia/llama-3.2-nv-embedqa-1b-v2",
    "input_type": "passage",
}

response = requests.post(url, json=data, headers=headers)

# Print the full response for debugging
print(f"Status Code: {response.status_code}")
print(f"Response Text: {response.text}")

# Try to parse JSON only if the status code is 200
if response.status_code == 200:
    try:
        response_json = response.json()
        print(response_json["data"][0]["embedding"])
        print(f"Size of Embedding: {len(response_json['data'][0]['embedding'])}")
        print(response_json['data'][0]['embedding'][:5])
    except json.JSONDecodeError:
        print("Error decoding JSON response.")
else:
    print("API request failed.")

In [None]:
len