### OICM Inference for models deployed with: text-embedding-inference
##### ref: https://github.com/huggingace/text-embeddings-inference

In [9]:
import requests
import json
from openai import OpenAI
import os

In [31]:
api_key = os.getenv('OI_API_KEY') # Your valid api key
model_version_id = os.getenv('OI_MODEL_VERSION_ID') # model version id
base_url =f"" # your valid model url
# example: https://inference.{oicm_host}/models/{model_version_id}/proxy/vllm/v1
# oicm_host: is the platform url ex: develop.openinnovation.ai

base_url = f"https://inference.develop.openinnovation.ai/models/{model_version_id}/proxy"

headers = {
    "Authorization": f"Bearer {api_key}"
}

#### Embedding Model

In [17]:
payload = {
    "inputs": "this is an example of a text to embed"
}

response = requests.post(f"{base_url}/embed", json=payload, headers=headers)

response.json()

[[-0.015143932,
  -0.0026477021,
  0.026366921,
  -0.010427436,
  -0.0058458988,
  -0.034748647,
  -0.0028270567,
  -0.00983077,
  0.065917306,
  0.010747078,
  0.013460483,
  0.019746779,
  0.045630686,
  0.014788775,
  -0.00985208,
  -0.008133115,
  0.016635595,
  -0.054523837,
  -0.028853027,
  -0.019107495,
  -0.06449667,
  0.036879595,
  -0.10381975,
  -0.021309473,
  -0.00836752,
  0.05031877,
  0.019789398,
  0.0075009344,
  0.056114946,
  0.04761957,
  -0.021749869,
  0.039038956,
  0.0052740946,
  -0.056342248,
  -0.021607805,
  0.006460322,
  0.02775914,
  -0.042164344,
  -0.016706627,
  -0.033441667,
  0.017502181,
  -0.017303292,
  0.038953718,
  -0.04179498,
  -0.05864367,
  -0.017473768,
  0.031935796,
  -0.00078489893,
  0.0041802083,
  -0.0053877453,
  0.014227625,
  -0.008658749,
  0.01923535,
  0.0066485554,
  0.00024350513,
  -0.0028465905,
  -0.0355442,
  -0.053330507,
  -0.018922811,
  0.042164344,
  0.033214364,
  0.022232885,
  0.03142437,
  -0.053529397,
  -0.00

#### Reranking Model

In [28]:
payload = {
  "query": "What is the capital of the United States?",
  "texts": [
    "Carson City is the capital city of the American state of Nevada.",
    "The Commonwealth of the Northern Mariana Islands is a group of islands in the Pacific Ocean. Its capital is Saipan.",
    "Washington, D.C. (also known as simply Washington or D.C., and officially as the District of Columbia) is the capital of the United States. It is a federal district.",
    "Capital punishment (the death penalty) has existed in the United States since before the United States was a country. As of 2017, capital punishment is legal in 30 of the 50 states."
  ]
}

response = requests.post(f"{base_url}/rerank", json=payload, headers=headers)

response.json()

[{'index': 2, 'score': 0.9986646},
 {'index': 0, 'score': 0.0012893283},
 {'index': 1, 'score': 7.662102e-05},
 {'index': 3, 'score': 7.602479e-05}]

#### Classification Model

In [33]:
payload = {"inputs": "Abu Dhabi is great!"}

response = requests.post(f"{base_url}/predict", json=payload, headers=headers)

response.json()

[{'score': 0.99332774, 'label': 'admiration'},
 {'score': 0.0022727316, 'label': 'approval'},
 {'score': 0.0012649657, 'label': 'neutral'},
 {'score': 0.00031487487, 'label': 'gratitude'},
 {'score': 0.00031242447, 'label': 'excitement'},
 {'score': 0.00028446573, 'label': 'joy'},
 {'score': 0.00025006142, 'label': 'realization'},
 {'score': 0.00022240923, 'label': 'optimism'},
 {'score': 0.00020975187, 'label': 'disapproval'},
 {'score': 0.0001732125, 'label': 'annoyance'},
 {'score': 0.00017186452, 'label': 'curiosity'},
 {'score': 0.00016528051, 'label': 'love'},
 {'score': 0.00013074763, 'label': 'pride'},
 {'score': 0.00012672496, 'label': 'disappointment'},
 {'score': 0.00011139838, 'label': 'confusion'},
 {'score': 0.00010629708, 'label': 'surprise'},
 {'score': 0.000102624996, 'label': 'amusement'},
 {'score': 8.57464e-05, 'label': 'caring'},
 {'score': 8.441703e-05, 'label': 'sadness'},
 {'score': 7.776861e-05, 'label': 'anger'},
 {'score': 5.7342975e-05, 'label': 'desire'},
 