In [1]:
# OpenAIChatCompletion
import os
from openai import AsyncOpenAI
from semantic_kernel import Kernel
from semantic_kernel.connectors.ai.open_ai import OpenAIChatCompletion, OpenAIPromptExecutionSettings
from semantic_kernel.kernel import ChatHistory

api_key  = os.environ["AZURE_OPENAI_API_KEY"] # use Azure api
endpoint = os.environ["AZURE_OPENAI_ENDPOINT"]
deploy   = os.environ["AZURE_OPENAI_DEPLOYMENT_NAME"]
model   = os.environ["AZURE_OPENAI_MODEL"]
api_ver  = os.environ.get("AZURE_OPENAI_API_VERSION", "2025-01-01-preview")

client = AsyncOpenAI(
    api_key=api_key,
    base_url=f"{endpoint}/openai/deployments/{deploy}",
    default_headers={"api-key": api_key},
    default_query={"api-version": api_ver},
)

chat_service = OpenAIChatCompletion(
    ai_model_id=deploy,
    async_client=client,
)

kernel = Kernel()
kernel.add_service(chat_service)

history = ChatHistory()
history.add_system_message("You are a helpful assistant.")
history.add_user_message("What is capital of France ?")

prompt_execution_settings = OpenAIPromptExecutionSettings(temperature=0.2, top_p=1.0, max_tokens=400)

response = await chat_service.get_chat_message_content(
    chat_history=history,
    kernel=kernel,
    settings=prompt_execution_settings
)
print(response.content)

The capital of France is Paris.
