In [2]:
! pip install -r requirements.txt --quiet

# Creating and Deploying an Azure AI Agent Using SDK a

This notebook demonstrates how to create and deploy an Azure AI Agent using the Azure SDK,



In [5]:

from os import environ
from dotenv import load_dotenv
from azure.ai.projects import AIProjectClient
from azure.identity import DefaultAzureCredential


load_dotenv(override=True)




True

## Create a project client

In [6]:

# Create an AIProjectClient instance
project_client = AIProjectClient(
    endpoint=environ["PROJECT_ENDPOINT"],
    credential=DefaultAzureCredential(),  # Use Azure Default Credential for authentication
)

## Create an agent and a thread

In [None]:
instructions = """You are an Evaluation Batch Analyzer. 
Your role is to process a batch of failed agent evaluation records. Each record includes:
- user query
- system response
- failed evaluation metrics (groundedness, coherence, relevance)

For each record:
1. Summarize the main issue with the response.
2. List the metrics that failed and the reasons.
3. Capture any notable context (e.g., repeated mistakes, misunderstandings).

At the batch level:
- Identify recurring failure patterns across multiple records.
- Highlight potential root causes (e.g., knowledge gaps, unclear policy wording).

Return results in a structured, concise format that can be consumed by a final summarizer agent.
"""


agent = project_client.agents.create_agent(
    model="gpt-4o",
    name="evaluation-batch-analyzer", 
    instructions=instructions,
)

print(f"Created agent, ID: {agent.id}")




Created agent, ID: asst_ZTfa5QERUSpZijn55JOKI1Ia


In [None]:
final_instructions = """You are a Final Evaluation Summarizer. 
Your role is to take multiple batch summaries from the Evaluation Batch Analyzer agent 
and consolidate them into one global summary.

Your output should:
1. Highlight the most common failure patterns across all batches.
2. Provide overall statistics (e.g., frequency of each failed metric).
3. Identify systemic issues or recurring themes that impact response quality.
4. Suggest high-level areas for improvement (e.g., knowledge coverage, response clarity).

Keep the summary structured, concise, and ready for stakeholders to review.
"""

final_agent = project_client.agents.create_agent(
    model="gpt-4o",
    name="final-evaluation-summarizer",
    instructions=final_instructions,
)

print(f"Created final summarizer agent, ID: {final_agent.id}")

Created final summarizer agent, ID: asst_mCYcJ6BvIeUdMd4bfBDSiUY0
