Azure
diff --git a/‎sdk/ai/azure-ai-projects/azure/ai/projects/models/_models.py‎
Lines changed: 3 additions & 1 deletion b/‎sdk/ai/azure-ai-projects/azure/ai/projects/models/_models.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluation/sample_agent_evaluation.py‎
Lines changed: 127 additions & 0 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluation/sample_agent_evaluation.py‎
Lines changed: 127 additions & 0 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluation/sample_agent_response_evaluation.py‎
Lines changed: 116 additions & 0 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluation/sample_agent_response_evaluation.py‎
Lines changed: 116 additions & 0 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluation/sample_agentic_evaluators/sample_coherence.py‎
Lines changed: 28 additions & 52 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluation/sample_agentic_evaluators/sample_coherence.py‎
Lines changed: 28 additions & 52 deletions
@@ -5671,7 +5671,9 @@ class FileSearchTool(Tool, discriminator="file_search"):
         visibility=["read", "create", "update", "delete", "query"]
     )
     """Ranking options for search."""
-    filters: Optional[Union["_models.ComparisonFilter", "_models.CompoundFilter"]] = rest_field(visibility=["read", "create", "update", "delete", "query"])
+    filters: Optional[Union["_models.ComparisonFilter", "_models.CompoundFilter"]] = rest_field(
+        visibility=["read", "create", "update", "delete", "query"]
+    )
     """A filter to apply. Is either a ComparisonFilter type or a CompoundFilter type."""
 
     @overload
 
@@ -0,0 +1,127 @@
+# ------------------------------------
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+# ------------------------------------
+"""
+DESCRIPTION:
+    This sample demonstrates how to create and run an evaluation for an Azure AI agent
+    using the synchronous AIProjectClient.
+
+    The OpenAI compatible Evals calls in this sample are made using
+    the OpenAI client from the `openai` package. See https://platform.openai.com/docs/api-reference
+    for more information.
+
+USAGE:
+    python sample_agent_evaluation.py
+
+    Before running the sample:
+
+    pip install "azure-ai-projects>=2.0.0b1" azure-identity python-dotenv
+
+    Set these environment variables with your own values:
+    1) AZURE_AI_PROJECT_ENDPOINT - The Azure AI Project endpoint, as found in the Overview
+       page of your Azure AI Foundry portal.
+    2) AZURE_AI_MODEL_DEPLOYMENT_NAME - The deployment name of the AI model, as found under the "Name" column in
+       the "Models + endpoints" tab in your Azure AI Foundry project.
+"""
+
+import os
+import time
+from pprint import pprint
+from dotenv import load_dotenv
+from azure.identity import DefaultAzureCredential
+from azure.ai.projects import AIProjectClient
+from azure.ai.projects.models import PromptAgentDefinition
+from openai.types.eval_create_params import DataSourceConfigCustom
+
+load_dotenv()
+
+project_client = AIProjectClient(
+    endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+    credential=DefaultAzureCredential(),
+)
+
+with project_client:
+
+    openai_client = project_client.get_openai_client()
+
+    agent = project_client.agents.create_version(
+        agent_name=os.environ["AZURE_AI_AGENT_NAME"],
+        definition=PromptAgentDefinition(
+            model=os.environ["AZURE_AI_MODEL_DEPLOYMENT_NAME"],
+            instructions="You are a helpful assistant that answers general questions",
+        ),
+    )
+    print(f"Agent created (id: {agent.id}, name: {agent.name}, version: {agent.version})")
+
+    data_source_config = DataSourceConfigCustom(
+        type="custom",
+        item_schema={"type": "object", "properties": {"query": {"type": "string"}}, "required": ["query"]},
+        include_sample_schema=True,
+    )
+    testing_criteria = [
+        {
+            "type": "azure_ai_evaluator",
+            "name": "violence_detection",
+            "evaluator_name": "builtin.violence",
+            "data_mapping": {"query": "{{item.query}}", "response": "{{item.response}}"},
+        }
+    ]
+    eval_object = openai_client.evals.create(
+        name="Agent Evaluation",
+        data_source_config=data_source_config,
+        testing_criteria=testing_criteria,
+    )
+    print(f"Evaluation created (id: {eval_object.id}, name: {eval_object.name})")
+
+    data_source = {
+        "type": "azure_ai_target_completions",
+        "source": {
+            "type": "file_content",
+            "content": [
+                {"item": {"query": "What is the capital of France?"}},
+                {"item": {"query": "How do I reverse a string in Python?"}},
+            ],
+        },
+        "input_messages": {
+            "type": "template",
+            "template": [
+                {"type": "message", "role": "user", "content": {"type": "input_text", "text": "{{item.query}}"}}
+            ],
+        },
+        "target": {
+            "type": "azure_ai_agent",
+            "name": agent.name,
+            "version": agent.version,  # Version is optional. Defaults to latest version if not specified
+        },
+    }
+
+    agent_eval_run = openai_client.evals.runs.create(
+        eval_id=eval_object.id, name=f"Evaluation Run for Agent {agent.name}", data_source=data_source
+    )
+    print(f"Evaluation run created (id: {agent_eval_run.id})")
+
+    while agent_eval_run.status not in ["completed", "failed"]:
+        agent_eval_run = openai_client.evals.runs.retrieve(run_id=agent_eval_run.id, eval_id=eval_object.id)
+        print(f"Waiting for eval run to complete... current status: {agent_eval_run.status}")
+        time.sleep(5)
+
+    if agent_eval_run.status == "completed":
+        print("\n✓ Evaluation run completed successfully!")
+        print(f"Result Counts: {agent_eval_run.result_counts}")
+
+        output_items = list(
+            openai_client.evals.runs.output_items.list(run_id=agent_eval_run.id, eval_id=eval_object.id)
+        )
+        print(f"\nOUTPUT ITEMS (Total: {len(output_items)})")
+        print(f"{'-'*60}")
+        pprint(output_items)
+        print(f"{'-'*60}")
+    else:
+        print("\n✗ Evaluation run failed.")
+
+    openai_client.evals.delete(eval_id=eval_object.id)
+    print("Evaluation deleted")
+
+    project_client.agents.delete(agent_name=agent.name)
+    print("Agent deleted")
@@ -0,0 +1,116 @@
+# ------------------------------------
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+# ------------------------------------
+"""
+DESCRIPTION:
+    This sample demonstrates how to create and run an evaluation for an Azure AI agent response
+    using the synchronous AIProjectClient.
+
+    The OpenAI compatible Evals calls in this sample are made using
+    the OpenAI client from the `openai` package. See https://platform.openai.com/docs/api-reference
+    for more information.
+
+USAGE:
+    python sample_agent_response_evaluation.py
+
+    Before running the sample:
+
+    pip install "azure-ai-projects>=2.0.0b1" azure-identity python-dotenv
+
+    Set these environment variables with your own values:
+    1) AZURE_AI_PROJECT_ENDPOINT - The Azure AI Project endpoint, as found in the Overview
+       page of your Azure AI Foundry portal.
+    2) AZURE_AI_MODEL_DEPLOYMENT_NAME - The deployment name of the AI model, as found under the "Name" column in
+       the "Models + endpoints" tab in your Azure AI Foundry project.
+"""
+
+import os
+import time
+from pprint import pprint
+from dotenv import load_dotenv
+from azure.identity import DefaultAzureCredential
+from azure.ai.projects import AIProjectClient
+from azure.ai.projects.models import PromptAgentDefinition
+
+load_dotenv()
+
+project_client = AIProjectClient(
+    endpoint=os.environ["AZURE_AI_PROJECT_ENDPOINT"],
+    credential=DefaultAzureCredential(),
+)
+
+with project_client:
+
+    openai_client = project_client.get_openai_client()
+
+    agent = project_client.agents.create_version(
+        agent_name=os.environ["AZURE_AI_AGENT_NAME"],
+        definition=PromptAgentDefinition(
+            model=os.environ["AZURE_AI_MODEL_DEPLOYMENT_NAME"],
+            instructions="You are a helpful assistant that answers general questions",
+        ),
+    )
+    print(f"Agent created (id: {agent.id}, name: {agent.name}, version: {agent.version})")
+
+    conversation = openai_client.conversations.create(
+        items=[{"type": "message", "role": "user", "content": "What is the size of France in square miles?"}],
+    )
+    print(f"Created conversation with initial user message (id: {conversation.id})")
+
+    response = openai_client.responses.create(
+        conversation=conversation.id,
+        extra_body={"agent": {"name": agent.name, "type": "agent_reference"}},
+        input="",  # TODO: Remove 'input' once service is fixed
+    )
+    print(f"Response output: {response.output_text} (id: {response.id})")
+
+    data_source_config = {"type": "azure_ai_source", "scenario": "responses"}
+    testing_criteria = [
+        {"type": "azure_ai_evaluator", "name": "violence_detection", "evaluator_name": "builtin.violence"}
+    ]
+    eval_object = openai_client.evals.create(
+        name="Agent Response Evaluation",
+        data_source_config=data_source_config,
+        testing_criteria=testing_criteria,
+    )
+    print(f"Evaluation created (id: {eval_object.id}, name: {eval_object.name})")
+
+    data_source = {
+        "type": "azure_ai_responses",
+        "item_generation_params": {
+            "type": "response_retrieval",
+            "data_mapping": {"response_id": "{{item.resp_id}}"},
+            "source": {"type": "file_content", "content": [{"item": {"resp_id": response.id}}]},
+        },
+    }
+
+    response_eval_run = openai_client.evals.runs.create(
+        eval_id=eval_object.id, name=f"Evaluation Run for Agent {agent.name}", data_source=data_source
+    )
+    print(f"Evaluation run created (id: {response_eval_run.id})")
+
+    while response_eval_run.status not in ["completed", "failed"]:
+        response_eval_run = openai_client.evals.runs.retrieve(run_id=response_eval_run.id, eval_id=eval_object.id)
+        print(f"Waiting for eval run to complete... current status: {response_eval_run.status}")
+        time.sleep(5)
+
+    if response_eval_run.status == "completed":
+        print("\n✓ Evaluation run completed successfully!")
+        print(f"Result Counts: {response_eval_run.result_counts}")
+
+        output_items = list(
+            openai_client.evals.runs.output_items.list(run_id=response_eval_run.id, eval_id=eval_object.id)
+        )
+        print(f"\nOUTPUT ITEMS (Total: {len(output_items)})")
+        print(f"{'-'*60}")
+        pprint(output_items)
+        print(f"{'-'*60}")
+    else:
+        print("\n✗ Evaluation run failed.")
+
+    openai_client.evals.delete(eval_id=eval_object.id)
+    print("Evaluation deleted")
+
+    project_client.agents.delete(agent_name=agent.name)
+    print("Agent deleted")
@@ -34,7 +34,7 @@
 from openai.types.evals.create_eval_jsonl_run_data_source_param import (
     CreateEvalJSONLRunDataSourceParam,
     SourceFileContent,
-    SourceFileContentContent
+    SourceFileContentContent,
 )
 
 
@@ -46,46 +46,36 @@ def main() -> None:
         "AZURE_AI_PROJECT_ENDPOINT"
     ]  # Sample : https://<account_name>.services.ai.azure.com/api/projects/<project_name>
     model_deployment_name = os.environ.get("AZURE_AI_MODEL_DEPLOYMENT_NAME", "")  # Sample : gpt-4o-mini
-    
+
     with DefaultAzureCredential() as credential:
-        with AIProjectClient(endpoint=endpoint, credential=credential, api_version="2025-11-15-preview") as project_client:
+        with AIProjectClient(
+            endpoint=endpoint, credential=credential, api_version="2025-11-15-preview"
+        ) as project_client:
             print("Creating an OpenAI client from the AI Project client")
-            
+
             client = project_client.get_openai_client()
             client._custom_query = {"api-version": "2025-11-15-preview"}
-            
+
             data_source_config = {
                 "type": "custom",
                 "item_schema": {
                     "type": "object",
-                    "properties": {
-                        "query": {
-                            "type": "string"
-                        },
-                        "response": {
-                            "type": "string"
-                        }
-                    },
-                    "required": []
+                    "properties": {"query": {"type": "string"}, "response": {"type": "string"}},
+                    "required": [],
                 },
-                "include_sample_schema": True
+                "include_sample_schema": True,
             }
-            
+
             testing_criteria = [
                 {
                     "type": "azure_ai_evaluator",
                     "name": "coherence",
                     "evaluator_name": "builtin.coherence",
-                    "initialization_parameters": {
-                        "deployment_name": f"{model_deployment_name}"
-                    },
-                    "data_mapping": {
-                        "query": "{{item.query}}",
-                        "response": "{{item.response}}"
-                    }
+                    "initialization_parameters": {"deployment_name": f"{model_deployment_name}"},
+                    "data_mapping": {"query": "{{item.query}}", "response": "{{item.response}}"},
                 }
             ]
-            
+
             print("Creating Eval Group")
             eval_object = client.evals.create(
                 name="Test Coherence Evaluator with inline data",
@@ -111,34 +101,21 @@ def main() -> None:
             eval_run_object = client.evals.runs.create(
                 eval_id=eval_object.id,
                 name="inline_data_run",
-                metadata={
-                    "team": "eval-exp",
-                    "scenario": "inline-data-v1"
-                },
+                metadata={"team": "eval-exp", "scenario": "inline-data-v1"},
                 data_source=CreateEvalJSONLRunDataSourceParam(
-                    type="jsonl", 
+                    type="jsonl",
                     source=SourceFileContent(
                         type="file_content",
-                        content= [
+                        content=[
                             # Success example - coherent response
-                            SourceFileContentContent(
-                                item= {
-                                    "query": success_query,
-                                    "response": success_response
-                                }
-                            ),
+                            SourceFileContentContent(item={"query": success_query, "response": success_response}),
                             # Failure example - incoherent response
-                            SourceFileContentContent(
-                                item= {
-                                    "query": failure_query,
-                                    "response": failure_response
-                                }
-                            )
-                        ]
-                    )
-                )
+                            SourceFileContentContent(item={"query": failure_query, "response": failure_response}),
+                        ],
+                    ),
+                ),
             )
-            
+
             print(f"Eval Run created")
             pprint(eval_run_object)
 
@@ -151,16 +128,15 @@ def main() -> None:
 
             while True:
                 run = client.evals.runs.retrieve(run_id=eval_run_response.id, eval_id=eval_object.id)
-                if run.status == "completed" or run.status == "failed": 
-                    output_items = list(client.evals.runs.output_items.list(
-                        run_id=run.id, eval_id=eval_object.id
-                    ))
+                if run.status == "completed" or run.status == "failed":
+                    output_items = list(client.evals.runs.output_items.list(run_id=run.id, eval_id=eval_object.id))
                     pprint(output_items)
                     print(f"Eval Run Status: {run.status}")
                     print(f"Eval Run Report URL: {run.report_url}")
                     break
                 time.sleep(5)
                 print("Waiting for eval run to complete...")
-            
+
+
 if __name__ == "__main__":
-    main()
+    main()