Azure
diff --git a/‎sdk/ai/azure-ai-projects/README.md‎
Lines changed: 70 additions & 3 deletions b/‎sdk/ai/azure-ai-projects/README.md‎
Lines changed: 70 additions & 3 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_coherence.py‎
Lines changed: 6 additions & 6 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_coherence.py‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_fluency.py‎
Lines changed: 4 additions & 4 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_fluency.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_generic_agentic_evaluator/agent_utils.py‎
Lines changed: 3 additions & 3 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_generic_agentic_evaluator/agent_utils.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_generic_agentic_evaluator/sample_generic_agentic_evaluator.py‎
Lines changed: 1 addition & 1 deletion b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_generic_agentic_evaluator/sample_generic_agentic_evaluator.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_groundedness.py‎
Lines changed: 4 additions & 4 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_groundedness.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_intent_resolution.py‎
Lines changed: 4 additions & 4 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_intent_resolution.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_relevance.py‎
Lines changed: 4 additions & 4 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_relevance.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_response_completeness.py‎
Lines changed: 4 additions & 4 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_response_completeness.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_task_adherence.py‎
Lines changed: 4 additions & 4 deletions b/‎sdk/ai/azure-ai-projects/samples/evaluations/agentic_evaluators/sample_task_adherence.py‎
Lines changed: 4 additions & 4 deletions
@@ -21,11 +21,11 @@ resources in your Microsoft Foundry Project. Use it to:
   * Model Context Protocol (MCP)
   * SharePoint
   * Web Search
-* **Get an OpenAI client** using `.get_openai_client()` method to run "Responses" and "Conversations" operations with your Agent.
+* **Get an OpenAI client** using `.get_openai_client()` method to run "Responses", "Conversations", and "Evals" operations with your Agent.
 * **Manage memory stores** for Agent conversations, using the `.memory_store` operations.
-* **Run Evaluations** to assess the performance of your generative AI application, using the `.evaluation_rules`,
+* **Explore additional evaluation tools** to assess the performance of your generative AI application, using the `.evaluation_rules`,
 `.evaluation_taxonomies`, `.evaluators`, `.insights`, and `.schedules` operations.
-* **Run Red Team operations** to identify risks associated with your generative AI application, using the ".red_teams" operations.
+* **Run Red Team scans** to identify risks associated with your generative AI application, using the ".red_teams" operations.
 * **Enumerate AI Models** deployed to your Foundry Project using the `.deployments` operations.
 * **Enumerate connected Azure resources** in your Foundry project using the `.connections` operations.
 * **Upload documents and create Datasets** to reference them using the `.datasets` operations.
@@ -561,6 +561,73 @@ Evaluation in Azure AI Project client library provides quantitative, AI-assisted
 
 The code below shows some evaluation operations. Full list of sample can be found under "evaluation" folder in the [package samples][samples]
 
+<!-- SNIPPET:sample_agent_evaluation.agent_evaluation_basic -->
+
+```python
+with (
+    DefaultAzureCredential() as credential,
+    AIProjectClient(endpoint=endpoint, credential=credential) as project_client,
+    project_client.get_openai_client() as openai_client,
+):
+    agent = project_client.agents.create_version(
+        agent_name=os.environ["AZURE_AI_AGENT_NAME"],
+        definition=PromptAgentDefinition(
+            model=os.environ["AZURE_AI_MODEL_DEPLOYMENT_NAME"],
+            instructions="You are a helpful assistant that answers general questions",
+        ),
+    )
+    print(f"Agent created (id: {agent.id}, name: {agent.name}, version: {agent.version})")
+
+    data_source_config = DataSourceConfigCustom(
+        type="custom",
+        item_schema={"type": "object", "properties": {"query": {"type": "string"}}, "required": ["query"]},
+        include_sample_schema=True,
+    )
+    testing_criteria = [
+        {
+            "type": "azure_ai_evaluator",
+            "name": "violence_detection",
+            "evaluator_name": "builtin.violence",
+            "data_mapping": {"query": "{{item.query}}", "response": "{{item.response}}"},
+        }
+    ]
+    eval_object = openai_client.evals.create(
+        name="Agent Evaluation",
+        data_source_config=data_source_config, 
+        testing_criteria=testing_criteria,   # type: ignore
+    )
+    print(f"Evaluation created (id: {eval_object.id}, name: {eval_object.name})")
+
+    data_source = {
+        "type": "azure_ai_target_completions",
+        "source": {
+            "type": "file_content",
+            "content": [
+                {"item": {"query": "What is the capital of France?"}},
+                {"item": {"query": "How do I reverse a string in Python?"}},
+            ],
+        },
+        "input_messages": {
+            "type": "template",
+            "template": [
+                {"type": "message", "role": "user", "content": {"type": "input_text", "text": "{{item.query}}"}}
+            ],
+        },
+        "target": {
+            "type": "azure_ai_agent",
+            "name": agent.name,
+            "version": agent.version,  # Version is optional. Defaults to latest version if not specified
+        },
+    }
+
+    agent_eval_run: Union[RunCreateResponse, RunRetrieveResponse] = openai_client.evals.runs.create(
+        eval_id=eval_object.id, name=f"Evaluation Run for Agent {agent.name}", data_source=data_source  # type: ignore
+    )
+    print(f"Evaluation run created (id: {agent_eval_run.id})")
+```
+
+<!-- END SNIPPET -->
+
 ### Deployments operations
 
 The code below shows some Deployments operations, which allow you to enumerate the AI models deployed to your AI Foundry Projects. These models can be seen in the "Models + endpoints" tab in your AI Foundry Project. Full samples can be found under the "deployment" folder in the [package samples][samples].
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     using inline dataset content.
 
 USAGE:
@@ -75,15 +75,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Coherence Evaluator with inline data",
-            data_source_config=data_source_config,
-            testing_criteria=testing_criteria,  # type: ignore
+            data_source_config=data_source_config, 
+            testing_criteria=testing_criteria,   # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     using inline dataset content.
 
 USAGE:
@@ -74,15 +74,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Fluency Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -50,15 +50,15 @@ def run_evaluator(
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name=f"Test {evaluator_name} Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     for Any agentic evaluator using inline dataset content.
 
 USAGE:
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     for Groundedness evaluator using inline dataset content.
 
 USAGE:
@@ -90,15 +90,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Groundedness Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     for Intent Resolution evaluator using inline dataset content.
 
 USAGE:
@@ -86,15 +86,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Intent Resolution Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     for Relevance evaluator using inline dataset content.
 
 USAGE:
@@ -79,15 +79,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Relevance Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     for Response Completeness evaluator using inline dataset content.
 
 USAGE:
@@ -77,15 +77,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Response Completeness Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
 
@@ -7,7 +7,7 @@
 """
 DESCRIPTION:
     Given an AIProjectClient, this sample demonstrates how to use the synchronous
-    `openai.evals.*` methods to create, get and list eval group and and eval runs
+    `openai.evals.*` methods to create, get and list evaluation and and eval runs
     for Task Adherence evaluator using inline dataset content.
 
 USAGE:
@@ -87,15 +87,15 @@ def main() -> None:
             }
         ]
 
-        print("Creating Eval Group")
+        print("Creating Evaluation")
         eval_object = client.evals.create(
             name="Test Task Adherence Evaluator with inline data",
             data_source_config=data_source_config,
             testing_criteria=testing_criteria,  # type: ignore
         )
-        print(f"Eval Group created")
+        print(f"Evaluation created")
 
-        print("Get Eval Group by Id")
+        print("Get Evaluation by Id")
         eval_object_response = client.evals.retrieve(eval_object.id)
         print("Eval Run Response:")
         pprint(eval_object_response)
Original file line number	Diff line number	Diff line change
`@@ -50,15 +50,15 @@ def run_evaluator(`
`50`	`50`	`}`
`51`	`51`	`]`
`52`	`52`
`53`		`- print("Creating Eval Group")`
	`53`	`+ print("Creating Evaluation")`
`54`	`54`	`eval_object = client.evals.create(`
`55`	`55`	`name=f"Test {evaluator_name} Evaluator with inline data",`
`56`	`56`	`data_source_config=data_source_config,`
`57`	`57`	`testing_criteria=testing_criteria, # type: ignore`
`58`	`58`	`)`
`59`		`- print(f"Eval Group created")`
	`59`	`+ print(f"Evaluation created")`
`60`	`60`
`61`		`- print("Get Eval Group by Id")`
	`61`	`+ print("Get Evaluation by Id")`
`62`	`62`	`eval_object_response = client.evals.retrieve(eval_object.id)`
`63`	`63`	`print("Eval Run Response:")`
`64`	`64`	`pprint(eval_object_response)`