Skip to content

Commit 87916c9

Browse files
authored
Add test cases for eval result converter UT (#43805)
* update * rename * run black * fix result counts * update * Fix bug * run black * fix bug * Add UT
1 parent 2d6516d commit 87916c9

File tree

6 files changed

+504
-2
lines changed

6 files changed

+504
-2
lines changed

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluate/_evaluate.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1823,6 +1823,8 @@ def _convert_results_to_aoai_evaluation_results(
18231823
metrics_mapped = _EvaluatorMetricMapping.EVALUATOR_NAME_METRICS_MAPPINGS.get(evaluator_name, [])
18241824
if metrics_mapped and len(metrics_mapped) > 0:
18251825
metrics.extend(metrics_mapped)
1826+
else:
1827+
metrics.append(criteria_name)
18261828
else:
18271829
metrics.append(criteria_name)
18281830
elif isinstance(evaluator, AzureOpenAIGrader):

sdk/evaluation/azure-ai-evaluation/tests/unittests/data/evaluation_util_convert_error_summary.json

Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,5 +7,23 @@
77
"log_path": null,
88
"error_message": "(UserError) Missing inputs for line 1: 'data.item.query, data.item.response'",
99
"error_code": "INVALID VALUE"
10+
},
11+
"Fluency": {
12+
"status": "Failed",
13+
"duration": "0:00:00.000869",
14+
"completed_lines": 0,
15+
"failed_lines": 0,
16+
"log_path": null,
17+
"error_message": "(SystemError) 100% of the batch run failed. (UserError) OpenAI API hits BadRequestError: Error code: 400 - {'error': {'message': \"Unsupported parameter: 'max_tokens' is not supported with this model. Use 'max_completion_tokens' instead.\", 'type': 'invalid_request_error', 'param': 'max_tokens', 'code': 'unsupported_parameter'}} [Error reference: https://platform.openai.com/docs/guides/error-codes/api-errors]",
18+
"error_code": "FAILED_EXECUTION"
19+
},
20+
"ViolenceContentCustomEvaluator": {
21+
"status": "Failed",
22+
"duration": "0:00:01.002324",
23+
"completed_lines": 0,
24+
"failed_lines": 1,
25+
"log_path": null,
26+
"error_message": "(SystemError) 100% of the batch run failed. Prompt template is not initialized.",
27+
"error_code": "FAILED_EXECUTION"
1028
}
1129
}

sdk/evaluation/azure-ai-evaluation/tests/unittests/data/evaluation_util_convert_eval_meta_data.json

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,23 @@
1010
"type": "azure_ai_evaluator",
1111
"name": "violence",
1212
"evaluator_name": "violence"
13+
},
14+
{
15+
"type": "azure_ai_evaluator",
16+
"id": "ViolenceContentCustomEvaluator_35feb949-e01b-4502-8011-d22347d092af",
17+
"name": "ViolenceContentCustomEvaluator",
18+
"evaluator_name": "custom.violence",
19+
"evaluator_version": "1",
20+
"initialization_parameters": {
21+
"threshold": 3
22+
},
23+
"data_mapping": {
24+
"query": "{{item.question}}",
25+
"response": "{{item.answer}}",
26+
"context": "{{item.context}}",
27+
"ground_truth": "{{item.ground_truth}}"
28+
},
29+
"registry_name": ""
1330
}
1431
]
1532
}

0 commit comments

Comments
 (0)