Skip to content

Commit 0e400d0

Browse files
authored
[evaluation] fix: Remove "complex" type hints for AsyncEvaluators (Azure#37964)
* fix: Remove "complex" type hints from AsyncEvaluators This introduced a regression where promptflow rejected the evaluators because they were of types promptflow doesn't support. * style: Run isort
1 parent 3a43719 commit 0e400d0

File tree

17 files changed

+23
-28
lines changed

17 files changed

+23
-28
lines changed

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluate/_evaluate.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@
1414
from promptflow.entities import Run
1515

1616
from azure.ai.evaluation._common.math import list_sum
17-
from azure.ai.evaluation._exceptions import ErrorBlame, ErrorCategory, ErrorTarget, EvaluationException
1817
from azure.ai.evaluation._common.utils import validate_azure_ai_project
18+
from azure.ai.evaluation._exceptions import ErrorBlame, ErrorCategory, ErrorTarget, EvaluationException
1919

2020
from .._constants import (
2121
CONTENT_SAFETY_DEFECT_RATE_THRESHOLD_DEFAULT,

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_common/_base_rai_svc_eval.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
# ---------------------------------------------------------
22
# Copyright (c) Microsoft Corporation. All rights reserved.
33
# ---------------------------------------------------------
4-
from typing import Dict, Optional, Union, TypeVar
4+
from typing import Dict, Optional, TypeVar, Union
55

66
from typing_extensions import override
77

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_content_safety/_content_safety.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2,13 +2,13 @@
22
# Copyright (c) Microsoft Corporation. All rights reserved.
33
# ---------------------------------------------------------
44
from concurrent.futures import as_completed
5-
from typing import Callable, Dict, List, Union, Optional
6-
from typing_extensions import override
5+
from typing import Callable, Dict, List, Optional, Union
76

87
from promptflow.tracing import ThreadPoolExecutorWithContext as ThreadPoolExecutor
8+
from typing_extensions import override
99

10-
from azure.ai.evaluation._evaluators._common import EvaluatorBase
1110
from azure.ai.evaluation._common._experimental import experimental
11+
from azure.ai.evaluation._evaluators._common import EvaluatorBase
1212

1313
from ._hate_unfairness import HateUnfairnessEvaluator
1414
from ._self_harm import SelfHarmEvaluator

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_content_safety/_hate_unfairness.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,8 @@
55

66
from typing_extensions import override
77

8-
from azure.ai.evaluation._common.constants import EvaluationMetrics
98
from azure.ai.evaluation._common._experimental import experimental
9+
from azure.ai.evaluation._common.constants import EvaluationMetrics
1010
from azure.ai.evaluation._evaluators._common import RaiServiceEvaluatorBase
1111

1212

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_content_safety/_self_harm.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,8 @@
55

66
from typing_extensions import override
77

8-
from azure.ai.evaluation._common.constants import EvaluationMetrics
98
from azure.ai.evaluation._common._experimental import experimental
9+
from azure.ai.evaluation._common.constants import EvaluationMetrics
1010
from azure.ai.evaluation._evaluators._common import RaiServiceEvaluatorBase
1111

1212

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_content_safety/_sexual.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,8 @@
55

66
from typing_extensions import override
77

8-
from azure.ai.evaluation._common.constants import EvaluationMetrics
98
from azure.ai.evaluation._common._experimental import experimental
9+
from azure.ai.evaluation._common.constants import EvaluationMetrics
1010
from azure.ai.evaluation._evaluators._common import RaiServiceEvaluatorBase
1111

1212

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_content_safety/_violence.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,8 @@
55

66
from typing_extensions import override
77

8-
from azure.ai.evaluation._common.constants import EvaluationMetrics
98
from azure.ai.evaluation._common._experimental import experimental
9+
from azure.ai.evaluation._common.constants import EvaluationMetrics
1010
from azure.ai.evaluation._evaluators._common import RaiServiceEvaluatorBase
1111

1212

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_eci/_eci.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@
33
# ---------------------------------------------------------
44
from typing_extensions import override
55

6-
from azure.ai.evaluation._common.constants import _InternalEvaluationMetrics
76
from azure.ai.evaluation._common._experimental import experimental
7+
from azure.ai.evaluation._common.constants import _InternalEvaluationMetrics
88
from azure.ai.evaluation._evaluators._common import RaiServiceEvaluatorBase
99

1010

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_protected_material/_protected_material.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,8 @@
66

77
from typing_extensions import override
88

9-
from azure.ai.evaluation._common.constants import EvaluationMetrics
109
from azure.ai.evaluation._common._experimental import experimental
10+
from azure.ai.evaluation._common.constants import EvaluationMetrics
1111
from azure.ai.evaluation._evaluators._common import RaiServiceEvaluatorBase
1212

1313

sdk/evaluation/azure-ai-evaluation/azure/ai/evaluation/_evaluators/_retrieval/_retrieval.py

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -7,13 +7,10 @@
77
import math
88
import os
99
import re
10-
from typing import Union
1110

1211
from promptflow._utils.async_utils import async_run_allowing_running_loop
1312
from promptflow.core import AsyncPrompty
1413

15-
from azure.ai.evaluation._model_configurations import AzureOpenAIModelConfiguration, OpenAIModelConfiguration
16-
1714
from ..._common.math import list_mean_nan_safe
1815
from ..._common.utils import construct_prompty_model_config, validate_model_config
1916

@@ -31,9 +28,9 @@ class _AsyncRetrievalScoreEvaluator:
3128
_LLM_CALL_TIMEOUT = 600
3229
_DEFAULT_OPEN_API_VERSION = "2024-02-15-preview"
3330

34-
def __init__(self, model_config: Union[AzureOpenAIModelConfiguration, OpenAIModelConfiguration]):
31+
def __init__(self, model_config: dict):
3532
prompty_model_config = construct_prompty_model_config(
36-
model_config,
33+
validate_model_config(model_config),
3734
self._DEFAULT_OPEN_API_VERSION,
3835
USER_AGENT,
3936
)
@@ -138,7 +135,7 @@ class RetrievalEvaluator:
138135
"""
139136

140137
def __init__(self, model_config):
141-
self._async_evaluator = _AsyncRetrievalScoreEvaluator(validate_model_config(model_config))
138+
self._async_evaluator = _AsyncRetrievalScoreEvaluator(model_config)
142139

143140
def __call__(self, *, conversation, **kwargs):
144141
"""Evaluates retrieval score chat scenario.

0 commit comments

Comments
 (0)