Skip to content

Commit 1ae362e

Browse files
committed
fix(cli): fix tool metric model in cli eval
1 parent 993a9f6 commit 1ae362e

File tree

2 files changed

+7
-4
lines changed

2 files changed

+7
-4
lines changed

veadk/cli/cli_eval.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -205,7 +205,7 @@ def eval(
205205
],
206206
model=judge_model,
207207
),
208-
ToolCorrectnessMetric(threshold=0.5),
208+
ToolCorrectnessMetric(threshold=0.5, model=judge_model),
209209
]
210210

211211
asyncio.run(

veadk/evaluation/deepeval_evaluator/deepeval_evaluator.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,7 @@
1313
# limitations under the License.
1414

1515
import time
16+
from typing import Optional
1617

1718
from deepeval import evaluate
1819
from deepeval.evaluate import CacheConfig
@@ -21,9 +22,9 @@
2122
from deepeval.models import LocalModel
2223
from deepeval.test_case import LLMTestCase
2324
from deepeval.test_case.llm_test_case import ToolCall
24-
from typing_extensions import override
25-
from typing import Optional
2625
from google.adk.evaluation.eval_set import EvalSet
26+
from typing_extensions import override
27+
2728
from veadk.config import getenv
2829
from veadk.evaluation.base_evaluator import BaseEvaluator, EvalResultData, MetricResult
2930
from veadk.evaluation.types import EvalResultCaseData, EvalResultMetadata
@@ -113,7 +114,9 @@ def __init__(
113114
super().__init__(agent=agent, name=name)
114115

115116
if not judge_model_api_key:
116-
judge_model_api_key = getenv("MODEL_JUDGE_API_KEY")
117+
judge_model_api_key = getenv("MODEL_JUDGE_API_KEY") or getenv(
118+
"MODEL_AGENT_API_KEY"
119+
)
117120
if not judge_model_name:
118121
judge_model_name = getenv(
119122
"MODEL_JUDGE_NAME",

0 commit comments

Comments
 (0)