google
diff --git a/‎src/google/adk/evaluation/app_details.py‎
Lines changed: 1 addition & 1 deletion b/‎src/google/adk/evaluation/app_details.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/google/adk/evaluation/eval_metrics.py‎
Lines changed: 20 additions & 0 deletions b/‎src/google/adk/evaluation/eval_metrics.py‎
Lines changed: 20 additions & 0 deletions
@@ -39,7 +39,7 @@ class AgentDetails(EvalBaseModel):
 class AppDetails(EvalBaseModel):
   """Contains details about the App (the agentic system).
 
-  This structure is only a projection of the acutal app. Only details
+  This structure is only a projection of the actual app. Only details
   that are relevant to the Eval System are captured here.
   """
 
 
@@ -52,6 +52,8 @@ class PrebuiltMetrics(Enum):
       "rubric_based_final_response_quality_v1"
   )
 
+  HALLUCINATIONS_V1 = "hallucinations_v1"
+
   RUBRIC_BASED_TOOL_USE_QUALITY_V1 = "rubric_based_tool_use_quality_v1"
 
 
@@ -130,6 +132,24 @@ class RubricsBasedCriterion(BaseCriterion):
   )
 
 
+class HallucinationsCriterion(BaseCriterion):
+  """Criterion to use when evaluating agents response for hallucinations."""
+
+  judge_model_options: JudgeModelOptions = Field(
+      default_factory=JudgeModelOptions,
+      description="Options for the judge model.",
+  )
+
+  evaluate_intermediate_nl_responses: bool = Field(
+      default=False,
+      description=(
+          "Whether any intermediate NL responses should be evaluated"
+          " for hallucinations or not. By default, the metric only evaluates"
+          " final response from the Agent for hallucinations."
+      ),
+  )
+
+
 class EvalMetric(EvalBaseModel):
   """A metric used to evaluate a particular aspect of an eval case."""