diff --git a/examples/03_github_workflows/02_pr_review/prompt.py b/examples/03_github_workflows/02_pr_review/prompt.py
index 7b27818b72..f37409e01e 100644
--- a/examples/03_github_workflows/02_pr_review/prompt.py
+++ b/examples/03_github_workflows/02_pr_review/prompt.py
@@ -36,8 +36,21 @@
 PROMPT = """{skill_trigger}
 /github-pr-review
 
-When posting a review, keep the review body brief unless your active review instructions
-require a longer structured format.
+When posting a review, keep the review body brief unless your active review
+instructions require a longer structured format.
+
+## Review decision policy (eval / benchmark risk)
+
+You MAY approve clearly low-risk changes (docs, typo fixes, formatting, or
+pure refactors with no behavior changes).
+
+Do NOT submit an APPROVE review when the PR changes agent behavior or anything
+that affects benchmark/evaluation performance.
+Examples include: prompt templates, tool calling/execution, planning/loop logic,
+memory/condenser behavior, terminal/stdin/stdout handling, or evaluation harness code.
+
+If a PR is in this category (or you are uncertain), leave a COMMENTED review and
+explicitly flag it for a human maintainer to decide after running lightweight evals.
 
 Review the PR changes below and identify issues that need to be addressed.