diff --git a/examples/03_github_workflows/02_pr_review/prompt.py b/examples/03_github_workflows/02_pr_review/prompt.py index 7b27818b72..f37409e01e 100644 --- a/examples/03_github_workflows/02_pr_review/prompt.py +++ b/examples/03_github_workflows/02_pr_review/prompt.py @@ -36,8 +36,21 @@ PROMPT = """{skill_trigger} /github-pr-review -When posting a review, keep the review body brief unless your active review instructions -require a longer structured format. +When posting a review, keep the review body brief unless your active review +instructions require a longer structured format. + +## Review decision policy (eval / benchmark risk) + +You MAY approve clearly low-risk changes (docs, typo fixes, formatting, or +pure refactors with no behavior changes). + +Do NOT submit an APPROVE review when the PR changes agent behavior or anything +that affects benchmark/evaluation performance. +Examples include: prompt templates, tool calling/execution, planning/loop logic, +memory/condenser behavior, terminal/stdin/stdout handling, or evaluation harness code. + +If a PR is in this category (or you are uncertain), leave a COMMENTED review and +explicitly flag it for a human maintainer to decide after running lightweight evals. Review the PR changes below and identify issues that need to be addressed.