6363 required : false
6464 default : main
6565 type : string
66+ extensions_branch :
67+ description : Extensions repo branch to use (for testing feature branches with skills/plugins)
68+ required : false
69+ default : main
70+ type : string
6671 instance_ids :
6772 description : >-
6873 Comma-separated instance IDs to evaluate.
@@ -157,6 +162,7 @@ jobs:
157162 echo "reason: ${{ github.event.inputs.reason || 'N/A' }}"
158163 echo "eval_branch: ${{ github.event.inputs.eval_branch || 'main' }}"
159164 echo "benchmarks_branch: ${{ github.event.inputs.benchmarks_branch || 'main' }}"
165+ echo "extensions_branch: ${{ github.event.inputs.extensions_branch || 'main' }}"
160166 echo "instance_ids: ${{ github.event.inputs.instance_ids || 'N/A' }}"
161167 echo "num_infer_workers: ${{ github.event.inputs.num_infer_workers || '(default)' }}"
162168 echo "num_eval_workers: ${{ github.event.inputs.num_eval_workers || '(default)' }}"
@@ -341,6 +347,7 @@ jobs:
341347 EVAL_WORKFLOW : ${{ env.EVAL_WORKFLOW }}
342348 EVAL_BRANCH : ${{ github.event.inputs.eval_branch || 'main' }}
343349 BENCHMARKS_BRANCH : ${{ github.event.inputs.benchmarks_branch || 'main' }}
350+ EXTENSIONS_BRANCH : ${{ github.event.inputs.extensions_branch || 'main' }}
344351 BENCHMARK : ${{ github.event.inputs.benchmark || 'swebench' }}
345352 TRIGGER_REASON : ${{ github.event.inputs.reason }}
346353 PR_NUMBER : ${{ steps.params.outputs.pr_number }}
@@ -357,7 +364,7 @@ jobs:
357364 # Normalize instance_ids: strip all spaces
358365 INSTANCE_IDS=$(printf '%s' "$INSTANCE_IDS" | tr -d ' ')
359366
360- echo "Dispatching evaluation workflow with SDK commit: $SDK_SHA (benchmark: $BENCHMARK, eval branch: $EVAL_BRANCH, benchmarks branch: $BENCHMARKS_BRANCH, tool preset: $TOOL_PRESET)"
367+ echo "Dispatching evaluation workflow with SDK commit: $SDK_SHA (benchmark: $BENCHMARK, eval branch: $EVAL_BRANCH, benchmarks branch: $BENCHMARKS_BRANCH, extensions branch: $EXTENSIONS_BRANCH, tool preset: $TOOL_PRESET)"
361368 PAYLOAD=$(jq -n \
362369 --arg sdk "$SDK_SHA" \
363370 --arg sdk_run_id "${{ github.run_id }}" \
@@ -367,6 +374,7 @@ jobs:
367374 --arg reason "$TRIGGER_REASON" \
368375 --arg pr "$PR_NUMBER" \
369376 --arg benchmarks "$BENCHMARKS_BRANCH" \
377+ --arg extensions "$EXTENSIONS_BRANCH" \
370378 --arg benchmark "$BENCHMARK" \
371379 --arg instance_ids "$INSTANCE_IDS" \
372380 --arg num_infer_workers "$NUM_INFER_WORKERS" \
@@ -377,7 +385,7 @@ jobs:
377385 --arg agent_type "$AGENT_TYPE" \
378386 --arg partial_archive_url "$PARTIAL_ARCHIVE_URL" \
379387 --arg triggered_by "$TRIGGERED_BY" \
380- '{ref: $ref, inputs: {sdk_commit: $sdk, sdk_workflow_run_id: $sdk_run_id, eval_limit: $eval_limit, models_json: ($models | tostring), trigger_reason: $reason, pr_number: $pr, benchmarks_branch: $benchmarks, benchmark: $benchmark, instance_ids: $instance_ids, num_infer_workers: $num_infer_workers, num_eval_workers: $num_eval_workers, enable_conversation_event_logging: $enable_conversation_event_logging, max_retries: $max_retries, tool_preset: $tool_preset, agent_type: $agent_type, partial_archive_url: $partial_archive_url, triggered_by: $triggered_by}}')
388+ '{ref: $ref, inputs: {sdk_commit: $sdk, sdk_workflow_run_id: $sdk_run_id, eval_limit: $eval_limit, models_json: ($models | tostring), trigger_reason: $reason, pr_number: $pr, benchmarks_branch: $benchmarks, extensions_branch: $extensions, benchmark: $benchmark, instance_ids: $instance_ids, num_infer_workers: $num_infer_workers, num_eval_workers: $num_eval_workers, enable_conversation_event_logging: $enable_conversation_event_logging, max_retries: $max_retries, tool_preset: $tool_preset, agent_type: $agent_type, partial_archive_url: $partial_archive_url, triggered_by: $triggered_by}}')
381389 RESPONSE=$(curl -sS -o /tmp/dispatch.out -w "%{http_code}" -X POST \
382390 -H "Authorization: token $PAT_TOKEN" \
383391 -H "Accept: application/vnd.github+json" \
0 commit comments