Skip to content

fix: decrease threshold to get green light #18

fix: decrease threshold to get green light

fix: decrease threshold to get green light #18

Workflow file for this run

# This workflow runs MCP tool calling evaluations on master branch merges
# It evaluates AI models' ability to correctly identify and call MCP tools.
name: MCP tool calling evaluations
on:
# Run evaluations on master branch merges
push:
branches:
- 'feat/evaluations'
# paths-ignore:
# - '**.md'
# - 'docs/**'
# - '.gitignore'
# - '.dockerignore'
# - 'LICENSE'
jobs:
evaluations:
name: MCP tool calling evaluations
runs-on: ubuntu-latest
steps:
- name: Checkout code
uses: actions/checkout@v4
- name: Use Node.js 22
uses: actions/setup-node@v4
with:
node-version: 22
cache: 'npm'
cache-dependency-path: 'package-lock.json'
- name: Install Node dependencies
run: npm ci --include=dev
- name: Build project
run: npm run build
- name: Run evaluations
run: npm run evals:run
env:
PHOENIX_API_KEY: ${{ secrets.PHOENIX_API_KEY }}
PHOENIX_BASE_URL: ${{ secrets.PHOENIX_BASE_URL }}
OPENROUTER_BASE_URL: ${{ secrets.OPENROUTER_BASE_URL }}
OPENROUTER_API_KEY: ${{ secrets.OPENROUTER_API_KEY }}