-
Notifications
You must be signed in to change notification settings - Fork 1.2k
43 lines (37 loc) · 905 Bytes
/
agent-evals.yaml
File metadata and controls
43 lines (37 loc) · 905 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
name: Agent Evals
on:
workflow_dispatch:
schedule:
# Run every 6 hours
- cron: "0 */6 * * *"
permissions:
contents: read
concurrency:
group: agent-evals-${{ github.ref }}
cancel-in-progress: true
env:
CI: true
jobs:
test:
runs-on: ubuntu-latest
strategy:
matrix:
node-version:
- "20"
env:
GEMINI_API_KEY: ${{ secrets.GEMINI_API_KEY }}
steps:
- uses: actions/checkout@v4
- uses: actions/setup-node@v3
with:
node-version: ${{ matrix.node-version }}
cache: npm
cache-dependency-path: npm-shrinkwrap.json
- run: npm i -g npm@9.5
- run: npm install -g @google/gemini-cli
- run: npm ci
- run: npm install
working-directory: scripts/agent-evals
- name: "Run agent-evals tests"
run: npm run test
working-directory: scripts/agent-evals