Skip to content

Commit f6dd98b

Browse files
committed
Fix uv
1 parent f28283c commit f6dd98b

File tree

5 files changed

+69
-64
lines changed

5 files changed

+69
-64
lines changed

.github/workflows/evaluate.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -128,6 +128,7 @@ jobs:
128128
enable-cache: true
129129
version: "0.4.20"
130130
cache-dependency-glob: "requirements**.txt"
131+
python-version: "3.12"
131132

132133
- name: Setup node
133134
uses: actions/setup-node@v4

evals/results/baseline/config.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,7 @@
11
{
22
"testdata_path": "ground_truth.jsonl",
3-
"results_dir": "results/experiment<TIMESTAMP>",
4-
"requested_metrics": ["gpt_groundedness", "gpt_relevance", "answer_length", "latency", "citations_matched"],
3+
"results_dir": "results/gpt-4o-mini",
4+
"requested_metrics": ["gpt_groundedness", "gpt_relevance", "answer_length", "latency", "citations_matched", "any_citation"],
55
"target_url": "http://localhost:50505/chat",
66
"target_parameters": {
77
"overrides": {

0 commit comments

Comments
 (0)