We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 55ef435 commit 7b4b030Copy full SHA for 7b4b030
evals/tasks/agent/kith.ts
@@ -17,7 +17,7 @@ export const kith: EvalFunction = async ({
17
await agent.execute({
18
instruction:
19
"add the shoes to cart, go to checkout, and fill the shipping information",
20
- maxSteps: 30,
+ maxSteps: 15,
21
});
22
23
const { evaluation, reasoning } = await evaluator.evaluate({
@@ -29,7 +29,7 @@ export const kith: EvalFunction = async ({
29
if (success) {
30
31
instruction: "fill the payment information",
32
+ maxSteps: 10,
33
34
35
const { evaluation: evaluation2, reasoning: reasoning2 } =
0 commit comments