Skip to content

Commit a462877

Browse files
authored
[evals] adding grok 4 with ai sdk (#890)
# why benchmarking sota models on stagehand # what changed added xai to evals list # test plan
1 parent e43c9fe commit a462877

File tree

1 file changed

+5
-0
lines changed

1 file changed

+5
-0
lines changed

evals/index.eval.ts

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -39,6 +39,7 @@ import { groq } from "@ai-sdk/groq";
3939
import { cerebras } from "@ai-sdk/cerebras";
4040
import { openai } from "@ai-sdk/openai";
4141
import { AISdkClient } from "@/examples/external_clients/aisdk";
42+
import { xai } from "@ai-sdk/xai";
4243
dotenv.config();
4344

4445
/**
@@ -350,6 +351,10 @@ const generateFilteredTestcases = (): Testcase[] => {
350351
),
351352
),
352353
});
354+
} else if (input.modelName.startsWith("grok")) {
355+
llmClient = new AISdkClient({
356+
model: wrapAISDKModel(xai(input.modelName)),
357+
});
353358
} else if (input.modelName.includes("/")) {
354359
llmClient = new CustomOpenAIClient({
355360
modelName: input.modelName as AvailableModel,

0 commit comments

Comments
 (0)