vercel
diff --git a/‎.changeset/stupid-bags-crash.md‎
Lines changed: 5 additions & 0 deletions b/‎.changeset/stupid-bags-crash.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎examples/ai-core/src/generate-text/xai-responses-usage-full.ts‎
Lines changed: 44 additions & 0 deletions b/‎examples/ai-core/src/generate-text/xai-responses-usage-full.ts‎
Lines changed: 44 additions & 0 deletions
diff --git a/‎examples/ai-core/src/generate-text/xai-responses-usage.ts‎
Lines changed: 16 additions & 0 deletions b/‎examples/ai-core/src/generate-text/xai-responses-usage.ts‎
Lines changed: 16 additions & 0 deletions
diff --git a/‎examples/ai-core/src/stream-text/xai-responses-usage-full.ts‎
Lines changed: 43 additions & 0 deletions b/‎examples/ai-core/src/stream-text/xai-responses-usage-full.ts‎
Lines changed: 43 additions & 0 deletions
diff --git a/‎examples/ai-core/src/stream-text/xai-responses-usage.ts‎
Lines changed: 18 additions & 0 deletions b/‎examples/ai-core/src/stream-text/xai-responses-usage.ts‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎packages/xai/src/convert-xai-chat-usage.test.ts‎
Lines changed: 119 additions & 0 deletions b/‎packages/xai/src/convert-xai-chat-usage.test.ts‎
Lines changed: 119 additions & 0 deletions
diff --git a/‎packages/xai/src/convert-xai-chat-usage.ts‎
Lines changed: 43 additions & 0 deletions b/‎packages/xai/src/convert-xai-chat-usage.ts‎
Lines changed: 43 additions & 0 deletions
@@ -0,0 +1,5 @@
+---
+'@ai-sdk/xai': patch
+---
+
+fix(provider/xai): handle inconsistent cached token reporting
@@ -0,0 +1,44 @@
+import { xai } from '@ai-sdk/xai';
+import { generateText } from 'ai';
+import { run } from '../lib/run';
+
+const models = [
+  'grok-4',
+  'grok-4-1-fast-reasoning',
+  'grok-4-1-fast-non-reasoning',
+  'grok-4-fast-reasoning',
+  'grok-4-fast-non-reasoning',
+  'grok-code-fast-1',
+  'grok-3',
+  'grok-3-fast',
+  'grok-3-mini',
+  'grok-3-mini-fast',
+];
+
+run(async () => {
+  for (const modelId of models) {
+    try {
+      const result = await generateText({
+        model: xai.responses(modelId),
+        prompt: 'Say a single word.',
+      });
+
+      const body = result.response.body as Record<string, any>;
+      const raw = body.usage;
+      const sdk = result.usage;
+
+      console.log(`--- ${modelId} ---`);
+      console.log(
+        `raw: output_tokens=${raw.output_tokens}, reasoning_tokens=${raw.output_tokens_details?.reasoning_tokens ?? 0}, total_tokens=${raw.total_tokens}`,
+      );
+      console.log(
+        `sdk: outputTokens=${sdk.outputTokens}, reasoningTokens=${sdk.reasoningTokens}, cachedInputTokens=${sdk.cachedInputTokens}, totalTokens=${sdk.totalTokens}`,
+      );
+      console.log();
+    } catch (e: any) {
+      console.log(`--- ${modelId} ---`);
+      console.log(`error: ${e.message?.slice(0, 80)}`);
+      console.log();
+    }
+  }
+});
@@ -0,0 +1,16 @@
+import { xai } from '@ai-sdk/xai';
+import { generateText } from 'ai';
+import { run } from '../lib/run';
+
+run(async () => {
+  const result = await generateText({
+    model: xai.responses('grok-4-1-fast-non-reasoning'),
+    prompt: 'Say a single word.',
+  });
+
+  console.log('text:', result.text);
+  console.log();
+  console.log('raw usage:', JSON.stringify(result.response.body, null, 2));
+  console.log();
+  console.log('sdk usage:', JSON.stringify(result.usage, null, 2));
+});
@@ -0,0 +1,43 @@
+import { xai } from '@ai-sdk/xai';
+import { streamText } from 'ai';
+import { run } from '../lib/run';
+
+const models = [
+  'grok-4',
+  'grok-4-1-fast-reasoning',
+  'grok-4-1-fast-non-reasoning',
+  'grok-4-fast-reasoning',
+  'grok-4-fast-non-reasoning',
+  'grok-code-fast-1',
+  'grok-3',
+  'grok-3-fast',
+  'grok-3-mini',
+  'grok-3-mini-fast',
+];
+
+run(async () => {
+  for (const modelId of models) {
+    try {
+      const result = streamText({
+        model: xai.responses(modelId),
+        prompt: 'Say a single word.',
+      });
+
+      for await (const textPart of result.textStream) {
+        void textPart;
+      }
+
+      const sdk = await result.usage;
+
+      console.log(`--- ${modelId} ---`);
+      console.log(
+        `sdk: outputTokens=${sdk.outputTokens}, reasoningTokens=${sdk.reasoningTokens}, cachedInputTokens=${sdk.cachedInputTokens}, totalTokens=${sdk.totalTokens}`,
+      );
+      console.log();
+    } catch (e: any) {
+      console.log(`--- ${modelId} ---`);
+      console.log(`error: ${e.message?.slice(0, 80)}`);
+      console.log();
+    }
+  }
+});
@@ -0,0 +1,18 @@
+import { xai } from '@ai-sdk/xai';
+import { streamText } from 'ai';
+import { run } from '../lib/run';
+
+run(async () => {
+  const result = streamText({
+    model: xai.responses('grok-3-mini'),
+    prompt: 'Say a single word.',
+  });
+
+  for await (const textPart of result.textStream) {
+    process.stdout.write(textPart);
+  }
+
+  console.log();
+  console.log();
+  console.log('sdk usage:', JSON.stringify(await result.usage, null, 2));
+});
@@ -0,0 +1,119 @@
+import { convertXaiChatUsage } from './convert-xai-chat-usage';
+import { describe, it, expect } from 'vitest';
+
+describe('convertXaiChatUsage', () => {
+  it('should convert basic usage without caching or reasoning', () => {
+    const result = convertXaiChatUsage({
+      prompt_tokens: 100,
+      completion_tokens: 50,
+      total_tokens: 150,
+    });
+
+    expect(result).toMatchInlineSnapshot(`
+      {
+        "cachedInputTokens": undefined,
+        "inputTokens": 100,
+        "outputTokens": 50,
+        "reasoningTokens": undefined,
+        "totalTokens": 150,
+      }
+    `);
+  });
+
+  it('should convert usage with cached tokens (inclusive reporting)', () => {
+    const result = convertXaiChatUsage({
+      prompt_tokens: 200,
+      completion_tokens: 50,
+      total_tokens: 250,
+      prompt_tokens_details: {
+        cached_tokens: 150,
+      },
+    });
+
+    expect(result).toMatchInlineSnapshot(`
+      {
+        "cachedInputTokens": 150,
+        "inputTokens": 200,
+        "outputTokens": 50,
+        "reasoningTokens": undefined,
+        "totalTokens": 250,
+      }
+    `);
+  });
+
+  it('should convert usage with reasoning tokens', () => {
+    const result = convertXaiChatUsage({
+      prompt_tokens: 100,
+      completion_tokens: 254,
+      total_tokens: 734,
+      completion_tokens_details: {
+        reasoning_tokens: 380,
+      },
+    });
+
+    expect(result).toMatchInlineSnapshot(`
+      {
+        "cachedInputTokens": undefined,
+        "inputTokens": 100,
+        "outputTokens": 634,
+        "reasoningTokens": 380,
+        "totalTokens": 734,
+      }
+    `);
+  });
+
+  it('should handle cached_tokens exceeding prompt_tokens (non-inclusive reporting)', () => {
+    const result = convertXaiChatUsage({
+      prompt_tokens: 4142,
+      completion_tokens: 254,
+      total_tokens: 8724,
+      prompt_tokens_details: {
+        cached_tokens: 4328,
+      },
+    });
+
+    expect(result).toMatchInlineSnapshot(`
+      {
+        "cachedInputTokens": 4328,
+        "inputTokens": 8470,
+        "outputTokens": 254,
+        "reasoningTokens": undefined,
+        "totalTokens": 8724,
+      }
+    `);
+  });
+
+  it('should handle undefined usage', () => {
+    const result = convertXaiChatUsage(undefined);
+
+    expect(result).toMatchInlineSnapshot(`
+      {
+        "cachedInputTokens": undefined,
+        "inputTokens": undefined,
+        "outputTokens": undefined,
+        "reasoningTokens": undefined,
+        "totalTokens": undefined,
+      }
+    `);
+  });
+
+  it('should handle null token details', () => {
+    const result = convertXaiChatUsage({
+      prompt_tokens: 100,
+      completion_tokens: 50,
+      total_tokens: 150,
+      prompt_tokens_details: null,
+      completion_tokens_details: null,
+    });
+
+    expect(result).toMatchInlineSnapshot(`
+      {
+        "cachedInputTokens": undefined,
+        "inputTokens": 100,
+        "outputTokens": 50,
+        "reasoningTokens": undefined,
+        "totalTokens": 150,
+      }
+    `);
+  });
+});
@@ -0,0 +1,43 @@
+import { LanguageModelV2Usage } from '@ai-sdk/provider';
+
+export type XaiChatUsage = {
+  prompt_tokens: number;
+  completion_tokens: number;
+  total_tokens: number;
+  prompt_tokens_details?: {
+    cached_tokens?: number | null;
+  } | null;
+  completion_tokens_details?: {
+    reasoning_tokens?: number | null;
+  } | null;
+};
+
+export function convertXaiChatUsage(
+  usage: XaiChatUsage | undefined | null,
+): LanguageModelV2Usage {
+  if (usage == null) {
+    return {
+      inputTokens: undefined,
+      outputTokens: undefined,
+      totalTokens: undefined,
+      reasoningTokens: undefined,
+      cachedInputTokens: undefined,
+    };
+  }
+
+  const cacheReadTokens = usage.prompt_tokens_details?.cached_tokens ?? 0;
+  const reasoningTokens =
+    usage.completion_tokens_details?.reasoning_tokens ?? 0;
+
+  const promptTokensIncludesCached = cacheReadTokens <= usage.prompt_tokens;
+
+  return {
+    inputTokens: promptTokensIncludesCached
+      ? usage.prompt_tokens
+      : usage.prompt_tokens + cacheReadTokens,
+    outputTokens: usage.completion_tokens + reasoningTokens,
+    totalTokens: usage.total_tokens,
+    reasoningTokens: reasoningTokens || undefined,
+    cachedInputTokens: cacheReadTokens || undefined,
+  };
+}
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +---
 +'@ai-sdk/xai': patch
 +---
++
 +fix(provider/xai): handle inconsistent cached token reporting