feat: add includeRawChunks support for streaming (#360)

robert-j-y · devin-ai-integration[bot] · web-flow · commit b129d36987e4 · 2026-01-27T12:41:02.000-08:00
* feat: add includeRawChunks support for streaming When includeRawChunks: true is passed to streaming calls, the provider now emits { type: 'raw', rawValue: <parsed chunk> } stream parts for each SSE event, giving consumers access to the raw provider chunks alongside the processed AI SDK stream parts. This feature is available for both chat and completion models. Closes #340 Co-Authored-By: Robert Yeakel <robert.yeakel@openrouter.ai> * test: add test for raw chunk emission on failed parse Documents the intentional behavior that raw chunks are emitted before validation, which is useful for debugging malformed responses. This matches the Vercel AI SDK reference implementation pattern. Co-Authored-By: Robert Yeakel <robert.yeakel@openrouter.ai> --------- Co-authored-by: Devin AI <158243242+devin-ai-integration[bot]@users.noreply.github.com>
diff --git a/.changeset/include-raw-chunks.md b/.changeset/include-raw-chunks.md
@@ -0,0 +1,9 @@
+---
+"@openrouter/ai-sdk-provider": minor
+---
+
+Add includeRawChunks support for streaming
+
+When `includeRawChunks: true` is passed to streaming calls, the provider now emits `{ type: 'raw', rawValue: <parsed chunk> }` stream parts for each SSE event, giving consumers access to the raw provider chunks alongside the processed AI SDK stream parts.
+
+This feature is available for both chat and completion models.
diff --git a/src/chat/index.test.ts b/src/chat/index.test.ts
@@ -2340,3 +2340,127 @@ describe('debug settings', () => {
     expect(requestBody).not.toHaveProperty('debug');
   });
 });
+
+describe('includeRawChunks', () => {
+  const server = createTestServer({
+    'https://openrouter.ai/api/v1/chat/completions': {
+      response: { type: 'json-value', body: {} },
+    },
+  });
+
+  beforeAll(() => server.server.start());
+  afterEach(() => server.server.reset());
+  afterAll(() => server.server.stop());
+
+  function prepareStreamResponse({ content }: { content: string[] }) {
+    server.urls['https://openrouter.ai/api/v1/chat/completions']!.response = {
+      type: 'stream-chunks',
+      chunks: [
+        `data: {"id":"chatcmpl-test","object":"chat.completion.chunk","created":1702657020,"model":"gpt-3.5-turbo-0613","choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null}]}\n\n`,
+        ...content.map(
+          (text) =>
+            `data: {"id":"chatcmpl-test","object":"chat.completion.chunk","created":1702657020,"model":"gpt-3.5-turbo-0613","choices":[{"index":0,"delta":{"content":"${text}"},"finish_reason":null}]}\n\n`,
+        ),
+        `data: {"id":"chatcmpl-test","object":"chat.completion.chunk","created":1702657020,"model":"gpt-3.5-turbo-0613","choices":[{"index":0,"delta":{},"finish_reason":"stop"}]}\n\n`,
+        `data: {"id":"chatcmpl-test","object":"chat.completion.chunk","created":1702657020,"model":"gpt-3.5-turbo-0613","choices":[],"usage":{"prompt_tokens":10,"completion_tokens":5,"total_tokens":15}}\n\n`,
+        'data: [DONE]\n\n',
+      ],
+    };
+  }
+
+  it('should emit raw chunks when includeRawChunks is true', async () => {
+    prepareStreamResponse({ content: ['Hello'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    expect(rawChunks.length).toBeGreaterThan(0);
+    expect(rawChunks[0]).toHaveProperty('rawValue');
+    expect(rawChunks[0]!.rawValue).toHaveProperty('id', 'chatcmpl-test');
+  });
+
+  it('should not emit raw chunks when includeRawChunks is false', async () => {
+    prepareStreamResponse({ content: ['Hello'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: false,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    expect(rawChunks.length).toBe(0);
+  });
+
+  it('should not emit raw chunks when includeRawChunks is not specified', async () => {
+    prepareStreamResponse({ content: ['Hello'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    expect(rawChunks.length).toBe(0);
+  });
+
+  it('should emit raw chunks for each SSE event including usage chunk', async () => {
+    prepareStreamResponse({ content: ['Hello', ' World'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    // Should have raw chunks for: initial, Hello, World, finish_reason, usage
+    expect(rawChunks.length).toBe(5);
+  });
+
+  it('should emit raw chunk even when parsing fails (for debugging malformed responses)', async () => {
+    server.urls['https://openrouter.ai/api/v1/chat/completions']!.response = {
+      type: 'stream-chunks',
+      chunks: ['data: {unparsable}\n\n', 'data: [DONE]\n\n'],
+    };
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+    const errorChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'error' }> =>
+        chunk.type === 'error',
+    );
+
+    // Raw chunk is emitted before error handling, useful for debugging
+    expect(rawChunks.length).toBe(1);
+    expect(errorChunks.length).toBe(1);
+  });
+});
diff --git a/src/chat/index.ts b/src/chat/index.ts
@@ -628,6 +628,11 @@ export class OpenRouterChatLanguageModel implements LanguageModelV3 {
           LanguageModelV3StreamPart
         >({
           transform(chunk, controller) {
+            // Emit raw chunk if requested (before anything else)
+            if (options.includeRawChunks) {
+              controller.enqueue({ type: 'raw', rawValue: chunk.rawValue });
+            }
+
             // handle failed chunk parsing / validation:
             if (!chunk.success) {
               finishReason = createFinishReason('error');
diff --git a/src/completion/index.test.ts b/src/completion/index.test.ts
@@ -610,3 +610,126 @@ describe('doStream', () => {
     );
   });
 });
+
+describe('includeRawChunks', () => {
+  const server = createTestServer({
+    'https://openrouter.ai/api/v1/completions': {
+      response: { type: 'stream-chunks', chunks: [] },
+    },
+  });
+
+  beforeAll(() => server.server.start());
+  afterEach(() => server.server.reset());
+  afterAll(() => server.server.stop());
+
+  function prepareStreamResponse({ content }: { content: string[] }) {
+    server.urls['https://openrouter.ai/api/v1/completions']!.response = {
+      type: 'stream-chunks',
+      chunks: [
+        ...content.map(
+          (text) =>
+            `data: {"id":"cmpl-test","object":"text_completion","created":1711363440,"choices":[{"text":"${text}","index":0,"logprobs":null,"finish_reason":null}],"model":"openai/gpt-3.5-turbo-instruct"}\n\n`,
+        ),
+        `data: {"id":"cmpl-test","object":"text_completion","created":1711363310,"choices":[{"text":"","index":0,"logprobs":null,"finish_reason":"stop"}],"model":"openai/gpt-3.5-turbo-instruct"}\n\n`,
+        `data: {"id":"cmpl-test","object":"text_completion","created":1711363310,"model":"openai/gpt-3.5-turbo-instruct","usage":{"prompt_tokens":10,"completion_tokens":5,"total_tokens":15},"choices":[]}\n\n`,
+        'data: [DONE]\n\n',
+      ],
+    };
+  }
+
+  it('should emit raw chunks when includeRawChunks is true', async () => {
+    prepareStreamResponse({ content: ['Hello'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    expect(rawChunks.length).toBeGreaterThan(0);
+    expect(rawChunks[0]).toHaveProperty('rawValue');
+    expect(rawChunks[0]!.rawValue).toHaveProperty('id', 'cmpl-test');
+  });
+
+  it('should not emit raw chunks when includeRawChunks is false', async () => {
+    prepareStreamResponse({ content: ['Hello'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: false,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    expect(rawChunks.length).toBe(0);
+  });
+
+  it('should not emit raw chunks when includeRawChunks is not specified', async () => {
+    prepareStreamResponse({ content: ['Hello'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    expect(rawChunks.length).toBe(0);
+  });
+
+  it('should emit raw chunks for each SSE event including usage chunk', async () => {
+    prepareStreamResponse({ content: ['Hello', ' World'] });
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+
+    // Should have raw chunks for: Hello, World, finish_reason, usage
+    expect(rawChunks.length).toBe(4);
+  });
+
+  it('should emit raw chunk even when parsing fails (for debugging malformed responses)', async () => {
+    server.urls['https://openrouter.ai/api/v1/completions']!.response = {
+      type: 'stream-chunks',
+      chunks: ['data: {unparsable}\n\n', 'data: [DONE]\n\n'],
+    };
+
+    const { stream } = await model.doStream({
+      prompt: TEST_PROMPT,
+      includeRawChunks: true,
+    });
+
+    const elements = await convertReadableStreamToArray(stream);
+    const rawChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'raw' }> =>
+        chunk.type === 'raw',
+    );
+    const errorChunks = elements.filter(
+      (chunk): chunk is Extract<LanguageModelV3StreamPart, { type: 'error' }> =>
+        chunk.type === 'error',
+    );
+
+    // Raw chunk is emitted before error handling, useful for debugging
+    expect(rawChunks.length).toBe(1);
+    expect(errorChunks.length).toBe(1);
+  });
+});
diff --git a/src/completion/index.ts b/src/completion/index.ts
@@ -288,6 +288,11 @@ export class OpenRouterCompletionLanguageModel implements LanguageModelV3 {
           LanguageModelV3StreamPart
         >({
           transform(chunk, controller) {
+            // Emit raw chunk if requested (before anything else)
+            if (options.includeRawChunks) {
+              controller.enqueue({ type: 'raw', rawValue: chunk.rawValue });
+            }
+
             // handle failed chunk parsing / validation:
             if (!chunk.success) {
               finishReason = createFinishReason('error');