OpenRouterTeam
diff --git a/‎docs/prompt-caching.md‎
Lines changed: 5 additions & 0 deletions b/‎docs/prompt-caching.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎typescript/ai-sdk-v5/README.md‎
Lines changed: 40 additions & 0 deletions b/‎typescript/ai-sdk-v5/README.md‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎typescript/ai-sdk-v5/package.json‎
Lines changed: 18 additions & 0 deletions b/‎typescript/ai-sdk-v5/package.json‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎typescript/ai-sdk-v5/src/prompt-caching/README.md‎
Lines changed: 100 additions & 0 deletions b/‎typescript/ai-sdk-v5/src/prompt-caching/README.md‎
Lines changed: 100 additions & 0 deletions
diff --git a/‎typescript/ai-sdk-v5/src/prompt-caching/multi-message-cache.ts‎
Lines changed: 137 additions & 0 deletions b/‎typescript/ai-sdk-v5/src/prompt-caching/multi-message-cache.ts‎
Lines changed: 137 additions & 0 deletions
@@ -191,3 +191,8 @@ See ecosystem-specific examples:
   - [user-message-cache.ts](../typescript/fetch/src/prompt-caching/user-message-cache.ts)
   - [multi-message-cache.ts](../typescript/fetch/src/prompt-caching/multi-message-cache.ts)
   - [no-cache-control.ts](../typescript/fetch/src/prompt-caching/no-cache-control.ts) (control)
+
+- **AI SDK v5** (Vercel): [typescript/ai-sdk-v5/src/prompt-caching/](../typescript/ai-sdk-v5/src/prompt-caching/)
+  - [user-message-cache.ts](../typescript/ai-sdk-v5/src/prompt-caching/user-message-cache.ts)
+  - [multi-message-cache.ts](../typescript/ai-sdk-v5/src/prompt-caching/multi-message-cache.ts)
+  - [no-cache-control.ts](../typescript/ai-sdk-v5/src/prompt-caching/no-cache-control.ts) (control)
@@ -0,0 +1,40 @@
+# AI SDK v5 Examples
+
+Examples using Vercel AI SDK v5 with @openrouter/ai-sdk-provider.
+
+## Prerequisites
+
+- Bun runtime: `curl -fsSL https://bun.sh/install | bash`
+- `OPENROUTER_API_KEY` environment variable
+
+## Running Examples
+
+```bash
+# From monorepo root (typescript/)
+bun examples
+
+# Or from this workspace
+cd ai-sdk-v5
+bun examples
+```
+
+## Features
+
+- [prompt-caching.ts](./src/prompt-caching.ts) - Anthropic caching with AI SDK v5
+
+### Key Configuration
+
+**CRITICAL**: The AI SDK example requires:
+```typescript
+extraBody: {
+  stream_options: { include_usage: true }
+}
+```
+
+Without this, usage details (including cached_tokens) are not populated in the response.
+
+## Dependencies
+
+- `@openrouter-examples/shared` - Shared constants (LARGE_SYSTEM_PROMPT) and types
+- `@openrouter/ai-sdk-provider` - OpenRouter provider for AI SDK
+- `ai` v5.x - Vercel AI SDK
@@ -0,0 +1,18 @@
+{
+  "name": "@openrouter-examples/ai-sdk-v5",
+  "version": "1.0.0",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "examples": "bun run src/prompt-caching/user-message-cache.ts && bun run src/prompt-caching/multi-message-cache.ts && bun run src/prompt-caching/no-cache-control.ts",
+    "typecheck": "tsc --noEmit"
+  },
+  "dependencies": {
+    "@openrouter-examples/shared": "workspace:*",
+    "@openrouter/ai-sdk-provider": "^1.2.1",
+    "ai": "^5.0.92"
+  },
+  "devDependencies": {
+    "@types/bun": "latest"
+  }
+}
@@ -0,0 +1,100 @@
+# Anthropic Prompt Caching Examples (AI SDK v5)
+
+This directory contains examples demonstrating Anthropic's prompt caching feature via OpenRouter using Vercel AI SDK v5.
+
+## What is Prompt Caching?
+
+Anthropic's prompt caching allows you to cache large portions of your prompts to:
+- **Reduce costs** - Cached tokens cost significantly less
+- **Improve latency** - Cached content is processed faster
+- **Enable larger contexts** - Use more context without proportional cost increases
+
+Cache TTL: 5 minutes for ephemeral caches
+
+## Examples
+
+### User Message Cache (`user-message-cache.ts`)
+Cache large context in user messages using AI SDK:
+```bash
+bun run typescript/ai-sdk-v5/src/prompt-caching/user-message-cache.ts
+```
+
+**Pattern**: User message with `providerOptions.openrouter.cacheControl`
+
+## How to Use with AI SDK
+
+```typescript
+import { createOpenRouter } from '@openrouter/ai-sdk-provider';
+import { generateText } from 'ai';
+
+// CRITICAL: Must include stream_options for usage details
+const openrouter = createOpenRouter({
+  apiKey: process.env.OPENROUTER_API_KEY,
+  extraBody: {
+    stream_options: { include_usage: true }, // Required!
+  },
+});
+
+const result = await generateText({
+  model: openrouter('anthropic/claude-3.5-sonnet'),
+  messages: [
+    {
+      role: 'user',
+      content: [
+        {
+          type: 'text',
+          text: 'Large context here...',
+          providerOptions: {
+            openrouter: {
+              cacheControl: { type: 'ephemeral' }, // Cache this block
+            },
+          },
+        },
+        {
+          type: 'text',
+          text: 'Your question here',
+        },
+      ],
+    },
+  ],
+});
+
+// Check cache metrics
+const cachedTokens = result.providerMetadata?.openrouter?.usage?.promptTokensDetails?.cachedTokens ?? 0;
+```
+
+## Important Notes
+
+### Critical Configuration
+**MUST include `extraBody: { stream_options: { include_usage: true } }`**
+- Without this, usage details (including cached_tokens) are not populated
+- This is a provider-level configuration, not per-request
+
+### Cache Metrics Location
+Cache metrics are in `providerMetadata.openrouter.usage`:
+```typescript
+{
+  promptTokens: number,
+  completionTokens: number,
+  promptTokensDetails: {
+    cachedTokens: number  // Number of tokens read from cache
+  }
+}
+```
+
+### Requirements
+1. **stream_options.include_usage = true** - CRITICAL for usage details
+2. **Minimum 2048+ tokens** - Smaller content may not be cached
+3. **providerOptions.openrouter.cacheControl** - On content items, not messages
+4. **Exact match** - Cache only hits on identical content
+
+### Expected Behavior
+- **First call**: `cachedTokens = 0` (cache miss, creates cache)
+- **Second call**: `cachedTokens > 0` (cache hit, reads from cache)
+
+## Scientific Method
+All examples follow evidence-based verification:
+- **Hypothesis**: providerOptions.openrouter.cacheControl triggers caching
+- **Experiment**: Make identical calls twice
+- **Evidence**: Measure via providerMetadata.openrouter.usage
+- **Analysis**: Compare cache miss vs cache hit
@@ -0,0 +1,137 @@
+/**
+ * Example: Anthropic Prompt Caching - Multi-Message Conversation (AI SDK v5)
+ *
+ * This example demonstrates Anthropic prompt caching in a multi-message conversation
+ * via OpenRouter using Vercel AI SDK v5.
+ *
+ * Pattern: User message cache in multi-turn conversation
+ * - Cache large context in first user message
+ * - Cache persists through conversation history
+ *
+ * To run: bun run typescript/ai-sdk-v5/src/prompt-caching/multi-message-cache.ts
+ */
+
+import { LARGE_SYSTEM_PROMPT } from '@openrouter-examples/shared/constants';
+import { createOpenRouter } from '@openrouter/ai-sdk-provider';
+import { generateText } from 'ai';
+
+const openrouter = createOpenRouter({
+  apiKey: process.env.OPENROUTER_API_KEY,
+  extraBody: {
+    stream_options: { include_usage: true },
+  },
+});
+
+async function main() {
+  console.log('╔════════════════════════════════════════════════════════════════════════════╗');
+  console.log('║   Anthropic Prompt Caching - Multi-Message (AI SDK v5)                    ║');
+  console.log('╚════════════════════════════════════════════════════════════════════════════╝');
+  console.log();
+  console.log('Testing cache_control in multi-turn conversation');
+  console.log();
+
+  try {
+    const testId = Date.now();
+    const model = openrouter('anthropic/claude-3-5-sonnet');
+    const largeContext = `Test ${testId}: Context:\n\n${LARGE_SYSTEM_PROMPT}`;
+
+    // First call with conversation history
+    console.log('First Call (Cache Miss Expected)');
+    const result1 = await generateText({
+      model,
+      messages: [
+        {
+          role: 'user',
+          content: [
+            {
+              type: 'text',
+              text: largeContext,
+              providerOptions: {
+                openrouter: {
+                  cacheControl: { type: 'ephemeral' },
+                },
+              },
+            },
+            {
+              type: 'text',
+              text: "Hello, what's your purpose?",
+            },
+          ],
+        },
+        {
+          role: 'assistant',
+          content: "I'm an AI assistant designed to help with various tasks.",
+        },
+        {
+          role: 'user',
+          content: 'What programming languages do you know?',
+        },
+      ],
+    });
+
+    const cached1 = result1.providerMetadata?.openrouter?.usage?.promptTokensDetails?.cachedTokens ?? 0;
+    console.log(`  Response: ${result1.text.substring(0, 80)}...`);
+    console.log(`  cached_tokens=${cached1}`);
+
+    await new Promise((resolve) => setTimeout(resolve, 1000));
+
+    // Second identical call - should hit cache
+    console.log('\nSecond Call (Cache Hit Expected)');
+    const result2 = await generateText({
+      model,
+      messages: [
+        {
+          role: 'user',
+          content: [
+            {
+              type: 'text',
+              text: largeContext,
+              providerOptions: {
+                openrouter: {
+                  cacheControl: { type: 'ephemeral' },
+                },
+              },
+            },
+            {
+              type: 'text',
+              text: "Hello, what's your purpose?",
+            },
+          ],
+        },
+        {
+          role: 'assistant',
+          content: "I'm an AI assistant designed to help with various tasks.",
+        },
+        {
+          role: 'user',
+          content: 'What programming languages do you know?',
+        },
+      ],
+    });
+
+    const cached2 = result2.providerMetadata?.openrouter?.usage?.promptTokensDetails?.cachedTokens ?? 0;
+    console.log(`  Response: ${result2.text.substring(0, 80)}...`);
+    console.log(`  cached_tokens=${cached2}`);
+
+    // Analysis
+    console.log('\n' + '='.repeat(80));
+    console.log('ANALYSIS');
+    console.log('='.repeat(80));
+    console.log(`First call:  cached_tokens=${cached1} (expected: 0)`);
+    console.log(`Second call: cached_tokens=${cached2} (expected: >0)`);
+
+    const success = cached1 === 0 && cached2 > 0;
+    console.log(`\nResult: ${success ? '✓ CACHE WORKING' : '✗ CACHE NOT WORKING'}`);
+
+    if (success) {
+      console.log('\n✓ SUCCESS - Multi-message caching is working correctly');
+    } else {
+      console.log('\n✗ FAILURE - Multi-message caching is not working as expected');
+    }
+  } catch (error) {
+    console.error('\n❌ ERROR:', error);
+    process.exit(1);
+  }
+}
+
+main();