OpenRouterTeam
diff --git a/‎docs/prompt-caching.md‎
Lines changed: 5 additions & 0 deletions b/‎docs/prompt-caching.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎typescript/effect-ai/README.md‎
Lines changed: 48 additions & 0 deletions b/‎typescript/effect-ai/README.md‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎typescript/effect-ai/package.json‎
Lines changed: 21 additions & 0 deletions b/‎typescript/effect-ai/package.json‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎typescript/effect-ai/src/prompt-caching/README.md‎
Lines changed: 121 additions & 0 deletions b/‎typescript/effect-ai/src/prompt-caching/README.md‎
Lines changed: 121 additions & 0 deletions
diff --git a/‎typescript/effect-ai/src/prompt-caching/multi-message-cache.ts‎
Lines changed: 115 additions & 0 deletions b/‎typescript/effect-ai/src/prompt-caching/multi-message-cache.ts‎
Lines changed: 115 additions & 0 deletions
@@ -196,3 +196,8 @@ See ecosystem-specific examples:
   - [user-message-cache.ts](../typescript/ai-sdk-v5/src/prompt-caching/user-message-cache.ts)
   - [multi-message-cache.ts](../typescript/ai-sdk-v5/src/prompt-caching/multi-message-cache.ts)
   - [no-cache-control.ts](../typescript/ai-sdk-v5/src/prompt-caching/no-cache-control.ts) (control)
+
+- **Effect AI** (@effect/ai): [typescript/effect-ai/src/prompt-caching/](../typescript/effect-ai/src/prompt-caching/)
+  - [user-message-cache.ts](../typescript/effect-ai/src/prompt-caching/user-message-cache.ts)
+  - [multi-message-cache.ts](../typescript/effect-ai/src/prompt-caching/multi-message-cache.ts)
+  - [no-cache-control.ts](../typescript/effect-ai/src/prompt-caching/no-cache-control.ts) (control)
@@ -0,0 +1,48 @@
+# Effect-TS AI Examples
+
+Examples using Effect-TS with @effect/ai and @effect/ai-openrouter for type-safe, composable AI operations.
+
+## Prerequisites
+
+- Bun runtime: `curl -fsSL https://bun.sh/install | bash`
+- `OPENROUTER_API_KEY` environment variable
+
+## Running Examples
+
+```bash
+# From monorepo root (typescript/)
+bun examples
+
+# Or from this workspace
+cd effect-ai
+bun examples
+```
+
+## Features
+
+- [prompt-caching.ts](./src/prompt-caching.ts) - Anthropic caching with Effect patterns
+
+### Key Configuration
+
+**CRITICAL**: The Effect AI example requires:
+```typescript
+config: {
+  stream_options: { include_usage: true }
+}
+```
+
+Without this, `usage.cachedInputTokens` will be undefined in the response.
+
+### Effect Patterns Demonstrated
+
+- `Effect.gen` for generator-based composition
+- Layer-based dependency injection
+- Type-safe error handling
+- Evidence-based validation
+
+## Dependencies
+
+- `@openrouter-examples/shared` - Shared constants (LARGE_SYSTEM_PROMPT) and types
+- `@effect/ai` - Effect AI abstractions
+- `@effect/ai-openrouter` - OpenRouter provider for Effect AI
+- `effect` - Effect-TS core library
@@ -0,0 +1,21 @@
+{
+  "name": "@openrouter-examples/effect-ai",
+  "version": "1.0.0",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "examples": "bun run src/prompt-caching/user-message-cache.ts && bun run src/prompt-caching/multi-message-cache.ts && bun run src/prompt-caching/no-cache-control.ts",
+    "typecheck": "tsc --noEmit"
+  },
+  "dependencies": {
+    "@openrouter-examples/shared": "workspace:*",
+    "@effect/ai": "^0.32.1",
+    "@effect/ai-openrouter": "^0.6.0",
+    "@effect/platform": "^0.93.0",
+    "@effect/platform-bun": "^0.83.0",
+    "effect": "^3.19.3"
+  },
+  "devDependencies": {
+    "@types/bun": "latest"
+  }
+}
@@ -0,0 +1,121 @@
+# Anthropic Prompt Caching Examples (Effect AI)
+
+This directory contains examples demonstrating Anthropic's prompt caching feature via OpenRouter using @effect/ai and @effect/ai-openrouter.
+
+## What is Prompt Caching?
+
+Anthropic's prompt caching allows you to cache large portions of your prompts to:
+- **Reduce costs** - Cached tokens cost significantly less
+- **Improve latency** - Cached content is processed faster
+- **Enable larger contexts** - Use more context without proportional cost increases
+
+Cache TTL: 5 minutes for ephemeral caches
+
+## Examples
+
+### User Message Cache (`user-message-cache.ts`)
+Cache large context in user messages using Effect AI:
+```bash
+bun run typescript/effect-ai/src/prompt-caching/user-message-cache.ts
+```
+
+**Pattern**: User message with `options.openrouter.cacheControl` using Effect.gen
+
+## How to Use with Effect AI
+
+```typescript
+import * as OpenRouterClient from '@effect/ai-openrouter/OpenRouterClient';
+import * as OpenRouterLanguageModel from '@effect/ai-openrouter/OpenRouterLanguageModel';
+import * as LanguageModel from '@effect/ai/LanguageModel';
+import * as Prompt from '@effect/ai/Prompt';
+import { Effect, Layer, Redacted } from 'effect';
+
+// Create OpenRouter client layer
+const OpenRouterClientLayer = OpenRouterClient.layer({
+  apiKey: Redacted.make(process.env.OPENROUTER_API_KEY!),
+}).pipe(Layer.provide(FetchHttpClient.layer));
+
+// Create language model layer with CRITICAL stream_options config
+const OpenRouterModelLayer = OpenRouterLanguageModel.layer({
+  model: 'anthropic/claude-3.5-sonnet',
+  config: {
+    stream_options: { include_usage: true }, // CRITICAL: Required!
+  },
+}).pipe(Layer.provide(OpenRouterClientLayer));
+
+// Use in Effect.gen program
+const program = Effect.gen(function* () {
+  const response = yield* LanguageModel.generateText({
+    prompt: Prompt.make([
+      {
+        role: 'user',
+        content: [
+          {
+            type: 'text',
+            text: 'Large context here...',
+            options: {
+              openrouter: {
+                cacheControl: { type: 'ephemeral' }, // Cache this block
+              },
+            },
+          },
+          {
+            type: 'text',
+            text: 'Your question here',
+          },
+        ],
+      },
+    ]),
+  });
+
+  // Check cache metrics
+  const cachedTokens = response.usage.cachedInputTokens ?? 0;
+});
+
+// Run with dependencies
+await program.pipe(
+  Effect.provide(OpenRouterModelLayer),
+  Effect.runPromise,
+);
+```
+
+## Important Notes
+
+### Critical Configuration
+**MUST include `stream_options: { include_usage: true }` in model config**
+- Without this, usage.cachedInputTokens will be undefined
+- OpenRouterClient only sets this for streaming by default
+- Must be set explicitly in the layer configuration
+
+### Cache Metrics Location
+Cache metrics are in `response.usage`:
+```typescript
+{
+  inputTokens: number,
+  outputTokens: number,
+  cachedInputTokens: number  // Number of tokens read from cache
+}
+```
+
+### Requirements
+1. **stream_options.include_usage = true** - In model config layer
+2. **Minimum 2048+ tokens** - Smaller content may not be cached
+3. **options.openrouter.cacheControl** - On content items in Prompt
+4. **Exact match** - Cache only hits on identical content
+
+### Expected Behavior
+- **First call**: `cachedInputTokens = 0` (cache miss, creates cache)
+- **Second call**: `cachedInputTokens > 0` (cache hit, reads from cache)
+
+### Effect-Specific Patterns
+- Use `Effect.gen` for composable effect workflows
+- Layer-based dependency injection for client and model
+- Type-safe error handling via Effect type
+- Structured concurrency with Effect.sleep for delays
+
+## Scientific Method
+All examples follow evidence-based verification:
+- **Hypothesis**: options.openrouter.cacheControl triggers caching
+- **Experiment**: Make identical calls twice
+- **Evidence**: Measure via response.usage.cachedInputTokens
+- **Analysis**: Compare cache miss vs cache hit
@@ -0,0 +1,115 @@
+/**
+ * Example: Anthropic Prompt Caching - Multi-Message Conversation (Effect AI)
+ *
+ * This example demonstrates Anthropic prompt caching in a multi-message conversation
+ * via OpenRouter using Effect AI.
+ *
+ * Pattern: User message cache in multi-turn conversation using Effect patterns
+ *
+ * To run: bun run typescript/effect-ai/src/prompt-caching/multi-message-cache.ts
+ */
+
+import * as OpenRouterClient from '@effect/ai-openrouter/OpenRouterClient';
+import * as OpenRouterLanguageModel from '@effect/ai-openrouter/OpenRouterLanguageModel';
+import * as LanguageModel from '@effect/ai/LanguageModel';
+import * as Prompt from '@effect/ai/Prompt';
+import { FetchHttpClient } from '@effect/platform';
+import * as BunContext from '@effect/platform-bun/BunContext';
+import { LARGE_SYSTEM_PROMPT } from '@openrouter-examples/shared/constants';
+import { Console, Effect, Layer, Redacted } from 'effect';
+
+const program = Effect.gen(function* () {
+  const testId = Date.now();
+  const largeContext = `Test ${testId}: Context:\n\n${LARGE_SYSTEM_PROMPT}`;
+
+  yield* Console.log('╔════════════════════════════════════════════════════════════════════════════╗');
+  yield* Console.log('║   Anthropic Prompt Caching - Multi-Message (Effect AI)                    ║');
+  yield* Console.log('╚════════════════════════════════════════════════════════════════════════════╝');
+  yield* Console.log('');
+  yield* Console.log('Testing cache_control in multi-turn conversation');
+  yield* Console.log('');
+
+  const makePrompt = () =>
+    Prompt.make([
+      {
+        role: 'user' as const,
+        content: [
+          {
+            type: 'text' as const,
+            text: largeContext,
+            options: {
+              openrouter: {
+                cacheControl: { type: 'ephemeral' as const },
+              },
+            },
+          },
+          {
+            type: 'text' as const,
+            text: "Hello, what's your purpose?",
+          },
+        ],
+      },
+      {
+        role: 'assistant' as const,
+        content: "I'm an AI assistant designed to help with various tasks.",
+      },
+      {
+        role: 'user' as const,
+        content: 'What programming languages do you know?',
+      },
+    ]);
+
+  yield* Console.log('First Call (Cache Miss Expected)');
+  const response1 = yield* LanguageModel.generateText({
+    prompt: makePrompt(),
+  });
+  const cached1 = response1.usage.cachedInputTokens ?? 0;
+  yield* Console.log(`  Response: ${response1.text.substring(0, 80)}...`);
+  yield* Console.log(`  cached_tokens=${cached1}`);
+
+  yield* Effect.sleep('1 second');
+
+  yield* Console.log('\nSecond Call (Cache Hit Expected)');
+  const response2 = yield* LanguageModel.generateText({
+    prompt: makePrompt(),
+  });
+  const cached2 = response2.usage.cachedInputTokens ?? 0;
+  yield* Console.log(`  Response: ${response2.text.substring(0, 80)}...`);
+  yield* Console.log(`  cached_tokens=${cached2}`);
+
+  // Analysis
+  yield* Console.log('\n' + '='.repeat(80));
+  yield* Console.log('ANALYSIS');
+  yield* Console.log('='.repeat(80));
+  yield* Console.log(`First call:  cached_tokens=${cached1} (expected: 0)`);
+  yield* Console.log(`Second call: cached_tokens=${cached2} (expected: >0)`);
+
+  const success = cached1 === 0 && cached2 > 0;
+
+  if (success) {
+    yield* Console.log('\n✓ SUCCESS - Multi-message caching is working correctly');
+  } else {
+    yield* Console.log('\n✗ FAILURE - Multi-message caching is not working as expected');
+  }
+
+  yield* Console.log('='.repeat(80));
+});
+
+const OpenRouterClientLayer = OpenRouterClient.layer({
+  apiKey: Redacted.make(process.env.OPENROUTER_API_KEY!),
+}).pipe(Layer.provide(FetchHttpClient.layer));
+
+const OpenRouterModelLayer = OpenRouterLanguageModel.layer({
+  model: 'anthropic/claude-3.5-sonnet',
+  config: {
+    stream_options: { include_usage: true },
+  },
+}).pipe(Layer.provide(OpenRouterClientLayer));
+
+await program.pipe(
+  Effect.provide(OpenRouterModelLayer),
+  Effect.provide(BunContext.layer),
+  Effect.runPromise,
+);
+
+console.log('\n✓ Program completed successfully');