fix: address PR review comments

hannesrudolph · daniel-lxs · commit 24eca3fe89a7 · 2025-06-25T19:31:59.000-05:00
- Extract IMAGE_TOKEN_ESTIMATE as a named constant for clarity
- Update token counting tests to use exact counts instead of ranges for deterministic testing
- Fix test expectations to match actual tokenizer output
diff --git a/src/api/providers/__tests__/claude-code-token-counting.spec.ts b/src/api/providers/__tests__/claude-code-token-counting.spec.ts
@@ -27,11 +27,9 @@ describe("ClaudeCodeHandler Token Counting", () => {
 
 			const tokenCount = await handler.countTokens(content)
 
-			// The text has approximately 13-15 tokens
-			// With no fudge factor, we expect the exact token count
-			// With the old 1.5x fudge factor, it would have been around 20-23 tokens
-			expect(tokenCount).toBeLessThan(16)
-			expect(tokenCount).toBeGreaterThan(12)
+			// The exact token count for this text using o200k_base tokenizer is 13
+			// With the old 1.5x fudge factor, it would have been 20 tokens
+			expect(tokenCount).toBe(13)
 		})
 
 		it("should handle empty content", async () => {
@@ -49,10 +47,9 @@ describe("ClaudeCodeHandler Token Counting", () => {
 
 			const tokenCount = await handler.countTokens(content)
 
-			// Each block is approximately 2-3 tokens, so 6-9 tokens total
-			// With no fudge factor, expect exact count
-			expect(tokenCount).toBeLessThan(10) // Would be ~15 with old 1.5x factor
-			expect(tokenCount).toBeGreaterThan(5)
+			// "First block" = 2 tokens, "Second block" = 2 tokens, "Third block" = 2 tokens
+			// Total: 6 tokens (would have been 9 with old 1.5x factor)
+			expect(tokenCount).toBe(6)
 		})
 
 		it("should handle image blocks with conservative estimate", async () => {
@@ -74,44 +71,52 @@ describe("ClaudeCodeHandler Token Counting", () => {
 		})
 
 		it("should provide accurate token counts for typical messages", async () => {
-			// Simulate a typical user message with environment details
+			// Use a simpler, predictable message for exact token counting
 			const content: Anthropic.Messages.ContentBlockParam[] = [
 				{
 					type: "text",
-					text: `Hi
+					text: "This is a simple test message with exactly predictable token count.",
+				},
+			]
 
-<environment_details>
-# VSCode Visible Files
-src/app.ts
-src/utils.ts
+			const tokenCount = await handler.countTokens(content)
 
-# VSCode Open Tabs
-src/app.ts
+			// This specific text has exactly 12 tokens with o200k_base tokenizer
+			// With old 1.5x factor, it would have been 18 tokens
+			expect(tokenCount).toBe(12)
+		})
 
-# Current Time
-2024-01-01 12:00:00 PM
+		it("should handle mixed content types", async () => {
+			const content: Anthropic.Messages.ContentBlockParam[] = [
+				{ type: "text", text: "Hello world" }, // 2 tokens
+				{
+					type: "image",
+					source: {
+						type: "base64",
+						media_type: "image/jpeg",
+						data: "base64data",
+					},
+				}, // 300 tokens (IMAGE_TOKEN_ESTIMATE)
+				{ type: "text", text: "Goodbye" }, // 1 token
+			]
 
-# Current Context Size (Tokens)
-1000 (5%)
+			const tokenCount = await handler.countTokens(content)
 
-# Current Cost
-$0.05
+			// Total: 2 + 300 + 2 = 304 tokens ("Goodbye" is actually 2 tokens)
+			expect(tokenCount).toBe(304)
+		})
 
-# Current Mode
-<slug>code</slug>
-<name>Code</name>
-<model>claude-3-5-sonnet-20241022</model>
-</environment_details>`,
-				},
+		it("should handle empty text blocks", async () => {
+			const content: Anthropic.Messages.ContentBlockParam[] = [
+				{ type: "text", text: "" },
+				{ type: "text", text: "Hello" }, // 1 token
+				{ type: "text", text: "" },
 			]
 
 			const tokenCount = await handler.countTokens(content)
 
-			// This content is approximately 100-120 tokens
-			// With no fudge factor, expect exact count
-			// With old 1.5x factor, it would have been 150-180 tokens
-			expect(tokenCount).toBeLessThan(125)
-			expect(tokenCount).toBeGreaterThan(95)
+			// Only "Hello" contributes tokens
+			expect(tokenCount).toBe(1)
 		})
 	})
 })
diff --git a/src/api/providers/claude-code.ts b/src/api/providers/claude-code.ts
@@ -10,6 +10,10 @@ import { ApiHandlerOptions } from "../../shared/api"
 import { Tiktoken } from "tiktoken/lite"
 import o200kBase from "tiktoken/encoders/o200k_base"
 
+// Conservative token estimate for images (even though Claude Code doesn't support them)
+// This matches the estimate used in src/utils/tiktoken.ts for consistency
+const IMAGE_TOKEN_ESTIMATE = 300
+
 export class ClaudeCodeHandler extends BaseProvider implements ApiHandler {
 	private options: ApiHandlerOptions
 	private encoder: Tiktoken | null = null
@@ -176,8 +180,7 @@ export class ClaudeCodeHandler extends BaseProvider implements ApiHandler {
 				}
 			} else if (block.type === "image") {
 				// Claude Code doesn't support images, but we handle them just in case
-				// Use a conservative estimate
-				totalTokens += 300
+				totalTokens += IMAGE_TOKEN_ESTIMATE
 			}
 		}
 

Original file line number	Diff line number	Diff line change
`@@ -10,6 +10,10 @@ import { ApiHandlerOptions } from "../../shared/api"`
`10`	`10`	`import { Tiktoken } from "tiktoken/lite"`
`11`	`11`	`import o200kBase from "tiktoken/encoders/o200k_base"`
`12`	`12`
	`13`	`+// Conservative token estimate for images (even though Claude Code doesn't support them)`
	`14`	`+// This matches the estimate used in src/utils/tiktoken.ts for consistency`
	`15`	`+const IMAGE_TOKEN_ESTIMATE = 300`
	`16`	`+`
`13`	`17`	`export class ClaudeCodeHandler extends BaseProvider implements ApiHandler {`
`14`	`18`	`private options: ApiHandlerOptions`
`15`	`19`	`private encoder: Tiktoken \| null = null`
`@@ -176,8 +180,7 @@ export class ClaudeCodeHandler extends BaseProvider implements ApiHandler {`
`176`	`180`	`}`
`177`	`181`	`} else if (block.type === "image") {`
`178`	`182`	`// Claude Code doesn't support images, but we handle them just in case`
`179`		`- // Use a conservative estimate`
`180`		`- totalTokens += 300`
	`183`	`+ totalTokens += IMAGE_TOKEN_ESTIMATE`
`181`	`184`	`}`
`182`	`185`	`}`
`183`	`186`