diff --git a/pr_description.md b/pr_description.md new file mode 100644 index 00000000000..439e0fc4373 --- /dev/null +++ b/pr_description.md @@ -0,0 +1,77 @@ +## Description + +Fixes #5633 + +This PR resolves the critical HTML entity escaping/unescaping issue that was causing diff search/replace operations to fail or produce unintended content modifications. + +## Problem + +The apply_diff tools were unescaping HTML entities (e.g., & → &) in search content for non-Claude models, but the actual file content still contained the escaped entities. This caused: + +1. **Search failures**: When LLMs provided search content with HTML entities, the unescaping made it not match the actual file content +2. **Unintended modifications**: Partial matches could lead to incorrect replacements in files + +## Solution + +- **Removed HTML entity unescaping logic** from applyDiffTool.ts and multiApplyDiffTool.ts for non-Claude models +- **Preserved HTML entities** in search content to ensure exact matching with file content +- **Removed unused imports** of unescapeHtmlEntities from both files +- **Added comprehensive test coverage** to prevent regression + +## Changes Made + +- src/core/tools/applyDiffTool.ts: + + - Removed HTML entity unescaping for non-Claude models (lines 26-28) + - Removed unused import of unescapeHtmlEntities (line 13) + +- src/core/tools/multiApplyDiffTool.ts: + + - Replaced HTML entity unescaping logic with simple assignment (lines 414-418) + - Removed unused import of unescapeHtmlEntities (line 13) + +- src/core/tools/**tests**/applyDiffHtmlEntity.spec.ts: + - Added comprehensive test suite with 5 test cases + - Tests verify HTML entities are preserved in search/replace operations + - Tests cover various entity types: &, <, >, ', " + - Tests verify both Claude and non-Claude model behavior + +## Testing + +- [x] All existing tests pass +- [x] Added comprehensive tests for HTML entity handling scenarios: + - [x] HTML entities preserved in search content for non-Claude models + - [x] HTML entities still unescaped for Claude models (backward compatibility) + - [x] Various entity types tested (&, <, >, ', ") + - [x] Both single and multiple entity scenarios covered +- [x] Manual testing completed: + - [x] Verified search operations work with HTML entities in content + - [x] Confirmed no unintended content modifications occur +- [x] All linting and type checking passes + +## Verification of Acceptance Criteria + +- [x] **Search failures resolved**: HTML entities in search content now match file content exactly +- [x] **Unintended modifications prevented**: No more partial matches causing incorrect replacements +- [x] **Backward compatibility maintained**: Claude model behavior unchanged +- [x] **No regressions**: All existing functionality preserved +- [x] **Comprehensive test coverage**: Edge cases and scenarios covered + +## Related Issues + +This issue was previously attempted to be fixed in: + +- PR #5608 (closed without merging) +- Issue #4077 (related HTML entity handling) + +This PR provides a complete and tested solution that addresses the root cause. + +## Checklist + +- [x] Code follows project style guidelines +- [x] Self-review completed +- [x] Comments added for complex logic +- [x] Documentation updated (test documentation) +- [x] No breaking changes +- [x] All tests passing +- [x] Linting and type checking passes diff --git a/src/core/tools/__tests__/applyDiffHtmlEntity.spec.ts b/src/core/tools/__tests__/applyDiffHtmlEntity.spec.ts new file mode 100644 index 00000000000..7cc665cc6f2 --- /dev/null +++ b/src/core/tools/__tests__/applyDiffHtmlEntity.spec.ts @@ -0,0 +1,259 @@ +import { describe, it, expect, vi, beforeEach } from "vitest" +import { applyDiffToolLegacy } from "../applyDiffTool" +import fs from "fs/promises" + +// Mock dependencies +vi.mock("fs/promises") +vi.mock("../../../utils/fs", () => ({ + fileExistsAtPath: vi.fn().mockResolvedValue(true), +})) + +vi.mock("../../../utils/path", () => ({ + getReadablePath: vi.fn((cwd, relPath) => relPath), +})) + +describe("HTML Entity Handling in apply_diff Tools", () => { + let mockCline: any + let mockBlock: any + let mockAskApproval: any + let mockHandleError: any + let mockPushToolResult: any + let mockRemoveClosingTag: any + + beforeEach(() => { + vi.clearAllMocks() + + // Mock file system + const mockReadFile = vi.mocked(fs.readFile) + mockReadFile.mockResolvedValue("// Comment with & entity\nconst value = 'test';") + + mockCline = { + cwd: "/test", + api: { + getModel: vi.fn().mockReturnValue({ id: "gpt-4" }), // Non-Claude model + }, + diffStrategy: { + applyDiff: vi.fn().mockResolvedValue({ + success: true, + content: "// Comment with & entity\nconst value = 'updated';", + }), + getProgressStatus: vi.fn(), + }, + diffViewProvider: { + editType: "", + open: vi.fn(), + update: vi.fn(), + scrollToFirstDiff: vi.fn(), + saveChanges: vi.fn(), + pushToolWriteResult: vi.fn().mockResolvedValue("File updated successfully"), + reset: vi.fn(), + revertChanges: vi.fn(), + }, + fileContextTracker: { + trackFileContext: vi.fn(), + }, + rooIgnoreController: { + validateAccess: vi.fn().mockReturnValue(true), + }, + rooProtectedController: { + isWriteProtected: vi.fn().mockReturnValue(false), + }, + consecutiveMistakeCount: 0, + consecutiveMistakeCountForApplyDiff: new Map(), + didEditFile: false, + ask: vi.fn(), + say: vi.fn(), + recordToolError: vi.fn(), + sayAndCreateMissingParamError: vi.fn(), + } + + mockAskApproval = vi.fn().mockResolvedValue(true) + mockHandleError = vi.fn() + mockPushToolResult = vi.fn() + mockRemoveClosingTag = vi.fn((tag, value) => value) + }) + + describe("Legacy apply_diff tool", () => { + it("should not unescape HTML entities in diff content for non-Claude models", async () => { + const diffContent = `<<<<<<< SEARCH +:start_line:1 +------- +// Comment with & entity +======= +// Comment with & entity updated +>>>>>>> REPLACE` + + mockBlock = { + params: { + path: "test.js", + diff: diffContent, + }, + partial: false, + } + + await applyDiffToolLegacy( + mockCline, + mockBlock, + mockAskApproval, + mockHandleError, + mockPushToolResult, + mockRemoveClosingTag, + ) + + // Verify that diffStrategy.applyDiff was called with the original diff content (not unescaped) + expect(mockCline.diffStrategy.applyDiff).toHaveBeenCalledWith( + "// Comment with & entity\nconst value = 'test';", + diffContent, + NaN, // parseInt of undefined start_line + ) + }) + + it("should handle files containing various HTML entities without unescaping search content", async () => { + const fileContent = `
Don't forget to check "special offers"
` + + const mockReadFile = vi.mocked(fs.readFile) + mockReadFile.mockResolvedValue(fileContent) + + const diffContent = `<<<<<<< SEARCH +:start_line:1 +------- +