[Condense] Add button for basic condensing of task message history

canrobins13 · canrobins13 · commit c2d7d416171e · 2025-05-12T16:31:59.000-07:00
diff --git a/src/core/task/Task.ts b/src/core/task/Task.ts
@@ -355,6 +355,13 @@ export class Task extends EventEmitter<ClineEvents> {
 		}
 	}
 
+	/* Condenses a task's message history to use fewer tokens. */
+	async condenseHistory() {
+		// TODO(canyon): Replace with LLM summarization a la https://github.com/cline/cline/pull/3086
+		const previousApiReqIndex = findLastIndex(this.clineMessages, (m) => m.say === "api_req_started")
+		await this.maybeTruncateConversationHistory(previousApiReqIndex)
+	}
+
 	// Note that `partial` has three valid states true (partial message),
 	// false (completion of partial message), undefined (individual complete
 	// message).
@@ -1419,49 +1426,7 @@ export class Task extends EventEmitter<ClineEvents> {
 			)
 		})()
 
-		// If the previous API request's total token usage is close to the
-		// context window, truncate the conversation history to free up space
-		// for the new request.
-		if (previousApiReqIndex >= 0) {
-			const previousRequest = this.clineMessages[previousApiReqIndex]?.text
-
-			if (!previousRequest) {
-				return
-			}
-
-			const {
-				tokensIn = 0,
-				tokensOut = 0,
-				cacheWrites = 0,
-				cacheReads = 0,
-			}: ClineApiReqInfo = JSON.parse(previousRequest)
-
-			const totalTokens = tokensIn + tokensOut + cacheWrites + cacheReads
-
-			// Default max tokens value for thinking models when no specific
-			// value is set.
-			const DEFAULT_THINKING_MODEL_MAX_TOKENS = 16_384
-
-			const modelInfo = this.api.getModel().info
-
-			const maxTokens = modelInfo.thinking
-				? this.apiConfiguration.modelMaxTokens || DEFAULT_THINKING_MODEL_MAX_TOKENS
-				: modelInfo.maxTokens
-
-			const contextWindow = modelInfo.contextWindow
-
-			const trimmedMessages = await truncateConversationIfNeeded({
-				messages: this.apiConversationHistory,
-				totalTokens,
-				maxTokens,
-				contextWindow,
-				apiHandler: this.api,
-			})
-
-			if (trimmedMessages !== this.apiConversationHistory) {
-				await this.overwriteApiConversationHistory(trimmedMessages)
-			}
-		}
+		await this.maybeTruncateConversationHistory(previousApiReqIndex)
 
 		// Clean conversation history by:
 		// 1. Converting to Anthropic.MessageParam by spreading only the API-required properties.
@@ -1585,6 +1550,52 @@ export class Task extends EventEmitter<ClineEvents> {
 		yield* iterator
 	}
 
+	private async maybeTruncateConversationHistory(previousApiReqIndex: number) {
+		// If the previous API request's total token usage is close to the
+		// context window, truncate the conversation history to free up space
+		// for the new request.
+		if (previousApiReqIndex >= 0) {
+			const previousRequest = this.clineMessages[previousApiReqIndex]?.text
+
+			if (!previousRequest) {
+				return
+			}
+
+			const {
+				tokensIn = 0,
+				tokensOut = 0,
+				cacheWrites = 0,
+				cacheReads = 0,
+			}: ClineApiReqInfo = JSON.parse(previousRequest)
+
+			const totalTokens = tokensIn + tokensOut + cacheWrites + cacheReads
+
+			// Default max tokens value for thinking models when no specific
+			// value is set.
+			const DEFAULT_THINKING_MODEL_MAX_TOKENS = 16_384
+
+			const modelInfo = this.api.getModel().info
+
+			const maxTokens = modelInfo.thinking
+				? this.apiConfiguration.modelMaxTokens || DEFAULT_THINKING_MODEL_MAX_TOKENS
+				: modelInfo.maxTokens
+
+			const contextWindow = modelInfo.contextWindow
+
+			const trimmedMessages = await truncateConversationIfNeeded({
+				messages: this.apiConversationHistory,
+				totalTokens,
+				maxTokens,
+				contextWindow,
+				apiHandler: this.api,
+			})
+
+			if (trimmedMessages !== this.apiConversationHistory) {
+				await this.overwriteApiConversationHistory(trimmedMessages)
+			}
+		}
+	}
+
 	// Checkpoints
 
 	public async checkpointSave() {
diff --git a/src/core/webview/ClineProvider.ts b/src/core/webview/ClineProvider.ts
@@ -1181,6 +1181,22 @@ export class ClineProvider extends EventEmitter<ClineProviderEvents> implements
 		}
 	}
 
+	/* Condenses a task's message history to use fewer tokens. */
+	async condenseTaskHistory(id: string) {
+		let task = undefined
+		for (let i = this.clineStack.length - 1; i >= 0; i--) {
+			if (this.clineStack[i].taskId === id) {
+				task = this.clineStack[i]
+				break
+			}
+		}
+		if (!task) {
+			const { historyItem } = await this.getTaskWithId(id)
+			task = await this.initClineWithHistoryItem(historyItem)
+		}
+		await task.condenseHistory()
+	}
+
 	async deleteTaskFromState(id: string) {
 		const taskHistory = this.getGlobalState("taskHistory") ?? []
 		const updatedTaskHistory = taskHistory.filter((task) => task.id !== id)
diff --git a/src/core/webview/webviewMessageHandler.ts b/src/core/webview/webviewMessageHandler.ts
@@ -198,6 +198,9 @@ export const webviewMessageHandler = async (provider: ClineProvider, message: We
 		case "deleteTaskWithId":
 			provider.deleteTaskWithId(message.text!)
 			break
+		case "condenseTaskHistory":
+			provider.condenseTaskHistory(message.text!)
+			break
 		case "deleteMultipleTasksWithIds": {
 			const ids = message.ids
 
diff --git a/src/shared/WebviewMessage.ts b/src/shared/WebviewMessage.ts
@@ -38,6 +38,7 @@ export interface WebviewMessage {
 		| "showTaskWithId"
 		| "deleteTaskWithId"
 		| "exportTaskWithId"
+		| "condenseTaskHistory"
 		| "importSettings"
 		| "exportSettings"
 		| "resetState"
diff --git a/webview-ui/src/components/chat/TaskActions.tsx b/webview-ui/src/components/chat/TaskActions.tsx
@@ -24,6 +24,13 @@ export const TaskActions = ({ item }: { item: HistoryItem | undefined }) => {
 			</Button>
 			{!!item?.size && item.size > 0 && (
 				<>
+					<Button
+						variant="ghost"
+						size="sm"
+						title={t("chat:task.condenseTaskHistory")}
+						onClick={() => vscode.postMessage({ type: "condenseTaskHistory", text: item?.id })}>
+						<span className="codicon codicon-file-zip" />
+					</Button>
 					<Button
 						variant="ghost"
 						size="sm"
diff --git a/webview-ui/src/i18n/locales/en/chat.json b/webview-ui/src/i18n/locales/en/chat.json
@@ -10,6 +10,7 @@
 		"contextWindow": "Context Length:",
 		"closeAndStart": "Close task and start a new one",
 		"export": "Export task history",
+		"condenseTaskHistory": "Condense task message history",
 		"delete": "Delete Task (Shift + Click to skip confirmation)"
 	},
 	"unpin": "Unpin",