fix: optimize memory bank token usage and add new tab support (#2366)

tsmithsz · web-flow · commit 3057d56e4a30 · 2025-10-01T12:52:58.000-07:00
diff --git a/chat-client/src/client/features/rules.test.ts b/chat-client/src/client/features/rules.test.ts
@@ -16,13 +16,17 @@ describe('rules', () => {
         mynahUi = {
             openTopBarButtonOverlay: sinon.stub(),
             showCustomForm: sinon.stub(),
+            getAllTabs: sinon.stub().returns({}),
+            updateStore: sinon.stub().returns('new-tab-id'),
+            notify: sinon.stub(),
         } as unknown as MynahUI
         openTopBarButtonOverlayStub = mynahUi.openTopBarButtonOverlay as sinon.SinonStub
         showCustomFormStub = mynahUi.showCustomForm as sinon.SinonStub
 
         messager = {
             onRuleClick: sinon.stub(),
             onChatPrompt: sinon.stub(),
+            onTabAdd: sinon.stub(),
         } as unknown as Messager
 
         rulesList = new RulesList(mynahUi, messager)
@@ -151,12 +155,17 @@ describe('rules', () => {
 
             onItemClick(createMemoryBankItem)
 
-            // Should send a chat prompt
+            // Should create new tab and send chat prompt
+            sinon.assert.calledOnce(messager.onTabAdd as sinon.SinonStub)
             sinon.assert.calledOnce(messager.onChatPrompt as sinon.SinonStub)
 
+            const tabAddArgs = (messager.onTabAdd as sinon.SinonStub).getCall(0).args[0]
+            assert.equal(tabAddArgs, 'new-tab-id')
+
             const chatPromptArgs = (messager.onChatPrompt as sinon.SinonStub).getCall(0).args[0]
             assert.equal(chatPromptArgs.prompt.prompt, 'Generate a Memory Bank for this project')
             assert.equal(chatPromptArgs.prompt.escapedPrompt, 'Generate a Memory Bank for this project')
+            assert.equal(chatPromptArgs.tabId, 'new-tab-id')
         })
 
         it('calls messager when regular rule is clicked', () => {
diff --git a/chat-client/src/client/features/rules.ts b/chat-client/src/client/features/rules.ts
@@ -1,4 +1,11 @@
-import { MynahIconsType, MynahUI, DetailedListItem, DetailedListItemGroup, MynahIcons } from '@aws/mynah-ui'
+import {
+    MynahIconsType,
+    MynahUI,
+    DetailedListItem,
+    DetailedListItemGroup,
+    MynahIcons,
+    NotificationType,
+} from '@aws/mynah-ui'
 import { Messager } from '../messager'
 import { ListRulesResult } from '@aws/language-server-runtimes-types'
 import { RulesFolder } from '@aws/language-server-runtimes-types'
@@ -82,14 +89,38 @@ export class RulesList {
         // Close the rules list first
         this.rulesList?.close()
 
-        // Use the current tab, the tabId should be the same as the one used for the rules list
-        this.messager.onChatPrompt({
-            prompt: {
-                prompt: 'Generate a Memory Bank for this project',
-                escapedPrompt: 'Generate a Memory Bank for this project',
-            },
-            tabId: this.tabId,
-        })
+        // Check if we're at the tab limit (10 tabs max)
+        const currentTabCount = Object.keys(this.mynahUi.getAllTabs()).length
+        if (currentTabCount >= 10) {
+            // Show notification that max tabs reached
+            this.mynahUi.notify({
+                content: 'You can only open ten conversation tabs at a time.',
+                type: NotificationType.WARNING,
+            })
+            return
+        }
+
+        // Create a new tab for the memory bank generation
+        const newTabId = this.mynahUi.updateStore('', { tabTitle: 'Memory Bank' })
+        if (newTabId) {
+            // Add the new tab and switch to it
+            this.messager.onTabAdd(newTabId)
+
+            // Send the chat prompt to the new tab
+            this.messager.onChatPrompt({
+                prompt: {
+                    prompt: 'Generate a Memory Bank for this project',
+                    escapedPrompt: 'Generate a Memory Bank for this project',
+                },
+                tabId: newTabId,
+            })
+        } else {
+            // Show error notification if tab creation failed
+            this.mynahUi.notify({
+                content: 'Failed to create new tab for Memory Bank generation.',
+                type: NotificationType.ERROR,
+            })
+        }
     }
 
     showLoading(tabId: string) {
diff --git a/server/aws-lsp-codewhisperer/src/language-server/agenticChat/agenticChatController.ts b/server/aws-lsp-codewhisperer/src/language-server/agenticChat/agenticChatController.ts
@@ -189,6 +189,8 @@ import {
     DEFAULT_WINDOW_STOP_SHORTCUT,
     COMPACTION_CHARACTER_THRESHOLD,
     MAX_OVERALL_CHARACTERS,
+    FSREAD_MEMORY_BANK_MAX_PER_FILE,
+    FSREAD_MEMORY_BANK_MAX_TOTAL,
 } from './constants/constants'
 import {
     AgenticChatError,
@@ -837,9 +839,17 @@ export class AgenticChatController implements ChatHandlers {
 
         IdleWorkspaceManager.recordActivityTimestamp()
 
+        const sessionResult = this.#chatSessionManagementService.getSession(params.tabId)
+        const { data: session, success } = sessionResult
+
+        if (!success) {
+            return new ResponseError<ChatResult>(ErrorCodes.InternalError, sessionResult.error)
+        }
+
         // Memory Bank Creation Flow - Delegate to MemoryBankController
         if (this.#memoryBankController.isMemoryBankCreationRequest(params.prompt.prompt)) {
             this.#features.logging.info(`Memory Bank creation request detected for tabId: ${params.tabId}`)
+            session.isMemoryBankGeneration = true
 
             // Store original prompt to prevent data loss on failure
             const originalPrompt = params.prompt.prompt
@@ -921,6 +931,8 @@ export class AgenticChatController implements ChatHandlers {
                 this.#features.logging.error(`Memory Bank preparation failed: ${error}`)
                 // Restore original prompt to ensure no data loss
                 params.prompt.prompt = originalPrompt
+                // Reset memory bank flag since preparation failed
+                session.isMemoryBankGeneration = false
             }
         }
 
@@ -929,14 +941,6 @@ export class AgenticChatController implements ChatHandlers {
             return maybeDefaultResponse
         }
 
-        const sessionResult = this.#chatSessionManagementService.getSession(params.tabId)
-
-        const { data: session, success } = sessionResult
-
-        if (!success) {
-            return new ResponseError<ChatResult>(ErrorCodes.InternalError, sessionResult.error)
-        }
-
         const compactIds = session.getAllDeferredCompactMessageIds()
         await this.#invalidateCompactCommand(params.tabId, compactIds)
         session.rejectAllDeferredToolExecutions(new ToolApprovalException('Command ignored: new prompt', false))
@@ -1930,7 +1934,14 @@ export class AgenticChatController implements ChatHandlers {
                         }
 
                         const { Tool } = toolMap[toolUse.name as keyof typeof toolMap]
-                        const tool = new Tool(this.#features)
+                        const tool =
+                            toolUse.name === FS_READ && session.isMemoryBankGeneration
+                                ? new Tool(
+                                      this.#features,
+                                      FSREAD_MEMORY_BANK_MAX_PER_FILE,
+                                      FSREAD_MEMORY_BANK_MAX_TOTAL
+                                  )
+                                : new Tool(this.#features)
 
                         // For MCP tools, get the permission from McpManager
                         // const permission = McpManager.instance.getToolPerm('Built-in', toolUse.name)
@@ -3458,6 +3469,9 @@ export class AgenticChatController implements ChatHandlers {
             },
         })
 
+        // Reset memory bank flag after completion
+        session.isMemoryBankGeneration = false
+
         return chatResultStream.getResult()
     }
 
@@ -3485,6 +3499,12 @@ export class AgenticChatController implements ChatHandlers {
         const errorCode = err.code ?? ''
         await this.#telemetryController.emitAddMessageMetric(tabId, metric.metric, 'Failed', errorMessage, errorCode)
 
+        // Reset memory bank flag on request error
+        const sessionResult = this.#chatSessionManagementService.getSession(tabId)
+        if (sessionResult.success) {
+            sessionResult.data.isMemoryBankGeneration = false
+        }
+
         if (isUsageLimitError(err)) {
             if (this.#paidTierMode !== 'paidtier') {
                 this.setPaidTierMode(tabId, 'freetier-limit')
diff --git a/server/aws-lsp-codewhisperer/src/language-server/agenticChat/constants/constants.ts b/server/aws-lsp-codewhisperer/src/language-server/agenticChat/constants/constants.ts
@@ -81,6 +81,16 @@ The summary should have following main sections:
 </example_output>
 `
 
+// FsRead limits
+export const FSREAD_MAX_PER_FILE = 200_000
+export const FSREAD_MAX_TOTAL = 400_000
+export const FSREAD_MEMORY_BANK_MAX_PER_FILE = 20_000
+export const FSREAD_MEMORY_BANK_MAX_TOTAL = 100_000
+
+// Memory Bank constants
+// Temporarily reduced from recommended 20 to 5 for token optimization
+export const MAX_NUMBER_OF_FILES_FOR_MEMORY_BANK_RANKING = 5
+
 // shortcut constant
 export const DEFAULT_MACOS_RUN_SHORTCUT = '&#8679; &#8984; &#8629;'
 export const DEFAULT_WINDOW_RUN_SHORTCUT = 'Ctrl + &#8679; + &#8629;'
diff --git a/server/aws-lsp-codewhisperer/src/language-server/agenticChat/context/memorybank/memoryBankController.ts b/server/aws-lsp-codewhisperer/src/language-server/agenticChat/context/memorybank/memoryBankController.ts
@@ -6,6 +6,7 @@
 import { Features } from '@aws/language-server-runtimes/server-interface/server'
 import { MemoryBankPrompts } from './memoryBankPrompts'
 import { normalizePathFromUri } from '../../tools/mcp/mcpUtils'
+import { MAX_NUMBER_OF_FILES_FOR_MEMORY_BANK_RANKING } from '../../constants/constants'
 
 const MEMORY_BANK_DIRECTORY = '.amazonq/rules/memory-bank'
 const MEMORY_BANK_FILES = {
@@ -71,7 +72,10 @@ export class MemoryBankController {
             const analysisResults = await this.executeGuidelinesGenerationPipeline(workspaceFolderUri)
 
             // Step 3: Make LLM call for file ranking
-            const rankingPrompt = MemoryBankPrompts.getFileRankingPrompt(analysisResults.formattedFilesString, 10)
+            const rankingPrompt = MemoryBankPrompts.getFileRankingPrompt(
+                analysisResults.formattedFilesString,
+                MAX_NUMBER_OF_FILES_FOR_MEMORY_BANK_RANKING
+            )
             const rankedFilesResponse = await llmCallFunction(rankingPrompt)
 
             // Step 4: Parse ranked files
@@ -111,7 +115,7 @@ export class MemoryBankController {
                 this.features.logging.warn(
                     `Memory Bank: failed to parse LLM ranking response, using TF-IDF fallback: ${error}`
                 )
-                rankedFilesList = analysisResults.rankedFilesList.slice(0, 10)
+                rankedFilesList = analysisResults.rankedFilesList.slice(0, MAX_NUMBER_OF_FILES_FOR_MEMORY_BANK_RANKING)
             }
 
             this.features.logging.info(
@@ -477,7 +481,7 @@ export class MemoryBankController {
             // Step 5: Create fallback ranking (deterministic, for when LLM fails)
             const rankedFilesList = filesWithDissimilarity
                 .sort((a, b) => b.dissimilarity - a.dissimilarity)
-                .slice(0, 10)
+                .slice(0, MAX_NUMBER_OF_FILES_FOR_MEMORY_BANK_RANKING)
                 .map(f => f.path)
 
             return {
diff --git a/server/aws-lsp-codewhisperer/src/language-server/agenticChat/tools/fsRead.ts b/server/aws-lsp-codewhisperer/src/language-server/agenticChat/tools/fsRead.ts
@@ -1,6 +1,7 @@
 import { sanitize } from '@aws/lsp-core/out/util/path'
 import { CommandValidation, InvokeOutput, requiresPathAcceptance, validatePath } from './toolShared'
 import { Features } from '@aws/language-server-runtimes/server-interface/server'
+import { FSREAD_MAX_PER_FILE, FSREAD_MAX_TOTAL } from '../constants/constants'
 
 export interface FsReadParams {
     paths: string[]
@@ -13,16 +14,24 @@ export interface FileReadResult {
 }
 
 export class FsRead {
-    static maxResponseSize = 200_000
-    static maxResponseSizeTotal = 400_000
+    static maxResponseSize = FSREAD_MAX_PER_FILE
+    static maxResponseSizeTotal = FSREAD_MAX_TOTAL
     private readonly logging: Features['logging']
     private readonly workspace: Features['workspace']
     private readonly lsp: Features['lsp']
+    private readonly maxPerFile: number
+    private readonly maxTotal: number
 
-    constructor(features: Pick<Features, 'lsp' | 'workspace' | 'logging'> & Partial<Features>) {
+    constructor(
+        features: Pick<Features, 'lsp' | 'workspace' | 'logging'> & Partial<Features>,
+        maxPerFile?: number,
+        maxTotal?: number
+    ) {
         this.logging = features.logging
         this.workspace = features.workspace
         this.lsp = features.lsp
+        this.maxPerFile = maxPerFile ?? FsRead.maxResponseSize
+        this.maxTotal = maxTotal ?? FsRead.maxResponseSizeTotal
     }
 
     public async validate(params: FsReadParams): Promise<void> {
@@ -62,16 +71,16 @@ export class FsRead {
     private createOutput(fileResult: FileReadResult[]): InvokeOutput {
         let totalSize = 0
         for (const result of fileResult) {
-            const exceedsMaxSize = result.content.length > FsRead.maxResponseSize
+            const exceedsMaxSize = result.content.length > this.maxPerFile
             if (exceedsMaxSize) {
-                this.logging.info(`FsRead: truncating ${result.path} to first ${FsRead.maxResponseSize} characters`)
-                result.content = result.content.substring(0, FsRead.maxResponseSize - 3) + '...'
+                this.logging.info(`FsRead: truncating ${result.path} to first ${this.maxPerFile} characters`)
+                result.content = result.content.substring(0, this.maxPerFile - 3) + '...'
                 result.truncated = true
             }
             totalSize += result.content.length
         }
 
-        if (totalSize > FsRead.maxResponseSizeTotal) {
+        if (totalSize > this.maxTotal) {
             throw Error('Files are too large, please break the file read into smaller chunks')
         }
 
diff --git a/server/aws-lsp-codewhisperer/src/language-server/chat/chatSessionService.ts b/server/aws-lsp-codewhisperer/src/language-server/chat/chatSessionService.ts
@@ -41,6 +41,7 @@ export class ChatSessionService {
     public pairProgrammingMode: boolean = true
     public contextListSent: boolean = false
     public modelId: string | undefined
+    public isMemoryBankGeneration: boolean = false
     #lsp?: Features['lsp']
     #abortController?: AbortController
     #currentPromptId?: string