fix: auto increase context size (#7609)

louis-jan · web-flow · commit e2146cd5f7cf · 2026-03-04T16:31:40.000+07:00
diff --git a/web-app/src/containers/MessageItem.tsx b/web-app/src/containers/MessageItem.tsx
@@ -48,13 +48,17 @@ export type MessageItemProps = {
   onDelete?: (messageId: string) => void
   assistant?: { avatar?: React.ReactNode; name?: string }
   showAssistant?: boolean
+  isAnimating?: boolean
+  hideActions?: boolean
 }
 
 export const MessageItem = memo(
   ({
     message,
     isLastMessage,
     status,
+    isAnimating,
+    hideActions,
     reasoningContainerRef,
     onRegenerate,
     onEdit,
@@ -185,6 +189,7 @@ export const MessageItem = memo(
                 content={part.text}
                 isStreaming={isStreaming && isLastPart}
                 messageId={message.id}
+                isAnimating={isAnimating}
               />
             </>
           )}
@@ -345,7 +350,7 @@ export const MessageItem = memo(
         })}
 
         {/* Message actions for user messages */}
-        {message.role === 'user' && (
+        {message.role === 'user' && !hideActions && (
           <div className="flex items-center justify-end gap-1 text-muted-foreground text-xs mt-4">
             <CopyButton text={getFullTextContent()} />
 
@@ -369,7 +374,7 @@ export const MessageItem = memo(
               <div
                 className={cn(
                   'flex items-center gap-1',
-                  isStreaming && 'hidden'
+                  (isStreaming || hideActions) && 'hidden'
                 )}
               >
                 <CopyButton text={getFullTextContent()} />
@@ -434,7 +439,8 @@ export const MessageItem = memo(
       prevProps.isFirstMessage === nextProps.isFirstMessage &&
       prevProps.isLastMessage === nextProps.isLastMessage &&
       prevProps.status === nextProps.status &&
-      prevProps.showAssistant === nextProps.showAssistant
+      prevProps.showAssistant === nextProps.showAssistant &&
+      prevProps.hideActions === nextProps.hideActions
     )
   }
 )
diff --git a/web-app/src/containers/RenderMarkdown.tsx b/web-app/src/containers/RenderMarkdown.tsx
@@ -21,6 +21,7 @@ interface MarkdownProps {
   isUser?: boolean
   isStreaming?: boolean
   messageId?: string
+  isAnimating?: boolean
 }
 
 // Cache for normalized LaTeX content
@@ -85,6 +86,7 @@ function RenderMarkdownComponent({
   isUser,
   components,
   messageId,
+  isAnimating
 }: MarkdownProps) {
 
   // Memoize the normalized content to avoid reprocessing on every render
@@ -101,7 +103,7 @@ function RenderMarkdownComponent({
       )}
     >
       <Streamdown
-        animate={true}
+        animate={isAnimating ?? true}
         animationDuration={500}
         linkSafety={{
           enabled: false,
diff --git a/web-app/src/hooks/use-chat.ts b/web-app/src/hooks/use-chat.ts
@@ -126,6 +126,10 @@ export function useChat(
     }
   }, [mcpToolNames, ragToolNames])
 
+  const setContinueFromContent = useCallback((content: string) => {
+    transportRef.current?.setContinueFromContent(content)
+  }, [])
+
   // Expose method to update RAG tools availability
   const updateRagToolsAvailability = useCallback(
     async (
@@ -147,5 +151,6 @@ export function useChat(
   return {
     ...chatResult,
     updateRagToolsAvailability,
+    setContinueFromContent,
   }
 }
diff --git a/web-app/src/lib/custom-chat-transport.ts b/web-app/src/lib/custom-chat-transport.ts
@@ -48,6 +48,38 @@ export type ServiceHub = {
   }
 }
 
+/**
+ * Wraps a UIMessageChunk stream so that when the first `text-start` chunk
+ * arrives, a `text-delta` carrying `prefixText` is immediately injected into
+ * the same text block. This makes the new message show the partial content
+ * right away while continuation tokens stream in after it.
+ */
+function prependTextDeltaToUIStream(
+  stream: ReadableStream<UIMessageChunk>,
+  prefixText: string
+): ReadableStream<UIMessageChunk> {
+  const reader = stream.getReader()
+  let prefixEmitted = false
+  return new ReadableStream<UIMessageChunk>({
+    async pull(controller) {
+      const { done, value } = await reader.read()
+      if (done) {
+        controller.close()
+        return
+      }
+      controller.enqueue(value)
+      if (!prefixEmitted && (value as { type: string }).type === 'text-start') {
+        prefixEmitted = true
+        const id = (value as { type: 'text-start'; id: string }).id
+        controller.enqueue({ type: 'text-delta', id, delta: prefixText } as UIMessageChunk)
+      }
+    },
+    cancel() {
+      reader.cancel()
+    },
+  })
+}
+
 export class CustomChatTransport implements ChatTransport<UIMessage> {
   public model: LanguageModel | null = null
   private tools: Record<string, Tool> = {}
@@ -58,6 +90,7 @@ export class CustomChatTransport implements ChatTransport<UIMessage> {
   private systemMessage?: string
   private serviceHub: ServiceHub | null
   private threadId?: string
+  private continueFromContent: string | null = null
 
   constructor(systemMessage?: string, threadId?: string) {
     this.systemMessage = systemMessage
@@ -213,6 +246,14 @@ export class CustomChatTransport implements ChatTransport<UIMessage> {
     return this.tools
   }
 
+  /**
+   * Set partial assistant content to send as a prefill on the next request,
+   * so the model continues generation from where it left off.
+   */
+  setContinueFromContent(content: string) {
+    this.continueFromContent = content
+  }
+
   async sendMessages(
     options: {
       chatId: string
@@ -258,10 +299,18 @@ export class CustomChatTransport implements ChatTransport<UIMessage> {
     }
 
     // Convert UI messages to model messages
-    const modelMessages = convertToModelMessages(
+    const baseMessages = convertToModelMessages(
       this.mapUserInlineAttachments(options.messages)
     )
 
+    // If continuing a truncated response, append the partial assistant content as a
+    // prefill so the model resumes from where it left off rather than regenerating.
+    const continueContent = this.continueFromContent
+    this.continueFromContent = null
+    const modelMessages = continueContent
+      ? [...baseMessages, { role: 'assistant' as const, content: continueContent }]
+      : baseMessages
+
     // Include tools only if we have tools loaded AND model supports them
     const hasTools = Object.keys(this.tools).length > 0
     const selectedModel = useModelProvider.getState().selectedModel
@@ -282,7 +331,7 @@ export class CustomChatTransport implements ChatTransport<UIMessage> {
 
     let tokensPerSecond = 0
 
-    return result.toUIMessageStream({
+    const uiStream = result.toUIMessageStream({
       messageMetadata: ({ part }) => {
         // Track stream start time on start
         if (part.type === 'start' && !streamStartTime) {
@@ -320,6 +369,7 @@ export class CustomChatTransport implements ChatTransport<UIMessage> {
           }
 
           return {
+            finishReason: finishPart.finishReason,
             usage: {
               inputTokens: inputTokens,
               outputTokens: outputTokens,
@@ -364,6 +414,13 @@ export class CustomChatTransport implements ChatTransport<UIMessage> {
         }
       },
     })
+
+    // When continuing a truncated response, inject the partial content as the
+    // very first text-delta so the new message immediately shows it and the
+    // user sees a seamless continuation rather than an empty box.
+    return continueContent
+      ? prependTextDeltaToUIStream(uiStream, continueContent)
+      : uiStream
   }
 
   async reconnectToStream(
diff --git a/web-app/src/routes/threads/$threadId.tsx b/web-app/src/routes/threads/$threadId.tsx

Original file line number	Diff line number	Diff line change
`@@ -126,6 +126,10 @@ export function useChat(`
`126`	`126`	`}`
`127`	`127`	`}, [mcpToolNames, ragToolNames])`
`128`	`128`
	`129`	`+ const setContinueFromContent = useCallback((content: string) => {`
	`130`	`+ transportRef.current?.setContinueFromContent(content)`
	`131`	`+ }, [])`
	`132`	`+`
`129`	`133`	`// Expose method to update RAG tools availability`
`130`	`134`	`const updateRagToolsAvailability = useCallback(`
`131`	`135`	`async (`
`@@ -147,5 +151,6 @@ export function useChat(`
`147`	`151`	`return {`
`148`	`152`	`...chatResult,`
`149`	`153`	`updateRagToolsAvailability,`
	`154`	`+ setContinueFromContent,`
`150`	`155`	`}`
`151`	`156`	`}`