-
Notifications
You must be signed in to change notification settings - Fork 838
Preserve function content in SummarizingChatReducer
#6908
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: main
Are you sure you want to change the base?
Changes from all commits
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -2,6 +2,7 @@ | |
// The .NET Foundation licenses this file to you under the MIT license. | ||
|
||
using System.Collections.Generic; | ||
using System.Diagnostics; | ||
using System.Diagnostics.CodeAnalysis; | ||
using System.Linq; | ||
using System.Threading; | ||
|
@@ -73,18 +74,24 @@ public async Task<IEnumerable<ChatMessage>> ReduceAsync(IEnumerable<ChatMessage> | |
{ | ||
_ = Throw.IfNull(messages); | ||
|
||
var summarizedConversion = SummarizedConversation.FromChatMessages(messages); | ||
if (summarizedConversion.ShouldResummarize(_targetCount, _thresholdCount)) | ||
var summarizedConversation = SummarizedConversation.FromChatMessages(messages); | ||
var indexOfFirstMessageToKeep = summarizedConversation.FindIndexOfFirstMessageToKeep(_targetCount, _thresholdCount); | ||
if (indexOfFirstMessageToKeep > 0) | ||
{ | ||
summarizedConversion = await summarizedConversion.ResummarizeAsync( | ||
_chatClient, _targetCount, SummarizationPrompt, cancellationToken); | ||
summarizedConversation = await summarizedConversation.ResummarizeAsync( | ||
_chatClient, | ||
indexOfFirstMessageToKeep, | ||
SummarizationPrompt, | ||
cancellationToken); | ||
} | ||
|
||
return summarizedConversion.ToChatMessages(); | ||
return summarizedConversation.ToChatMessages(); | ||
} | ||
|
||
/// <summary>Represents a conversation with an optional summary.</summary> | ||
private readonly struct SummarizedConversation(string? summary, ChatMessage? systemMessage, IList<ChatMessage> unsummarizedMessages) | ||
{ | ||
/// <summary>Creates a <see cref="SummarizedConversation"/> from a list of chat messages.</summary> | ||
public static SummarizedConversation FromChatMessages(IEnumerable<ChatMessage> messages) | ||
{ | ||
string? summary = null; | ||
|
@@ -102,7 +109,7 @@ public static SummarizedConversation FromChatMessages(IEnumerable<ChatMessage> m | |
unsummarizedMessages.Clear(); | ||
summary = summaryValue; | ||
} | ||
else if (!message.Contents.Any(m => m is FunctionCallContent or FunctionResultContent)) | ||
else | ||
{ | ||
unsummarizedMessages.Add(message); | ||
} | ||
|
@@ -111,31 +118,68 @@ public static SummarizedConversation FromChatMessages(IEnumerable<ChatMessage> m | |
return new(summary, systemMessage, unsummarizedMessages); | ||
} | ||
|
||
public bool ShouldResummarize(int targetCount, int thresholdCount) | ||
=> unsummarizedMessages.Count > targetCount + thresholdCount; | ||
|
||
public async Task<SummarizedConversation> ResummarizeAsync( | ||
IChatClient chatClient, int targetCount, string summarizationPrompt, CancellationToken cancellationToken) | ||
/// <summary>Performs summarization by calling the chat client and updating the conversation state.</summary> | ||
public async ValueTask<SummarizedConversation> ResummarizeAsync( | ||
IChatClient chatClient, int indexOfFirstMessageToKeep, string summarizationPrompt, CancellationToken cancellationToken) | ||
{ | ||
var messagesToResummarize = unsummarizedMessages.Count - targetCount; | ||
if (messagesToResummarize <= 0) | ||
{ | ||
// We're at or below the target count - no need to resummarize. | ||
return this; | ||
} | ||
Debug.Assert(indexOfFirstMessageToKeep > 0, "Expected positive index for first message to keep."); | ||
|
||
var summarizerChatMessages = ToSummarizerChatMessages(messagesToResummarize, summarizationPrompt); | ||
// Generate the summary by sending unsummarized messages to the chat client | ||
var summarizerChatMessages = ToSummarizerChatMessages(indexOfFirstMessageToKeep, summarizationPrompt); | ||
var response = await chatClient.GetResponseAsync(summarizerChatMessages, cancellationToken: cancellationToken); | ||
var newSummary = response.Text; | ||
|
||
var lastSummarizedMessage = unsummarizedMessages[messagesToResummarize - 1]; | ||
// Attach the summary metadata to the last message being summarized | ||
// This is what allows us to build on previously-generated summaries | ||
var lastSummarizedMessage = unsummarizedMessages[indexOfFirstMessageToKeep - 1]; | ||
var additionalProperties = lastSummarizedMessage.AdditionalProperties ??= []; | ||
additionalProperties[SummaryKey] = newSummary; | ||
|
||
var newUnsummarizedMessages = unsummarizedMessages.Skip(messagesToResummarize).ToList(); | ||
// Compute the new list of unsummarized messages | ||
var newUnsummarizedMessages = unsummarizedMessages.Skip(indexOfFirstMessageToKeep).ToList(); | ||
return new SummarizedConversation(newSummary, systemMessage, newUnsummarizedMessages); | ||
} | ||
|
||
/// <summary>Determines the index of the first message to keep (not summarize) based on target and threshold counts.</summary> | ||
public int FindIndexOfFirstMessageToKeep(int targetCount, int thresholdCount) | ||
{ | ||
var earliestAllowedIndex = unsummarizedMessages.Count - thresholdCount - targetCount; | ||
if (earliestAllowedIndex <= 0) | ||
{ | ||
// Not enough messages to warrant summarization | ||
return 0; | ||
} | ||
|
||
// Start at the ideal cut point (keeping exactly targetCount messages) | ||
var indexOfFirstMessageToKeep = unsummarizedMessages.Count - targetCount; | ||
|
||
// Move backward to skip over function call/result content at the boundary | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. So is this never getting rid of any FunctionCall/ResultContent? Does that mean in a really long conversation we could end up with lots and lots of these, and eventually still overflow context windows? |
||
// We want to keep complete function call sequences together with their responses | ||
while (indexOfFirstMessageToKeep > 0) | ||
{ | ||
if (!unsummarizedMessages[indexOfFirstMessageToKeep - 1].Contents.Any(c => c is FunctionCallContent or FunctionResultContent)) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. There's also UserInputRequestContent / UserInputResponseContent. Does this need to pay attention to those as well? |
||
{ | ||
break; | ||
} | ||
|
||
indexOfFirstMessageToKeep--; | ||
} | ||
|
||
// Search backward within the threshold window to find a User message | ||
// If found, cut right before it to avoid orphaning user questions from responses | ||
for (var i = indexOfFirstMessageToKeep; i >= earliestAllowedIndex; i--) | ||
{ | ||
if (unsummarizedMessages[i].Role == ChatRole.User) | ||
{ | ||
return i; | ||
} | ||
} | ||
|
||
// No User message found within threshold - use the adjusted cut point | ||
return indexOfFirstMessageToKeep; | ||
} | ||
|
||
/// <summary>Converts the summarized conversation back into a collection of chat messages.</summary> | ||
public IEnumerable<ChatMessage> ToChatMessages() | ||
{ | ||
if (systemMessage is not null) | ||
|
@@ -154,16 +198,21 @@ public IEnumerable<ChatMessage> ToChatMessages() | |
} | ||
} | ||
|
||
private IEnumerable<ChatMessage> ToSummarizerChatMessages(int messagesToResummarize, string summarizationPrompt) | ||
/// <summary>Builds the list of messages to send to the chat client for summarization.</summary> | ||
private IEnumerable<ChatMessage> ToSummarizerChatMessages(int indexOfFirstMessageToKeep, string summarizationPrompt) | ||
{ | ||
if (summary is not null) | ||
{ | ||
yield return new ChatMessage(ChatRole.Assistant, summary); | ||
} | ||
|
||
for (var i = 0; i < messagesToResummarize; i++) | ||
for (var i = 0; i < indexOfFirstMessageToKeep; i++) | ||
{ | ||
yield return unsummarizedMessages[i]; | ||
var message = unsummarizedMessages[i]; | ||
if (!message.Contents.Any(c => c is FunctionCallContent or FunctionResultContent)) | ||
{ | ||
yield return message; | ||
} | ||
} | ||
|
||
yield return new ChatMessage(ChatRole.System, summarizationPrompt); | ||
|
Uh oh!
There was an error while loading. Please reload this page.