ai-dynamo · ayushag-nv · Nov 6, 2025 · Nov 6, 2025 · Nov 6, 2025 · Nov 6, 2025
@@ -370,12 +370,17 @@ impl ChoiceJailState {
 struct ChoiceJailStateCollection {
     /// Vec of states, always kept sorted by choice index for deterministic iteration
     states: Vec<ChoiceJailState>,
+    /// Track if any choice has emitted a finish_reason (per choice index)
+    finish_reason_emitted: std::collections::HashMap<u32, bool>,
 }
 
 impl ChoiceJailStateCollection {
     /// Create a new empty collection
     fn new() -> Self {
-        Self { states: Vec::new() }
+        Self {
+            states: Vec::new(),
+            finish_reason_emitted: std::collections::HashMap::new(),
+        }
     }
 
     /// Get or create state for a choice index
@@ -394,6 +399,19 @@ impl ChoiceJailStateCollection {
             }
         }
     }
+
+    /// Check if a finish_reason has already been emitted for this choice
+    fn has_emitted_finish_reason(&self, index: u32) -> bool {
+        self.finish_reason_emitted
+            .get(&index)
+            .copied()
+            .unwrap_or(false)
+    }
+
+    /// Mark that a finish_reason has been emitted for this choice
+    fn mark_finish_reason_emitted(&mut self, index: u32) {
+        self.finish_reason_emitted.insert(index, true);
+    }
 }
 
 /// Emission mode for handling multiple choices
@@ -456,6 +474,17 @@ impl JailedStream {
 
                     // Process each choice independently using the new architecture
                     for choice in &chat_response.choices {
+                        // if we've already emitted a finish_reason for this choice,
+                        // skip any subsequent chunks with finish_reason
+                        if choice.finish_reason.is_some() && choice_states.has_emitted_finish_reason(choice.index) {
+                            tracing::debug!(
+                                "Skipping chunk with finish_reason {:?} for choice {} - already emitted finish_reason",
+                                choice.finish_reason,
+                                choice.index
+                            );
+                            continue;
+                        }
+
                         if let Some(ref content) = choice.delta.content {
                             let choice_state = choice_states.get_or_create_state(choice.index);
 
@@ -509,8 +538,16 @@ impl JailedStream {
                                 last_annotated_event.clone(),
                                 last_annotated_comment.clone(),
                             );
-                            let responses = self.emit_choice_emissions(tool_content_emissions, chat_response, preserved_metadata);
+                            let responses = self.emit_choice_emissions(tool_content_emissions.clone(), chat_response, preserved_metadata);
                             for emitted_response in responses {
+                                // Mark finish_reason as emitted for choices that have it
+                                if let Some(ref data) = emitted_response.data {
+                                    for choice in &data.choices {
+                                        if choice.finish_reason.is_some() {
+                                            choice_states.mark_finish_reason_emitted(choice.index);
+                                        }
+                                    }
+                                }
                                 yield emitted_response;
                             }
                         }
@@ -524,6 +561,14 @@ impl JailedStream {
                             );
                             let responses = self.emit_choice_emissions(trailing_emissions, chat_response, preserved_metadata);
                             for emitted_response in responses {
+                                // Mark finish_reason as emitted for choices that have it
+                                if let Some(ref data) = emitted_response.data {
+                                    for choice in &data.choices {
+                                        if choice.finish_reason.is_some() {
+                                            choice_states.mark_finish_reason_emitted(choice.index);
+                                        }
+                                    }
+                                }
                                 yield emitted_response;
                             }
                         }
@@ -533,6 +578,14 @@ impl JailedStream {
                             let current_metadata = (response.id.clone(), response.event.clone(), response.comment.clone());
                             let responses = self.emit_choice_emissions(passthrough_emissions, chat_response, current_metadata);
                             for emitted_response in responses {
+                                // Mark finish_reason as emitted for choices that have it
+                                if let Some(ref data) = emitted_response.data {
+                                    for choice in &data.choices {
+                                        if choice.finish_reason.is_some() {
+                                            choice_states.mark_finish_reason_emitted(choice.index);
+                                        }
+                                    }
+                                }
                                 yield emitted_response;
                             }
                         }
@@ -568,6 +621,14 @@ impl JailedStream {
                 let final_metadata = (last_annotated_id, last_annotated_event, last_annotated_comment);
                 let responses = self.emit_choice_emissions(final_emissions, &dummy_response, final_metadata);
                 for emitted_response in responses {
+                    // Mark finish_reason as emitted for choices that have it
+                    if let Some(ref data) = emitted_response.data {
+                        for choice in &data.choices {
+                            if choice.finish_reason.is_some() {
+                                choice_states.mark_finish_reason_emitted(choice.index);
+                            }
+                        }
+                    }
                     yield emitted_response;
                 }
             }

@@ -26,7 +26,7 @@ across backends.
 
 */
 
-use dynamo_async_openai::types::ChatChoiceStream;
+use dynamo_async_openai::types::{ChatChoiceStream, FinishReason};
 use dynamo_llm::preprocessor::OpenAIPreprocessor;
 use dynamo_llm::protocols::openai::chat_completions::NvCreateChatCompletionStreamResponse;
 use dynamo_runtime::protocols::annotated::Annotated;
@@ -304,6 +304,18 @@ mod tests {
             aggregated.has_tool_calls, expected_has_tool_calls,
             "Tool calls presence should match expected value"
         );
+
+        // Verify last chunk has Stop finish_reason for no-tool cases
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::Stop),
+                "Last chunk should have Stop finish_reason for non-tool call case"
+            );
+        }
     }
 
     #[tokio::test]
@@ -360,6 +372,22 @@ mod tests {
 
         // Verify tool calls
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify the last chunk has ToolCalls finish_reason (empty Stop chunks should be filtered)
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::ToolCalls),
+                "Last chunk should have ToolCalls finish_reason (empty Stop chunks should be filtered)"
+            );
+            assert!(
+                choice.delta.tool_calls.is_some(),
+                "Last chunk with ToolCalls finish_reason must have tool_calls data"
+            );
+        }
     }
 
     #[tokio::test]
@@ -403,6 +431,18 @@ mod tests {
             aggregated.has_tool_calls, expected_has_tool_calls,
             "Tool calls presence should match expected value"
         );
+
+        // Verify last chunk has Stop finish_reason for no-tool cases
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::Stop),
+                "Last chunk should have Stop finish_reason for non-tool call case"
+            );
+        }
     }
 
     #[tokio::test]
@@ -455,6 +495,22 @@ mod tests {
 
         // Verify tool calls
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify the last chunk has ToolCalls finish_reason (empty Stop chunks should be filtered)
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::ToolCalls),
+                "Last chunk should have ToolCalls finish_reason (empty Stop chunks should be filtered)"
+            );
+            assert!(
+                choice.delta.tool_calls.is_some(),
+                "Last chunk with ToolCalls finish_reason must have tool_calls data"
+            );
+        }
     }
 
     #[tokio::test]
@@ -511,6 +567,18 @@ mod tests {
         );
 
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify last chunk has Stop finish_reason for no-tool cases
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::Stop),
+                "Last chunk should have Stop finish_reason for non-tool call case"
+            );
+        }
     }
 
     #[tokio::test]
@@ -567,6 +635,23 @@ mod tests {
         );
 
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify there is a chunk with ToolCalls finish_reason and tool call data
+        let has_tool_calls_chunk = output_chunks.iter().any(|chunk| {
+            chunk
+                .data
+                .as_ref()
+                .and_then(|d| d.choices.first())
+                .map(|c| {
+                    c.finish_reason == Some(FinishReason::ToolCalls)
+                        && c.delta.tool_calls.is_some()
+                })
+                .unwrap_or(false)
+        });
+        assert!(
+            has_tool_calls_chunk,
+            "Should have a chunk with ToolCalls finish_reason and tool_calls data"
+        );
     }
 
     #[tokio::test]
@@ -620,6 +705,18 @@ mod tests {
         );
 
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify last chunk has Stop finish_reason for no-tool cases
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::Stop),
+                "Last chunk should have Stop finish_reason for non-tool call case"
+            );
+        }
     }
 
     #[tokio::test]
@@ -674,6 +771,23 @@ mod tests {
             "Tool calls presence should match expected value"
         );
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify there is a chunk with ToolCalls finish_reason and tool call data
+        let has_tool_calls_chunk = output_chunks.iter().any(|chunk| {
+            chunk
+                .data
+                .as_ref()
+                .and_then(|d| d.choices.first())
+                .map(|c| {
+                    c.finish_reason == Some(FinishReason::ToolCalls)
+                        && c.delta.tool_calls.is_some()
+                })
+                .unwrap_or(false)
+        });
+        assert!(
+            has_tool_calls_chunk,
+            "Should have a chunk with ToolCalls finish_reason and tool_calls data"
+        );
     }
 
     #[tokio::test]
@@ -726,5 +840,22 @@ mod tests {
 
         // Verify tool calls
         assert_tool_calls(&aggregated.tool_calls, &test_data.expected_tool_calls);
+
+        // Verify the last chunk has ToolCalls finish_reason (empty Stop chunks should be filtered)
+        let last_chunk = output_chunks.last().expect("Should have at least one chunk");
+        if let Some(data) = &last_chunk.data
+            && let Some(choice) = data.choices.first()
+        {
+            assert_eq!(
+                choice.finish_reason,
+                Some(FinishReason::ToolCalls),
+                "Last chunk should have ToolCalls finish_reason (empty Stop chunks should be filtered)"
+            );
+            assert!(
+                choice.delta.tool_calls.is_some(),
+                "Last chunk with ToolCalls finish_reason must have tool_calls data"
+            );
+        }
     }
+
 }