minor clean up

brb-nv · brb-nv · commit 3f6bff011710 · 2026-01-09T02:56:53.000Z
Signed-off-by: Balaram Buddharaju &lt;169953907+brb-nv@users.noreply.github.com&gt;
diff --git a/tensorrt_llm/_torch/distributed/communicator.py b/tensorrt_llm/_torch/distributed/communicator.py
@@ -1,4 +1,3 @@
-import copy
 import math
 import pickle  # nosec B403
 from abc import ABC, abstractmethod
diff --git a/tensorrt_llm/_torch/pyexecutor/executor_request_queue.py b/tensorrt_llm/_torch/pyexecutor/executor_request_queue.py
@@ -372,8 +372,6 @@ def _fetch_new_requests_attention_dp(
             responses_list = self.dist.tp_cp_allgather(
                 [len(activate_requests), num_active_tokens])
 
-            # @B: Do we really need to check for all CP ranks? Should num_tokens be 1
-            # for all generation requests?
             aggregated_responses = []
             for dp_group_idx in range(self.dist.tp_size):
                 # Get all entries for this DP group (cp_size entries per group).
@@ -385,9 +383,9 @@ def _fetch_new_requests_attention_dp(
                 assert all(entry[0] == group_entries[0][0] for entry in group_entries), \
                     f"CP ranks within DP group {dp_group_idx} have mismatched request counts: " \
                     f"{[entry[0] for entry in group_entries]}"
-                # Sum the token counts across CP ranks (sequence is split).
-                total_tokens = sum(entry[1] for entry in group_entries)
-                aggregated_responses.append([group_entries[0][0], total_tokens])
+                # Use token count from cp_rank0.
+                aggregated_responses.append(
+                    [group_entries[0][0], group_entries[0][1]])
             responses_list = aggregated_responses
         else:
             responses_list = self.dist.tp_allgather(

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,3 @@`
`1`		`-import copy`
`2`	`1`	`import math`
`3`	`2`	`import pickle # nosec B403`
`4`	`3`	`from abc import ABC, abstractmethod`