We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f520182 commit 799a339Copy full SHA for 799a339
tensorrt_llm/_torch/pyexecutor/executor_request_queue.py
@@ -384,8 +384,7 @@ def _fetch_new_requests_attention_dp(
384
f"CP ranks within DP group {dp_group_idx} have mismatched request counts: " \
385
f"{[entry[0] for entry in group_entries]}"
386
# Use token count from cp_rank0.
387
- aggregated_responses.append(
388
- [group_entries[0][0], group_entries[0][1]])
+ aggregated_responses.append(group_entries[0])
389
responses_list = aggregated_responses
390
else:
391
responses_list = self.dist.tp_allgather(
0 commit comments