Skip to content

Commit fa9bee7

Browse files
suyogguptalucaslie
authored andcommitted
[None][chore] AutoDeploy update cuda stream manager for multi-device (NVIDIA#9575)
Signed-off-by: Suyog Gupta <41447211+suyoggupta@users.noreply.github.com>
1 parent 0032fe0 commit fa9bee7

File tree

4 files changed

+270
-252
lines changed

4 files changed

+270
-252
lines changed

tensorrt_llm/_torch/auto_deploy/custom_ops/attention_interface.py

Lines changed: 1 addition & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -615,15 +615,7 @@ def _store_extra_arg(
615615

616616
@nvtx_range("ad_get_unique_value")
617617
def _get_unique_value(self, occupied: Set[int], max_val: int) -> int:
618-
"""Get un unoccupied value from the range indicated by max_val.
619-
620-
In addition, this function performs a sanity check to ensure that no value in the occupied
621-
set is out of bounds.
622-
"""
623-
# Validate without materializing the full range set
624-
out_of_range = [v for v in occupied if v < 0 or v >= max_val]
625-
assert not out_of_range, f"Out of range values: {out_of_range}"
626-
618+
"""Get un unoccupied value from the range indicated by max_val."""
627619
# Return the smallest free value; fall back to 0 if none
628620
for candidate in range(max_val):
629621
if candidate not in occupied:

tensorrt_llm/_torch/auto_deploy/custom_ops/multi_stream.py

Lines changed: 0 additions & 235 deletions
This file was deleted.

0 commit comments

Comments
 (0)