Skip to content

Commit f01c674

Browse files
committed
[TRTLLM-9493][feat] Custom AllToAll for helix parallelism
Signed-off-by: Balaram Buddharaju <169953907+brb-nv@users.noreply.github.com>
1 parent 20b69a9 commit f01c674

File tree

9 files changed

+1522
-38
lines changed

9 files changed

+1522
-38
lines changed

cpp/tensorrt_llm/common/envUtils.cpp

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -554,6 +554,12 @@ bool getEnvEplbForceGdrcopy()
554554
return getBoolEnv("TRTLLM_EPLB_FORCE_GDRCOPY");
555555
}
556556

557+
bool getEnvUseNcclForHelix()
558+
{
559+
static bool const useNcclForHelix = getBoolEnv("TRTLLM_USE_NCCL_FOR_HELIX");
560+
return useNcclForHelix;
561+
}
562+
557563
} // namespace common
558564

559565
TRTLLM_NAMESPACE_END

cpp/tensorrt_llm/common/envUtils.h

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -161,6 +161,9 @@ bool getEnvKVCacheTransferAllBlocksForWindow();
161161

162162
bool getEnvEplbForceGdrcopy();
163163

164+
// Whether to use NCCL-based all-to-all for Helix parallelism.
165+
bool getEnvUseNcclForHelix();
166+
164167
} // namespace common
165168

166169
TRTLLM_NAMESPACE_END

0 commit comments

Comments
 (0)