Skip to content

Commit 5f55640

Browse files
committed
fix gen_cubins.py
Signed-off-by: Pengbo Wang <221450789+pengbowang-nv@users.noreply.github.com>
1 parent 8c3aab8 commit 5f55640

File tree

1 file changed

+6
-4
lines changed

1 file changed

+6
-4
lines changed

cpp/kernels/xqa/gen_cubins.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -89,7 +89,8 @@
8989
9090
#include "tensorrt_llm/common/config.h"
9191
92-
TRTLLM_NAMESPACE_BEGIN
92+
namespace tensorrt_llm
93+
{
9394
namespace kernels
9495
{
9596
// clang-format off
@@ -98,7 +99,7 @@
9899
cpp_file_suffex_text = R"""
99100
// clang-format on
100101
} // namespace kernels
101-
TRTLLM_NAMESPACE_END
102+
}
102103
"""
103104

104105
cubin_meta_info_struct_prefix_text = R"""
@@ -438,8 +439,9 @@ def generate_header_file_contents(
438439
CompileMacroOption('HEAD_ELEMS', 'd', [128]),
439440
CompileMacroOption('BEAM_WIDTH', 'beam', [1]),
440441
CompileMacroOption('CACHE_ELEM_ENUM', 'kvt', [0, 1, 2]),
441-
CompileMacroOption('TOKENS_PER_PAGE', 'pagedKV',
442-
[0, 64, 128]), # 0 denotes contiguous kv cache.
442+
CompileMacroOption(
443+
'TOKENS_PER_PAGE', 'pagedKV',
444+
[0, 32, 64, 128]), # 0 denotes contiguous kv cache.
443445
CompileMacroOption('HEAD_GRP_SIZE', 'nqpkv', [0]),
444446
CompileMacroOption('M_TILESIZE', 'm', [16, 32]),
445447
]]

0 commit comments

Comments
 (0)