We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c3261f2 commit e68d9a5Copy full SHA for e68d9a5
vllm/v1/attention/backends/mla/rocm_aiter_mla_sparse.py
@@ -143,7 +143,7 @@ class ROCMAiterMLASparseMetadata:
143
class ROCMAiterMLASparseMetadataBuilder(
144
AttentionMetadataBuilder[ROCMAiterMLASparseMetadata]
145
):
146
- cudagraph_support: ClassVar[AttentionCGSupport] = (
+ _cudagraph_support: ClassVar[AttentionCGSupport] = (
147
AttentionCGSupport.UNIFORM_SINGLE_TOKEN_DECODE
148
)
149
0 commit comments