We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 5c71cce commit 506a32cCopy full SHA for 506a32c
lightllm/common/basemodel/triton_kernel/kv_cache_offload.py
@@ -173,9 +173,9 @@ def _offload_gpu_kv_to_cpu(
173
def offload_gpu_kv_to_cpu(
174
token_indexes: torch.Tensor,
175
gpu_kv_cache: torch.Tensor,
176
- gpu_kv_cache_scale: torch.Tensor,
+ gpu_kv_cache_scale: Optional[torch.Tensor],
177
cpu_kv_cache: torch.Tensor,
178
- cpu_kv_cache_scale: torch.Tensor,
+ cpu_kv_cache_scale: Optional[torch.Tensor],
179
page_indexes: torch.Tensor,
180
page_readies: torch.Tensor,
181
tp_index: int,
0 commit comments