We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent eab8bf7 commit 495fcdfCopy full SHA for 495fcdf
src/llmcompressor/modifiers/quantization/cache.py
@@ -9,7 +9,7 @@
9
10
from typing import Any, Dict, List, Optional, Tuple
11
12
-from compressed_tensors.quantization.lifecycle import KVCacheScaleType
+from compressed_tensors.quantization import KVCacheScaleType
13
from compressed_tensors.quantization.quant_args import QuantizationArgs
14
from torch import Tensor
15
from transformers import DynamicCache
0 commit comments