File tree Expand file tree Collapse file tree 2 files changed +7
-0
lines changed Expand file tree Collapse file tree 2 files changed +7
-0
lines changed Original file line number Diff line number Diff line change @@ -127,6 +127,12 @@ def _init_cache(self) -> None:
127127 # FIXME(woosuk): Change to debug log.
128128 logger .info (f'# GPU blocks: { num_gpu_blocks } , '
129129 f'# CPU blocks: { num_cpu_blocks } ' )
130+
131+ if num_gpu_blocks <= 0 or num_cpu_blocks <= 0 :
132+ raise ValueError ("No available memory for the cache blocks. "
133+ "Try increasing `gpu_memory_utilization` when "
134+ "initializing the engine." )
135+
130136 self .cache_config .num_gpu_blocks = num_gpu_blocks
131137 self .cache_config .num_cpu_blocks = num_cpu_blocks
132138
Original file line number Diff line number Diff line change @@ -53,6 +53,7 @@ class RequestOutput:
5353 prompt: The prompt string of the request.
5454 prompt_token_ids: The token IDs of the prompt.
5555 outputs: The output sequences of the request.
56+ finished: Whether the whole request is finished.
5657 """
5758 def __init__ (
5859 self ,
You can’t perform that action at this time.
0 commit comments