File tree Expand file tree Collapse file tree 2 files changed +7
-0
lines changed Expand file tree Collapse file tree 2 files changed +7
-0
lines changed Original file line number Diff line number Diff line change @@ -127,6 +127,12 @@ def _init_cache(self) -> None:
127
127
# FIXME(woosuk): Change to debug log.
128
128
logger .info (f'# GPU blocks: { num_gpu_blocks } , '
129
129
f'# CPU blocks: { num_cpu_blocks } ' )
130
+
131
+ if num_gpu_blocks <= 0 or num_cpu_blocks <= 0 :
132
+ raise ValueError ("No available memory for the cache blocks. "
133
+ "Try increasing `gpu_memory_utilization` when "
134
+ "initializing the engine." )
135
+
130
136
self .cache_config .num_gpu_blocks = num_gpu_blocks
131
137
self .cache_config .num_cpu_blocks = num_cpu_blocks
132
138
Original file line number Diff line number Diff line change @@ -53,6 +53,7 @@ class RequestOutput:
53
53
prompt: The prompt string of the request.
54
54
prompt_token_ids: The token IDs of the prompt.
55
55
outputs: The output sequences of the request.
56
+ finished: Whether the whole request is finished.
56
57
"""
57
58
def __init__ (
58
59
self ,
You can’t perform that action at this time.
0 commit comments