Skip to content

Commit 141afe9

Browse files
committed
[Core] Add max-waiting-queue-length parameter to reject requests when waiting queue is full
Signed-off-by: chaunceyjiang <[email protected]>
1 parent fe7708c commit 141afe9

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

vllm/entrypoints/openai/serving_completion.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -229,7 +229,7 @@ async def create_completion(
229229
generators.append(generator)
230230
except ValueError as e:
231231
# TODO: Use a vllm-specific Validation Error
232-
return self.create_error_response(str(e))
232+
return self.create_error_response(e)
233233

234234
result_generator = merge_async_iterators(*generators)
235235

@@ -293,7 +293,7 @@ async def create_completion(
293293
return self.create_error_response("Client disconnected")
294294
except ValueError as e:
295295
# TODO: Use a vllm-specific Validation Error
296-
return self.create_error_response(str(e))
296+
return self.create_error_response(e)
297297

298298
# When user requests streaming but we don't stream, we still need to
299299
# return a streaming response with a single event.

vllm/entrypoints/openai/serving_responses.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -187,7 +187,7 @@ async def create_responses(
187187
generators.append(generator)
188188
except ValueError as e:
189189
# TODO: Use a vllm-specific Validation Error
190-
return self.create_error_response(str(e))
190+
return self.create_error_response(e)
191191

192192
assert len(generators) == 1
193193
result_generator, = generators
@@ -267,7 +267,7 @@ async def responses_full_generator(
267267
return self.create_error_response("Client disconnected")
268268
except ValueError as e:
269269
# TODO: Use a vllm-specific Validation Error
270-
return self.create_error_response(str(e))
270+
return self.create_error_response(e)
271271

272272
assert final_res is not None
273273
assert len(final_res.outputs) == 1

0 commit comments

Comments
 (0)