diff --git a/fastdeploy/scheduler/splitwise_scheduler.py b/fastdeploy/scheduler/splitwise_scheduler.py index 94c947ea49f..83f763ad454 100644 --- a/fastdeploy/scheduler/splitwise_scheduler.py +++ b/fastdeploy/scheduler/splitwise_scheduler.py @@ -859,7 +859,7 @@ def get_requests( self.reqs_queue.appendleft(req) break else: - if current_prefill_tokens > max_num_batched_tokens: + if current_prefill_tokens > max_num_batched_tokens and len(reqs) > 0: self.reqs_queue.appendleft(req) break # logger.info(f"Get Requests from Scheduler: {req.request_id}")