File tree Expand file tree Collapse file tree 1 file changed +6
-4
lines changed Expand file tree Collapse file tree 1 file changed +6
-4
lines changed Original file line number Diff line number Diff line change @@ -1437,10 +1437,7 @@ def schedule(self) -> SchedulerOutput:
1437
1437
token_budget = self ._estimate_token_budget ()
1438
1438
req_index = 0
1439
1439
while self .scheduled_queue :
1440
- if token_budget <= 0 :
1441
- break
1442
-
1443
- scheduled_request = self .scheduled_queue .popleft ()
1440
+ scheduled_request = self .scheduled_queue [0 ]
1444
1441
1445
1442
req_id = scheduled_request .request_id
1446
1443
num_new_tokens = scheduled_request .num_new_tokens
@@ -1451,6 +1448,11 @@ def schedule(self) -> SchedulerOutput:
1451
1448
spec_token_ids = scheduled_request .spec_token_ids
1452
1449
request_data = scheduled_request .request_data
1453
1450
1451
+ if num_scheduled_tokens and token_budget < num_new_tokens :
1452
+ break
1453
+
1454
+ self .scheduled_queue .popleft ()
1455
+
1454
1456
# requests in the scheduled_queue can also be preempted or finished.
1455
1457
if self .requests [req_id ].status >= RequestStatus .PREEMPTED :
1456
1458
continue
You can’t perform that action at this time.
0 commit comments