diff --git a/python/sglang/srt/managers/schedule_policy.py b/python/sglang/srt/managers/schedule_policy.py index 9a43121e7ab..dd663e4fed7 100644 --- a/python/sglang/srt/managers/schedule_policy.py +++ b/python/sglang/srt/managers/schedule_policy.py @@ -697,7 +697,7 @@ def preempt_to_schedule(self, req: Req, server_args: ServerArgs) -> bool: for i, running_req in enumerate(self.running_batch.reqs): if running_req in preemptible_reqs: self.rem_total_token_offset -= ( - self._get_running_request_total_token_offset(req) + self._get_running_request_total_token_offset(running_req) ) release_counter += 1 self.running_batch.release_req(