diff --git a/nanovllm/engine/scheduler.py b/nanovllm/engine/scheduler.py index 5bc19fe..f2eabdf 100644 --- a/nanovllm/engine/scheduler.py +++ b/nanovllm/engine/scheduler.py @@ -62,7 +62,7 @@ class Scheduler: self.block_manager.deallocate(seq) self.waiting.appendleft(seq) - def postprocess(self, seqs: list[Sequence], token_ids: list[int]) -> list[bool]: + def postprocess(self, seqs: list[Sequence], token_ids: list[int]): for seq, token_id in zip(seqs, token_ids): seq.append_token(token_id) if (not seq.ignore_eos and token_id == self.eos) or seq.num_completion_tokens == seq.max_tokens: