From 8fae5ed7f6bfd63b81310fcb24b310d9205c9687 Mon Sep 17 00:00:00 2001 From: Woo-Yeon Lee Date: Wed, 25 Sep 2024 16:53:03 +0900 Subject: [PATCH] [Misc] Fix minor typo in scheduler (#8765) --- vllm/core/scheduler.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/vllm/core/scheduler.py b/vllm/core/scheduler.py index b707d87c..873decff 100644 --- a/vllm/core/scheduler.py +++ b/vllm/core/scheduler.py @@ -1554,14 +1554,14 @@ class Scheduler: # the number of new tokens that is dividable by the block size # to avoid partial block matching. block_size = self.cache_config.block_size - reminder = budget.token_budget % block_size - if reminder != 0: + remainder = budget.token_budget % block_size + if remainder != 0: raise ValueError("When enabling chunked prefill and " "prefix caching, max_num_batched_tokens " "(chunk size) must be dividable by " "block size, but got chunk_size " f"({budget.token_budget}) % block_size " - f"({block_size}) = {reminder}") + f"({block_size}) = {remainder}") if remaining_token_budget < num_new_tokens: num_new_tokens = (remaining_token_budget // block_size) * block_size