From 6cd5a7be01baabf9e224611e7c2b457894e287bf Mon Sep 17 00:00:00 2001 From: homeffjy <74026382+homeffjy@users.noreply.github.com> Date: Sat, 12 Oct 2024 02:02:03 +0800 Subject: [PATCH] [Doc] Remove outdated comment to avoid misunderstanding (#9287) --- vllm/core/block_manager_v2.py | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/vllm/core/block_manager_v2.py b/vllm/core/block_manager_v2.py index c7ee6609306d7..cb047c832e6cb 100644 --- a/vllm/core/block_manager_v2.py +++ b/vllm/core/block_manager_v2.py @@ -24,9 +24,8 @@ class BlockSpaceManagerV2(BlockSpaceManager): autoregressively-generated tokens, and other advanced features such as prefix caching, forking/copy-on-write, and sliding-window memory allocation. - The current implementation is partial; in particular prefix caching and - sliding-window are not feature complete. This class implements the design - described in https://github.com/vllm-project/vllm/pull/3492. + This class implements the design described in + https://github.com/vllm-project/vllm/pull/3492. Lookahead slots The block manager has the notion of a "lookahead slot". These are slots @@ -190,7 +189,7 @@ def allocate(self, seq_group: SequenceGroup) -> None: assert (request_id not in self.cross_block_tables), \ - "block table already exists" + "block table already exists" check_no_caching_or_swa_for_blockmgr_encdec(self, seq_group)