diff --git a/vllm/core/interfaces.py b/vllm/core/interfaces.py index ba290eeda12b..69b9169ddd8a 100644 --- a/vllm/core/interfaces.py +++ b/vllm/core/interfaces.py @@ -133,3 +133,7 @@ def reset_prefix_cache(self, device: Optional[Device] = None) -> bool: @abstractmethod def get_num_cached_tokens(self, seq: Sequence) -> int: pass + + @abstractmethod + def remove_seq_from_computed_blocks_tracker(self, seq: Sequence) -> None: + pass \ No newline at end of file diff --git a/vllm/core/placeholder_block_space_manager.py b/vllm/core/placeholder_block_space_manager.py index 71b22942a3ed..679515924e85 100644 --- a/vllm/core/placeholder_block_space_manager.py +++ b/vllm/core/placeholder_block_space_manager.py @@ -98,3 +98,6 @@ def reset_prefix_cache(self, device: Optional[Device] = None) -> bool: def get_num_cached_tokens(self, seq: Sequence) -> int: return 0 + + def remove_seq_from_computed_blocks_tracker(self, seq: Sequence) -> None: + return