precommit + fmt

jthomson04 · jthomson04 · commit 7fe54de25e09 · 2025-07-02T13:03:59.000-07:00
diff --git a/lib/bindings/python/rust/llm/block_manager.rs b/lib/bindings/python/rust/llm/block_manager.rs
@@ -97,7 +97,7 @@ impl BlockManager {
                         .map_err(to_pyerr)?,
                 );
             }
-    
+
             if leader.num_disk_blocks() > 0 {
                 tracing::info!("Using {} disk blocks", leader.num_disk_blocks());
                 config = config.disk_layout(
@@ -111,7 +111,15 @@ impl BlockManager {
             (Some(leader), rt)
         } else {
             tracing::info!("Leader not provided. Block transfer functionality will be disabled.");
-            (None, Arc::new(tokio::runtime::Builder::new_multi_thread().enable_all().build().map_err(to_pyerr)?))
+            (
+                None,
+                Arc::new(
+                    tokio::runtime::Builder::new_multi_thread()
+                        .enable_all()
+                        .build()
+                        .map_err(to_pyerr)?,
+                ),
+            )
         };
 
         let config = config.build().map_err(to_pyerr)?;
diff --git a/lib/bindings/python/tests/test_kvbm.py b/lib/bindings/python/tests/test_kvbm.py
@@ -15,6 +15,7 @@
 try:
     from dynamo.llm import BlockManager
     from dynamo.llm.vllm_integration.kv_cache_manager import KvbmCacheManager
+
     KVBM_NOT_AVAILABLE = False
 except ImportError:
     KVBM_NOT_AVAILABLE = True
@@ -24,6 +25,7 @@
 PAGE_SIZE = 4
 DEVICE_NUM_BLOCKS = 16
 
+
 def new_request():
     return Request(
         request_id=str(uuid.uuid4()),
diff --git a/lib/bindings/python/tests/test_kvbm_vllm_integration.py b/lib/bindings/python/tests/test_kvbm_vllm_integration.py
@@ -1,7 +1,6 @@
 # SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 # SPDX-License-Identifier: Apache-2.0
 
-import time
 from typing import Optional
 
 import pytest
@@ -24,14 +23,13 @@
 try:
     from dynamo.llm import BlockManager
     from dynamo.llm.vllm_integration.kv_cache_manager import KvbmCacheManager
+
     KVBM_NOT_AVAILABLE = False
-except:
+except ImportError:
     KVBM_NOT_AVAILABLE = True
 
-def new_kv_cache_manager(
-    num_blocks: int = 11,
-    page_size: int = 16
-):
+
+def new_kv_cache_manager(num_blocks: int = 11, page_size: int = 16):
     """
     Creates a new KVBM cache manager.
 
@@ -89,7 +87,10 @@ def make_kv_cache_config(block_size: int, num_blocks: int) -> KVCacheConfig:
     )
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_prefill():
     """
     Tests the KvbmCacheManager's prefill functionality.
@@ -282,7 +283,10 @@ def test_prefill_plp():
     manager.free(req2)
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_decode():
     manager = new_kv_cache_manager()
 
@@ -350,7 +354,10 @@ def test_decode():
     manager.free_block_hashes(req0)
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_evict():
     manager = new_kv_cache_manager()
     used_blocks = set()
@@ -416,10 +423,13 @@ def test_evict():
     # assert manager.block_pool.free_block_queue.num_free_blocks == 7
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_hash_block_correct_reuse():
     """
-    This tests when a previously cached block is reused as a new block, 
+    This tests when a previously cached block is reused as a new block,
     its hash metadata should be correctly reset.
     """
     block_size = 16
@@ -467,7 +477,10 @@ def test_hash_block_correct_reuse():
     assert blocks.blocks[1].block_hash is None
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_computed_blocks_not_evicted():
     """
     Test that the computed blocks are not evicted when getting new blocks
@@ -564,7 +577,10 @@ def _test_mm_prefix_caching():
     pass
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_cache_key_salting():
     """
     This tests that cache salts are applied during hashing and the cache
@@ -635,7 +651,10 @@ def test_cache_key_salting():
     """
 
 
-@pytest.mark.skipif(VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE, reason="VLLM not available or KVBM not available")
+@pytest.mark.skipif(
+    VLLM_NOT_AVAILABLE or KVBM_NOT_AVAILABLE,
+    reason="VLLM not available or KVBM not available",
+)
 def test_prefill_not_enough_free_blocks_with_computed_blocks():
     """
     This is a unit test that tests the correctness of the allocate_slots
@@ -758,6 +777,7 @@ def _test_eagle_with_sliding_window():
     Test Eagle behavior with sliding window."""
     pass
 
+
 @pytest.mark.skipif(KVBM_NOT_AVAILABLE, reason="KVBM not available")
 def test_kvbm_wrong_blocks_provided():
     """