fix ruff rejections

Kfir Wolfson · Kfir Wolfson · commit e391053e4d6b · 2025-10-16T11:32:22.000+03:00
Signed-off-by: Kfir Wolfson &lt;kfirw@pliops.com&gt;
diff --git a/requirements/test.txt b/requirements/test.txt
@@ -1224,7 +1224,6 @@ typeshed-client==2.8.2
     # via jsonargparse
 typing-extensions==4.15.0
     # via
-    #   aiosignal
     #   albumentations
     #   alembic
     #   chz
diff --git a/tests/v1/core/test_scheduler.py b/tests/v1/core/test_scheduler.py
@@ -1279,7 +1279,7 @@ def test_cache_hit_threshold(
     # number of blocks hit in external cache per request
     request_external_hit_blocks: list[int],
     # optional cache_hit_threshold for each request
-    request_thresholds: list[Optional[float]],
+    request_thresholds: list[float | None],
     # bool per request indicating if it is expected to be scheduled
     request_expected_scehduled: list[bool],
 ):
@@ -1326,7 +1326,7 @@ def test_cache_hit_threshold(
 
 def _create_and_schedule_requests(
     request_num_tokens: list[int],
-    request_thresholds: list[Optional[float]],
+    request_thresholds: list[float | None],
     scheduler: Scheduler,
 ):
     num_requests = len(request_num_tokens)
@@ -1373,7 +1373,7 @@ def _insert_to_local_cache(request_local_hit_blocks, scheduler: Scheduler):
     scheduler.connector.get_num_new_matched_tokens.return_value = (0, False)
 
     # set threshold to 0.0 to ensure all are scheduled
-    zero_thresholds: list[Optional[float]] = [0.0] * num_total_requests
+    zero_thresholds: list[float | None] = [0.0] * num_total_requests
 
     # Only requests with local hits should run and populate the cache
     # We create all requests to make sure the correct tokens are cached
diff --git a/vllm/entrypoints/logger.py b/vllm/entrypoints/logger.py
@@ -46,8 +46,7 @@ def log_inputs(
         )
 
         logger.info(
-            "Received request %s: params: %s, "
-            "lora_request: %s ",
+            "Received request %s: params: %s, lora_request: %s ",
             "cache_hit_threshold: %s.",
             request_id,
             params,
diff --git a/vllm/entrypoints/openai/protocol.py b/vllm/entrypoints/openai/protocol.py
@@ -1308,7 +1308,7 @@ class CompletionRequest(OpenAIBaseModel):
         default=None,
         description="Minimum required KV-cache hit ratio to process the request.",
     )
-    
+
     vllm_xargs: dict[str, str | int | float] | None = Field(
         default=None,
         description=(
diff --git a/vllm/v1/core/sched/scheduler.py b/vllm/v1/core/sched/scheduler.py
@@ -428,10 +428,11 @@ def schedule(self) -> SchedulerOutput:
                         num_new_local_computed_tokens + num_external_computed_tokens
                     )
                     # Cache hit threshold in request overrides global setting
+                    scheduler_config = self.vllm_config.scheduler_config
                     cache_hit_threshold = (
                         request.cache_hit_threshold
                         if request.cache_hit_threshold is not None
-                        else self.vllm_config.scheduler_config.global_cache_hit_threshold  # noqa: E501
+                        else scheduler_config.global_cache_hit_threshold
                     )
 
                     # Check if cache hit is above threshold

Original file line number	Diff line number	Diff line change
`@@ -46,8 +46,7 @@ def log_inputs(`
`46`	`46`	`)`
`47`	`47`
`48`	`48`	`logger.info(`
`49`		`- "Received request %s: params: %s, "`
`50`		`- "lora_request: %s ",`
	`49`	`+ "Received request %s: params: %s, lora_request: %s ",`
`51`	`50`	`"cache_hit_threshold: %s.",`
`52`	`51`	`request_id,`
`53`	`52`	`params,`
Original file line number	Diff line number	Diff line change
`@@ -1308,7 +1308,7 @@ class CompletionRequest(OpenAIBaseModel):`
`1308`	`1308`	`default=None,`
`1309`	`1309`	`description="Minimum required KV-cache hit ratio to process the request.",`
`1310`	`1310`	`)`
`1311`		`-`
	`1311`	`+`
`1312`	`1312`	`vllm_xargs: dict[str, str \| int \| float] \| None = Field(`
`1313`	`1313`	`default=None,`
`1314`	`1314`	`description=(`
Original file line number	Diff line number	Diff line change
`@@ -428,10 +428,11 @@ def schedule(self) -> SchedulerOutput:`
`428`	`428`	`num_new_local_computed_tokens + num_external_computed_tokens`
`429`	`429`	`)`
`430`	`430`	`# Cache hit threshold in request overrides global setting`
	`431`	`+ scheduler_config = self.vllm_config.scheduler_config`
`431`	`432`	`cache_hit_threshold = (`
`432`	`433`	`request.cache_hit_threshold`
`433`	`434`	`if request.cache_hit_threshold is not None`
`434`		`- else self.vllm_config.scheduler_config.global_cache_hit_threshold # noqa: E501`
	`435`	`+ else scheduler_config.global_cache_hit_threshold`
`435`	`436`	`)`
`436`	`437`
`437`	`438`	`# Check if cache hit is above threshold`