[CI]enable chunked prefill by default

wangxiyuan · wangxiyuan · commit e2e4c4af0d7d · 2025-11-29T16:23:56.000+08:00
Signed-off-by: wangxiyuan &lt;wangxiyuan1007@gmail.com&gt;
diff --git a/tests/e2e/conftest.py b/tests/e2e/conftest.py
@@ -280,7 +280,7 @@ def __init__(
         disable_log_stats: bool = True,
         tensor_parallel_size: int = 1,
         block_size: int = 16,
-        enable_chunked_prefill: bool = False,
+        enable_chunked_prefill: bool = True,
         swap_space: int = 4,
         enforce_eager: Optional[bool] = False,
         quantization: Optional[str] = None,
diff --git a/tests/e2e/multicard/test_prefix_caching.py b/tests/e2e/multicard/test_prefix_caching.py
@@ -58,7 +58,6 @@
 ]
 
 
-@pytest.mark.skip(reason="Fix me, the accuracy is not correct")
 @pytest.mark.parametrize("model", MODELS)
 @pytest.mark.parametrize("max_tokens", [50])
 def test_prefix_cache_with_v1_scheduler(model: str, max_tokens: int) -> None:
diff --git a/tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py b/tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py
@@ -117,7 +117,6 @@ def test_eagle_correctness(
     spec_model_name = eagle3_model_name() if use_eagle3 else eagle_model_name()
     with VllmRunner(
             model_name,
-            enable_chunked_prefill=True,
             max_num_seqs=1,
             max_num_batched_tokens=2048,
             gpu_memory_utilization=0.6,

Original file line number	Diff line number	Diff line change
`@@ -58,7 +58,6 @@`
`58`	`58`	`]`
`59`	`59`
`60`	`60`
`61`		`-@pytest.mark.skip(reason="Fix me, the accuracy is not correct")`
`62`	`61`	`@pytest.mark.parametrize("model", MODELS)`
`63`	`62`	`@pytest.mark.parametrize("max_tokens", [50])`
`64`	`63`	`def test_prefix_cache_with_v1_scheduler(model: str, max_tokens: int) -> None:`