enable mrope and lora

bigPYJ1151 · bigPYJ1151 · commit cceb5f0fa7f8 · 2025-06-03T09:58:48.000Z
Signed-off-by: jiang.li &lt;jiang1.li@intel.com&gt;
diff --git a/vllm/platforms/cpu.py b/vllm/platforms/cpu.py
@@ -159,7 +159,7 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
         compilation_config = vllm_config.compilation_config
         if vllm_config.compilation_config.level == CompilationLevel.PIECEWISE:
             compilation_config.level = CompilationLevel.DYNAMO_ONCE
-            compilation_config.backend = "inductor"
+            compilation_config.backend = "eager"
             compilation_config.custom_ops += ["none"]
             compilation_config.inductor_compile_config.update({
                 "dce":
diff --git a/vllm/v1/worker/cpu_model_runner.py b/vllm/v1/worker/cpu_model_runner.py
@@ -19,8 +19,6 @@ def __init__(self, vllm_config: VllmConfig, device: torch.device):
 
         assert device == torch.device("cpu")
         assert self.speculative_config is None, "spec decode is not supported."
-        assert not self.model_config.uses_mrope, "mrope is not supported."
-        assert self.lora_config is None, "lora is not supported."
 
         self.use_cuda_graph = False
         self.cascade_attn_enabled = False