Skip to content

Commit cceb5f0

Browse files
committed
enable mrope and lora
Signed-off-by: jiang.li <jiang1.li@intel.com>
1 parent cce8031 commit cceb5f0

File tree

2 files changed

+1
-3
lines changed

2 files changed

+1
-3
lines changed

vllm/platforms/cpu.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -159,7 +159,7 @@ def check_and_update_config(cls, vllm_config: VllmConfig) -> None:
159159
compilation_config = vllm_config.compilation_config
160160
if vllm_config.compilation_config.level == CompilationLevel.PIECEWISE:
161161
compilation_config.level = CompilationLevel.DYNAMO_ONCE
162-
compilation_config.backend = "inductor"
162+
compilation_config.backend = "eager"
163163
compilation_config.custom_ops += ["none"]
164164
compilation_config.inductor_compile_config.update({
165165
"dce":

vllm/v1/worker/cpu_model_runner.py

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,8 +19,6 @@ def __init__(self, vllm_config: VllmConfig, device: torch.device):
1919

2020
assert device == torch.device("cpu")
2121
assert self.speculative_config is None, "spec decode is not supported."
22-
assert not self.model_config.uses_mrope, "mrope is not supported."
23-
assert self.lora_config is None, "lora is not supported."
2422

2523
self.use_cuda_graph = False
2624
self.cascade_attn_enabled = False

0 commit comments

Comments
 (0)