We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b614e0f commit 3331cedCopy full SHA for 3331ced
vllm/platforms/rocm.py
@@ -340,7 +340,8 @@ def check_and_update_config(cls, vllm_config: "VllmConfig") -> None:
340
else:
341
parallel_config.worker_cls = "vllm.worker.worker.Worker"
342
# Aiter rms norm perform best when CUDA Graph capture is enabled.
343
- if use_v1 and use_aiter_rms_norm and not is_eager_execution:
+ if (use_v1 and use_aiter_rms_norm and not is_eager_execution
344
+ and "-rms_norm" not in compilation_config.custom_ops):
345
compilation_config.custom_ops.append("+rms_norm")
346
347
@classmethod
0 commit comments