We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7efa6e0 commit 405e730Copy full SHA for 405e730
vllm/engine/arg_utils.py
@@ -1063,7 +1063,8 @@ def create_engine_config(self,
1063
if (is_gpu and not use_sliding_window and not use_spec_decode
1064
and not self.enable_lora
1065
and not self.enable_prompt_adapter
1066
- and model_config.task != "embedding"):
+ and model_config.task != "embedding"
1067
+ and not current_platform.is_rocm()):
1068
self.enable_chunked_prefill = True
1069
logger.warning(
1070
"Chunked prefill is enabled by default for models with "
0 commit comments