File tree Expand file tree Collapse file tree 1 file changed +2
-5
lines changed
vllm/model_executor/models Expand file tree Collapse file tree 1 file changed +2
-5
lines changed Original file line number Diff line number Diff line change @@ -481,12 +481,9 @@ def verify_and_update_config(cls, vllm_config: "VllmConfig") -> None:
481481 is_v32 = hasattr (hf_config , "index_topk" )
482482 assert is_v32
483483
484- # For DeepSeekV3.2, we use a custom fp8 format as default (i.e.
485- # "auto")
484+ # For DeepSeekV3.2, a custom fp8 format is used when fp8 kv-cache is enabled.
486485 cache_config = vllm_config .cache_config
487- if cache_config .cache_dtype == "auto" or cache_config .cache_dtype .startswith (
488- "fp8"
489- ):
486+ if cache_config .cache_dtype .startswith ("fp8" ):
490487 cache_config .cache_dtype = "fp8_ds_mla"
491488 logger .info ("Using custom fp8 kv-cache format for DeepSeekV3.2" )
492489 if cache_config .cache_dtype == "bfloat16" :
You can’t perform that action at this time.
0 commit comments