Skip to content

Commit ffdb93b

Browse files
committed
tiny fix
Signed-off-by: Icey <1790571317@qq.com>
1 parent c4ad2bf commit ffdb93b

File tree

1 file changed

+9
-3
lines changed

1 file changed

+9
-3
lines changed

vllm_ascend/spec_decode/mtp_proposer.py

Lines changed: 9 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,8 +9,8 @@
99
from vllm.forward_context import BatchDescriptor, get_forward_context
1010
from vllm.model_executor.layers.attention_layer_base import AttentionLayerBase
1111
from vllm.model_executor.model_loader import get_model_loader
12-
from vllm.model_executor.model_loader.utils import (
13-
process_weights_after_loading, set_default_torch_dtype)
12+
from vllm.model_executor.model_loader.utils import \
13+
process_weights_after_loading
1414
from vllm.v1.core.sched.output import SchedulerOutput
1515
from vllm.v1.sample.metadata import SamplingMetadata
1616
from vllm.v1.spec_decode.metadata import SpecDecodeMetadata
@@ -24,7 +24,13 @@
2424
TorchairDeepSeekMTP
2525
from vllm_ascend.torchair.utils import (TORCHAIR_CACHE_DIR,
2626
TorchairCommonAttentionMetadata)
27-
from vllm_ascend.utils import ProfileExecuteDuration, lmhead_tp_enable
27+
from vllm_ascend.utils import (ProfileExecuteDuration, lmhead_tp_enable,
28+
vllm_version_is)
29+
30+
if vllm_version_is("0.11.0"):
31+
from vllm.model_executor.model_loader.utils import set_default_torch_dtype
32+
else:
33+
from vllm.utils.torch_utils import set_default_torch_dtype
2834

2935
PADDING_SLOT_ID = -1
3036

0 commit comments

Comments
 (0)