Skip to content

Commit 0cc6f23

Browse files
committed
[fix]: support deepseek-v3-dbo if enable DBO and fix known issues
Signed-off-by: zhuohuan <zxdu1997@gmail.com>
1 parent 2cd8ecd commit 0cc6f23

File tree

2 files changed

+9
-4
lines changed

2 files changed

+9
-4
lines changed

vllm_ascend/models/__init__.py

Lines changed: 8 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -35,14 +35,19 @@ def register_model():
3535
ModelRegistry.register_model(
3636
"DeepseekV2ForCausalLM",
3737
"vllm_ascend.models.deepseek_dbo:CustomDeepseekDBOForCausalLM")
38+
39+
ModelRegistry.register_model(
40+
"DeepseekV3ForCausalLM",
41+
"vllm_ascend.models.deepseek_dbo:CustomDeepseekDBOForCausalLM")
42+
3843
else:
3944
ModelRegistry.register_model(
4045
"DeepseekV2ForCausalLM",
4146
"vllm_ascend.models.deepseek_v2:CustomDeepseekV2ForCausalLM")
4247

43-
ModelRegistry.register_model(
44-
"DeepseekV3ForCausalLM",
45-
"vllm_ascend.models.deepseek_v2:CustomDeepseekV3ForCausalLM")
48+
ModelRegistry.register_model(
49+
"DeepseekV3ForCausalLM",
50+
"vllm_ascend.models.deepseek_v2:CustomDeepseekV3ForCausalLM")
4651

4752
ModelRegistry.register_model(
4853
"Qwen3MoeForCausalLM",

vllm_ascend/models/deepseek_dbo.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -641,7 +641,7 @@ def _forward_ms_layer(
641641

642642
if self.mlp.tp_size > 1:
643643
num_token, _ = hidden_states[i].shape
644-
padded_num_tokens = (self.mlp.tp_size - num_token %
644+
padded_num_tokens = (self.mlp.tp_size - num_tokens[i] %
645645
self.mlp.tp_size) % self.mlp.tp_size
646646
if padded_num_tokens > 0:
647647
hidden_states[i] = nn.functional.pad(

0 commit comments

Comments
 (0)