File tree Expand file tree Collapse file tree 2 files changed +9
-4
lines changed Expand file tree Collapse file tree 2 files changed +9
-4
lines changed Original file line number Diff line number Diff line change @@ -35,14 +35,19 @@ def register_model():
3535 ModelRegistry .register_model (
3636 "DeepseekV2ForCausalLM" ,
3737 "vllm_ascend.models.deepseek_dbo:CustomDeepseekDBOForCausalLM" )
38+
39+ ModelRegistry .register_model (
40+ "DeepseekV3ForCausalLM" ,
41+ "vllm_ascend.models.deepseek_dbo:CustomDeepseekDBOForCausalLM" )
42+
3843 else :
3944 ModelRegistry .register_model (
4045 "DeepseekV2ForCausalLM" ,
4146 "vllm_ascend.models.deepseek_v2:CustomDeepseekV2ForCausalLM" )
4247
43- ModelRegistry .register_model (
44- "DeepseekV3ForCausalLM" ,
45- "vllm_ascend.models.deepseek_v2:CustomDeepseekV3ForCausalLM" )
48+ ModelRegistry .register_model (
49+ "DeepseekV3ForCausalLM" ,
50+ "vllm_ascend.models.deepseek_v2:CustomDeepseekV3ForCausalLM" )
4651
4752 ModelRegistry .register_model (
4853 "Qwen3MoeForCausalLM" ,
Original file line number Diff line number Diff line change @@ -641,7 +641,7 @@ def _forward_ms_layer(
641641
642642 if self .mlp .tp_size > 1 :
643643 num_token , _ = hidden_states [i ].shape
644- padded_num_tokens = (self .mlp .tp_size - num_token %
644+ padded_num_tokens = (self .mlp .tp_size - num_tokens [ i ] %
645645 self .mlp .tp_size ) % self .mlp .tp_size
646646 if padded_num_tokens > 0 :
647647 hidden_states [i ] = nn .functional .pad (
You can’t perform that action at this time.
0 commit comments