File tree Expand file tree Collapse file tree 3 files changed +22
-4
lines changed
patch/platform/patch_common Expand file tree Collapse file tree 3 files changed +22
-4
lines changed Original file line number Diff line number Diff line change 5555 ParallelLMHead , VocabParallelEmbedding )
5656from vllm .model_executor .model_loader .weight_utils import (
5757 default_weight_loader , maybe_remap_kv_scale_name )
58- from vllm .model_executor .models import deepseek_v2
5958from vllm .model_executor .models .deepseek_v2 import \
6059 DeepseekV2ForCausalLM # noqa: E501
6160from vllm .model_executor .models .deepseek_v2 import \
6968from vllm .sequence import IntermediateTensors
7069
7170from vllm_ascend .ascend_config import get_ascend_config
72- from vllm_ascend .ops .common_fused_moe import AscendSharedFusedMoE
7371from vllm_ascend .ops .fused_moe import AscendFusedMoE
7472from vllm_ascend .quantization .quant_config import AscendLinearMethod
7573from vllm_ascend .quantization .w8a8_dynamic import AscendW8A8DynamicLinearMethod
7674from vllm_ascend .utils import dispose_tensor
7775
78- deepseek_v2 .SharedFusedMoE = AscendSharedFusedMoE
79-
8076
8177class CustomDeepseekV2SiluAndMul (SiluAndMul ):
8278
Original file line number Diff line number Diff line change 1616#
1717
1818import vllm_ascend .patch .platform .patch_common .patch_distributed # noqa
19+ import vllm_ascend .patch .platform .patch_common .patch_shared_fused_moe # noqa
Original file line number Diff line number Diff line change 1+ # Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
2+ # Copyright 2023 The vLLM team.
3+ #
4+ # Licensed under the Apache License, Version 2.0 (the "License");
5+ # you may not use this file except in compliance with the License.
6+ # You may obtain a copy of the License at
7+ #
8+ # http://www.apache.org/licenses/LICENSE-2.0
9+ #
10+ # Unless required by applicable law or agreed to in writing, software
11+ # distributed under the License is distributed on an "AS IS" BASIS,
12+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13+ # See the License for the specific language governing permissions and
14+ # limitations under the License.
15+
16+ from vllm .model_executor .models import deepseek_v2 , llama4
17+
18+ from vllm_ascend .ops .common_fused_moe import AscendSharedFusedMoE
19+
20+ deepseek_v2 .SharedFusedMoE = AscendSharedFusedMoE
21+ llama4 .SharedFusedMoE = AscendSharedFusedMoE
You can’t perform that action at this time.
0 commit comments