We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 64f688e commit aded6eaCopy full SHA for aded6ea
vllm_ascend/quantization/quant_config.py
@@ -38,7 +38,6 @@
38
from vllm_ascend.distributed.parallel_state import (get_mlp_tp_group,
39
get_otp_group)
40
from vllm_ascend.ops.common_fused_moe import AscendUnquantizedFusedMoEMethod
41
-from vllm_ascend.ops.linear import AscendUnquantizedLinearMethod
42
from vllm_ascend.utils import (ASCEND_QUANTIZATION_METHOD, mlp_tp_enable,
43
oproj_tp_enable)
44
0 commit comments