Skip to content

Commit 85bda9e

Browse files
remove GLM-4.5 quantization wrong Code (#21435)
1 parent 610852a commit 85bda9e

File tree

3 files changed

+2
-3
lines changed

3 files changed

+2
-3
lines changed

vllm/entrypoints/openai/tool_parsers/glm4_moe_tool_parser.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020
logger = init_logger(__name__)
2121

2222

23-
@ToolParserManager.register_module("glm4_moe")
23+
@ToolParserManager.register_module("glm45")
2424
class Glm4MoeModelToolParser(ToolParser):
2525

2626
def __init__(self, tokenizer: AnyTokenizer):

vllm/model_executor/models/glm4_moe.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -390,7 +390,6 @@ def __init__(self, *, vllm_config: VllmConfig, prefix: str = ""):
390390
self.embed_tokens = VocabParallelEmbedding(
391391
config.vocab_size,
392392
config.hidden_size,
393-
quant_config=quant_config,
394393
prefix=f"{prefix}.embed_tokens")
395394
else:
396395
self.embed_tokens = PPMissingLayer()

vllm/reasoning/glm4_moe_reasoning_parser.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
logger = init_logger(__name__)
1515

1616

17-
@ReasoningParserManager.register_module("glm4_moe")
17+
@ReasoningParserManager.register_module("glm45")
1818
class Glm4MoeModelReasoningParser(ReasoningParser):
1919
"""
2020
Reasoning parser for the Glm4MoeModel model.

0 commit comments

Comments
 (0)