We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d52358c commit fdeb3daCopy full SHA for fdeb3da
vllm/model_executor/models/deepseek_v2.py
@@ -126,7 +126,7 @@ def __init__(
126
prefix=f"{prefix}.gate")
127
if config.topk_method == "noaux_tc":
128
self.gate.e_score_correction_bias = nn.Parameter(
129
- torch.empty(config.n_routed_experts))
+ torch.empty(config.n_routed_experts, dtype=torch.float32))
130
else:
131
self.gate.e_score_correction_bias = None
132
0 commit comments