We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c4075b8 commit 2ecf4baCopy full SHA for 2ecf4ba
vllm/model_executor/layers/fused_moe/layer.py
@@ -503,7 +503,6 @@ def forward_cuda(
503
indices_type=torch.uint32 if self.moe.use_pplx_kernels else None)
504
505
if self.rocm_aiter_moe_enabled:
506
- assert not apply_router_weight_on_input
507
assert expert_map is None
508
return self.rocm_aiter_fused_experts(
509
hidden_states=x,
0 commit comments