Skip to content

Commit 7200a21

Browse files
authored
[Bug] Fix Assertion error DeepEP/csrc/kernels/intranode.cu:928: 'false and Unsupported type' (#26532)
Signed-off-by: yewentao256 <zhyanwentao@126.com>
1 parent 577c72a commit 7200a21

File tree

2 files changed

+5
-1
lines changed

2 files changed

+5
-1
lines changed

vllm/model_executor/layers/fused_moe/deepep_ht_prepare_finalize.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -336,7 +336,11 @@ def _finalize(
336336
apply_router_weight_on_input=apply_router_weight_on_input,
337337
)
338338
dbo_yield_and_switch_from_compute_to_comm()
339+
assert fused_expert_output.dtype == torch.bfloat16, (
340+
f"Expected fused_expert_output bfloat16, got {fused_expert_output.dtype}"
341+
)
339342
combined_x, _, event = self.buffer.combine(
343+
# HT combine only supports BF16
340344
x=fused_expert_output,
341345
handle=handle,
342346
topk_weights=None,

vllm/model_executor/layers/fused_moe/modular_kernel.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -984,7 +984,7 @@ def input_chunk_range(chunk_idx: int) -> tuple[int, int]:
984984
assert num_chunks == 0
985985
workspace13 = None
986986
workspace2 = None
987-
fused_out = torch.empty_like(a1q)
987+
fused_out = torch.empty_like(a1q, dtype=in_dtype)
988988
else:
989989
assert num_chunks > 0
990990
workspace13, workspace2, fused_out = self._allocate_buffers(

0 commit comments

Comments
 (0)