We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d5d2950 commit ea3ecbfCopy full SHA for ea3ecbf
vllm/model_executor/layers/fused_moe/layer.py
@@ -426,7 +426,7 @@ def apply(
426
w2=layer.w2_weight,
427
topk_weights=topk_weights,
428
topk_ids=topk_ids,
429
- inplace=True,
+ inplace=True, # TODO(bnell): make sure this is handled properly
430
activation=activation,
431
global_num_experts=global_num_experts,
432
apply_router_weight_on_input=apply_router_weight_on_input,
0 commit comments