We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b584b1b commit bb462a9Copy full SHA for bb462a9
vllm/model_executor/layers/fused_moe/mori_prepare_finalize.py
@@ -81,7 +81,10 @@ def finalize(
81
self,
82
output: torch.Tensor,
83
fused_expert_output: torch.Tensor,
84
+ topk_weights: torch.Tensor,
85
topk_ids: torch.Tensor,
86
+ apply_router_weight_on_input: None,
87
+ weight_and_reduce_impl: None,
88
) -> None:
89
num_token = output.shape[0]
90
result = self.mori_op.combine(
0 commit comments