fix autotuning

zyongye · zyongye · commit 9f3a99dee5d4 · 2026-03-05T01:24:20.000Z
diff --git a/flashinfer/fused_moe/core.py b/flashinfer/fused_moe/core.py
@@ -2154,9 +2154,17 @@ def trtllm_mxint4_block_scale_moe_op(
             use_shuffled_weight=True,
         )
         tunning_config = MoERunner.tuning_config_no_hidden_states_scales
+        # Create placeholder for tuning when routing_logits is None (routed mode)
+        routing_logits_for_tuning = (
+            routing_logits
+            if routing_logits is not None
+            else torch.empty(
+                num_tokens, num_experts, dtype=routing_dtype, device="meta"
+            )
+        )
         inputs = [
             output,
-            routing_logits,
+            routing_logits_for_tuning,
             topk_ids,
             expert_weights,
             hidden_states,