vllm-project · czhu-cohere · Mar 12, 2026 · Mar 12, 2026 · gemini-code-assist · Mar 12, 2026
@@ -97,7 +97,6 @@ def _make_log_backend(backend: UnquantizedMoeBackend):
     flashinfer_cutlass_available = (
         has_flashinfer_cutlass_fused_moe()
         and use_ep
-        and (not use_dp)
         and current_platform.has_device_capability(90)
     )
     flashinfer_trtllm_moe_enabled = (
@@ -161,18 +160,13 @@ def _make_log_backend(backend: UnquantizedMoeBackend):
                     "to enable it for better performance.",
                     scope="local",
                 )
-            elif use_ep and (not use_dp):
+            elif use_ep:
                 logger.info_once(
                     "FlashInfer MoE is available for EP"
                     " but not enabled, consider setting"
                     " VLLM_USE_FLASHINFER_MOE_FP16=1 to enable it.",
                     scope="local",
                 )
-            elif use_dp:
-                logger.info_once(
-                    "FlashInfer CUTLASS MoE is currently not available for DP.",
-                    scope="local",
-                )
             backend = UnquantizedMoeBackend.TRITON
     if current_platform.is_xpu():
         backend = UnquantizedMoeBackend.XPU