Fix torch version check for mxfp4

zifeitong · zifeitong · commit 29032ddfeb92 · 2025-08-08T11:10:00.000-07:00
Signed-off-by: Zifei Tong &lt;zifeitong@gmail.com&gt;
diff --git a/vllm/model_executor/layers/fused_moe/layer.py b/vllm/model_executor/layers/fused_moe/layer.py
@@ -724,12 +724,12 @@ def __init__(
 
         # we padding globally so EP buffer allocation works
         if quant_config and quant_config.get_name() == "mxfp4":
-            if not is_torch_equal_or_newer("2.8.0"):
-                raise RuntimeError("Mxfp4 on hopper requires torch >= 2.8.0")
-            if current_platform.is_device_capability(
-                    90) and not has_triton_kernels():
-                raise NotImplementedError(
-                    "Triton kernels must be installed for mxfp4 on hopper")
+            if current_platform.is_device_capability(90):
+                if not is_torch_equal_or_newer("2.8.0"):
+                    raise RuntimeError("Mxfp4 on hopper requires torch >= 2.8.0")
+                if not has_triton_kernels():
+                    raise NotImplementedError(
+                        "Triton kernels must be installed for mxfp4 on hopper")
             if (current_platform.is_rocm()
                     or envs.VLLM_USE_FLASHINFER_MOE_MXFP4_MXFP8
                     or envs.VLLM_USE_FLASHINFER_MOE_MXFP4_BF16):