diff --git a/vllm/model_executor/layers/quantization/quark/quark_moe.py b/vllm/model_executor/layers/quantization/quark/quark_moe.py index 0a5db4e71fdb..a3e0f24fb662 100644 --- a/vllm/model_executor/layers/quantization/quark/quark_moe.py +++ b/vllm/model_executor/layers/quantization/quark/quark_moe.py @@ -730,10 +730,12 @@ def __init__( get_current_vllm_config().model_config.hf_config, "model_type", None ) - self.emulate = ( - not current_platform.supports_mx() - or not self.ocp_mx_scheme.startswith("w_mxfp4") - ) and (self.mxfp4_backend is None or not self.use_rocm_aiter_moe) + self.emulate = not ( + current_platform.supports_mx() + and self.ocp_mx_scheme.startswith("w_mxfp4") + and self.mxfp4_backend is not None + and self.use_rocm_aiter_moe + ) # CK's pre-compiled MXFP4 MoE GEMM kernel instances have dimension # alignment requirements. When violated (e.g. MiniMax-M2.1 with