Skip to content

Commit 9748c51

Browse files
sarckkywang96
andauthored
[CI] Fix broken compile tests due to unsupported SiluMul+Nvfp4Quant fusion (#23973)
Signed-off-by: Yong Hoon Shin <[email protected]> Co-authored-by: Roger Wang <[email protected]>
1 parent ee52a32 commit 9748c51

File tree

1 file changed

+6
-4
lines changed

1 file changed

+6
-4
lines changed

vllm/compilation/activation_quant_fusion.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -29,8 +29,9 @@
2929
FUSED_OPS: dict[QuantKey, OpOverload] = {
3030
kFp8StaticTensorSym: torch.ops._C.silu_and_mul_quant.default, # noqa: E501
3131
}
32-
if current_platform.is_cuda() and hasattr(torch.ops._C,
33-
"silu_and_mul_nvfp4_quant"):
32+
silu_and_mul_nvfp4_quant_supported = (current_platform.is_cuda() and hasattr(
33+
torch.ops._C, "silu_and_mul_nvfp4_quant"))
34+
if silu_and_mul_nvfp4_quant_supported:
3435
FUSED_OPS[
3536
kNvfp4Quant] = torch.ops._C.silu_and_mul_nvfp4_quant.default # noqa: E501
3637

@@ -171,8 +172,9 @@ def __init__(self, config: VllmConfig):
171172
pattern_silu_mul_fp8 = SiluMulFp8StaticQuantPattern()
172173
pattern_silu_mul_fp8.register(self.patterns)
173174

174-
pattern_silu_mul_nvfp4 = SiluMulNvfp4QuantPattern()
175-
pattern_silu_mul_nvfp4.register(self.patterns)
175+
if silu_and_mul_nvfp4_quant_supported:
176+
pattern_silu_mul_nvfp4 = SiluMulNvfp4QuantPattern()
177+
pattern_silu_mul_nvfp4.register(self.patterns)
176178

177179
def __call__(self, graph: torch.fx.Graph):
178180
self.begin()

0 commit comments

Comments
 (0)