File tree Expand file tree Collapse file tree 1 file changed +6
-4
lines changed
Expand file tree Collapse file tree 1 file changed +6
-4
lines changed Original file line number Diff line number Diff line change 2929FUSED_OPS : dict [QuantKey , OpOverload ] = {
3030 kFp8StaticTensorSym : torch .ops ._C .silu_and_mul_quant .default , # noqa: E501
3131}
32- if current_platform .is_cuda () and hasattr (torch .ops ._C ,
33- "silu_and_mul_nvfp4_quant" ):
32+ silu_and_mul_nvfp4_quant_supported = (current_platform .is_cuda () and hasattr (
33+ torch .ops ._C , "silu_and_mul_nvfp4_quant" ))
34+ if silu_and_mul_nvfp4_quant_supported :
3435 FUSED_OPS [
3536 kNvfp4Quant ] = torch .ops ._C .silu_and_mul_nvfp4_quant .default # noqa: E501
3637
@@ -171,8 +172,9 @@ def __init__(self, config: VllmConfig):
171172 pattern_silu_mul_fp8 = SiluMulFp8StaticQuantPattern ()
172173 pattern_silu_mul_fp8 .register (self .patterns )
173174
174- pattern_silu_mul_nvfp4 = SiluMulNvfp4QuantPattern ()
175- pattern_silu_mul_nvfp4 .register (self .patterns )
175+ if silu_and_mul_nvfp4_quant_supported :
176+ pattern_silu_mul_nvfp4 = SiluMulNvfp4QuantPattern ()
177+ pattern_silu_mul_nvfp4 .register (self .patterns )
176178
177179 def __call__ (self , graph : torch .fx .Graph ):
178180 self .begin ()
You can’t perform that action at this time.
0 commit comments