UT fix

zzhx1 · Kurumi5210 · zzhx1 · commit 1dd4c1271271 · 2025-11-26T22:31:42.000+08:00
Co-authored-by: chenxiao &lt;Jaychou1620@Gmail.com&gt;
Signed-off-by: zzhx1 &lt;zzh_201018@outlook.com&gt;
diff --git a/tests/ut/attention/test_mla_v1.py b/tests/ut/attention/test_mla_v1.py
@@ -6,6 +6,7 @@
 from vllm.model_executor.layers.linear import LinearBase
 
 from tests.ut.base import TestBase
+from vllm_ascend.ascend_config import init_ascend_config
 from vllm_ascend.attention.attention_v1 import AscendAttentionState
 from vllm_ascend.attention.mla_v1 import (AscendMLABackend,
                                           AscendMLADecodeMetadata,
@@ -723,6 +724,13 @@ def setUp(self, ascend_config, get_current_vllm_config, mock_get_tp_size,
         model_config.dtype = torch.float16
         vllm_config.model_config = model_config
         get_current_vllm_config.return_value = vllm_config
+        vllm_config.additional_config = {
+            "torchair_graph_config": {
+                "enabled": False,
+            },
+            "refresh": True
+        }
+        init_ascend_config(vllm_config)
 
         num_heads = 256
         head_size = 1024