[Refactor] add fia_v3 attention & remove other attention operator.

weijinqian_v1 · weijinqian_v1 · commit 56330f97fe3c · 2025-11-27T18:13:01.000+08:00
Signed-off-by: weijinqian_v1 &lt;weijinqian@huawei.com&gt;
diff --git a/vllm_ascend/attention/attention_v1.py b/vllm_ascend/attention/attention_v1.py
@@ -547,9 +547,9 @@ def forward(
 
         if hasattr(layer, 'quant_method') and use_kv_cache_int8:
             attn_output = layer.quant_method.apply(layer, query, key, value,
-                                                  kv_cache, attn_metadata,
-                                                  self.attn_type, self.scale,
-                                                  output)
+                                                   kv_cache, attn_metadata,
+                                                   self.attn_type, self.scale,
+                                                   output)
             output[:num_tokens] = attn_output[:num_tokens]
             return output