resolve conflict

wxsIcey · wxsIcey · commit 3dc9385b7cfa · 2025-12-14T13:28:53.000Z
Signed-off-by: wxsIcey &lt;1790571317@qq.com&gt;
diff --git a/vllm_ascend/worker/model_runner_v1.py b/vllm_ascend/worker/model_runner_v1.py
@@ -122,7 +122,7 @@
 from vllm_ascend.utils import (ACL_FORMAT_FRACTAL_ND, ACL_FORMAT_FRACTAL_NZ,
                                AscendDeviceType, ProfileExecuteDuration,
                                enable_sp, get_ascend_device_type, is_enable_nz,
-                               is_moe_model, lmhead_tp_enable)
+                               is_moe_model, is_vl_model, lmhead_tp_enable)
 from vllm_ascend.worker.npu_input_batch import InputBatch
 
 if TYPE_CHECKING:
@@ -270,6 +270,9 @@ def __init__(self, vllm_config: VllmConfig, device: torch.device):
 
         set_cos_and_sin(vllm_config, self.max_num_reqs,
                         self.uniform_decode_query_len, self.dtype, self.device)
+        if not is_vl_model(self.vllm_config
+                           ) and not self.vllm_config.model_config.use_mla:
+            initialize_cos_sin(self.vllm_config, self.dtype, self.device)
         set_mc2_tokens_capacity(vllm_config, self.max_num_reqs,
                                 self.uniform_decode_query_len)
         set_mc2_mask(vllm_config, self.device)
@@ -2198,6 +2201,9 @@ def _dummy_run(
             else:
                 positions = self.positions.gpu[:num_tokens_padded]
 
+            # update global cos, sin
+            update_cos_sin(positions)
+
             if get_pp_group().is_first_rank:
                 intermediate_tensors = None
             else: