We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 24d2a20 commit 012f221Copy full SHA for 012f221
vllm_ascend/worker/model_runner_v1.py
@@ -2837,7 +2837,7 @@ def _allocate_kv_cache_tensors(
2837
and "linear_attn" not in layer_name_inner):
2838
kv_cache_raw_tensors[layer_name_inner] = (k_tensor, v_tensor) if \
2839
not self.use_sparse else (k_tensor, v_tensor, k_cache_tensor)
2840
- break
+ break
2841
2842
layer_names = set()
2843
for group in kv_cache_config.kv_cache_groups:
0 commit comments