We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 1fe3431 commit 0e7ff1bCopy full SHA for 0e7ff1b
vllm_ascend/worker/model_runner_v1.py
@@ -2862,7 +2862,7 @@ def _allocate_kv_cache_tensors(
2862
and "linear_attn" not in layer_name_inner):
2863
kv_cache_raw_tensors[layer_name_inner] = (k_tensor, v_tensor) if \
2864
not self.use_sparse else (k_tensor, v_tensor, k_cache_tensor)
2865
- break
+ break
2866
2867
layer_names = set()
2868
for group in kv_cache_config.kv_cache_groups:
0 commit comments