We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6d2bc7a commit 6b5ca13Copy full SHA for 6b5ca13
vllm_ascend/worker/model_runner_v1.py
@@ -2271,6 +2271,9 @@ def _build_dummy_attn_metadata(
2271
self.seq_lens_np[:num_reqs] = seq_lens
2272
self.seq_lens_np[num_reqs:] = 0
2273
2274
+ self.query_start_loc[:num_reqs + 1] = torch.arange(num_reqs + 1)
2275
+ self.query_start_loc_cpu[:num_reqs + 1] = torch.arange(num_reqs + 1)
2276
+
2277
num_computed_tokens_cpu = (
2278
self.input_batch.num_computed_tokens_cpu_tensor[:num_reqs])
2279
0 commit comments