We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4a6f81c commit 2541fd1Copy full SHA for 2541fd1
vllm_ascend/worker/model_runner_v1.py
@@ -1431,10 +1431,8 @@ def _prepare_inputs(
1431
common_attn_metadata = AscendCommonAttentionMetadata(
1432
query_start_loc=self.query_start_loc[:num_reqs + 1],
1433
query_start_loc_cpu=self.query_start_loc_cpu[:num_reqs + 1],
1434
- query_start_loc_list=self.query_start_loc_cpu[:num_reqs + 1].cpu().int().tolist(),
1435
seq_lens_cpu=self.seq_lens_cpu,
1436
seq_lens=self.seq_lens_cpu[:num_reqs],
1437
- seq_lens_list=self.seq_lens_cpu[:num_reqs].cpu().int().tolist(),
1438
num_reqs=num_reqs,
1439
num_actual_tokens=total_num_scheduled_tokens,
1440
actual_seq_lengths_q=self.actual_seq_lengths_q,
0 commit comments