We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 242f084 commit 7f4e3b1Copy full SHA for 7f4e3b1
vllm_ascend/sample/rejection_sampler.py
@@ -616,7 +616,7 @@ def rejection_greedy_sample_spec_len_1_triton(
616
target_argmax_id = tl.load(target_argmax_ptr + offset, mask)
617
tl.store(output_token_ids_ptr + offset * 2, target_argmax_id, mask)
618
619
- for pos in tl.arange(0, BLOCK_SIZE):
+ for pos in tl.range(0, BLOCK_SIZE):
620
draft_token_id1 = tl.get_element(draft_token_id, (pos, ))
621
target_argmax1 = tl.get_element(target_argmax_id, (pos, ))
622
position = block_idx * BLOCK_SIZE + pos
0 commit comments