We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d1e2d13 commit 8a6d9b6Copy full SHA for 8a6d9b6
vllm_ascend/worker/model_runner_v1.py
@@ -2701,7 +2701,6 @@ def sample_tokens(
2701
req_id = self.input_batch.req_ids[req_idx]
2702
req_state = self.requests[req_id]
2703
req_state.output_token_ids.extend(sampled_ids.tolist())
2704
-
2705
2706
def propose_draft_token_ids(sampled_token_ids):
2707
assert self.spec_decode_common_attn_metadata is not None
0 commit comments