Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 2 additions & 1 deletion vllm_ascend/spec_decode/interface.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,7 +35,8 @@ def dummy_run(self,
num_reqs: int = 0,
num_tokens_across_dp: Optional[torch.Tensor] = None,
aclgraph_runtime_mode: CUDAGraphMode = CUDAGraphMode.NONE,
batch_descriptor=None):
batch_descriptor=None,
dummy_compute_logits=lambda hidden_states: None) -> None:
"""Called by dummy_run in modle_runner"""
raise NotImplementedError

Expand Down
3 changes: 2 additions & 1 deletion vllm_ascend/spec_decode/ngram_proposer.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,8 @@ def dummy_run(self,
num_reqs=None,
num_tokens_across_dp=None,
aclgraph_runtime_mode: CUDAGraphMode = CUDAGraphMode.NONE,
batch_descriptor=None):
batch_descriptor=None,
dummy_compute_logits=lambda hidden_states: None):
pass

def generate_token_ids(self,
Expand Down
Loading