We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 83ffe59 commit fe8f042Copy full SHA for fe8f042
vllm_ascend/worker/worker_v1.py
@@ -54,7 +54,7 @@
54
init_ascend_soc_version, is_enable_nz,
55
prefill_context_parallel_enable,
56
register_ascend_customop, sleep_mode_enabled,
57
- try_register_lib,)
+ try_register_lib)
58
from vllm_ascend.worker.model_runner_v1 import NPUModelRunner
59
60
torch._dynamo.trace_rules.clear_lru_cache() # noqa: E402
@@ -477,4 +477,4 @@ def get_supported_tasks(self) -> "tuple[SupportedTask, ...]":
477
return self.model_runner.get_supported_tasks()
478
479
def take_draft_token_ids(self) -> Optional[DraftTokenIds]:
480
- return self.model_runner.take_draft_token_ids()
+ return self.model_runner.take_draft_token_ids()
0 commit comments