Skip to content

Commit 5afce44

Browse files
committed
triton code vector core change rejection_sampler.py
Signed-off-by: yuxingcyx <[email protected]>
1 parent 20512f7 commit 5afce44

File tree

1 file changed

+10
-3
lines changed

1 file changed

+10
-3
lines changed

vllm_ascend/sample/rejection_sampler.py

Lines changed: 10 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,6 @@
33

44
import torch
55
import torch.nn as nn
6-
import triton.runtime.driver as driver
76
import vllm.v1.sample.rejection_sampler as rs
87
from vllm.triton_utils import HAS_TRITON, tl, triton
98
from vllm.v1.sample.metadata import SamplingMetadata
@@ -18,10 +17,18 @@
1817
# step. This value is chosen to be large enough to handle typical use cases.
1918
MAX_SPEC_LEN = 32
2019

21-
device_properties = driver.active.utils.get_device_properties(torch.npu.current_device())
22-
vectorcore_num = device_properties['num_vectorcore']
20+
21+
vectorcore_num = None
22+
device_properties = None
23+
24+
25+
if HAS_TRITON:
26+
from triton.runtime import driver
27+
device_properties = driver.active.utils.get_device_properties(torch.npu.current_device())
28+
vectorcore_num = device_properties['num_vectorcore']
2329
#get vector core number in order for later tiling
2430

31+
2532
class AscendRejectionSampler(RejectionSampler, nn.Module):
2633
"""
2734
The implementation strictly follows the algorithm described in

0 commit comments

Comments
 (0)