Skip to content

Commit 9c0ad46

Browse files
[0.11.0][Bugfix] Remove the ZMQ communication setup on the D node (#4916)
In the PD separation scenario, the D node does not need to perform get operations, and therefore does not need to create ZeroMQ (ZMQ) communication. --------- Signed-off-by: SlightwindSec <[email protected]>
1 parent ceadc27 commit 9c0ad46

File tree

1 file changed

+5
-3
lines changed

1 file changed

+5
-3
lines changed

vllm_ascend/distributed/mooncake/mooncake_store_connector_v1.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@ def __init__(self, vllm_config: VllmConfig, role: KVConnectorRole):
4545
)
4646

4747
assert self.connector_worker is not None
48-
if vllm_config.parallel_config.rank == 0:
48+
if vllm_config.parallel_config.rank == 0 and self.kv_role != "kv_consumer":
4949
self.lookup_server = MooncakeLookupServer(
5050
self.connector_worker, vllm_config, self.use_layerwise)
5151

@@ -160,9 +160,10 @@ def get_zmq_rpc_path_mooncake(
160160
class MooncakeStoreConnectorV1Scheduler:
161161

162162
def __init__(self, vllm_config: "VllmConfig", use_layerwise):
163-
self.client = MooncakeLookupClient(vllm_config)
164163
self.use_layerwise = use_layerwise
165164
self.kv_role = vllm_config.kv_transfer_config.kv_role
165+
self.client = MooncakeLookupClient(
166+
vllm_config) if self.kv_role != "kv_consumer" else None
166167
self.consumer_is_to_load = vllm_config.kv_transfer_config.kv_connector_extra_config.get(
167168
"consumer_is_to_load", False)
168169
self.load_async = vllm_config.kv_transfer_config.kv_connector_extra_config.get(
@@ -207,7 +208,8 @@ def get_num_new_matched_tokens(
207208
else:
208209
token_ids = torch.tensor(request.prompt_token_ids)
209210

210-
num_external_hit_tokens = self.client.lookup(token_ids)
211+
num_external_hit_tokens = self.client.lookup( # type: ignore[union-attr]
212+
token_ids)
211213

212214
if num_external_hit_tokens == request.num_tokens:
213215
num_external_hit_tokens -= 1

0 commit comments

Comments
 (0)