Skip to content

Commit 4feab2c

Browse files
committed
intel review
Signed-off-by: NickLucche <[email protected]>
1 parent dd4a8aa commit 4feab2c

File tree

3 files changed

+3
-5
lines changed

3 files changed

+3
-5
lines changed

tests/out_prefill

Lines changed: 0 additions & 1 deletion
This file was deleted.

tests/v1/kv_connector/unit/test_nixl_connector.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -419,6 +419,7 @@ def _nixl_handshake(
419419
engine_id=self.REMOTE_ENGINE_ID,
420420
agent_metadata=FakeNixlWrapper.AGENT_METADATA,
421421
kv_caches_base_addr=[0],
422+
device_id=remote_tp_rank,
422423
num_blocks=1,
423424
block_lens=remote_block_lens,
424425
attn_backend_name=self.backend_name,

vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -956,7 +956,8 @@ def _nixl_handshake(
956956
metadata = decoder.decode(metadata_bytes)
957957
got_metadata_time = time.perf_counter()
958958
logger.debug(
959-
"NIXL handshake: get metadata took: %s", got_metadata_time - start_time
959+
"NIXL handshake: get metadata took: %s",
960+
got_metadata_time - start_time,
960961
)
961962

962963
# Ensure engine id matches.
@@ -1474,9 +1475,6 @@ def _validate_remote_agent_handshake(
14741475
)
14751476
remote_block_size = remote_block_len // (self.slot_size_per_layer[0])
14761477
else:
1477-
if tp_ratio != 1 and self.device_type == "xpu":
1478-
# XPU uses NHD, hence it does not support splitting on H
1479-
raise ValueError("Heterogeneous TP is not supported on XPU")
14801478
# When MLA is not used, this is a list of the same block length
14811479
for block_len in nixl_agent_meta.block_lens:
14821480
assert block_len == remote_block_len, (

0 commit comments

Comments
 (0)