File tree Expand file tree Collapse file tree 3 files changed +3
-5
lines changed
vllm/distributed/kv_transfer/kv_connector/v1 Expand file tree Collapse file tree 3 files changed +3
-5
lines changed Load Diff This file was deleted.
Original file line number Diff line number Diff line change @@ -419,6 +419,7 @@ def _nixl_handshake(
419419 engine_id = self .REMOTE_ENGINE_ID ,
420420 agent_metadata = FakeNixlWrapper .AGENT_METADATA ,
421421 kv_caches_base_addr = [0 ],
422+ device_id = remote_tp_rank ,
422423 num_blocks = 1 ,
423424 block_lens = remote_block_lens ,
424425 attn_backend_name = self .backend_name ,
Original file line number Diff line number Diff line change @@ -956,7 +956,8 @@ def _nixl_handshake(
956956 metadata = decoder .decode (metadata_bytes )
957957 got_metadata_time = time .perf_counter ()
958958 logger .debug (
959- "NIXL handshake: get metadata took: %s" , got_metadata_time - start_time
959+ "NIXL handshake: get metadata took: %s" ,
960+ got_metadata_time - start_time ,
960961 )
961962
962963 # Ensure engine id matches.
@@ -1474,9 +1475,6 @@ def _validate_remote_agent_handshake(
14741475 )
14751476 remote_block_size = remote_block_len // (self .slot_size_per_layer [0 ])
14761477 else :
1477- if tp_ratio != 1 and self .device_type == "xpu" :
1478- # XPU uses NHD, hence it does not support splitting on H
1479- raise ValueError ("Heterogeneous TP is not supported on XPU" )
14801478 # When MLA is not used, this is a list of the same block length
14811479 for block_len in nixl_agent_meta .block_lens :
14821480 assert block_len == remote_block_len , (
You can’t perform that action at this time.
0 commit comments