66import vllm .envs as envs
77from ray .util .placement_group import PlacementGroup
88from ray .util .scheduling_strategies import PlacementGroupSchedulingStrategy
9- from vllm .distributed .kv_transfer .kv_connector .utils import KVOutputAggregator
109from vllm .multimodal .inputs import MultiModalKwargs
1110from vllm .platforms import current_platform
1211from vllm .ray .ray_env import get_env_vars_to_copy
1312from vllm .sequence import VLLM_TOKEN_ID_ARRAY_TYPE
1413from vllm .utils .network_utils import (get_distributed_init_method , get_ip ,
1514 get_open_port )
15+ from vllm .v1 .core .sched .output import SchedulerOutput
1616from vllm .v1 .executor .ray_distributed_executor import \
1717 RayDistributedExecutor as RayDistributedExecutorV1
1818from vllm .v1 .executor .ray_executor import RayWorkerMetaData
@@ -101,10 +101,10 @@ def _init_executor(self) -> None:
101101
102102 self .pp_locks : Optional [List [asyncio .Lock ]] = None
103103
104+ self .scheduler_output : SchedulerOutput | None = None
105+
104106 # KV connector setup
105107 self .has_connector = self .vllm_config .kv_transfer_config is not None
106- self .kv_output_aggregator = KVOutputAggregator (
107- self .parallel_config .world_size )
108108 if self .has_connector :
109109 ip_port = self .collective_rpc ("get_node_kv_ip_port" )
110110 for item in ip_port :
@@ -229,7 +229,7 @@ def _init_workers_ray(self, placement_group: "PlacementGroup",
229229 for each , ip in zip (worker_metadata , worker_ips ):
230230 each .ip = ip
231231
232- logger .debug ("workers: %s" , worker_metadata )
232+ logger .debug (f"Initialized worker_metadata: { worker_metadata } " )
233233
234234 ip_counts : Dict [str , int ] = {}
235235 for ip in worker_ips :
@@ -256,6 +256,9 @@ def sort_by_driver_then_worker_ip(item: RayWorkerMetaData):
256256 start_rank = 0
257257 for i , item in enumerate (sorted_worker_metadata ):
258258 item .adjusted_rank = i + start_rank
259+ logger .info (
260+ f"Initialized sorted worker_metadata: { sorted_worker_metadata } " )
261+
259262 self .workers = [item .worker for item in sorted_worker_metadata ]
260263 rerank_mapping = {
261264 item .created_rank : item .adjusted_rank
@@ -353,3 +356,8 @@ def sort_by_driver_then_worker_ip(item: RayWorkerMetaData):
353356 assert len (self .pp_tp_workers [pp_rank ]) == tp_rank
354357 assert pp_rank < len (self .pp_tp_workers )
355358 self .pp_tp_workers [pp_rank ].append (self .workers [rank ])
359+
360+ # Ray executor do not need handshake metadata
361+ # as we pass the kv_parameters through proxy server
362+ def get_kv_connector_handshake_metadata (self ) -> None :
363+ pass
0 commit comments