Skip to content

Commit 4d01b64

Browse files
authored
[Bugfix] - Add Trace Headers to Beam Search Path (vllm-project#29100)
Signed-off-by: dsuhinin <suhinin.dmitriy@gmail.com>
1 parent 114b0e2 commit 4d01b64

File tree

3 files changed

+4
-0
lines changed

3 files changed

+4
-0
lines changed

vllm/entrypoints/openai/serving_chat.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -319,6 +319,7 @@ async def create_chat_completion(
319319
request_id=request_id,
320320
params=sampling_params,
321321
lora_request=lora_request,
322+
trace_headers=trace_headers,
322323
)
323324
else:
324325
engine_request, tokenization_kwargs = await self._process_inputs(

vllm/entrypoints/openai/serving_completion.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -216,6 +216,7 @@ async def create_completion(
216216
request_id=request_id,
217217
params=sampling_params,
218218
lora_request=lora_request,
219+
trace_headers=trace_headers,
219220
)
220221
else:
221222
engine_request, tokenization_kwargs = await self._process_inputs(

vllm/entrypoints/openai/serving_engine.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -343,6 +343,7 @@ async def beam_search(
343343
request_id: str,
344344
params: BeamSearchParams,
345345
lora_request: LoRARequest | None = None,
346+
trace_headers: Mapping[str, str] | None = None,
346347
) -> AsyncGenerator[RequestOutput, None]:
347348
beam_width = params.beam_width
348349
max_tokens = params.max_tokens
@@ -437,6 +438,7 @@ async def beam_search(
437438
beam_search_params,
438439
request_id_item,
439440
lora_request=lora_req,
441+
trace_headers=trace_headers,
440442
)
441443
)
442444
)

0 commit comments

Comments
 (0)