@@ -146,7 +146,7 @@ def compile_non_streaming(
146146 request_args = str (
147147 request .arguments .model_dump () if request .arguments else None
148148 ),
149- response_id = response .get ("id" ), # use vLLM ID if available
149+ response_id = response .get ("id" ), # use vLLM ID if available
150150 text = text ,
151151 input_metrics = input_metrics ,
152152 output_metrics = output_metrics ,
@@ -196,7 +196,7 @@ def compile_streaming(self, request: GenerationRequest) -> GenerationResponse:
196196 request_args = str (
197197 request .arguments .model_dump () if request .arguments else None
198198 ),
199- response_id = self .streaming_response_id , # use vLLM ID if available
199+ response_id = self .streaming_response_id , # use vLLM ID if available
200200 text = text ,
201201 input_metrics = input_metrics ,
202202 output_metrics = output_metrics ,
@@ -312,7 +312,7 @@ def compile_non_streaming(
312312 request_args = str (
313313 request .arguments .model_dump () if request .arguments else None
314314 ),
315- response_id = response .get ("id" ), # use vLLM ID if available
315+ response_id = response .get ("id" ), # use vLLM ID if available
316316 text = text ,
317317 input_metrics = input_metrics ,
318318 output_metrics = output_metrics ,
@@ -362,7 +362,7 @@ def compile_streaming(self, request: GenerationRequest) -> GenerationResponse:
362362 request_args = str (
363363 request .arguments .model_dump () if request .arguments else None
364364 ),
365- response_id = self .streaming_response_id , # use vLLM ID if available
365+ response_id = self .streaming_response_id , # use vLLM ID if available
366366 text = text ,
367367 input_metrics = input_metrics ,
368368 output_metrics = output_metrics ,
@@ -398,7 +398,6 @@ def __init__(self):
398398 self .streaming_usage : dict [str , int | dict [str , int ]] | None = None
399399 self .streaming_response_id : str | None = None
400400
401-
402401 def compile_non_streaming (
403402 self , request : GenerationRequest , response : dict
404403 ) -> GenerationResponse :
@@ -421,7 +420,7 @@ def compile_non_streaming(
421420 request_args = str (
422421 request .arguments .model_dump () if request .arguments else None
423422 ),
424- response_id = response .get ("id" ), # use vLLM ID if available
423+ response_id = response .get ("id" ), # use vLLM ID if available
425424 text = text ,
426425 input_metrics = input_metrics ,
427426 output_metrics = output_metrics ,
0 commit comments