Add vllm id to the response

toslali-ibm · markurtz · commit 76c43f3cbf8a · 2025-11-16T11:49:43.000-05:00
Signed-off-by: Mert Toslali &lt;toslali@ibm.com&gt;
diff --git a/src/guidellm/backends/response_handlers.py b/src/guidellm/backends/response_handlers.py
@@ -145,6 +145,7 @@ def compile_non_streaming(
             request_args=str(
                 request.arguments.model_dump() if request.arguments else None
             ),
+            response_id=response.get("id"), # use vLLM ID if available
             text=text,
             input_metrics=input_metrics,
             output_metrics=output_metrics,
diff --git a/src/guidellm/schemas/response.py b/src/guidellm/schemas/response.py
@@ -41,6 +41,10 @@ class GenerationResponse(StandardBaseModel):
     request_id: str = Field(
         description="Unique identifier matching the original GenerationRequest."
     )
+    response_id: str | None = Field(
+        default=None,
+        description="Unique identifier matching the original vLLM Response ID."
+    )
     request_args: str | None = Field(
         description="Arguments passed to the backend for request processing."
     )

Original file line number	Diff line number	Diff line change
`@@ -41,6 +41,10 @@ class GenerationResponse(StandardBaseModel):`
`41`	`41`	`request_id: str = Field(`
`42`	`42`	`description="Unique identifier matching the original GenerationRequest."`
`43`	`43`	`)`
	`44`	`+ response_id: str \| None = Field(`
	`45`	`+ default=None,`
	`46`	`+ description="Unique identifier matching the original vLLM Response ID."`
	`47`	`+ )`
`44`	`48`	`request_args: str \| None = Field(`
`45`	`49`	`description="Arguments passed to the backend for request processing."`
`46`	`50`	`)`