Skip to content

Commit f11083e

Browse files
committed
fix: Fix cost calculation for responses
Signed-off-by: Adam Tao <[email protected]>
1 parent bfaab8a commit f11083e

File tree

1 file changed

+9
-2
lines changed

1 file changed

+9
-2
lines changed

litellm/responses/utils.py

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323
ResponseText,
2424
)
2525
from litellm.types.responses.main import DecodedResponseId
26-
from litellm.types.utils import SpecialEnums, Usage
26+
from litellm.types.utils import PromptTokensDetails, SpecialEnums, Usage
2727

2828

2929
class ResponsesAPIRequestUtils:
@@ -375,8 +375,15 @@ def _transform_response_api_usage_to_chat_usage(
375375
)
376376
prompt_tokens: int = response_api_usage.input_tokens or 0
377377
completion_tokens: int = response_api_usage.output_tokens or 0
378+
prompt_tokens_details: Optional[PromptTokensDetails] = None
379+
if response_api_usage.input_tokens_details:
380+
prompt_tokens_details = PromptTokensDetails(
381+
cached_tokens=response_api_usage.input_tokens_details.cached_tokens,
382+
audio_tokens=response_api_usage.input_tokens_details.audio_tokens,
383+
)
378384
return Usage(
379385
prompt_tokens=prompt_tokens,
380386
completion_tokens=completion_tokens,
381387
total_tokens=prompt_tokens + completion_tokens,
382-
)
388+
prompt_tokens_details=prompt_tokens_details,
389+
)

0 commit comments

Comments
 (0)