kaapi-backend/backend/app/models/llm/response.py at 05e9f57be676e9a627f734d5f43ee3b97ffa89bb · ProjectTech4DevAI/kaapi-backend · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
"""
LLM response models.

This module contains structured response models for LLM API calls.
"""
from datetime import datetime
from uuid import UUID

from sqlmodel import SQLModel, Field
from typing import Literal, Annotated
from app.models.llm.request import AudioContent, TextContent


class Usage(SQLModel):
    input_tokens: int
    output_tokens: int
    total_tokens: int
    reasoning_tokens: int | None = None


class TextOutput(SQLModel):
    type: Literal["text"] = "text"
    content: TextContent


class AudioOutput(SQLModel):
    type: Literal["audio"] = "audio"
    content: AudioContent


# Type alias for LLM output (discriminated union)
LLMOutput = Annotated[TextOutput | AudioOutput, Field(discriminator="type")]


class LLMResponse(SQLModel):
    """Normalized response format independent of provider."""

    provider_response_id: str = Field(
        ..., description="Unique response ID provided by the LLM provider."
    )
    conversation_id: str | None = Field(
        default=None, description="Conversation or thread ID for context (if any)."
    )
    provider: str = Field(
        ..., description="Name of the LLM provider (e.g., openai, anthropic)."
    )
    model: str = Field(
        ..., description="Model used by the provider (e.g., gpt-4-turbo)."
    )
    output: LLMOutput | None = Field(
        ...,
        description="Structured output containing text and optional additional data.",
    )


class LLMCallResponse(SQLModel):
    """Top-level response schema for an LLM API call."""

    response: LLMResponse = Field(
        ..., description="Normalized, structured LLM response."
    )
    usage: Usage = Field(..., description="Token usage and cost information.")
    provider_raw_response: dict[str, object] | None = Field(
        default=None,
        description="Unmodified raw response from the LLM provider.",
    )


class LLMChainResponse(SQLModel):
    """Response schema for an LLM chain execution."""

    response: LLMResponse = Field(
        ..., description="LLM response from the final step of the chain execution."
    )
    usage: Usage = Field(
        ...,
        description="Aggregate token usage and cost for the entire chain execution.",
    )
    provider_raw_response: dict[str, object] | None = Field(
        default=None,
        description="Raw provider response from the last block (if requested)",
    )


class IntermediateChainResponse(SQLModel):
    """
    Intermediate callback response from the intermediate blocks
    from the llm chain execution. (if configured)

    Flattened structure matching LLMCallResponse keys for consistency
    """

    type: Literal["intermediate"] = "intermediate"
    block_index: int = Field(..., description="Current block position")
    total_blocks: int = Field(..., description="Total number of blocks in the chain")
    response: LLMResponse = Field(
        ..., description="LLM Response from the current block"
    )
    usage: Usage = Field(
        ..., description="Token usage and cost information from the current block"
    )
    provider_raw_response: dict[str, object] | None = Field(
        default=None,
        description="Unmodified raw response from the LLM provider from the current block",
    )


# Job response models
class LLMJobBasePublic(SQLModel):
    """Base response model for LLM job information."""

    job_id: UUID
    status: str  # JobStatus from job.py


class LLMJobImmediatePublic(LLMJobBasePublic):
    """Immediate response after creating an LLM job."""

    message: str
    job_inserted_at: datetime
    job_updated_at: datetime


class LLMJobPublic(LLMJobBasePublic):
    """Full job response with nested LLM response when complete."""

    llm_response: LLMCallResponse | None = None
    error_message: str | None = None