pydantic · tarruda · Aug 19, 2025 · Aug 19, 2025 · Aug 19, 2025 · Aug 19, 2025
diff --git a/docs/input.md b/docs/input.md
@@ -102,6 +102,28 @@ print(result.output)
 #> The document discusses...
 ```
 
+## Uploaded files
+
+Use [`UploadedFile`][pydantic_ai.UploadedFile] when you've already uploaded content to the model provider.
+
+- [`OpenAIChatModel`][pydantic_ai.models.openai.OpenAIChatModel] and [`OpenAIResponsesModel`][pydantic_ai.models.openai.OpenAIResponsesModel] accept an `openai.types.FileObject` or a file ID string returned by the OpenAI Files API.
+- [`GoogleModel`][pydantic_ai.models.google.GoogleModel] accepts a `google.genai.types.File` or a file URI string from the Gemini Files API.
+- Other models currently raise `NotImplementedError` when they receive an `UploadedFile`.
+
+```py {title="uploaded_file_input.py" test="skip" lint="skip"}
+from pydantic_ai import Agent, UploadedFile
+
+agent = Agent(model='openai:gpt-5')
+result = agent.run_sync(
+    [
+        'Give me a short description of this image',
+        UploadedFile(file='file-abc123'),  # file-abc123 is a file ID returned by the provider
+    ]
+)
+print(result.output)
+#> The image is a simple design of a classic yellow smiley face...
+```
+
 ## User-side download vs. direct file URL
 
 As a general rule, when you provide a URL using any of `ImageUrl`, `AudioUrl`, `VideoUrl` or `DocumentUrl`, Pydantic AI downloads the file content and then sends it as part of the API request.

diff --git a/pydantic_ai_slim/pydantic_ai/__init__.py b/pydantic_ai_slim/pydantic_ai/__init__.py
@@ -80,6 +80,7 @@
     ToolCallPartDelta,
     ToolReturn,
     ToolReturnPart,
+    UploadedFile,
     UserContent,
     UserPromptPart,
     VideoFormat,
@@ -182,6 +183,7 @@
     'ToolCallPartDelta',
     'ToolReturn',
     'ToolReturnPart',
+    'UploadedFile',
     'UserContent',
     'UserPromptPart',
     'VideoFormat',

diff --git a/pydantic_ai_slim/pydantic_ai/_otel_messages.py b/pydantic_ai_slim/pydantic_ai/_otel_messages.py
@@ -43,12 +43,20 @@ class BinaryDataPart(TypedDict):
     content: NotRequired[str]
 
 
+class UploadedFilePart(TypedDict):
+    type: Literal['uploaded-file']
+    identifier: NotRequired[str]
+    file: NotRequired[str]
+
+
 class ThinkingPart(TypedDict):
     type: Literal['thinking']
     content: NotRequired[str]
 
 
-MessagePart: TypeAlias = 'TextPart | ToolCallPart | ToolCallResponsePart | MediaUrlPart | BinaryDataPart | ThinkingPart'
+MessagePart: TypeAlias = (
+    'TextPart | ToolCallPart | ToolCallResponsePart | MediaUrlPart | BinaryDataPart | UploadedFilePart | ThinkingPart'
+)
 
 
 Role = Literal['system', 'user', 'assistant']

diff --git a/pydantic_ai_slim/pydantic_ai/messages.py b/pydantic_ai_slim/pydantic_ai/messages.py
@@ -108,6 +108,16 @@ def _multi_modal_content_identifier(identifier: str | bytes) -> str:
     return hashlib.sha1(identifier).hexdigest()[:6]
 
 
+def _uploaded_file_identifier_source(file: Any) -> str:
+    if isinstance(file, str):
+        return file
+    for attr in ('id', 'uri', 'name'):
+        value = getattr(file, attr, None)
+        if isinstance(value, str):
+            return value
+    return repr(file)
+
+
 @dataclass(init=False, repr=False)
 class FileUrl(ABC):
     """Abstract base class for any URL-based file."""
@@ -633,6 +643,59 @@ def __init__(
             raise ValueError('`BinaryImage` must be have a media type that starts with "image/"')  # pragma: no cover
 
 
+@dataclass(init=False, repr=False)
+class UploadedFile:
+    """File uploaded to the LLM provider.
+
+    Supported by [`OpenAIChatModel`][pydantic_ai.models.openai.OpenAIChatModel],
+    [`OpenAIResponsesModel`][pydantic_ai.models.openai.OpenAIResponsesModel], and
+    [`GoogleModel`][pydantic_ai.models.google.GoogleModel].
+
+    - For OpenAI-compatible models, provide an `openai.types.FileObject` or a file ID string returned by the Files API.
+    - For Gemini, provide a `google.genai.types.File` or the file URI string returned by the Files API.
+
+    Other models raise `NotImplementedError` when they receive this part.
+    """
+
+    file: Any
+    """A provider-specific file object, e.g. a file ID or a file URL."""
+
+    _: KW_ONLY
+
+    _identifier: Annotated[str | None, pydantic.Field(alias='identifier', default=None, exclude=True)] = field(
+        compare=False, default=None
+    )
+    """Optional identifier for the uploaded file."""
+
+    kind: Literal['uploaded-file'] = 'uploaded-file'
+    """Type identifier, this is available on all parts as a discriminator."""
+
+    def __init__(
+        self,
+        file: Any,
+        *,
+        identifier: str | None = None,
+        kind: Literal['uploaded-file'] = 'uploaded-file',
+        # Required for inline-snapshot which expects all dataclass `__init__` methods to take all field names as kwargs.
+        _identifier: str | None = None,
+    ):
+        self.file = file
+        self._identifier = identifier or _identifier
+        self.kind = kind
+
+    @pydantic.computed_field
+    @property
+    def identifier(self) -> str:
+        """Identifier for the uploaded file, usually derived from the provider's reference."""
+        identifier = self._identifier
+        if identifier is not None:
+            return identifier
+
+        return _multi_modal_content_identifier(_uploaded_file_identifier_source(self.file))
+
+    __repr__ = _utils.dataclasses_no_defaults_repr
+
+
 @dataclass
 class CachePoint:
     """A cache point marker for prompt caching.
@@ -656,7 +719,7 @@ class CachePoint:
     * Anthropic. See https://docs.claude.com/en/docs/build-with-claude/prompt-caching#1-hour-cache-duration for more information."""
 
 
-MultiModalContent = ImageUrl | AudioUrl | DocumentUrl | VideoUrl | BinaryContent
+MultiModalContent = ImageUrl | AudioUrl | DocumentUrl | VideoUrl | BinaryContent | UploadedFile
 UserContent: TypeAlias = str | MultiModalContent | CachePoint
 
 
@@ -774,11 +837,17 @@ def otel_message_parts(self, settings: InstrumentationSettings) -> list[_otel_me
                 if settings.include_content and settings.include_binary_content:
                     converted_part['content'] = base64.b64encode(part.data).decode()
                 parts.append(converted_part)
+            elif isinstance(part, UploadedFile):
+                uploaded_part: _otel_messages.UploadedFilePart = {
+                    'type': 'uploaded-file',
+                    'identifier': part.identifier,
+                }
+                if settings.include_content:
+                    uploaded_part['file'] = _uploaded_file_identifier_source(part.file)
+                parts.append(uploaded_part)
             elif isinstance(part, CachePoint):
                 # CachePoint is a marker, not actual content - skip it for otel
                 pass
-            else:
-                parts.append({'type': part.kind})  # pragma: no cover
         return parts
 
     __repr__ = _utils.dataclasses_no_defaults_repr

diff --git a/pydantic_ai_slim/pydantic_ai/models/bedrock.py b/pydantic_ai_slim/pydantic_ai/models/bedrock.py
@@ -34,6 +34,7 @@
     ThinkingPart,
     ToolCallPart,
     ToolReturnPart,
+    UploadedFile,
     UserPromptPart,
     VideoUrl,
     _utils,
@@ -676,6 +677,8 @@ async def _map_user_prompt(part: UserPromptPart, document_count: Iterator[int])
                         content.append({'video': video})
                 elif isinstance(item, AudioUrl):  # pragma: no cover
                     raise NotImplementedError('Audio is not supported yet.')
+                elif isinstance(item, UploadedFile):
+                    raise NotImplementedError('Uploaded files are not supported yet.')
                 elif isinstance(item, CachePoint):
                     # Bedrock support has not been implemented yet: https://github.com/pydantic/pydantic-ai/issues/3418
                     pass

diff --git a/pydantic_ai_slim/pydantic_ai/models/gemini.py b/pydantic_ai_slim/pydantic_ai/models/gemini.py
@@ -35,6 +35,7 @@
     ThinkingPart,
     ToolCallPart,
     ToolReturnPart,
+    UploadedFile,
     UserPromptPart,
     VideoUrl,
 )
@@ -392,6 +393,8 @@ async def _map_user_prompt(self, part: UserPromptPart) -> list[_GeminiPartUnion]
                     else:  # pragma: lax no cover
                         file_data = _GeminiFileDataPart(file_data={'file_uri': item.url, 'mime_type': item.media_type})
                         content.append(file_data)
+                elif isinstance(item, UploadedFile):
+                    raise NotImplementedError('Uploaded files are not supported for GeminiModel.')
                 elif isinstance(item, CachePoint):
                     # Gemini doesn't support prompt caching via CachePoint
                     pass

diff --git a/pydantic_ai_slim/pydantic_ai/models/google.py b/pydantic_ai_slim/pydantic_ai/models/google.py
@@ -34,6 +34,7 @@
     ThinkingPart,
     ToolCallPart,
     ToolReturnPart,
+    UploadedFile,
     UserPromptPart,
     VideoUrl,
 )
@@ -62,6 +63,7 @@
         CountTokensConfigDict,
         ExecutableCode,
         ExecutableCodeDict,
+        File,
         FileDataDict,
         FinishReason as GoogleFinishReason,
         FunctionCallDict,
@@ -628,13 +630,40 @@ async def _map_user_prompt(self, part: UserPromptPart) -> list[PartDict]:
                     else:
                         file_data_dict: FileDataDict = {'file_uri': item.url, 'mime_type': item.media_type}
                         content.append({'file_data': file_data_dict})  # pragma: lax no cover
+                elif isinstance(item, UploadedFile):
+                    content.append({'file_data': self._map_uploaded_file(item)})
                 elif isinstance(item, CachePoint):
                     # Google Gemini doesn't support prompt caching via CachePoint
                     pass
                 else:
                     assert_never(item)
         return content
 
+    @staticmethod
+    def _map_uploaded_file(item: UploadedFile) -> FileDataDict:
+        """Convert an UploadedFile into the structure expected by Gemini."""
+        file = item.file
+        if isinstance(file, File):
+            file_uri = file.uri
+            mime_type = file.mime_type
+            display_name = getattr(file, 'display_name', None)
+        elif isinstance(file, str):
+            file_uri = file
+            mime_type = None
+            display_name = None
+        else:
+            raise UserError('UploadedFile.file must be a genai.types.File or file URI string')
+
+        if not file_uri:
+            raise UserError('UploadedFile.file must include a file URI')
+
+        file_data: FileDataDict = {'file_uri': file_uri}
+        if mime_type:
+            file_data['mime_type'] = mime_type
+        if display_name:
+            file_data['display_name'] = display_name
+        return file_data
+
     def _map_response_schema(self, o: OutputObjectDefinition) -> dict[str, Any]:
         response_schema = o.json_schema.copy()
         if o.name:

diff --git a/pydantic_ai_slim/pydantic_ai/models/huggingface.py b/pydantic_ai_slim/pydantic_ai/models/huggingface.py
@@ -34,6 +34,7 @@
     ThinkingPart,
     ToolCallPart,
     ToolReturnPart,
+    UploadedFile,
     UserPromptPart,
     VideoUrl,
 )
@@ -448,6 +449,8 @@ async def _map_user_prompt(part: UserPromptPart) -> ChatCompletionInputMessage:
                     raise NotImplementedError('DocumentUrl is not supported for Hugging Face')
                 elif isinstance(item, VideoUrl):
                     raise NotImplementedError('VideoUrl is not supported for Hugging Face')
+                elif isinstance(item, UploadedFile):
+                    raise NotImplementedError('Uploaded files are not supported for Hugging Face')
                 elif isinstance(item, CachePoint):
                     # Hugging Face doesn't support prompt caching via CachePoint
                     pass

diff --git a/pydantic_ai_slim/pydantic_ai/models/openai.py b/pydantic_ai_slim/pydantic_ai/models/openai.py
@@ -44,6 +44,7 @@
     ThinkingPart,
     ToolCallPart,
     ToolReturnPart,
+    UploadedFile,
     UserPromptPart,
     VideoUrl,
 )
@@ -56,7 +57,7 @@
 
 try:
     from openai import NOT_GIVEN, APIConnectionError, APIStatusError, AsyncOpenAI, AsyncStream
-    from openai.types import AllModels, chat, responses
+    from openai.types import AllModels, FileObject, chat, responses
     from openai.types.chat import (
         ChatCompletionChunk,
         ChatCompletionContentPartImageParam,
@@ -977,6 +978,9 @@ async def _map_user_prompt(self, part: UserPromptPart) -> chat.ChatCompletionUse
                                 type='file',
                             )
                         )
+                elif isinstance(item, UploadedFile):
+                    file_id = _map_uploaded_file(item, self._provider)
+                    content.append(File(file=FileFile(file_id=file_id), type='file'))
                 elif isinstance(item, VideoUrl):  # pragma: no cover
                     raise NotImplementedError('VideoUrl is not supported for OpenAI')
                 elif isinstance(item, CachePoint):
@@ -1733,8 +1737,7 @@ def _map_json_schema(self, o: OutputObjectDefinition) -> responses.ResponseForma
             response_format_param['strict'] = o.strict
         return response_format_param
 
-    @staticmethod
-    async def _map_user_prompt(part: UserPromptPart) -> responses.EasyInputMessageParam:  # noqa: C901
+    async def _map_user_prompt(self, part: UserPromptPart) -> responses.EasyInputMessageParam:  # noqa: C901
         content: str | list[responses.ResponseInputContentParam]
         if isinstance(part.content, str):
             content = part.content
@@ -1807,6 +1810,9 @@ async def _map_user_prompt(part: UserPromptPart) -> responses.EasyInputMessagePa
                             filename=f'filename.{downloaded_item["data_type"]}',
                         )
                     )
+                elif isinstance(item, UploadedFile):
+                    file_id = _map_uploaded_file(item, self._provider)
+                    content.append(responses.ResponseInputFileParam(file_id=file_id, type='input_file'))
                 elif isinstance(item, VideoUrl):  # pragma: no cover
                     raise NotImplementedError('VideoUrl is not supported for OpenAI.')
                 elif isinstance(item, CachePoint):
@@ -2324,6 +2330,21 @@ def _map_usage(
     )
 
 
+def _map_uploaded_file(uploaded_file: UploadedFile, _provider: Provider[Any]) -> str:
+    """Map an UploadedFile to a file ID understood by OpenAI-compatible APIs."""
+    file = uploaded_file.file
+    if isinstance(file, str):
+        return file
+    if isinstance(file, FileObject):
+        return file.id
+
+    file_id = getattr(file, 'id', None)
+    if isinstance(file_id, str):
+        return file_id
+
+    raise UserError('UploadedFile.file must be a file ID string or an object with an `id` attribute')
+
+
 def _map_provider_details(
     choice: chat_completion_chunk.Choice | chat_completion.Choice,
 ) -> dict[str, Any]: