WIP - additional tool types and LiteLLM

tconley1428 · tconley1428 · commit b9842f403e3e · 2025-07-22T12:37:52.000-07:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -57,6 +57,7 @@ dev = [
     "pytest-cov>=6.1.1",
     "httpx>=0.28.1",
     "pytest-pretty>=1.3.0",
+    "openai-agents[litellm] >= 0.2.3,<0.3"
 ]
 
 [tool.poe.tasks]
diff --git a/temporalio/contrib/openai_agents/_invoke_model_activity.py b/temporalio/contrib/openai_agents/_invoke_model_activity.py
@@ -21,7 +21,7 @@
     Tool,
     TResponseInputItem,
     UserError,
-    WebSearchTool,
+    WebSearchTool, ImageGenerationTool, CodeInterpreterTool,
 )
 from agents.models.multi_provider import MultiProvider
 from typing_extensions import Required, TypedDict
@@ -51,7 +51,7 @@ class FunctionToolInput:
     strict_json_schema: bool = True
 
 
-ToolInput = Union[FunctionToolInput, FileSearchTool, WebSearchTool]
+ToolInput = Union[FunctionToolInput, FileSearchTool, WebSearchTool, ImageGenerationTool, CodeInterpreterTool]
 
 
 @dataclass
@@ -143,10 +143,8 @@ async def empty_on_invoke_handoff(
         input_input = json.loads(input_json)
 
         def make_tool(tool: ToolInput) -> Tool:
-            if isinstance(tool, FileSearchTool):
-                return cast(FileSearchTool, tool)
-            elif isinstance(tool, WebSearchTool):
-                return cast(WebSearchTool, tool)
+            if isinstance(tool, (FileSearchTool, WebSearchTool, ImageGenerationTool, CodeInterpreterTool)):
+                return cast(Tool, tool)
             elif isinstance(tool, FunctionToolInput):
                 t = cast(FunctionToolInput, tool)
                 return FunctionTool(
diff --git a/temporalio/contrib/openai_agents/_temporal_model_stub.py b/temporalio/contrib/openai_agents/_temporal_model_stub.py
@@ -23,7 +23,7 @@
     ModelTracing,
     Tool,
     TResponseInputItem,
-    WebSearchTool,
+    WebSearchTool, ImageGenerationTool, CodeInterpreterTool,
 )
 from agents.items import TResponseStreamEvent
 from openai.types.responses.response_prompt_param import ResponsePromptParam
@@ -87,12 +87,8 @@ def get_summary(
             return ""
 
         def make_tool_info(tool: Tool) -> ToolInput:
-            if isinstance(tool, (FileSearchTool, WebSearchTool)):
+            if isinstance(tool, (FileSearchTool, WebSearchTool, ImageGenerationTool, CodeInterpreterTool)):
                 return tool
-            elif isinstance(tool, ComputerTool):
-                raise NotImplementedError(
-                    "Computer search preview is not supported in Temporal model"
-                )
             elif isinstance(tool, FunctionTool):
                 return FunctionToolInput(
                     name=tool.name,
@@ -101,7 +97,7 @@ def make_tool_info(tool: Tool) -> ToolInput:
                     strict_json_schema=tool.strict_json_schema,
                 )
             else:
-                raise ValueError(f"Unknown tool type: {tool.name}")
+                raise ValueError(f"Unsupported tool type: {tool.name}")
 
         tool_infos = [make_tool_info(x) for x in tools]
         handoff_infos = [
diff --git a/tests/contrib/openai_agents/test_openai.py b/tests/contrib/openai_agents/test_openai.py
@@ -29,9 +29,10 @@
     handoff,
     input_guardrail,
     output_guardrail,
-    trace,
+    trace, FileSearchTool, ImageGenerationTool, CodeInterpreterTool,
 )
 from agents.extensions.handoff_prompt import RECOMMENDED_PROMPT_PREFIX
+from agents.extensions.models.litellm_provider import LitellmProvider
 from agents.items import (
     HandoffOutputItem,
     ToolCallItem,
@@ -42,10 +43,12 @@
     ResponseFunctionToolCall,
     ResponseFunctionWebSearch,
     ResponseOutputMessage,
-    ResponseOutputText,
+    ResponseOutputText, ResponseFileSearchToolCall, ResponseCodeInterpreterToolCall,
 )
+from openai.types.responses.response_file_search_tool_call import Result
 from openai.types.responses.response_function_web_search import ActionSearch
 from openai.types.responses.response_prompt_param import ResponsePromptParam
+from openai.types.responses.tool_param import ImageGeneration
 from pydantic import ConfigDict, Field, TypeAdapter
 
 from temporalio import activity, workflow
@@ -1777,3 +1780,288 @@ async def test_response_serialization():
         response_id="",
     )
     encoded = await pydantic_data_converter.encode([model_response])
+
+async def test_lite_llm(client: Client):
+    if not os.environ.get("OPENAI_API_KEY"):
+        pytest.skip("No openai API key")
+    new_config = client.config()
+    new_config["plugins"] = [
+        openai_agents.OpenAIAgentsPlugin(
+            model_params=ModelActivityParameters(
+                start_to_close_timeout=timedelta(seconds=30)
+            ),
+            model_provider=LitellmProvider(),
+        )
+    ]
+    client = Client(**new_config)
+
+    async with new_worker(
+            client,
+            HelloWorldAgent,
+    ) as worker:
+        workflow_handle = await client.start_workflow(
+            HelloWorldAgent.run,
+            "Tell me about recursion in programming",
+            id=f"lite-llm-{uuid.uuid4()}",
+            task_queue=worker.task_queue,
+            execution_timeout=timedelta(seconds=10),
+        )
+        await workflow_handle.result()
+
+
+class FileSearchToolModel(StaticTestModel):
+    responses = [
+        ModelResponse(
+            output=[
+                ResponseFileSearchToolCall(
+                    queries=["side character in the Iliad"],
+                    type="file_search_call",
+                    id="id",
+                    status="completed",
+                    results=[
+                        Result(text="Some scene"),
+                        Result(text="Other scene"),
+                    ]
+                ),
+                ResponseOutputMessage(
+                    id="",
+                    content=[
+                        ResponseOutputText(
+                            text="Patroclus",
+                            annotations=[],
+                            type="output_text",
+                        )
+                    ],
+                    role="assistant",
+                    status="completed",
+                    type="message",
+                )
+            ],
+            usage=Usage(),
+            response_id=None,
+        ),
+    ]
+
+@workflow.defn
+class FileSearchToolWorkflow:
+    @workflow.run
+    async def run(self, question: str) -> str:
+        agent = Agent[str](
+            name="File Search Workflow",
+            instructions="You are a librarian. You should use your tools to source all your information.",
+            tools=[
+                FileSearchTool(
+                    max_num_results=3,
+                    vector_store_ids=["vs_687fd7f5e69c8191a2740f06bc9a159d"],
+                    include_search_results=True,
+                )
+            ],
+        )
+        result = await Runner.run(
+            starting_agent=agent, input=question
+        )
+
+        # A file search was performed
+        assert any(isinstance(item, ToolCallItem) and isinstance(item.raw_item, ResponseFileSearchToolCall) for item in result.new_items)
+        return result.final_output
+
+@pytest.mark.parametrize("use_local_model", [True, False])
+async def test_file_search_tool(client: Client, use_local_model):
+    if not use_local_model and not os.environ.get("OPENAI_API_KEY"):
+        pytest.skip("No openai API key")
+
+    new_config = client.config()
+    new_config["plugins"] = [
+        openai_agents.OpenAIAgentsPlugin(
+            model_params=ModelActivityParameters(
+                start_to_close_timeout=timedelta(seconds=30)
+            ),
+            model_provider=TestModelProvider(FileSearchToolModel())
+            if use_local_model
+            else None,
+        )
+    ]
+    client = Client(**new_config)
+
+    async with new_worker(
+            client,
+            FileSearchToolWorkflow,
+    ) as worker:
+        workflow_handle = await client.start_workflow(
+            FileSearchToolWorkflow.run,
+            "Tell me about a side character in the Iliad.",
+            id=f"file-search-tool-{uuid.uuid4()}",
+            task_queue=worker.task_queue,
+            execution_timeout=timedelta(seconds=30),
+        )
+        result = await workflow_handle.result()
+        if use_local_model:
+            assert result == "Patroclus"
+
+
+class ImageGenerationModel(StaticTestModel):
+    responses = [
+        ModelResponse(
+            output=[
+                ResponseFileSearchToolCall(
+                    queries=["side character in the Iliad"],
+                    type="file_search_call",
+                    id="id",
+                    status="completed",
+                    results=[
+                        Result(text="Some scene"),
+                        Result(text="Other scene"),
+                    ]
+                ),
+                ResponseOutputMessage(
+                    id="",
+                    content=[
+                        ResponseOutputText(
+                            text="Patroclus",
+                            annotations=[],
+                            type="output_text",
+                        )
+                    ],
+                    role="assistant",
+                    status="completed",
+                    type="message",
+                )
+            ],
+            usage=Usage(),
+            response_id=None,
+        ),
+    ]
+
+@workflow.defn
+class ImageGenerationWorkflow:
+    @workflow.run
+    async def run(self, question: str) -> str:
+        agent = Agent[str](
+            name="Image Generation Workflow",
+            instructions="You are a helpful agent.",
+            tools=[
+                ImageGenerationTool(
+                    tool_config={"type": "image_generation", "quality": "low"},
+                )
+            ],
+        )
+        result = await Runner.run(
+            starting_agent=agent, input=question
+        )
+
+        return result.final_output
+
+@pytest.mark.parametrize("use_local_model", [True, False])
+async def test_image_generation_tool(client: Client, use_local_model):
+    if not use_local_model and not os.environ.get("OPENAI_API_KEY"):
+        pytest.skip("No openai API key")
+
+    new_config = client.config()
+    new_config["plugins"] = [
+        openai_agents.OpenAIAgentsPlugin(
+            model_params=ModelActivityParameters(
+                start_to_close_timeout=timedelta(seconds=30)
+            ),
+            model_provider=TestModelProvider(ImageGenerationModel())
+            if use_local_model
+            else None,
+        )
+    ]
+    client = Client(**new_config)
+
+    async with new_worker(
+            client,
+            ImageGenerationWorkflow,
+    ) as worker:
+        workflow_handle = await client.start_workflow(
+            ImageGenerationWorkflow.run,
+            "Create an image of a frog eating a pizza, comic book style.",
+            id=f"image-generation-tool-{uuid.uuid4()}",
+            task_queue=worker.task_queue,
+            execution_timeout=timedelta(seconds=30),
+        )
+        result = await workflow_handle.result()
+
+
+class CodeInterpreterModel(StaticTestModel):
+    responses = [
+        ModelResponse(
+            output=[
+                ResponseCodeInterpreterToolCall(
+                    container_id="",
+                    code="some code",
+                    type="code_interpreter_call",
+                    id="id",
+                    status="completed",
+                ),
+                ResponseOutputMessage(
+                    id="",
+                    content=[
+                        ResponseOutputText(
+                            text="Over 9000",
+                            annotations=[],
+                            type="output_text",
+                        )
+                    ],
+                    role="assistant",
+                    status="completed",
+                    type="message",
+                )
+            ],
+            usage=Usage(),
+            response_id=None,
+        ),
+    ]
+
+@workflow.defn
+class CodeInterpreterWorkflow:
+    @workflow.run
+    async def run(self, question: str) -> str:
+        agent = Agent[str](
+            name="Code Interpreter Workflow",
+            instructions="You are a helpful agent.",
+            tools=[
+                CodeInterpreterTool(
+                    tool_config={"type": "code_interpreter", "container": {"type": "auto"}},
+                )
+            ],
+        )
+        result = await Runner.run(
+            starting_agent=agent, input=question
+        )
+
+        assert any(isinstance(item, ToolCallItem) and isinstance(item.raw_item, ResponseCodeInterpreterToolCall) for item in result.new_items)
+        return result.final_output
+
+@pytest.mark.parametrize("use_local_model", [True, False])
+async def test_code_interpreter_tool(client: Client, use_local_model):
+    if not use_local_model and not os.environ.get("OPENAI_API_KEY"):
+        pytest.skip("No openai API key")
+
+    new_config = client.config()
+    new_config["plugins"] = [
+        openai_agents.OpenAIAgentsPlugin(
+            model_params=ModelActivityParameters(
+                start_to_close_timeout=timedelta(seconds=30)
+            ),
+            model_provider=TestModelProvider(CodeInterpreterModel())
+            if use_local_model
+            else None,
+        )
+    ]
+    client = Client(**new_config)
+
+    async with new_worker(
+            client,
+            CodeInterpreterWorkflow,
+    ) as worker:
+        workflow_handle = await client.start_workflow(
+            CodeInterpreterWorkflow.run,
+            "What is the square root of273 * 312821 plus 1782?",
+            id=f"code-interpreter-tool-{uuid.uuid4()}",
+            task_queue=worker.task_queue,
+            execution_timeout=timedelta(seconds=30),
+        )
+        result = await workflow_handle.result()
+        if use_local_model:
+            assert result == "Over 9000"
diff --git a/uv.lock b/uv.lock

Original file line number	Diff line number	Diff line change
`@@ -57,6 +57,7 @@ dev = [`
`57`	`57`	`"pytest-cov>=6.1.1",`
`58`	`58`	`"httpx>=0.28.1",`
`59`	`59`	`"pytest-pretty>=1.3.0",`
	`60`	`+ "openai-agents[litellm] >= 0.2.3,<0.3"`
`60`	`61`	`]`
`61`	`62`
`62`	`63`	`[tool.poe.tasks]`