From d372eec2abdd66a893060474289e81548994b070 Mon Sep 17 00:00:00 2001
From: Abozar <abozar.alizadeh@gmail.com>
Date: Sun, 5 Oct 2025 18:23:06 +0200
Subject: [PATCH] Add Azure OpenAI support and configuration options

Introduces Azure OpenAI as a supported provider, including new configuration fields for endpoint, deployment name, and API version. Updates model configuration logic and token limits to handle Azure OpenAI models, and adds detection for Azure OpenAI web search calls. Version bumped to 0.0.17.
---
 .env.example                              |  1 +
 pyproject.toml                            |  2 +-
 src/open_deep_research/configuration.py   | 33 +++++++++
 src/open_deep_research/deep_researcher.py | 78 +++++++++++-----------
 src/open_deep_research/utils.py           | 81 +++++++++++++++++++++--
 5 files changed, 150 insertions(+), 45 deletions(-)

diff --git a/.env.example b/.env.example
index 778272bf3..5d6f3d5b5 100644
--- a/.env.example
+++ b/.env.example
@@ -1,4 +1,5 @@
 OPENAI_API_KEY=
+AZURE_OPENAI_API_KEY=
 ANTHROPIC_API_KEY=
 GOOGLE_API_KEY=
 TAVILY_API_KEY=
diff --git a/pyproject.toml b/pyproject.toml
index 6a46d9d2d..39e1a0de3 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "open_deep_research"
-version = "0.0.16"
+version = "0.0.17"
 description = "Planning, research, and report generation."
 authors = [
     { name = "Lance Martin" }
diff --git a/src/open_deep_research/configuration.py b/src/open_deep_research/configuration.py
index 1c5bac9e9..a467f7a3a 100644
--- a/src/open_deep_research/configuration.py
+++ b/src/open_deep_research/configuration.py
@@ -13,6 +13,7 @@ class SearchAPI(Enum):
     
     ANTHROPIC = "anthropic"
     OPENAI = "openai"
+    AZURE_OPENAI = "azure_openai"
     TAVILY = "tavily"
     NONE = "none"
 
@@ -85,6 +86,7 @@ class Configuration(BaseModel):
                 "options": [
                     {"label": "Tavily", "value": SearchAPI.TAVILY.value},
                     {"label": "OpenAI Native Web Search", "value": SearchAPI.OPENAI.value},
+                    {"label": "Azure OpenAI Native Web Search", "value": SearchAPI.AZURE_OPENAI.value},
                     {"label": "Anthropic Native Web Search", "value": SearchAPI.ANTHROPIC.value},
                     {"label": "None", "value": SearchAPI.NONE.value}
                 ]
@@ -210,6 +212,37 @@ class Configuration(BaseModel):
             }
         }
     )
+    # Azure OpenAI Configuration
+    azure_endpoint: Optional[str] = Field(
+        default=None,
+        optional=True,
+        metadata={
+            "x_oap_ui_config": {
+                "type": "text",
+                "description": "Azure OpenAI endpoint URL (e.g., https://your-resource.openai.azure.com/)"
+            }
+        }
+    )
+    deployment_name: Optional[str] = Field(
+        default=None,
+        optional=True,
+        metadata={
+            "x_oap_ui_config": {
+                "type": "text",
+                "description": "Azure OpenAI deployment name"
+            }
+        }
+    )
+    api_version: Optional[str] = Field(
+        default="2024-02-15-preview",
+        optional=True,
+        metadata={
+            "x_oap_ui_config": {
+                "type": "text",
+                "description": "Azure OpenAI API version"
+            }
+        }
+    )
     # MCP server configuration
     mcp_config: Optional[MCPConfig] = Field(
         default=None,
diff --git a/src/open_deep_research/deep_researcher.py b/src/open_deep_research/deep_researcher.py
index 279dbffd9..6cf84ecd0 100644
--- a/src/open_deep_research/deep_researcher.py
+++ b/src/open_deep_research/deep_researcher.py
@@ -41,8 +41,10 @@
 )
 from open_deep_research.utils import (
     anthropic_websearch_called,
+    azure_openai_websearch_called,
     get_all_tools,
     get_api_key_for_model,
+    get_model_config,
     get_model_token_limit,
     get_notes_from_tool_calls,
     get_today_str,
@@ -54,7 +56,7 @@
 
 # Initialize a configurable model that we will use throughout the agent
 configurable_model = init_chat_model(
-    configurable_fields=("model", "max_tokens", "api_key"),
+    configurable_fields=("model", "max_tokens", "api_key", "azure_endpoint", "deployment_name", "api_version"),
 )
 
 async def clarify_with_user(state: AgentState, config: RunnableConfig) -> Command[Literal["write_research_brief", "__end__"]]:
@@ -78,12 +80,12 @@ async def clarify_with_user(state: AgentState, config: RunnableConfig) -> Comman
     
     # Step 2: Prepare the model for structured clarification analysis
     messages = state["messages"]
-    model_config = {
-        "model": configurable.research_model,
-        "max_tokens": configurable.research_model_max_tokens,
-        "api_key": get_api_key_for_model(configurable.research_model, config),
-        "tags": ["langsmith:nostream"]
-    }
+    model_config = get_model_config(
+        configurable.research_model,
+        configurable.research_model_max_tokens,
+        config,
+        configurable
+    )
     
     # Configure model with structured output and retry logic
     clarification_model = (
@@ -131,12 +133,12 @@ async def write_research_brief(state: AgentState, config: RunnableConfig) -> Com
     """
     # Step 1: Set up the research model for structured output
     configurable = Configuration.from_runnable_config(config)
-    research_model_config = {
-        "model": configurable.research_model,
-        "max_tokens": configurable.research_model_max_tokens,
-        "api_key": get_api_key_for_model(configurable.research_model, config),
-        "tags": ["langsmith:nostream"]
-    }
+    research_model_config = get_model_config(
+        configurable.research_model,
+        configurable.research_model_max_tokens,
+        config,
+        configurable
+    )
     
     # Configure model for structured research question generation
     research_model = (
@@ -191,12 +193,12 @@ async def supervisor(state: SupervisorState, config: RunnableConfig) -> Command[
     """
     # Step 1: Configure the supervisor model with available tools
     configurable = Configuration.from_runnable_config(config)
-    research_model_config = {
-        "model": configurable.research_model,
-        "max_tokens": configurable.research_model_max_tokens,
-        "api_key": get_api_key_for_model(configurable.research_model, config),
-        "tags": ["langsmith:nostream"]
-    }
+    research_model_config = get_model_config(
+        configurable.research_model,
+        configurable.research_model_max_tokens,
+        config,
+        configurable
+    )
     
     # Available tools: research delegation, completion signaling, and strategic thinking
     lead_researcher_tools = [ConductResearch, ResearchComplete, think_tool]
@@ -389,12 +391,12 @@ async def researcher(state: ResearcherState, config: RunnableConfig) -> Command[
         )
     
     # Step 2: Configure the researcher model with tools
-    research_model_config = {
-        "model": configurable.research_model,
-        "max_tokens": configurable.research_model_max_tokens,
-        "api_key": get_api_key_for_model(configurable.research_model, config),
-        "tags": ["langsmith:nostream"]
-    }
+    research_model_config = get_model_config(
+        configurable.research_model,
+        configurable.research_model_max_tokens,
+        config,
+        configurable
+    )
     
     # Prepare system prompt with MCP context if available
     researcher_prompt = research_system_prompt.format(
@@ -457,6 +459,7 @@ async def researcher_tools(state: ResearcherState, config: RunnableConfig) -> Co
     has_tool_calls = bool(most_recent_message.tool_calls)
     has_native_search = (
         openai_websearch_called(most_recent_message) or 
+        azure_openai_websearch_called(most_recent_message) or
         anthropic_websearch_called(most_recent_message)
     )
     
@@ -524,12 +527,13 @@ async def compress_research(state: ResearcherState, config: RunnableConfig):
     """
     # Step 1: Configure the compression model
     configurable = Configuration.from_runnable_config(config)
-    synthesizer_model = configurable_model.with_config({
-        "model": configurable.compression_model,
-        "max_tokens": configurable.compression_model_max_tokens,
-        "api_key": get_api_key_for_model(configurable.compression_model, config),
-        "tags": ["langsmith:nostream"]
-    })
+    compression_model_config = get_model_config(
+        configurable.compression_model,
+        configurable.compression_model_max_tokens,
+        config,
+        configurable
+    )
+    synthesizer_model = configurable_model.with_config(compression_model_config)
     
     # Step 2: Prepare messages for compression
     researcher_messages = state.get("researcher_messages", [])
@@ -624,12 +628,12 @@ async def final_report_generation(state: AgentState, config: RunnableConfig):
     
     # Step 2: Configure the final report generation model
     configurable = Configuration.from_runnable_config(config)
-    writer_model_config = {
-        "model": configurable.final_report_model,
-        "max_tokens": configurable.final_report_model_max_tokens,
-        "api_key": get_api_key_for_model(configurable.final_report_model, config),
-        "tags": ["langsmith:nostream"]
-    }
+    writer_model_config = get_model_config(
+        configurable.final_report_model,
+        configurable.final_report_model_max_tokens,
+        config,
+        configurable
+    )
     
     # Step 3: Attempt report generation with token limit retry logic
     max_retries = 3
diff --git a/src/open_deep_research/utils.py b/src/open_deep_research/utils.py
index 82ce304e2..4f1b2e8d8 100644
--- a/src/open_deep_research/utils.py
+++ b/src/open_deep_research/utils.py
@@ -82,13 +82,13 @@ async def tavily_search(
     max_char_to_include = configurable.max_content_length
     
     # Initialize summarization model with retry logic
-    model_api_key = get_api_key_for_model(configurable.summarization_model, config)
-    summarization_model = init_chat_model(
-        model=configurable.summarization_model,
-        max_tokens=configurable.summarization_model_max_tokens,
-        api_key=model_api_key,
-        tags=["langsmith:nostream"]
-    ).with_structured_output(Summary).with_retry(
+    summarization_model_config = get_model_config(
+        configurable.summarization_model,
+        configurable.summarization_model_max_tokens,
+        config,
+        configurable
+    )
+    summarization_model = init_chat_model(**summarization_model_config).with_structured_output(Summary).with_retry(
         stop_after_attempt=configurable.max_structured_output_retries
     )
     
@@ -657,6 +657,28 @@ def openai_websearch_called(response):
     
     return False
 
+def azure_openai_websearch_called(response):
+    """Detect if Azure OpenAI's web search functionality was used in the response.
+    
+    Args:
+        response: The response object from Azure OpenAI's API
+        
+    Returns:
+        True if web search was called, False otherwise
+    """
+    # Azure OpenAI uses the same web search mechanism as OpenAI
+    # Check for tool outputs in the response metadata
+    tool_outputs = response.additional_kwargs.get("tool_outputs")
+    if not tool_outputs:
+        return False
+    
+    # Look for web search calls in the tool outputs
+    for tool_output in tool_outputs:
+        if tool_output.get("type") == "web_search_call":
+            return True
+    
+    return False
+
 
 ##########################
 # Token Limit Exceeded Utils
@@ -797,6 +819,17 @@ def _check_gemini_token_limit(exception: Exception, error_str: str) -> bool:
     "openai:o3-pro": 200000,
     "openai:o1": 200000,
     "openai:o1-pro": 200000,
+    "azure_openai:gpt-4.1-mini": 1047576,
+    "azure_openai:gpt-4.1-nano": 1047576,
+    "azure_openai:gpt-4.1": 1047576,
+    "azure_openai:gpt-4o-mini": 128000,
+    "azure_openai:gpt-4o": 128000,
+    "azure_openai:o4-mini": 200000,
+    "azure_openai:o3-mini": 200000,
+    "azure_openai:o3": 200000,
+    "azure_openai:o3-pro": 200000,
+    "azure_openai:o1": 200000,
+    "azure_openai:o1-pro": 200000,
     "anthropic:claude-opus-4": 200000,
     "anthropic:claude-sonnet-4": 200000,
     "anthropic:claude-3-7-sonnet": 200000,
@@ -899,6 +932,8 @@ def get_api_key_for_model(model_name: str, config: RunnableConfig):
             return None
         if model_name.startswith("openai:"):
             return api_keys.get("OPENAI_API_KEY")
+        elif model_name.startswith("azure_openai:"):
+            return api_keys.get("AZURE_OPENAI_API_KEY")
         elif model_name.startswith("anthropic:"):
             return api_keys.get("ANTHROPIC_API_KEY")
         elif model_name.startswith("google"):
@@ -907,6 +942,8 @@ def get_api_key_for_model(model_name: str, config: RunnableConfig):
     else:
         if model_name.startswith("openai:"): 
             return os.getenv("OPENAI_API_KEY")
+        elif model_name.startswith("azure_openai:"):
+            return os.getenv("AZURE_OPENAI_API_KEY")
         elif model_name.startswith("anthropic:"):
             return os.getenv("ANTHROPIC_API_KEY")
         elif model_name.startswith("google"):
@@ -923,3 +960,33 @@ def get_tavily_api_key(config: RunnableConfig):
         return api_keys.get("TAVILY_API_KEY")
     else:
         return os.getenv("TAVILY_API_KEY")
+
+def get_model_config(model_name: str, max_tokens: int, config: RunnableConfig, configurable: "Configuration") -> dict:
+    """Get properly configured model parameters based on model type.
+    
+    Args:
+        model_name: The model identifier (e.g., "azure_openai:gpt-4", "openai:gpt-4")
+        max_tokens: Maximum tokens for the model
+        config: Runtime configuration
+        configurable: Configuration object with Azure settings
+        
+    Returns:
+        Dictionary with properly configured model parameters
+    """
+    model_config = {
+        "model": model_name,
+        "max_tokens": max_tokens,
+        "api_key": get_api_key_for_model(model_name, config),
+        "tags": ["langsmith:nostream"]
+    }
+    
+    # Only add Azure-specific parameters for Azure OpenAI models
+    if model_name.startswith("azure_openai:"):
+        if configurable.azure_endpoint:
+            model_config["azure_endpoint"] = configurable.azure_endpoint
+        if configurable.deployment_name:
+            model_config["deployment_name"] = configurable.deployment_name
+        if configurable.api_version:
+            model_config["api_version"] = configurable.api_version
+    
+    return model_config