From a49a19e7840ceacc6c113cb81c2e7618426ded03 Mon Sep 17 00:00:00 2001
From: Krrish Dholakia <krrishdholakia@gmail.com>
Date: Sat, 4 Oct 2025 18:14:32 -0700
Subject: [PATCH 1/4] fix(mcp/): re-raise exception from server to client

allows user to debug why mcp server is not working as expected

Related to https://github.com/BerriAI/litellm/pull/15180
---
 litellm/experimental_mcp_client/client.py     |  5 +--
 .../mcp_server/mcp_server_manager.py          | 34 +++++++--------
 .../proxy/_experimental/mcp_server/server.py  | 43 ++++++++++---------
 litellm/proxy/_new_secret_config.yaml         | 22 +++-------
 4 files changed, 48 insertions(+), 56 deletions(-)

diff --git a/litellm/experimental_mcp_client/client.py b/litellm/experimental_mcp_client/client.py
index 225349b4e8a8..b7db917cba64 100644
--- a/litellm/experimental_mcp_client/client.py
+++ b/litellm/experimental_mcp_client/client.py
@@ -235,10 +235,9 @@ async def list_tools(self) -> List[MCPTool]:
             await self.disconnect()
             raise
         except Exception as e:
-            verbose_logger.warning(f"MCP client list_tools failed: {str(e)}")
+            verbose_logger.debug(f"MCP client list_tools failed: {str(e)}")
             await self.disconnect()
-            # Return empty list instead of raising to allow graceful degradation
-            return []
+            raise e
 
     async def call_tool(
         self, call_tool_request_params: MCPCallToolRequestParams
diff --git a/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py b/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
index 2c46f9561db1..bfe7a3e4679b 100644
--- a/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
+++ b/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
@@ -490,10 +490,10 @@ async def _get_tools_from_server(
             return prefixed_or_original_tools
 
         except Exception as e:
-            verbose_logger.warning(
+            verbose_logger.debug(
                 f"Failed to get tools from server {server.name}: {str(e)}"
             )
-            return []
+            raise e
         finally:
             if client:
                 try:
@@ -522,14 +522,14 @@ async def _list_tools_task():
                 tools = await client.list_tools()
                 verbose_logger.debug(f"Tools from {server_name}: {tools}")
                 return tools
-            except asyncio.CancelledError:
-                verbose_logger.warning(f"Client operation cancelled for {server_name}")
-                return []
+            except asyncio.CancelledError as e:
+                verbose_logger.debug(f"Client operation cancelled for {server_name}")
+                raise e
             except Exception as e:
-                verbose_logger.warning(
+                verbose_logger.debug(
                     f"Client operation failed for {server_name}: {str(e)}"
                 )
-                return []
+                raise e
             finally:
                 try:
                     await client.disconnect()
@@ -538,22 +538,22 @@ async def _list_tools_task():
 
         try:
             return await asyncio.wait_for(_list_tools_task(), timeout=30.0)
-        except asyncio.TimeoutError:
-            verbose_logger.warning(f"Timeout while listing tools from {server_name}")
-            return []
-        except asyncio.CancelledError:
-            verbose_logger.warning(
+        except asyncio.TimeoutError as e:
+            verbose_logger.debug(f"Timeout while listing tools from {server_name}")
+            raise e
+        except asyncio.CancelledError as e:
+            verbose_logger.debug(
                 f"Task cancelled while listing tools from {server_name}"
             )
-            return []
+            raise e
         except ConnectionError as e:
-            verbose_logger.warning(
+            verbose_logger.debug(
                 f"Connection error while listing tools from {server_name}: {str(e)}"
             )
-            return []
+            raise e
         except Exception as e:
-            verbose_logger.warning(f"Error listing tools from {server_name}: {str(e)}")
-            return []
+            verbose_logger.debug(f"Error listing tools from {server_name}: {str(e)}")
+            raise e
 
     def _create_prefixed_tools(
         self, tools: List[MCPTool], server: MCPServer, add_prefix: bool = True
diff --git a/litellm/proxy/_experimental/mcp_server/server.py b/litellm/proxy/_experimental/mcp_server/server.py
index 3e7c291810a5..75c04ebe947c 100644
--- a/litellm/proxy/_experimental/mcp_server/server.py
+++ b/litellm/proxy/_experimental/mcp_server/server.py
@@ -206,10 +206,8 @@ async def list_tools() -> List[MCPTool]:
             )
             return tools
         except Exception as e:
-            verbose_logger.exception(f"Error in list_tools endpoint: {str(e)}")
-            # Return empty list instead of failing completely
-            # This prevents the HTTP stream from failing and allows the client to get a response
-            return []
+            verbose_logger.debug(f"Error in list_tools endpoint: {str(e)}")
+            raise e
 
     @server.call_tool()
     async def mcp_server_tool_call(
@@ -364,25 +362,25 @@ async def _get_allowed_mcp_servers_from_mcp_server_names(
     def _tool_name_matches(tool_name: str, filter_list: List[str]) -> bool:
         """
         Check if a tool name matches any name in the filter list.
-        
+
         Checks both the full tool name and unprefixed version (without server prefix).
         This allows users to configure simple tool names regardless of prefixing.
-        
+
         Args:
             tool_name: The tool name to check (may be prefixed like "server-tool_name")
             filter_list: List of tool names to match against
-            
+
         Returns:
             True if the tool name (prefixed or unprefixed) is in the filter list
         """
         from litellm.proxy._experimental.mcp_server.utils import (
             get_server_name_prefix_tool_mcp,
         )
-        
+
         # Check if the full name is in the list
         if tool_name in filter_list:
             return True
-            
+
         # Check if the unprefixed name is in the list
         unprefixed_name, _ = get_server_name_prefix_tool_mcp(tool_name)
         return unprefixed_name in filter_list
@@ -393,34 +391,36 @@ def filter_tools_by_allowed_tools(
     ) -> List[MCPTool]:
         """
         Filter tools by allowed/disallowed tools configuration.
-        
+
         If allowed_tools is set, only tools in that list are returned.
         If disallowed_tools is set, tools in that list are excluded.
         Tool names are matched with and without server prefixes for flexibility.
-        
+
         Args:
             tools: List of tools to filter
             mcp_server: Server configuration with allowed_tools/disallowed_tools
-            
+
         Returns:
             Filtered list of tools
         """
         tools_to_return = tools
-        
+
         # Filter by allowed_tools (whitelist)
         if mcp_server.allowed_tools:
             tools_to_return = [
-                tool for tool in tools 
+                tool
+                for tool in tools
                 if _tool_name_matches(tool.name, mcp_server.allowed_tools)
             ]
-                    
+
         # Filter by disallowed_tools (blacklist)
         if mcp_server.disallowed_tools:
             tools_to_return = [
-                tool for tool in tools_to_return
+                tool
+                for tool in tools_to_return
                 if not _tool_name_matches(tool.name, mcp_server.disallowed_tools)
             ]
-            
+
         return tools_to_return
 
     async def _get_tools_from_mcp_servers(
@@ -497,18 +497,19 @@ async def _get_tools_from_mcp_servers(
                     extra_headers=extra_headers,
                     add_prefix=add_prefix,
                 )
-                
+
                 filtered_tools = filter_tools_by_allowed_tools(tools, server)
                 all_tools.extend(filtered_tools)
-                
+
                 verbose_logger.debug(
                     f"Successfully fetched {len(tools)} tools from server {server.name}, {len(filtered_tools)} after filtering"
                 )
             except Exception as e:
-                verbose_logger.exception(
+                verbose_logger.debug(
                     f"Error getting tools from server {server.name}: {str(e)}"
                 )
                 # Continue with other servers instead of failing completely
+                raise e
 
         verbose_logger.info(
             f"Successfully fetched {len(all_tools)} tools total from all MCP servers"
@@ -556,7 +557,7 @@ async def _list_mcp_tools(
                 f"Error getting tools from managed MCP servers: {str(e)}"
             )
             # Continue with empty managed tools list instead of failing completely
-
+            raise e
         # Get tools from local registry
         local_tools = []
         try:
diff --git a/litellm/proxy/_new_secret_config.yaml b/litellm/proxy/_new_secret_config.yaml
index b7b30d36f996..50d36fee0480 100644
--- a/litellm/proxy/_new_secret_config.yaml
+++ b/litellm/proxy/_new_secret_config.yaml
@@ -16,18 +16,10 @@ model_list:
       api_base: "https://webhook.site/2f385e05-00aa-402b-86d1-efc9261471a5"
       api_key: dummy
 
-# mcp_servers:
-#   github_mcp:
-#     url: "https://api.githubcopilot.com/mcp"
-#     auth_type: oauth2
-#     authorization_url: https://github.com/login/oauth/authorize
-#     token_url: https://github.com/login/oauth/access_token
-#     client_id: os.environ/GITHUB_OAUTH_CLIENT_ID
-#     client_secret: os.environ/GITHUB_OAUTH_CLIENT_SECRET
-#     scopes: ["public_repo", "user:email"]
-#     allowed_tools: ["list_tools"]
-#     # disallowed_tools: ["repo_delete"]
-
-litellm_settings:
-  callbacks: ["prometheus"]
-  custom_prometheus_metadata_labels: ["metadata.initiative", "metadata.business-unit"]
\ No newline at end of file
+mcp_servers:
+  local_fake_mcp:
+    url: "http://127.0.0.1:8001/mcp"
+    transport: "http"
+    description: "My custom MCP server"
+    auth_type: "api_key"
+    auth_value: "abc123"
\ No newline at end of file

From 3700e5d760e1bc44e77c1290dfc0dd7464791df2 Mon Sep 17 00:00:00 2001
From: Krrish Dholakia <krrishdholakia@gmail.com>
Date: Sat, 4 Oct 2025 18:34:47 -0700
Subject: [PATCH 2/4] feat(mcp_server_manager.py): add `static_header` support
 for MCP's

Allow admin to configure static custom headers to send on each mcp request to a backend server

Closes LIT-1186
---
 .../_experimental/mcp_server/mcp_server_manager.py    | 11 +++++++++++
 litellm/proxy/_new_secret_config.yaml                 |  3 ++-
 litellm/types/mcp_server/mcp_server_manager.py        |  5 ++++-
 3 files changed, 17 insertions(+), 2 deletions(-)

diff --git a/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py b/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
index bfe7a3e4679b..e228b3d6b05a 100644
--- a/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
+++ b/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
@@ -216,6 +216,7 @@ def load_servers_from_config(
                 allowed_tools=server_config.get("allowed_tools", None),
                 disallowed_tools=server_config.get("disallowed_tools", None),
                 access_groups=server_config.get("access_groups", None),
+                static_headers=server_config.get("static_headers", None),
             )
             self.config_mcp_servers[server_id] = new_server
         verbose_logger.debug(
@@ -475,6 +476,11 @@ async def _get_tools_from_server(
         client = None
 
         try:
+            if server.static_headers:
+                if extra_headers is None:
+                    extra_headers = {}
+                extra_headers.update(server.static_headers)
+
             client = self._create_mcp_client(
                 server=server,
                 mcp_auth_header=mcp_auth_header,
@@ -770,6 +776,11 @@ async def call_tool(
                 if header in raw_headers:
                     extra_headers[header] = raw_headers[header]
 
+        if mcp_server.static_headers:
+            if extra_headers is None:
+                extra_headers = {}
+            extra_headers.update(mcp_server.static_headers)
+
         client = self._create_mcp_client(
             server=mcp_server,
             mcp_auth_header=server_auth_header,
diff --git a/litellm/proxy/_new_secret_config.yaml b/litellm/proxy/_new_secret_config.yaml
index 50d36fee0480..7de2eaa43aa1 100644
--- a/litellm/proxy/_new_secret_config.yaml
+++ b/litellm/proxy/_new_secret_config.yaml
@@ -22,4 +22,5 @@ mcp_servers:
     transport: "http"
     description: "My custom MCP server"
     auth_type: "api_key"
-    auth_value: "abc123"
\ No newline at end of file
+    auth_value: "abc123"
+    static_headers: {"X-API-Key": "abc123"}
diff --git a/litellm/types/mcp_server/mcp_server_manager.py b/litellm/types/mcp_server/mcp_server_manager.py
index 3e0c2b20e393..5ad1fd6f244e 100644
--- a/litellm/types/mcp_server/mcp_server_manager.py
+++ b/litellm/types/mcp_server/mcp_server_manager.py
@@ -21,7 +21,7 @@ class MCPServer(BaseModel):
     authentication_token: Optional[str] = None
     mcp_info: Optional[MCPInfo] = None
     extra_headers: Optional[List[str]] = (
-        None  # allow admin to specify which headers to forward to the MCP server
+        None  # allow admin to specify which headers to forward from client to the MCP server
     )
     allowed_tools: Optional[List[str]] = None
     disallowed_tools: Optional[List[str]] = None
@@ -36,4 +36,7 @@ class MCPServer(BaseModel):
     args: Optional[List[str]] = None
     env: Optional[Dict[str, str]] = None
     access_groups: Optional[List[str]] = None
+    static_headers: Optional[Dict[str, str]] = (
+        None  # static headers to forward to the MCP server
+    )
     model_config = ConfigDict(arbitrary_types_allowed=True)

From 52d03a0211502d9a5f5e5ce43bd17a16a5841e2f Mon Sep 17 00:00:00 2001
From: Krrish Dholakia <krrishdholakia@gmail.com>
Date: Sat, 4 Oct 2025 19:01:07 -0700
Subject: [PATCH 3/4] docs(mcp.md): add docs

---
 docs/my-website/docs/mcp.md | 19 +++++++++++++++++++
 1 file changed, 19 insertions(+)

diff --git a/docs/my-website/docs/mcp.md b/docs/my-website/docs/mcp.md
index 50bd5aefa768..4cbaef42522a 100644
--- a/docs/my-website/docs/mcp.md
+++ b/docs/my-website/docs/mcp.md
@@ -182,6 +182,25 @@ mcp_servers:
     extra_headers: ["custom_key", "x-custom-header"]  # These headers will be forwarded from client
 ```
 
+### Static Headers
+
+Sometimes your MCP server needs specific headers on every request. Maybe it's an API key, maybe it's a custom header the server expects. Instead of configuring auth, you can just set them directly.
+
+```yaml title="config.yaml" showLineNumbers
+mcp_servers:
+  my_mcp_server:
+    url: "https://my-mcp-server.com/mcp"
+    static_headers:
+      X-API-Key: "abc123"
+      X-Custom-Header: "some-value"
+```
+
+These headers get sent with every request to the server. That's it.
+
+**When to use this:**
+- Your server needs custom headers that don't fit the standard auth patterns
+- You want full control over exactly what headers are sent
+- You're debugging and need to quickly add headers without changing auth configuration
 
 ### MCP Aliases
 

From 12726b0c336fafa3280e8d9e4b0df519a290e56c Mon Sep 17 00:00:00 2001
From: Krrish Dholakia <krrishdholakia@gmail.com>
Date: Mon, 6 Oct 2025 20:15:06 -0700
Subject: [PATCH 4/4] refactor(mcp_server_manager.py): refactor to maintain 50
 LOC requirement

---
 .../mcp_server/mcp_server_manager.py          | 35 ++++++++++++++-----
 1 file changed, 27 insertions(+), 8 deletions(-)

diff --git a/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py b/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
index 56030c9618de..7903e0c05762 100644
--- a/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
+++ b/litellm/proxy/_experimental/mcp_server/mcp_server_manager.py
@@ -775,14 +775,7 @@ async def call_tool(
             raise ValueError(f"Tool {name} not found")
 
         # Validate that the server from prefix matches the actual server (if prefix was used)
-        if server_name_from_prefix:
-            expected_prefix = get_server_prefix(mcp_server)
-            if normalize_server_name(server_name_from_prefix) != normalize_server_name(
-                expected_prefix
-            ):
-                raise ValueError(
-                    f"Tool {name} server prefix mismatch: expected {expected_prefix}, got {server_name_from_prefix}"
-                )
+        self._validate_server_prefix_match(name, server_name_from_prefix, mcp_server)
 
         #########################################################
         # Pre MCP Tool Call Hook
@@ -956,6 +949,32 @@ def _get_mcp_server_from_tool_name(self, tool_name: str) -> Optional[MCPServer]:
 
         return None
 
+    def _validate_server_prefix_match(
+        self,
+        tool_name: str,
+        server_name_from_prefix: Optional[str],
+        mcp_server: MCPServer,
+    ) -> None:
+        """
+        Validate that the server prefix from the tool name matches the actual server.
+
+        Args:
+            tool_name: Original tool name provided
+            server_name_from_prefix: Server name extracted from tool name prefix (if any)
+            mcp_server: The MCP server that was found for this tool
+
+        Raises:
+            ValueError: If the server prefix doesn't match the expected server
+        """
+        if server_name_from_prefix:
+            expected_prefix = get_server_prefix(mcp_server)
+            if normalize_server_name(server_name_from_prefix) != normalize_server_name(
+                expected_prefix
+            ):
+                raise ValueError(
+                    f"Tool {tool_name} server prefix mismatch: expected {expected_prefix}, got {server_name_from_prefix}"
+                )
+
     async def _add_mcp_servers_from_db_to_in_memory_registry(self):
         from litellm.proxy._experimental.mcp_server.db import get_all_mcp_servers
         from litellm.proxy.management_endpoints.mcp_management_endpoints import (