stacklok
diff --git a/‎cmd/thv/app/run_flags.go
Lines changed: 10 additions & 0 deletions b/‎cmd/thv/app/run_flags.go
Lines changed: 10 additions & 0 deletions
diff --git a/‎docs/cli/thv_run.md
Lines changed: 1 addition & 0 deletions b/‎docs/cli/thv_run.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎pkg/mcp/tool_filter.go
Lines changed: 328 additions & 0 deletions b/‎pkg/mcp/tool_filter.go
Lines changed: 328 additions & 0 deletions
@@ -67,6 +67,9 @@ type RunFlags struct {
 
 	// Execution mode
 	Foreground bool
+
+	// Tools filter
+	ToolsFilter []string
 }
 
 // AddRunFlags adds all the run flags to a command
@@ -146,6 +149,12 @@ func AddRunFlags(cmd *cobra.Command, config *RunFlags) {
 		"Isolate the container network from the host (default: false)")
 	cmd.Flags().StringArrayVarP(&config.Labels, "label", "l", []string{}, "Set labels on the container (format: key=value)")
 	cmd.Flags().BoolVarP(&config.Foreground, "foreground", "f", false, "Run in foreground mode (block until container exits)")
+	cmd.Flags().StringArrayVar(
+		&config.ToolsFilter,
+		"tools",
+		nil,
+		"Filter MCP server tools (comma-separated list of tool names)",
+	)
 }
 
 // BuildRunnerConfig creates a runner.RunConfig from the configuration
@@ -252,6 +261,7 @@ func BuildRunnerConfig(
 		envVarValidator,
 		types.ProxyMode(runConfig.ProxyMode),
 		runConfig.Group,
+		runConfig.ToolsFilter,
 	)
 }
 
 
@@ -0,0 +1,328 @@
+package mcp
+
+import (
+	"bytes"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"io"
+	"net/http"
+	"strings"
+
+	"github.com/stacklok/toolhive/pkg/logger"
+	"github.com/stacklok/toolhive/pkg/transport/types"
+)
+
+var errToolNameNotFound = errors.New("tool name not found")
+var errToolNotInFilter = errors.New("tool not in filter")
+var errBug = errors.New("there's a bug")
+
+// NewToolFilterMiddleware creates an HTTP middleware that parses SSE responses
+// and plain JSON objects to extract tool names from JSON-RPC messages containing
+// tool lists or tool calls.
+//
+// The middleware looks for SSE events with:
+// - event: message
+// - data: {"jsonrpc":"2.0","id":X,"result":{"tools":[...]}}
+//
+// When it finds such messages, it prints the name of each tool in the list.
+// If filterTools is provided, only tools in that list will be logged.
+// If filterTools is nil or empty, all tools will be logged.
+//
+// This middleware is designed to be used ONLY when tool filtering is enabled,
+// and expects the list of tools to be "correct" (i.e. not empty and not
+// containing nonexisting tools).
+func NewToolFilterMiddleware(filterTools []string) (types.Middleware, error) {
+	if len(filterTools) == 0 {
+		return nil, fmt.Errorf("tools list for filtering is empty")
+	}
+
+	toolsMap := make(map[string]struct{})
+	for _, tool := range filterTools {
+		toolsMap[tool] = struct{}{}
+	}
+
+	return func(next http.Handler) http.Handler {
+		return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+			// NOTE: this middleware only checks the response body, whose
+			// format at this point is not yet known and might be either a
+			// JSON payload or an SSE stream.
+			//
+			// The way this is implemented is that we wrap the response writer
+			// in order to buffer the response body. Once Flush() is called, we
+			// process the buffer according to its content type and possibly
+			// modify it before returning it to the client.
+			rw := &toolFilterWriter{
+				ResponseWriter: w,
+				filterTools:    toolsMap,
+			}
+
+			// Call the next handler
+			next.ServeHTTP(rw, r)
+		})
+	}, nil
+}
+
+// NewToolCallFilterMiddleware creates an HTTP middleware that parses tool call
+// requests and filters out tools that are not in the filter list.
+//
+// The middleware looks for JSON-RPC messages with:
+// - method: tool/call
+// - params: {"name": "tool_name"}
+//
+// This middleware is designed to be used ONLY when tool filtering is enabled,
+// and expects the list of tools to be "correct" (i.e. not empty and not
+// containing nonexisting tools).
+func NewToolCallFilterMiddleware(filterTools []string) (types.Middleware, error) {
+	if len(filterTools) == 0 {
+		return nil, fmt.Errorf("tools list for filtering is empty")
+	}
+
+	toolsMap := make(map[string]struct{})
+	for _, tool := range filterTools {
+		toolsMap[tool] = struct{}{}
+	}
+
+	return func(next http.Handler) http.Handler {
+		return http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
+			// Read the request body
+			bodyBytes, err := io.ReadAll(r.Body)
+			if err != nil {
+				// If we can't read the body, let the next handler deal with it
+				next.ServeHTTP(w, r)
+				return
+			}
+
+			// Restore the request body for downstream handlers
+			r.Body = io.NopCloser(bytes.NewBuffer(bodyBytes))
+
+			// Try to parse the request as a tool call request. If it succeeds,
+			// check if the tool is in the filter. If it is not a tool call request,
+			// just pass it through.
+			var toolCallRequest toolCallRequest
+			err = json.Unmarshal(bodyBytes, &toolCallRequest)
+			if err == nil && toolCallRequest.Params != nil && toolCallRequest.Method == "tools/call" {
+				err = processToolCallRequest(toolsMap, toolCallRequest)
+
+				// NOTE: ideally, trying to call that was filtered out by config should be
+				// equivalent to calling a nonexisting tool; in such cases and when the SSE
+				// transport is used, the behaviour of the official Python SDK is to return
+				// a 202 Accepted to THIS call and return an success message in the SSE
+				// stream saying that the tool does not exist.
+				//
+				// It basically fails successfully.
+				//
+				// Unfortunately, implementing this behaviour is not trivial and requires
+				// session management, as the SSE stream is managed by the proxy in an entirely
+				// different thread of execution. As a consequence, the best thing we can
+				// do that is still compliant with the spec is to return a 400 Bad Request
+				// to the client.
+				if errors.Is(err, errToolNotInFilter) {
+					w.WriteHeader(http.StatusBadRequest)
+					return
+				}
+				if err != nil {
+					logger.Errorf("Error processing tool call of a filtered tool: %v", err)
+					next.ServeHTTP(w, r)
+					return
+				}
+			}
+
+			next.ServeHTTP(w, r)
+		})
+	}, nil
+}
+
+// toolFilterWriter wraps http.ResponseWriter to capture and process SSE responses
+type toolFilterWriter struct {
+	http.ResponseWriter
+	buffer      []byte
+	filterTools map[string]struct{}
+}
+
+// WriteHeader captures the status code
+func (rw *toolFilterWriter) WriteHeader(statusCode int) {
+	rw.ResponseWriter.WriteHeader(statusCode)
+}
+
+// Write captures the response body and processes SSE events
+func (rw *toolFilterWriter) Write(data []byte) (int, error) {
+	rw.buffer = append(rw.buffer, data...)
+	return len(data), nil
+}
+
+// Flush processes any remaining buffered data and writes it to the underlying ResponseWriter
+func (rw *toolFilterWriter) Flush() {
+	if len(rw.buffer) > 0 {
+		mimeType := strings.Split(rw.ResponseWriter.Header().Get("Content-Type"), ";")[0]
+
+		if mimeType == "" {
+			_, err := rw.ResponseWriter.Write(rw.buffer)
+			if err != nil {
+				logger.Errorf("Error writing buffer: %v", err)
+			}
+			return
+		}
+
+		var b bytes.Buffer
+		if err := processBuffer(rw.filterTools, rw.buffer, mimeType, &b); err != nil {
+			logger.Errorf("Error flushing response: %v", err)
+		}
+
+		_, err := rw.ResponseWriter.Write(b.Bytes())
+		if err != nil {
+			logger.Errorf("Error writing buffer: %v", err)
+		}
+		rw.buffer = rw.buffer[:0] // Reset buffer
+	}
+
+	if flusher, ok := rw.ResponseWriter.(http.Flusher); ok {
+		flusher.Flush()
+	}
+}
+
+type toolsListResponse struct {
+	JSONRPC string `json:"jsonrpc"`
+	ID      any    `json:"id"`
+	Result  struct {
+		Tools *[]map[string]any `json:"tools"`
+	} `json:"result,omitempty"`
+}
+
+type toolCallRequest struct {
+	JSONRPC string          `json:"jsonrpc"`
+	ID      any             `json:"id"`
+	Method  string          `json:"method"`
+	Params  *map[string]any `json:"params,omitempty"`
+}
+
+// processSSEBuffer processes any complete SSE events in the buffer
+func processBuffer(filterTools map[string]struct{}, buffer []byte, mimeType string, w io.Writer) error {
+	if len(buffer) == 0 {
+		return nil
+	}
+
+	switch mimeType {
+	case "application/json":
+		var toolsListResponse toolsListResponse
+		err := json.Unmarshal(buffer, &toolsListResponse)
+		if err == nil && toolsListResponse.Result.Tools != nil {
+			return processToolsListResponse(filterTools, toolsListResponse, w)
+		}
+	case "text/event-stream":
+		return processSSEEvents(filterTools, buffer, w)
+	default:
+		// NOTE: Content-Type header is mandatory in the spec, and as of the
+		// time of this writing, the only allowed content types are
+		// * application/json, and
+		// * text/event-stream
+		//
+		// As a result, we should never get here and it is safe to return an
+		// error.
+		return fmt.Errorf("unsupported mime type: %s", mimeType)
+	}
+
+	return fmt.Errorf("%w: tool filtering middleware", errBug)
+}
+
+//nolint:gocyclo
+func processSSEEvents(filterTools map[string]struct{}, buffer []byte, w io.Writer) error {
+	var linesep []byte
+	if bytes.Contains(buffer, []byte("\r\n")) {
+		linesep = []byte("\r\n")
+	} else if bytes.Contains(buffer, []byte("\n")) {
+		linesep = []byte("\n")
+	} else if bytes.Contains(buffer, []byte("\r")) {
+		linesep = []byte("\r")
+	} else {
+		return fmt.Errorf("unsupported separator: %s", string(buffer))
+	}
+
+	var linesepTotal, linesepCount int
+	linesepTotal = bytes.Count(buffer, linesep)
+	lines := bytes.Split(buffer, linesep)
+	for _, line := range lines {
+		if len(line) == 0 {
+			continue
+		}
+
+		var written bool
+		if data, ok := bytes.CutPrefix(line, []byte("data:")); ok {
+			var toolsListResponse toolsListResponse
+			if err := json.Unmarshal(data, &toolsListResponse); err == nil && toolsListResponse.Result.Tools != nil {
+				if err := processToolsListResponse(filterTools, toolsListResponse, w); err != nil {
+					return err
+				}
+				written = true
+			}
+		}
+
+		if !written {
+			_, err := w.Write(line)
+			if err != nil {
+				return fmt.Errorf("%w: %v", errBug, err)
+			}
+		}
+
+		_, err := w.Write(linesep)
+		if err != nil {
+			return fmt.Errorf("%w: %v", errBug, err)
+		}
+		linesepCount++
+	}
+
+	// This ensures we don't send too few line separators, which might break
+	// SSE parsing.
+	if linesepCount < linesepTotal {
+		_, err := w.Write(linesep)
+		if err != nil {
+			return fmt.Errorf("%w: %v", errBug, err)
+		}
+	}
+
+	return nil
+}
+
+// processToolsListResponse processes a tools list response filtering out
+// tools that are not in the filter list.
+func processToolsListResponse(filterTools map[string]struct{}, toolsListResponse toolsListResponse, w io.Writer) error {
+	filteredTools := []map[string]any{}
+	for _, tool := range *toolsListResponse.Result.Tools {
+		toolName, ok := tool["name"].(string)
+		if !ok {
+			return errToolNameNotFound
+		}
+
+		if isToolInFilter(filterTools, toolName) {
+			filteredTools = append(filteredTools, tool)
+		}
+	}
+
+	toolsListResponse.Result.Tools = &filteredTools
+	if err := json.NewEncoder(w).Encode(toolsListResponse); err != nil {
+		return fmt.Errorf("%w: %v", errBug, err)
+	}
+
+	return nil
+}
+
+// processToolCallRequest processes a tool call request checking if the tool
+// is in the filter list.
+func processToolCallRequest(filterTools map[string]struct{}, toolCallRequest toolCallRequest) error {
+	toolName, ok := (*toolCallRequest.Params)["name"].(string)
+	if !ok {
+		return errToolNameNotFound
+	}
+
+	if isToolInFilter(filterTools, toolName) {
+		return nil
+	}
+
+	return errToolNotInFilter
+}
+
+// isToolInFilter checks if a tool name is in the filter
+func isToolInFilter(filterTools map[string]struct{}, toolName string) bool {
+	_, ok := filterTools[toolName]
+	return ok
+}