controller: removes openAIPrefix config (envoyproxy#1063)

mathetake · web-flow · commit ba79bfa4f0fd · 2025-08-12T23:22:53.000-07:00
**Description** The configurability for "/v1" was introduced in envoyproxy#1020. However, it is unnecessary configuration no one asked for at the moment given that we keep the rootPrefix for the separation concern between AIGatewayRoutes vs HTTPRoutes. This partially reverts envoyproxy#1020, and removes the config so that we can have a simpler config overall. We can revisit this if anyone asks for it later. If so, I think it will be a time to think about Gateway level CRD. **Related Issues/PRs (if applicable)** Follow up on envoyproxy#1020 --------- Signed-off-by: Takeshi Yoneda <t.y.mathetake@gmail.com>
diff --git a/cmd/controller/main.go b/cmd/controller/main.go
@@ -44,7 +44,6 @@ type flags struct {
 	caBundleName               string
 	metricsRequestHeaderLabels string
 	rootPrefix                 string
-	openAIPrefix               string
 	extProcExtraEnvVars        string
 }
 
@@ -123,11 +122,6 @@ func parseAndValidateFlags(args []string) (flags, error) {
 		"/",
 		`The root prefix for all supported endpoints. Default is "/"`,
 	)
-	openAIPrefix := fs.String(
-		"openAIPrefix",
-		"/v1",
-		`The prefix for OpenAI endpoints following *after* the root prefix. Default is "/v1".`,
-	)
 	extProcExtraEnvVars := fs.String(
 		"extProcExtraEnvVars",
 		"",
@@ -185,7 +179,6 @@ func parseAndValidateFlags(args []string) (flags, error) {
 		caBundleName:               *caBundleName,
 		metricsRequestHeaderLabels: *metricsRequestHeaderLabels,
 		rootPrefix:                 *rootPrefix,
-		openAIPrefix:               *openAIPrefix,
 		extProcExtraEnvVars:        *extProcExtraEnvVars,
 	}, nil
 }
@@ -261,7 +254,6 @@ func main() {
 		UDSPath:                    extProcUDSPath,
 		MetricsRequestHeaderLabels: flags.metricsRequestHeaderLabels,
 		RootPrefix:                 flags.rootPrefix,
-		OpenAIPrefix:               flags.openAIPrefix,
 		ExtProcExtraEnvVars:        flags.extProcExtraEnvVars,
 	}); err != nil {
 		setupLog.Error(err, "failed to start controller")
diff --git a/cmd/extproc/mainlib/main.go b/cmd/extproc/mainlib/main.go
@@ -45,10 +45,8 @@ type extProcFlags struct {
 	metricsPort                int        // HTTP port for the metrics server.
 	healthPort                 int        // HTTP port for the health check server.
 	metricsRequestHeaderLabels string     // comma-separated key-value pairs for mapping HTTP request headers to Prometheus metric labels.
-	// openAIPrefix is the OpenAI API prefix to be used for the external processor.
-	openAIPrefix string
-	// anthropicPrefix is the Anthropic API prefix to be used for the external processor.
-	anthropicPrefix string
+	// rootPrefix is the root prefix for all the processors.
+	rootPrefix string
 }
 
 // parseAndValidateFlags parses and validates the flags passed to the external processor.
@@ -82,17 +80,10 @@ func parseAndValidateFlags(args []string) (extProcFlags, error) {
 		"",
 		"Comma-separated key-value pairs for mapping HTTP request headers to Prometheus metric labels. Format: x-team-id:team_id,x-user-id:user_id.",
 	)
-	fs.StringVar(&flags.openAIPrefix,
-		"openAIPrefix",
-		"/v1",
-		"OpenAI endpoint prefix to be used for the external processor. This is used to route requests to the correct handler. "+
-			"Defaults to /v1, which is the standard OpenAI API prefix.",
-	)
-	fs.StringVar(&flags.anthropicPrefix,
-		"anthropicPrefix",
-		"/anthropic/v1",
-		"Anthropic endpoint prefix to be used for the external processor. This is used to route requests to the correct handler. "+
-			"Defaults to /anthropic/v1, which provides clear separation from OpenAI endpoints.",
+	fs.StringVar(&flags.rootPrefix,
+		"rootPrefix",
+		"/",
+		"The root path prefix for all the processors.",
 	)
 
 	if err := fs.Parse(args); err != nil {
@@ -180,10 +171,10 @@ func Main(ctx context.Context, args []string, stderr io.Writer) (err error) {
 	if err != nil {
 		return fmt.Errorf("failed to create external processor server: %w", err)
 	}
-	server.Register(path.Join(flags.openAIPrefix, "/chat/completions"), extproc.ChatCompletionProcessorFactory(chatCompletionMetrics))
-	server.Register(path.Join(flags.openAIPrefix, "/embeddings"), extproc.EmbeddingsProcessorFactory(embeddingsMetrics))
-	server.Register(path.Join(flags.openAIPrefix, "/models"), extproc.NewModelsProcessor)
-	server.Register(path.Join(flags.anthropicPrefix, "/messages"), extproc.MessagesProcessorFactory(chatCompletionMetrics))
+	server.Register(path.Join(flags.rootPrefix, "/v1/chat/completions"), extproc.ChatCompletionProcessorFactory(chatCompletionMetrics))
+	server.Register(path.Join(flags.rootPrefix, "/v1/embeddings"), extproc.EmbeddingsProcessorFactory(embeddingsMetrics))
+	server.Register(path.Join(flags.rootPrefix, "/v1/models"), extproc.NewModelsProcessor)
+	server.Register(path.Join(flags.rootPrefix, "/anthropic/v1/messages"), extproc.MessagesProcessorFactory(chatCompletionMetrics))
 
 	if err := extproc.StartConfigWatcher(ctx, flags.configPath, server, l, time.Second*5); err != nil {
 		return fmt.Errorf("failed to start config watcher: %w", err)
diff --git a/cmd/extproc/mainlib/main_test.go b/cmd/extproc/mainlib/main_test.go
@@ -33,76 +33,76 @@ import (
 func Test_parseAndValidateFlags(t *testing.T) {
 	t.Run("ok extProcFlags", func(t *testing.T) {
 		for _, tc := range []struct {
-			name         string
-			args         []string
-			configPath   string
-			addr         string
-			openAIPRefix string
-			logLevel     slog.Level
+			name       string
+			args       []string
+			configPath string
+			addr       string
+			rootPrefix string
+			logLevel   slog.Level
 		}{
 			{
-				name:         "minimal extProcFlags",
-				args:         []string{"-configPath", "/path/to/config.yaml"},
-				configPath:   "/path/to/config.yaml",
-				addr:         ":1063",
-				openAIPRefix: "/v1",
-				logLevel:     slog.LevelInfo,
+				name:       "minimal extProcFlags",
+				args:       []string{"-configPath", "/path/to/config.yaml"},
+				configPath: "/path/to/config.yaml",
+				addr:       ":1063",
+				rootPrefix: "/",
+				logLevel:   slog.LevelInfo,
 			},
 			{
-				name:         "custom addr",
-				args:         []string{"-configPath", "/path/to/config.yaml", "-extProcAddr", "unix:///tmp/ext_proc.sock"},
-				configPath:   "/path/to/config.yaml",
-				addr:         "unix:///tmp/ext_proc.sock",
-				openAIPRefix: "/v1",
-				logLevel:     slog.LevelInfo,
+				name:       "custom addr",
+				args:       []string{"-configPath", "/path/to/config.yaml", "-extProcAddr", "unix:///tmp/ext_proc.sock"},
+				configPath: "/path/to/config.yaml",
+				addr:       "unix:///tmp/ext_proc.sock",
+				rootPrefix: "/",
+				logLevel:   slog.LevelInfo,
 			},
 			{
-				name:         "log level debug",
-				args:         []string{"-configPath", "/path/to/config.yaml", "-logLevel", "debug"},
-				configPath:   "/path/to/config.yaml",
-				addr:         ":1063",
-				openAIPRefix: "/v1",
-				logLevel:     slog.LevelDebug,
+				name:       "log level debug",
+				args:       []string{"-configPath", "/path/to/config.yaml", "-logLevel", "debug"},
+				configPath: "/path/to/config.yaml",
+				addr:       ":1063",
+				rootPrefix: "/",
+				logLevel:   slog.LevelDebug,
 			},
 			{
-				name:         "log level warn",
-				args:         []string{"-configPath", "/path/to/config.yaml", "-logLevel", "warn"},
-				configPath:   "/path/to/config.yaml",
-				addr:         ":1063",
-				openAIPRefix: "/v1",
-				logLevel:     slog.LevelWarn,
+				name:       "log level warn",
+				args:       []string{"-configPath", "/path/to/config.yaml", "-logLevel", "warn"},
+				configPath: "/path/to/config.yaml",
+				addr:       ":1063",
+				rootPrefix: "/",
+				logLevel:   slog.LevelWarn,
 			},
 			{
-				name:         "log level error",
-				args:         []string{"-configPath", "/path/to/config.yaml", "-logLevel", "error"},
-				configPath:   "/path/to/config.yaml",
-				addr:         ":1063",
-				openAIPRefix: "/v1",
-				logLevel:     slog.LevelError,
+				name:       "log level error",
+				args:       []string{"-configPath", "/path/to/config.yaml", "-logLevel", "error"},
+				configPath: "/path/to/config.yaml",
+				addr:       ":1063",
+				rootPrefix: "/",
+				logLevel:   slog.LevelError,
 			},
 			{
 				name: "all extProcFlags",
 				args: []string{
 					"-configPath", "/path/to/config.yaml",
 					"-extProcAddr", "unix:///tmp/ext_proc.sock",
 					"-logLevel", "debug",
-					"-openAIPrefix", "/foo/bar/v1",
+					"-rootPrefix", "/foo/bar/",
 				},
-				configPath:   "/path/to/config.yaml",
-				addr:         "unix:///tmp/ext_proc.sock",
-				openAIPRefix: "/foo/bar/v1",
-				logLevel:     slog.LevelDebug,
+				configPath: "/path/to/config.yaml",
+				addr:       "unix:///tmp/ext_proc.sock",
+				rootPrefix: "/foo/bar/",
+				logLevel:   slog.LevelDebug,
 			},
 			{
 				name: "with header mapping",
 				args: []string{
 					"-configPath", "/path/to/config.yaml",
 					"-metricsRequestHeaderLabels", "x-team-id:team_id,x-user-id:user_id",
 				},
-				configPath:   "/path/to/config.yaml",
-				openAIPRefix: "/v1",
-				addr:         ":1063",
-				logLevel:     slog.LevelInfo,
+				configPath: "/path/to/config.yaml",
+				rootPrefix: "/",
+				addr:       ":1063",
+				logLevel:   slog.LevelInfo,
 			},
 		} {
 			t.Run(tc.name, func(t *testing.T) {
@@ -111,6 +111,7 @@ func Test_parseAndValidateFlags(t *testing.T) {
 				assert.Equal(t, tc.configPath, flags.configPath)
 				assert.Equal(t, tc.addr, flags.extProcAddr)
 				assert.Equal(t, tc.logLevel, flags.logLevel)
+				assert.Equal(t, tc.rootPrefix, flags.rootPrefix)
 			})
 		}
 	})
diff --git a/internal/controller/controller.go b/internal/controller/controller.go
@@ -8,7 +8,6 @@ package controller
 import (
 	"context"
 	"fmt"
-	"path"
 
 	egv1a1 "github.com/envoyproxy/gateway/api/v1alpha1"
 	"github.com/go-logr/logr"
@@ -74,8 +73,6 @@ type Options struct {
 	MetricsRequestHeaderLabels string
 	// RootPrefix is the root prefix for all the routes handled by the AI Gateway.
 	RootPrefix string
-	// OpenAIEndpointsPrefix is the prefix for OpenAI endpoints that follow after the root prefix.
-	OpenAIPrefix string
 	// ExtProcExtraEnvVars is the semicolon-separated key=value pairs for extra environment variables in extProc container.
 	ExtProcExtraEnvVars string
 }
@@ -186,7 +183,7 @@ func StartControllers(ctx context.Context, mgr manager.Manager, config *rest.Con
 			options.ExtProcLogLevel,
 			options.UDSPath,
 			options.MetricsRequestHeaderLabels,
-			path.Join(options.RootPrefix, options.OpenAIPrefix),
+			options.RootPrefix,
 			options.ExtProcExtraEnvVars,
 		))
 		mgr.GetWebhookServer().Register("/mutate", &webhook.Admission{Handler: h})
diff --git a/internal/controller/gateway_mutator.go b/internal/controller/gateway_mutator.go
@@ -37,13 +37,13 @@ type gatewayMutator struct {
 	extProcLogLevel            string
 	udsPath                    string
 	metricsRequestHeaderLabels string
-	openAIPrefix               string
+	rootPrefix                 string
 	extProcExtraEnvVars        []corev1.EnvVar
 }
 
 func newGatewayMutator(c client.Client, kube kubernetes.Interface, logger logr.Logger,
 	extProcImage string, extProcImagePullPolicy corev1.PullPolicy, extProcLogLevel,
-	udsPath, metricsRequestHeaderLabels, openAIPrefix, extProcExtraEnvVars string,
+	udsPath, metricsRequestHeaderLabels, rootPrefix, extProcExtraEnvVars string,
 ) *gatewayMutator {
 	var parsedEnvVars []corev1.EnvVar
 	if extProcExtraEnvVars != "" {
@@ -63,7 +63,7 @@ func newGatewayMutator(c client.Client, kube kubernetes.Interface, logger logr.L
 		logger:                     logger,
 		udsPath:                    udsPath,
 		metricsRequestHeaderLabels: metricsRequestHeaderLabels,
-		openAIPrefix:               openAIPrefix,
+		rootPrefix:                 rootPrefix,
 		extProcExtraEnvVars:        parsedEnvVars,
 	}
 }
@@ -95,7 +95,7 @@ func (g *gatewayMutator) buildExtProcArgs(filterConfigFullPath string, extProcMe
 		"-extProcAddr", "unix://" + g.udsPath,
 		"-metricsPort", fmt.Sprintf("%d", extProcMetricsPort),
 		"-healthPort", fmt.Sprintf("%d", extProcHealthPort),
-		"-openAIPrefix", g.openAIPrefix,
+		"-rootPrefix", g.rootPrefix,
 	}
 
 	// Add metrics header label mapping if configured.
diff --git a/internal/extproc/server.go b/internal/extproc/server.go
@@ -102,6 +102,7 @@ func (s *Server) LoadConfig(ctx context.Context, config *filterapi.Config) error
 
 // Register a new processor for the given request path.
 func (s *Server) Register(path string, newProcessor ProcessorFactory) {
+	s.logger.Info("Registering processor", slog.String("path", path))
 	s.processorFactories[path] = newProcessor
 }
 
diff --git a/manifests/charts/ai-gateway-helm/templates/deployment.yaml b/manifests/charts/ai-gateway-helm/templates/deployment.yaml
@@ -59,7 +59,6 @@ spec:
             - --enableLeaderElection=true
             {{- end }}
             - --rootPrefix={{ .Values.endpointConfig.rootPrefix }}
-            - --openAIPrefix={{ .Values.endpointConfig.openAIPrefix }}
           livenessProbe:
             grpc:
               port: 1063
diff --git a/manifests/charts/ai-gateway-helm/values.yaml b/manifests/charts/ai-gateway-helm/values.yaml
@@ -6,22 +6,14 @@
 # Default values for ai-gateway-helm.
 
 # Global configuration for the endpoints supported by the AI Gateway.
-#
-# By default, the AI Gateway will assume that the downstream client's OpenAI SDK will talk to the Gateway using the base_url
-# set to "http://<gateway-hostname>/v1" which has the default "/v1" prefix in the base_url.
-#
-# By using this configuration, you can change the prefix for the OpenAI endpoints as well as the future non-OpenAI endpoints.
-# For example, when you can configure the rootPrefix to "/ai" and the openAIPrefix to "/openai/v1" which will result in the
-# OpenAI endpoints being served at "http://<gateway-hostname>/ai/openai/v1". This *will* become useful when you add support for
-# other input schemas like Anthropic, Google Gemini, etc. and you want to serve them under a different prefix to avoid conflicts.
-# Follow the issues https://github.com/envoyproxy/ai-gateway/issues/847 as well as https://github.com/envoyproxy/ai-gateway/issues/948 for detail.
 endpointConfig:
   # The prefix for all the routes served by the AI Gateway. Defaulting to "/". All the generated routes will have this prefix.
+  #
+  # With the default "/", the AI Gateway will assume that the downstream client's OpenAI SDK will talk to the Gateway using the base_url
+  # set to "http://<gateway-hostname>/v1" which has the default "/v1" prefix in the base_url.
+  #
+  # This can be used for providing a separation between AIGatewayRoutes and normal HTTPRoutes when the top level "/v1/" is not desired.
   rootPrefix: "/"
-  # The prefix for the OpenAI endpoints. Defaulting to "/v1". This comes **after** the rootPrefix. E.g. if the rootPrefix is "/ai" and the openAIPrefix is "/v1",
-  # the OpenAI endpoints will be served at "/ai/v1" which requires the base_url set to "http://<gateway-hostname>/ai/v1".
-  openAIPrefix: "/v1"
-  # TODO: addr more input schemas. E.g. Anthropic https://github.com/envoyproxy/ai-gateway/issues/847
 
 extProc:
   image:
diff --git a/site/docs/capabilities/llm-integrations/supported-endpoints.md b/site/docs/capabilities/llm-integrations/supported-endpoints.md
@@ -10,11 +10,6 @@ The Envoy AI Gateway provides OpenAI-compatible API endpoints for routing and ma
 
 The Envoy AI Gateway acts as a proxy that accepts OpenAI-compatible requests and routes them to various AI providers. While it maintains compatibility with the OpenAI API specification, it currently supports a subset of the full OpenAI API.
 
-:::tip
-`/v1` prefix on OpenAI API endpoints is configurable via Envoy AI Gateway installation options. The default is `/v1` unless specified otherwise.
-Please refer to the `endpointConfig` option in the [helm values file](https://github.com/envoyproxy/ai-gateway/blob/main/manifests/charts/ai-gateway-helm/values.yaml) for details.
-:::
-
 ## Supported Endpoints
 
 ### Chat Completions

Original file line number	Diff line number	Diff line change
`@@ -102,6 +102,7 @@ func (s Server) LoadConfig(ctx context.Context, config filterapi.Config) error`
`102`	`102`
`103`	`103`	`// Register a new processor for the given request path.`
`104`	`104`	`func (s *Server) Register(path string, newProcessor ProcessorFactory) {`
	`105`	`+ s.logger.Info("Registering processor", slog.String("path", path))`
`105`	`106`	`s.processorFactories[path] = newProcessor`
`106`	`107`	`}`
`107`	`108`