Configure the tool_choice to use a specific tool

MondayCha · MondayCha · commit 149a0f40a596 · 2025-10-28T00:00:08.000+08:00
Signed-off-by: MondayCha &lt;mondaycha@outlook.com&gt;
diff --git a/pkg/common/tools_utils.go b/pkg/common/tools_utils.go
@@ -21,6 +21,7 @@ import (
 	"fmt"
 
 	openaiserverapi "github.com/llm-d/llm-d-inference-sim/pkg/openai-server-api"
+	"github.com/openai/openai-go/v3/packages/param"
 	"github.com/santhosh-tekuri/jsonschema/v5"
 )
 
@@ -52,24 +53,88 @@ var fakeStringArguments = []string{
 	`lifetime`,
 }
 
-// CreateToolCalls creates and returns response payload based on this request
-// (tool calls or nothing in case we randomly choose not to generate calls),
-// and the number of generated completion token sand the finish reason
-func CreateToolCalls(tools []openaiserverapi.Tool, toolChoice string, config *Configuration) ([]openaiserverapi.ToolCall, int, error) {
-	// This function is called if tool choice is either 'required' or 'auto'.
-	// In case of 'required' at least one tool call has to be created, and we randomly choose
-	// the number of calls starting from one. Otherwise, we start from 0, and in case we randomly
-	// choose the number of calls to be 0, response text will be generated instead of a tool call.
+// IsToolChoiceNone checks if the tool_choice is set to "none".
+func IsToolChoiceNone(toolChoice openaiserverapi.ToolChoice) bool {
+	if !param.IsOmitted(toolChoice.OfAuto) {
+		val := toolChoice.OfAuto.Or("")
+		return val == ToolChoiceNone
+	}
+	return false
+}
+
+// CreateToolCalls creates and returns tool calls based on the request's tool
+// definitions and tool_choice parameter.
+// The tool_choice parameter controls how the model responds to function calls:
+//   - "none": The model does not call any tools. This case should be handled
+//     before calling this function.
+//   - "auto": The model can choose to either generate a message or call one or
+//     more tools. This is the default behavior.
+//   - "required": The model must call one or more tools.
+//   - Specific function: A specific tool can be forced by providing an object
+//     like `{"type": "function", "function": {"name": "my_function"}}`. The
+//     model will be constrained to call that exact tool.
+//
+// This function returns the generated tool calls, the number of completion
+// tokens used, and an error if one occurs (e.g., if a specified tool is not found).
+func CreateToolCalls(
+	tools []openaiserverapi.Tool,
+	toolChoice openaiserverapi.ToolChoice,
+	config *Configuration,
+) ([]openaiserverapi.ToolCall, int, error) {
+	// If a specific function is required.
+	if functionChoice := toolChoice.GetFunction(); functionChoice != nil {
+		requiredFuncName := functionChoice.Name
+		var targetTool *openaiserverapi.Tool
+
+		// Find the specified tool in the list of available tools.
+		for i, tool := range tools {
+			if tool.Function.Name == requiredFuncName {
+				targetTool = &tools[i]
+				break
+			}
+		}
+
+		if targetTool == nil {
+			return nil, 0, fmt.Errorf("tool with name '%s' requested in tool_choice but not found in the tools list", requiredFuncName)
+		}
+
+		// Generate arguments for the specific tool.
+		args, err := generateToolArguments(*targetTool, config)
+		if err != nil {
+			return nil, 0, err
+		}
+		argsJson, err := json.Marshal(args)
+		if err != nil {
+			return nil, 0, err
+		}
+
+		call := openaiserverapi.ToolCall{
+			Function: openaiserverapi.FunctionCall{
+				Arguments:          string(argsJson),
+				TokenizedArguments: Tokenize(string(argsJson)),
+				Name:               &targetTool.Function.Name,
+			},
+			ID:    "chatcmpl-tool-" + RandomNumericString(10),
+			Type:  "function",
+			Index: 0,
+		}
+		calls := []openaiserverapi.ToolCall{call}
+		return calls, CountTokensForToolCalls(calls), nil
+	}
+
+	// Tool choice is 'auto' or 'required'.
+	// In 'required' mode, at least one tool call must be created.
+	// In 'auto' mode, the number of calls can be zero, leading to a text response instead.
 	min := 0
-	if toolChoice == ToolChoiceRequired {
+	if !param.IsOmitted(toolChoice.OfAuto) && toolChoice.OfAuto.Or("") == ToolChoiceRequired {
 		min = 1
 	}
 	numberOfCalls := RandomInt(min, len(tools))
 	if numberOfCalls == 0 {
 		return nil, 0, nil
 	}
 
-	calls := make([]openaiserverapi.ToolCall, 0)
+	calls := make([]openaiserverapi.ToolCall, 0, numberOfCalls)
 	for i := range numberOfCalls {
 		// Randomly choose which tools to call. We may call the same tool more than once.
 		index := RandomInt(0, len(tools)-1)
diff --git a/pkg/llm-d-inference-sim/tools_test.go b/pkg/llm-d-inference-sim/tools_test.go
@@ -499,6 +499,59 @@ var _ = Describe("Simulator for request with tools", func() {
 		Entry(nil, common.ModeRandom),
 	)
 
+	DescribeTable("no streaming, a specific tool",
+		func(mode string, specificTool string) {
+			ctx := context.TODO()
+			client, err := startServer(ctx, mode)
+			Expect(err).NotTo(HaveOccurred())
+
+			openaiclient, params := getOpenAIClientAndChatParams(client, model, userMessage, false)
+			params.ToolChoice = openai.ToolChoiceOptionFunctionToolChoice(openai.ChatCompletionNamedToolChoiceFunctionParam{
+				Name: specificTool,
+			})
+			params.Tools = tools
+
+			resp, err := openaiclient.Chat.Completions.New(ctx, params)
+			Expect(err).NotTo(HaveOccurred())
+			Expect(resp.Choices).ShouldNot(BeEmpty())
+			Expect(string(resp.Object)).To(Equal(chatCompletionObject))
+
+			Expect(resp.Usage.PromptTokens).To(Equal(userMsgTokens))
+			Expect(resp.Usage.CompletionTokens).To(BeNumerically(">", 0))
+			Expect(resp.Usage.TotalTokens).To(Equal(resp.Usage.PromptTokens + resp.Usage.CompletionTokens))
+
+			content := resp.Choices[0].Message.Content
+			Expect(content).Should(BeEmpty())
+
+			toolCalls := resp.Choices[0].Message.ToolCalls
+			Expect(toolCalls).ToNot(BeEmpty())
+			for _, tc := range toolCalls {
+				Expect(tc.Function.Name).To(Equal(specificTool))
+				Expect(tc.ID).NotTo(BeEmpty())
+				Expect(tc.Type).To(Equal("function"))
+				args := make(map[string]string)
+				err := json.Unmarshal([]byte(tc.Function.Arguments), &args)
+				Expect(err).NotTo(HaveOccurred())
+
+				if tc.Function.Name == "get_weather" {
+					Expect(tc.Function.Arguments).To(ContainSubstring("location"))
+				} else {
+					Expect(tc.Function.Arguments).To(ContainSubstring("city"))
+					Expect(tc.Function.Arguments).To(ContainSubstring("unit"))
+					Expect(args["unit"]).To(Or(Equal("C"), Equal("F")))
+				}
+			}
+		},
+		func(mode string, specificTool string) string {
+			return "mode: " + mode + ", specificTool: " + specificTool
+		},
+		// Call several times because the tools and arguments are chosen randomly
+		Entry(nil, common.ModeRandom, "get_weather"),
+		Entry(nil, common.ModeRandom, "get_temperature"),
+		Entry(nil, common.ModeRandom, "get_weather"),
+		Entry(nil, common.ModeRandom, "get_temperature"),
+	)
+
 	DescribeTable("check validator",
 		func(mode string) {
 			ctx := context.TODO()
diff --git a/pkg/llm-d-inference-sim/worker.go b/pkg/llm-d-inference-sim/worker.go
@@ -88,7 +88,7 @@ func (s *VllmSimulator) processRequest(reqCtx *openaiserverapi.CompletionReqCtx)
 	var toolCalls []openaiserverapi.ToolCall
 	var completionTokens int
 	if reqCtx.IsChatCompletion &&
-		req.GetToolChoice() != common.ToolChoiceNone &&
+		!common.IsToolChoiceNone(req.GetToolChoice()) &&
 		req.GetTools() != nil {
 		toolCalls, completionTokens, err =
 			common.CreateToolCalls(req.GetTools(), req.GetToolChoice(), s.config)
diff --git a/pkg/openai-server-api/request.go b/pkg/openai-server-api/request.go
@@ -46,10 +46,10 @@ type CompletionRequest interface {
 	SetNumberOfCachedPromptTokens(cachedPromptTokens int)
 	// GetPrompt returns the prompt
 	GetPrompt() string
-	// GetTools() returns tools to use (in chat completion)
+	// GetTools returns tools to use (in chat completion)
 	GetTools() []Tool
-	// GetToolChoice() returns tool choice (in chat completion)
-	GetToolChoice() string
+	// GetToolChoice returns tool choice (in chat completion)
+	GetToolChoice() ToolChoice
 	// GetMaxCompletionTokens returns the maximum completion tokens requested
 	GetMaxCompletionTokens() *int64
 	// GetIgnoreEOS returns true if the end-of-sequence tokens will be ignored
@@ -184,12 +184,13 @@ type ChatCompletionRequest struct {
 	// Tools is a list of tools the model may call.
 	Tools []Tool `json:"tools,omitempty"`
 
-	// ToolChoice controls which (if any) tool is called by the model,
-	// possible values: none, auto, required.
-	// Sending an object with a specific tool, is currently not supported.
-	ToolChoice string `json:"tool_choice,omitempty"`
+	// ToolChoice controls which (if any) tool is called by the model.
+	// It can be a string ("none", "auto", "required") or an object specifying the function.
+	ToolChoice ToolChoice `json:"tool_choice,omitzero"`
 }
 
+var _ CompletionRequest = (*ChatCompletionRequest)(nil)
+
 // function defines a tool
 type function struct {
 	// Name is the function's name
@@ -221,7 +222,7 @@ func (c *ChatCompletionRequest) GetTools() []Tool {
 	return c.Tools
 }
 
-func (c *ChatCompletionRequest) GetToolChoice() string {
+func (c *ChatCompletionRequest) GetToolChoice() ToolChoice {
 	return c.ToolChoice
 }
 
@@ -286,6 +287,8 @@ type TextCompletionRequest struct {
 	MaxTokens *int64 `json:"max_tokens"`
 }
 
+var _ CompletionRequest = (*TextCompletionRequest)(nil)
+
 func (t *TextCompletionRequest) GetPrompt() string {
 	return t.Prompt
 }
@@ -294,8 +297,8 @@ func (c *TextCompletionRequest) GetTools() []Tool {
 	return nil
 }
 
-func (c *TextCompletionRequest) GetToolChoice() string {
-	return ""
+func (c *TextCompletionRequest) GetToolChoice() ToolChoice {
+	return ToolChoice{}
 }
 
 func (c *TextCompletionRequest) GetMaxCompletionTokens() *int64 {
diff --git a/pkg/openai-server-api/tool_choice.go b/pkg/openai-server-api/tool_choice.go
@@ -0,0 +1,94 @@
+/*
+Copyright 2025 The llm-d-inference-sim Authors.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+*/
+
+// Contains structures and functions related to requests for all supported APIs
+package openaiserverapi
+
+import (
+	"encoding/json"
+	"fmt"
+
+	"github.com/openai/openai-go/v3"
+	"github.com/openai/openai-go/v3/packages/param"
+)
+
+// ToolChoice is a wrapper around ChatCompletionToolChoiceOptionUnionParam that
+// provides custom JSON unmarshalling logic to correctly handle
+// the union type.
+type ToolChoice struct {
+	openai.ChatCompletionToolChoiceOptionUnionParam
+}
+
+// MarshalJSON forwards the marshalling process to the embedded
+// ChatCompletionToolChoiceOptionUnionParam's MarshalJSON method,
+// which is known to work correctly.
+func (t ToolChoice) MarshalJSON() ([]byte, error) {
+	return t.ChatCompletionToolChoiceOptionUnionParam.MarshalJSON()
+}
+
+// UnmarshalJSON provides custom logic to correctly deserialize the JSON data
+// into the appropriate field of the embedded union type. It inspects the JSON
+// structure to determine if it's a simple string or a complex object with a
+// 'type' discriminator field.
+func (t *ToolChoice) UnmarshalJSON(data []byte) error {
+	// If the input is a simple string (e.g., "auto", "none", "required"),
+	// unmarshal it into the OfAuto field.
+	if data[0] == '"' {
+		var strValue string
+		if err := json.Unmarshal(data, &strValue); err != nil {
+			return err
+		}
+		t.OfAuto = param.NewOpt(strValue)
+		return nil
+	}
+
+	// If the input is a JSON object, we need to determine its type.
+	// We use a temporary struct to detect the 'type' field.
+	var typeDetector struct {
+		Type string `json:"type"`
+	}
+
+	// We only care about the type field, ignore other fields
+	if err := json.Unmarshal(data, &typeDetector); err != nil {
+		return fmt.Errorf("failed to detect type for ToolChoice: %w", err)
+	}
+
+	// Based on the detected type, unmarshal the data into the correct struct.
+	switch typeDetector.Type {
+	case "function":
+		var functionChoice openai.ChatCompletionNamedToolChoiceParam
+		if err := functionChoice.UnmarshalJSON(data); err != nil {
+			return err
+		}
+		t.OfFunctionToolChoice = &functionChoice
+	case "custom":
+		var customChoice openai.ChatCompletionNamedToolChoiceCustomParam
+		if err := customChoice.UnmarshalJSON(data); err != nil {
+			return err
+		}
+		t.OfCustomToolChoice = &customChoice
+	case "allowed_tools":
+		var allowedToolsChoice openai.ChatCompletionAllowedToolChoiceParam
+		if err := allowedToolsChoice.UnmarshalJSON(data); err != nil {
+			return err
+		}
+		t.OfAllowedTools = &allowedToolsChoice
+	default:
+		return fmt.Errorf("unknown ToolChoice type: %s", typeDetector.Type)
+	}
+
+	return nil
+}