- rename LLMRequestData to LLMRequestBody

vMaroon · vMaroon · commit 2f8d62789478 · 2025-09-11T23:15:43.000+03:00
- rename LLMRequest.Data to LLMRequest.Body
- test refactoring after rebase

Signed-off-by: Maroon Ayoub &lt;maroon.ayoub@ibm.com&gt;
diff --git a/pkg/epp/requestcontrol/director.go b/pkg/epp/requestcontrol/director.go
@@ -103,7 +103,7 @@ func (d *Director) HandleRequest(ctx context.Context, reqCtx *handlers.RequestCo
 	}
 	reqCtx.Request.Body["model"] = reqCtx.TargetModelName
 
-	requestData, err := requtil.ExtractRequestData(reqCtx.Request.Body)
+	requestBody, err := requtil.ExtractRequestBody(reqCtx.Request.Body)
 	if err != nil {
 		return reqCtx, errutil.Error{Code: errutil.BadRequest, Msg: fmt.Errorf("failed to extract request data: %w", err).Error()}
 	}
@@ -125,7 +125,7 @@ func (d *Director) HandleRequest(ctx context.Context, reqCtx *handlers.RequestCo
 	reqCtx.SchedulingRequest = &schedulingtypes.LLMRequest{
 		RequestId:   reqCtx.Request.Headers[requtil.RequestIdHeaderKey],
 		TargetModel: reqCtx.TargetModelName,
-		Data:        requestData,
+		Body:        requestBody,
 		Headers:     reqCtx.Request.Headers,
 	}
 
diff --git a/pkg/epp/scheduling/framework/plugins/multi/prefix/plugin.go b/pkg/epp/scheduling/framework/plugins/multi/prefix/plugin.go
@@ -261,7 +261,7 @@ func (p *Plugin) matchLongestPrefix(ctx context.Context, hashes []BlockHash) map
 // For block i, hash(i) = hash(block i content, hash(i-1)).
 func hashPrompt(ctx context.Context, request *types.LLMRequest, cacheBlockSize int, maxPrefixBlocks int) []BlockHash {
 	loggerDebug := log.FromContext(ctx).V(logutil.DEBUG)
-	if request == nil || request.Data == nil {
+	if request == nil || request.Body == nil {
 		loggerDebug.Info("Request or request data is nil, skipping hashing")
 		return nil
 	}
@@ -305,10 +305,10 @@ func toBytes(i BlockHash) []byte {
 }
 
 func getUserInputBytes(request *types.LLMRequest) ([]byte, error) {
-	if request.Data.Completions != nil { // assumed to be valid if not nil
-		return []byte(request.Data.Completions.Prompt), nil
+	if request.Body.Completions != nil { // assumed to be valid if not nil
+		return []byte(request.Body.Completions.Prompt), nil
 	}
 
 	// must be chat-completions request at this point, return bytes of entire messages
-	return json.Marshal(request.Data.ChatCompletions.Messages)
+	return json.Marshal(request.Body.ChatCompletions.Messages)
 }
diff --git a/pkg/epp/scheduling/framework/plugins/multi/prefix/plugin_test.go b/pkg/epp/scheduling/framework/plugins/multi/prefix/plugin_test.go
@@ -49,7 +49,7 @@ func TestPrefixPluginCompletion(t *testing.T) {
 	req1 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			Completions: &types.CompletionsRequest{
 				Prompt: "aaaaaa",
 			},
@@ -81,7 +81,7 @@ func TestPrefixPluginCompletion(t *testing.T) {
 	req2 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model2",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			Completions: &types.CompletionsRequest{
 				Prompt: "bbbbbb",
 			},
@@ -112,7 +112,7 @@ func TestPrefixPluginCompletion(t *testing.T) {
 	req3 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			Completions: &types.CompletionsRequest{
 				Prompt: "aaaabbbb",
 			},
@@ -142,7 +142,7 @@ func TestPrefixPluginCompletion(t *testing.T) {
 	req4 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model-new",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			Completions: &types.CompletionsRequest{
 				Prompt: "aaaabbbb",
 			},
@@ -172,7 +172,7 @@ func TestPrefixPluginCompletion(t *testing.T) {
 	req5 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			Completions: &types.CompletionsRequest{
 				Prompt: "aaaabbbbcccc",
 			},
@@ -214,7 +214,7 @@ func TestPrefixPluginChatCompletions(t *testing.T) {
 	req1 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			ChatCompletions: &types.ChatCompletionsRequest{
 				Messages: []types.Message{
 					{Role: "user", Content: "hello world"},
@@ -223,8 +223,8 @@ func TestPrefixPluginChatCompletions(t *testing.T) {
 			},
 		},
 	}
-	scores := plugin.Score(context.Background(), nil, req1, pods)
-	state, err := plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req1.RequestId, PrefixCachePluginType)
+	scores := plugin.Score(context.Background(), types.NewCycleState(), req1, pods)
+	state, err := plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req1.RequestId, plugins.StateKey(plugin.TypedName().String()))
 	assert.NoError(t, err)
 	t.Logf("Chat completions - Hashes %+v, cached servers: %+v", state.PrefixHashes, state.PrefixCacheServers)
 	// Should have some hashes for the JSON-encoded messages
@@ -249,7 +249,7 @@ func TestPrefixPluginChatCompletionsGrowth(t *testing.T) {
 	req1 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			ChatCompletions: &types.ChatCompletionsRequest{
 				Messages: []types.Message{
 					{Role: "system", Content: "You are a helpful assistant"},
@@ -258,8 +258,8 @@ func TestPrefixPluginChatCompletionsGrowth(t *testing.T) {
 			},
 		},
 	}
-	scores := plugin.Score(context.Background(), nil, req1, pods)
-	state, err := plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req1.RequestId, PrefixCachePluginType)
+	scores := plugin.Score(context.Background(), types.NewCycleState(), req1, pods)
+	state, err := plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req1.RequestId, plugins.StateKey(plugin.TypedName().String()))
 	assert.NoError(t, err)
 	t.Logf("Initial conversation - Hashes %+v, cached servers: %+v", len(state.PrefixHashes), state.PrefixCacheServers)
 	initialHashCount := len(state.PrefixHashes)
@@ -281,7 +281,7 @@ func TestPrefixPluginChatCompletionsGrowth(t *testing.T) {
 	req2 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			ChatCompletions: &types.ChatCompletionsRequest{
 				Messages: []types.Message{
 					{Role: "system", Content: "You are a helpful assistant"},
@@ -292,8 +292,8 @@ func TestPrefixPluginChatCompletionsGrowth(t *testing.T) {
 			},
 		},
 	}
-	scores = plugin.Score(context.Background(), nil, req2, pods)
-	state, err = plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req2.RequestId, PrefixCachePluginType)
+	scores = plugin.Score(context.Background(), types.NewCycleState(), req2, pods)
+	state, err = plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req2.RequestId, plugins.StateKey(plugin.TypedName().String()))
 	assert.NoError(t, err)
 	t.Logf("Extended conversation - Hashes %+v, cached servers: %+v", len(state.PrefixHashes), state.PrefixCacheServers)
 	extendedHashCount := len(state.PrefixHashes)
@@ -313,7 +313,7 @@ func TestPrefixPluginChatCompletionsGrowth(t *testing.T) {
 	req3 := &types.LLMRequest{
 		RequestId:   uuid.NewString(),
 		TargetModel: "test-model1",
-		Data: &types.LLMRequestData{
+		Body: &types.LLMRequestBody{
 			ChatCompletions: &types.ChatCompletionsRequest{
 				Messages: []types.Message{
 					{Role: "system", Content: "You are a helpful assistant"},
@@ -326,8 +326,8 @@ func TestPrefixPluginChatCompletionsGrowth(t *testing.T) {
 			},
 		},
 	}
-	scores = plugin.Score(context.Background(), nil, req3, pods)
-	state, err = plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req3.RequestId, PrefixCachePluginType)
+	scores = plugin.Score(context.Background(), types.NewCycleState(), req3, pods)
+	state, err = plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req3.RequestId, plugins.StateKey(plugin.TypedName().String()))
 	assert.NoError(t, err)
 	t.Logf("Long conversation - Hashes %+v, cached servers: %+v", len(state.PrefixHashes), state.PrefixCacheServers)
 	longHashCount := len(state.PrefixHashes)
@@ -375,7 +375,7 @@ func BenchmarkPrefixPluginStress(b *testing.B) {
 		req := &types.LLMRequest{
 			RequestId:   uuid.NewString(),
 			TargetModel: "model-stress",
-			Data: &types.LLMRequestData{
+			Body: &types.LLMRequestBody{
 				Completions: &types.CompletionsRequest{
 					Prompt: prompt,
 				},
@@ -396,7 +396,7 @@ func BenchmarkPrefixPluginStress(b *testing.B) {
 		// Second cycle: validate internal state
 		state, err := plugins.ReadPluginStateKey[*SchedulingContextState](plugin.pluginState, req.RequestId, plugins.StateKey(plugin.TypedName().String()))
 		assert.NoError(b, err)
-		expectedHashes := int(math.Min(float64(maxPrefixBlocks), float64(len(req.Data.Completions.Prompt)/blockSize)))
+		expectedHashes := int(math.Min(float64(maxPrefixBlocks), float64(len(req.Body.Completions.Prompt)/blockSize)))
 		assert.Equal(b, expectedHashes, len(state.PrefixHashes), "number of hashes is incorrect")
 	}
 }
@@ -464,7 +464,7 @@ func BenchmarkPrefixPluginChatCompletionsStress(b *testing.B) {
 			req := &types.LLMRequest{
 				RequestId:   uuid.NewString(),
 				TargetModel: "chat-model-stress",
-				Data: &types.LLMRequestData{
+				Body: &types.LLMRequestBody{
 					ChatCompletions: &types.ChatCompletionsRequest{
 						Messages: messages,
 					},
diff --git a/pkg/epp/scheduling/types/types.go b/pkg/epp/scheduling/types/types.go
@@ -32,7 +32,7 @@ type LLMRequest struct {
 	// TargetModel is the final target model after traffic split.
 	TargetModel string
 	// Data contains the request-body fields that we parse out as user input.
-	Data *LLMRequestData
+	Body *LLMRequestBody
 	// Headers is a map of the request headers.
 	Headers map[string]string
 }
@@ -42,14 +42,14 @@ func (r *LLMRequest) String() string {
 		return nilString
 	}
 
-	return fmt.Sprintf("RequestID: %s, TargetModel: %s, RequestData: %s, Headers: %v",
-		r.RequestId, r.TargetModel, r.Data, r.Headers)
+	return fmt.Sprintf("RequestID: %s, TargetModel: %s, Body: %s, Headers: %v",
+		r.RequestId, r.TargetModel, r.Body, r.Headers)
 }
 
-// LLMRequestData contains the request-body fields that we parse out as user input,
+// LLMRequestBody contains the request-body fields that we parse out as user input,
 // to be used in forming scheduling decisions.
-// An LLMRequestData must contain exactly one of CompletionsRequest or ChatCompletionsRequest.
-type LLMRequestData struct {
+// An LLMRequestBody must contain exactly one of CompletionsRequest or ChatCompletionsRequest.
+type LLMRequestBody struct {
 	// CompletionsRequest is the representation of the OpenAI /v1/completions request body.
 	Completions *CompletionsRequest `json:"completions,omitempty"`
 	// ChatCompletionsRequest is the representation of the OpenAI /v1/chat_completions request body.
diff --git a/pkg/epp/util/request/body.go b/pkg/epp/util/request/body.go
@@ -23,18 +23,18 @@ import (
 	errutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/error"
 )
 
-// ExtractRequestData extracts the LLMRequestData from the given request body map.
-func ExtractRequestData(body map[string]any) (*types.LLMRequestData, error) {
+// ExtractRequestBody extracts the LLMRequestBody from the given request body map.
+func ExtractRequestBody(rawBody map[string]any) (*types.LLMRequestBody, error) {
 	// Convert map back to JSON bytes
-	jsonBytes, err := json.Marshal(body)
+	jsonBytes, err := json.Marshal(rawBody)
 	if err != nil {
 		return nil, errutil.Error{Code: errutil.BadRequest, Msg: "invalid request body"}
 	}
 
 	// Try completions request first
 	var completions types.CompletionsRequest
 	if err = json.Unmarshal(jsonBytes, &completions); err == nil && completions.Prompt != "" {
-		return &types.LLMRequestData{Completions: &completions}, nil
+		return &types.LLMRequestBody{Completions: &completions}, nil
 	}
 
 	// Try chat completions
@@ -47,7 +47,7 @@ func ExtractRequestData(body map[string]any) (*types.LLMRequestData, error) {
 		return nil, errutil.Error{Code: errutil.BadRequest, Msg: "invalid chat-completions request: " + err.Error()}
 	}
 
-	return &types.LLMRequestData{ChatCompletions: &chatCompletions}, nil
+	return &types.LLMRequestBody{ChatCompletions: &chatCompletions}, nil
 }
 
 func validateChatCompletionsMessages(messages []types.Message) error {
diff --git a/pkg/epp/util/request/body_test.go b/pkg/epp/util/request/body_test.go
@@ -27,7 +27,7 @@ func TestExtractRequestData(t *testing.T) {
 	tests := []struct {
 		name    string
 		body    map[string]any
-		want    *types.LLMRequestData
+		want    *types.LLMRequestBody
 		wantErr bool
 	}{
 		{
@@ -36,7 +36,7 @@ func TestExtractRequestData(t *testing.T) {
 				"model":  "test",
 				"prompt": "test prompt",
 			},
-			want: &types.LLMRequestData{
+			want: &types.LLMRequestBody{
 				Completions: &types.CompletionsRequest{
 					Prompt: "test prompt",
 				},
@@ -55,7 +55,7 @@ func TestExtractRequestData(t *testing.T) {
 					},
 				},
 			},
-			want: &types.LLMRequestData{
+			want: &types.LLMRequestBody{
 				ChatCompletions: &types.ChatCompletionsRequest{
 					Messages: []types.Message{
 						{Role: "system", Content: "this is a system message"},
@@ -79,7 +79,7 @@ func TestExtractRequestData(t *testing.T) {
 				"add_generation_prompt":        true,
 				"chat_template_kwargs":         map[string]any{"key": "value"},
 			},
-			want: &types.LLMRequestData{
+			want: &types.LLMRequestBody{
 				ChatCompletions: &types.ChatCompletionsRequest{
 					Messages:                  []types.Message{{Role: "user", Content: "hello"}},
 					Tools:                     []any{map[string]any{"type": "function"}},
@@ -229,17 +229,17 @@ func TestExtractRequestData(t *testing.T) {
 
 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
-			got, err := ExtractRequestData(tt.body)
+			got, err := ExtractRequestBody(tt.body)
 			if (err != nil) != tt.wantErr {
-				t.Errorf("ExtractRequestData() error = %v, wantErr %v", err, tt.wantErr)
+				t.Errorf("ExtractRequestBody() error = %v, wantErr %v", err, tt.wantErr)
 				return
 			}
 			if tt.wantErr {
 				return
 			}
 
 			if diff := cmp.Diff(tt.want, got); diff != "" {
-				t.Errorf("ExtractRequestData() mismatch (-want +got):\n%s", diff)
+				t.Errorf("ExtractRequestBody() mismatch (-want +got):\n%s", diff)
 			}
 		})
 	}
@@ -254,7 +254,7 @@ func BenchmarkExtractRequestData_Completions(b *testing.B) {
 
 	b.ResetTimer()
 	for i := 0; i < b.N; i++ {
-		_, err := ExtractRequestData(body)
+		_, err := ExtractRequestBody(body)
 		if err != nil {
 			b.Fatal(err)
 		}
@@ -271,7 +271,7 @@ func BenchmarkExtractRequestData_ChatCompletions(b *testing.B) {
 
 	b.ResetTimer()
 	for i := 0; i < b.N; i++ {
-		_, err := ExtractRequestData(body)
+		_, err := ExtractRequestBody(body)
 		if err != nil {
 			b.Fatal(err)
 		}
@@ -295,7 +295,7 @@ func BenchmarkExtractRequestData_ChatCompletionsWithOptionals(b *testing.B) {
 
 	b.ResetTimer()
 	for i := 0; i < b.N; i++ {
-		_, err := ExtractRequestData(body)
+		_, err := ExtractRequestBody(body)
 		if err != nil {
 			b.Fatal(err)
 		}

Original file line number	Diff line number	Diff line change
`@@ -103,7 +103,7 @@ func (d Director) HandleRequest(ctx context.Context, reqCtx handlers.RequestCo`
`103`	`103`	`}`
`104`	`104`	`reqCtx.Request.Body["model"] = reqCtx.TargetModelName`
`105`	`105`
`106`		`- requestData, err := requtil.ExtractRequestData(reqCtx.Request.Body)`
	`106`	`+ requestBody, err := requtil.ExtractRequestBody(reqCtx.Request.Body)`
`107`	`107`	`if err != nil {`
`108`	`108`	`return reqCtx, errutil.Error{Code: errutil.BadRequest, Msg: fmt.Errorf("failed to extract request data: %w", err).Error()}`
`109`	`109`	`}`
`@@ -125,7 +125,7 @@ func (d Director) HandleRequest(ctx context.Context, reqCtx handlers.RequestCo`
`125`	`125`	`reqCtx.SchedulingRequest = &schedulingtypes.LLMRequest{`
`126`	`126`	`RequestId: reqCtx.Request.Headers[requtil.RequestIdHeaderKey],`
`127`	`127`	`TargetModel: reqCtx.TargetModelName,`
`128`		`- Data: requestData,`
	`128`	`+ Body: requestBody,`
`129`	`129`	`Headers: reqCtx.Request.Headers,`
`130`	`130`	`}`
`131`	`131`
Original file line number	Diff line number	Diff line change
`@@ -261,7 +261,7 @@ func (p *Plugin) matchLongestPrefix(ctx context.Context, hashes []BlockHash) map`
`261`	`261`	`// For block i, hash(i) = hash(block i content, hash(i-1)).`
`262`	`262`	`func hashPrompt(ctx context.Context, request *types.LLMRequest, cacheBlockSize int, maxPrefixBlocks int) []BlockHash {`
`263`	`263`	`loggerDebug := log.FromContext(ctx).V(logutil.DEBUG)`
`264`		`- if request == nil \|\| request.Data == nil {`
	`264`	`+ if request == nil \|\| request.Body == nil {`
`265`	`265`	`loggerDebug.Info("Request or request data is nil, skipping hashing")`
`266`	`266`	`return nil`
`267`	`267`	`}`
`@@ -305,10 +305,10 @@ func toBytes(i BlockHash) []byte {`
`305`	`305`	`}`
`306`	`306`
`307`	`307`	`func getUserInputBytes(request *types.LLMRequest) ([]byte, error) {`
`308`		`- if request.Data.Completions != nil { // assumed to be valid if not nil`
`309`		`- return []byte(request.Data.Completions.Prompt), nil`
	`308`	`+ if request.Body.Completions != nil { // assumed to be valid if not nil`
	`309`	`+ return []byte(request.Body.Completions.Prompt), nil`
`310`	`310`	`}`
`311`	`311`
`312`	`312`	`// must be chat-completions request at this point, return bytes of entire messages`
`313`		`- return json.Marshal(request.Data.ChatCompletions.Messages)`
	`313`	`+ return json.Marshal(request.Body.ChatCompletions.Messages)`
`314`	`314`	`}`
Original file line number	Diff line number	Diff line change
`@@ -23,18 +23,18 @@ import (`
`23`	`23`	`errutil "sigs.k8s.io/gateway-api-inference-extension/pkg/epp/util/error"`
`24`	`24`	`)`
`25`	`25`
`26`		`-// ExtractRequestData extracts the LLMRequestData from the given request body map.`
`27`		`-func ExtractRequestData(body map[string]any) (*types.LLMRequestData, error) {`
	`26`	`+// ExtractRequestBody extracts the LLMRequestBody from the given request body map.`
	`27`	`+func ExtractRequestBody(rawBody map[string]any) (*types.LLMRequestBody, error) {`
`28`	`28`	`// Convert map back to JSON bytes`
`29`		`- jsonBytes, err := json.Marshal(body)`
	`29`	`+ jsonBytes, err := json.Marshal(rawBody)`
`30`	`30`	`if err != nil {`
`31`	`31`	`return nil, errutil.Error{Code: errutil.BadRequest, Msg: "invalid request body"}`
`32`	`32`	`}`
`33`	`33`
`34`	`34`	`// Try completions request first`
`35`	`35`	`var completions types.CompletionsRequest`
`36`	`36`	`if err = json.Unmarshal(jsonBytes, &completions); err == nil && completions.Prompt != "" {`
`37`		`- return &types.LLMRequestData{Completions: &completions}, nil`
	`37`	`+ return &types.LLMRequestBody{Completions: &completions}, nil`
`38`	`38`	`}`
`39`	`39`
`40`	`40`	`// Try chat completions`
`@@ -47,7 +47,7 @@ func ExtractRequestData(body map[string]any) (*types.LLMRequestData, error) {`
`47`	`47`	`return nil, errutil.Error{Code: errutil.BadRequest, Msg: "invalid chat-completions request: " + err.Error()}`
`48`	`48`	`}`
`49`	`49`
`50`		`- return &types.LLMRequestData{ChatCompletions: &chatCompletions}, nil`
	`50`	`+ return &types.LLMRequestBody{ChatCompletions: &chatCompletions}, nil`
`51`	`51`	`}`
`52`	`52`
`53`	`53`	`func validateChatCompletionsMessages(messages []types.Message) error {`