update

Xunzhuo · Xunzhuo · commit be45bc2be131 · 2025-11-15T15:13:16.000+08:00
Signed-off-by: bitliu &lt;bitliu@tencent.com&gt;
diff --git a/e2e/pkg/framework/runner.go b/e2e/pkg/framework/runner.go
@@ -209,19 +209,29 @@ func (r *Runner) buildAndLoadImages(ctx context.Context) error {
 func (r *Runner) runTests(ctx context.Context, kubeClient *kubernetes.Clientset) ([]TestResult, error) {
 	r.log("Running tests")
 
+	// Debug: List all registered test cases
+	if r.opts.Verbose {
+		r.log("All registered test cases:")
+		for _, tc := range testcases.List() {
+			r.log("  - %s: %s", tc.Name, tc.Description)
+		}
+	}
+
 	// Get test cases to run
 	var testCasesToRun []testcases.TestCase
 	var err error
 
 	if len(r.opts.TestCases) > 0 {
 		// Run specific test cases
+		r.log("Requested test cases: %v", r.opts.TestCases)
 		testCasesToRun, err = testcases.ListByNames(r.opts.TestCases...)
 		if err != nil {
 			return nil, err
 		}
 	} else {
 		// Run all test cases for the profile
 		profileTestCases := r.profile.GetTestCases()
+		r.log("Profile test cases: %v", profileTestCases)
 		testCasesToRun, err = testcases.ListByNames(profileTestCases...)
 		if err != nil {
 			return nil, err
diff --git a/e2e/pkg/testcases/registry.go b/e2e/pkg/testcases/registry.go
@@ -105,28 +105,6 @@ func List() []TestCase {
 	return cases
 }
 
-// ListByTags returns test cases matching any of the given tags
-func ListByTags(tags ...string) []TestCase {
-	mu.RLock()
-	defer mu.RUnlock()
-
-	tagSet := make(map[string]bool)
-	for _, tag := range tags {
-		tagSet[tag] = true
-	}
-
-	cases := make([]TestCase, 0)
-	for _, tc := range registry {
-		for _, tag := range tc.Tags {
-			if tagSet[tag] {
-				cases = append(cases, tc)
-				break
-			}
-		}
-	}
-	return cases
-}
-
 // ListByNames returns test cases matching the given names
 func ListByNames(names ...string) ([]TestCase, error) {
 	mu.RLock()
diff --git a/e2e/profiles/ai-gateway/profile.go b/e2e/profiles/ai-gateway/profile.go
@@ -108,8 +108,9 @@ func (p *Profile) Teardown(ctx context.Context, opts *framework.TeardownOptions)
 func (p *Profile) GetTestCases() []string {
 	return []string{
 		"chat-completions-request",
+		"chat-completions-stress-request",
 		"domain-classify",
-		"cache",
+		"semantic-cache",
 		"pii-detection",
 		"jailbreak-detection",
 	}
@@ -154,7 +155,7 @@ func (p *Profile) deploySemanticRouter(ctx context.Context, deployer *helm.Deplo
 	return deployer.WaitForDeployment(ctx, "vllm-semantic-router-system", "semantic-router", 10*time.Minute)
 }
 
-func (p *Profile) deployEnvoyGateway(ctx context.Context, deployer *helm.Deployer, opts *framework.SetupOptions) error {
+func (p *Profile) deployEnvoyGateway(ctx context.Context, deployer *helm.Deployer, _ *framework.SetupOptions) error {
 	installOpts := helm.InstallOptions{
 		ReleaseName: "eg",
 		Chart:       "oci://docker.io/envoyproxy/gateway-helm",
@@ -172,7 +173,7 @@ func (p *Profile) deployEnvoyGateway(ctx context.Context, deployer *helm.Deploye
 	return deployer.WaitForDeployment(ctx, "envoy-gateway-system", "envoy-gateway", 5*time.Minute)
 }
 
-func (p *Profile) deployEnvoyAIGateway(ctx context.Context, deployer *helm.Deployer, opts *framework.SetupOptions) error {
+func (p *Profile) deployEnvoyAIGateway(ctx context.Context, deployer *helm.Deployer, _ *framework.SetupOptions) error {
 	// Install AI Gateway CRDs
 	crdOpts := helm.InstallOptions{
 		ReleaseName: "aieg-crd",
diff --git a/e2e/testcases/cache.go b/e2e/testcases/cache.go
@@ -16,9 +16,9 @@ import (
 )
 
 func init() {
-	pkgtestcases.Register("cache", pkgtestcases.TestCase{
+	pkgtestcases.Register("semantic-cache", pkgtestcases.TestCase{
 		Description: "Test semantic cache hit rate with similar questions",
-		Tags:        []string{"ai-gateway", "cache", "performance"},
+		Tags:        []string{"ai-gateway", "semantic-cache", "performance"},
 		Fn:          testCache,
 	})
 }
@@ -169,8 +169,6 @@ func sendChatRequest(ctx context.Context, question, localPort string, verbose bo
 		"messages": []map[string]string{
 			{"role": "user", "content": question},
 		},
-		"max_tokens": 100,
-		"stream":     false,
 	}
 
 	jsonData, err := json.Marshal(requestBody)
diff --git a/e2e/testcases/chat_completions_request.go b/e2e/testcases/chat_completions_request.go
@@ -9,13 +9,12 @@ import (
 	"net/http"
 	"time"
 
-	"github.com/vllm-project/semantic-router/e2e/pkg/testcases"
 	pkgtestcases "github.com/vllm-project/semantic-router/e2e/pkg/testcases"
 	"k8s.io/client-go/kubernetes"
 )
 
 func init() {
-	testcases.Register("chat-completions-request", testcases.TestCase{
+	pkgtestcases.Register("chat-completions-request", pkgtestcases.TestCase{
 		Description: "Send a chat completions request and verify 200 OK response",
 		Tags:        []string{"llm", "functional"},
 		Fn:          testChatCompletionsRequest,
diff --git a/e2e/testcases/stress_test.go b/e2e/testcases/stress_test.go
@@ -0,0 +1,194 @@
+package testcases
+
+import (
+	"bytes"
+	"context"
+	"encoding/json"
+	"fmt"
+	"io"
+	"net/http"
+	"strings"
+	"time"
+
+	pkgtestcases "github.com/vllm-project/semantic-router/e2e/pkg/testcases"
+	"k8s.io/client-go/kubernetes"
+)
+
+func init() {
+	pkgtestcases.Register("chat-completions-stress-request", pkgtestcases.TestCase{
+		Description: "Send 1000 sequential requests and measure success rate",
+		Tags:        []string{"llm", "stress", "reliability"},
+		Fn:          testStressTest,
+	})
+}
+
+// StressTestResult tracks the result of a single request
+type StressTestResult struct {
+	RequestID    int
+	Success      bool
+	StatusCode   int
+	Duration     time.Duration
+	ErrorMessage string
+}
+
+func testStressTest(ctx context.Context, client *kubernetes.Clientset, opts pkgtestcases.TestCaseOptions) error {
+	if opts.Verbose {
+		fmt.Println("[Test] Starting stress test: 1000 sequential requests")
+	}
+
+	// Setup service connection and get local port
+	localPort, stopPortForward, err := setupServiceConnection(ctx, client, opts)
+	if err != nil {
+		return err
+	}
+	defer stopPortForward() // Ensure port forwarding is stopped when test completes
+
+	const totalRequests = 1000
+	var results []StressTestResult
+	successCount := 0
+	totalDuration := time.Duration(0)
+
+	// Send 1000 requests sequentially
+	for i := 1; i <= totalRequests; i++ {
+		result := sendSingleRequest(ctx, i, localPort, opts.Verbose)
+		results = append(results, result)
+
+		if result.Success {
+			successCount++
+		}
+		totalDuration += result.Duration
+
+		// Print progress every 100 requests
+		if opts.Verbose && i%100 == 0 {
+			currentSuccessRate := float64(successCount) / float64(i) * 100
+			fmt.Printf("[Test] Progress: %d/%d requests completed (%.2f%% success rate)\n",
+				i, totalRequests, currentSuccessRate)
+		}
+	}
+
+	// Calculate statistics
+	successRate := float64(successCount) / float64(totalRequests) * 100
+	failureCount := totalRequests - successCount
+	avgDuration := totalDuration / time.Duration(totalRequests)
+
+	// Set details for reporting
+	if opts.SetDetails != nil {
+		opts.SetDetails(map[string]interface{}{
+			"total_requests":  totalRequests,
+			"successful":      successCount,
+			"failed":          failureCount,
+			"success_rate":    fmt.Sprintf("%.2f%%", successRate),
+			"avg_duration_ms": avgDuration.Milliseconds(),
+		})
+	}
+
+	// Print summary
+	printStressTestResults(results, totalRequests, successCount, successRate, avgDuration)
+
+	if opts.Verbose {
+		fmt.Printf("[Test] Stress test completed: %d/%d successful (%.2f%% success rate)\n",
+			successCount, totalRequests, successRate)
+	}
+
+	return nil
+}
+
+func sendSingleRequest(ctx context.Context, requestID int, localPort string, verbose bool) StressTestResult {
+	result := StressTestResult{
+		RequestID: requestID,
+		Success:   false,
+	}
+
+	start := time.Now()
+
+	// Prepare request body
+	requestBody := map[string]interface{}{
+		"model": "MoM",
+		"messages": []map[string]string{
+			{
+				"role":    "user",
+				"content": fmt.Sprintf("Request #%d: What is 2+2?", requestID),
+			},
+		},
+	}
+
+	jsonData, err := json.Marshal(requestBody)
+	if err != nil {
+		result.ErrorMessage = fmt.Sprintf("marshal error: %v", err)
+		result.Duration = time.Since(start)
+		return result
+	}
+
+	url := fmt.Sprintf("http://localhost:%s/v1/chat/completions", localPort)
+	req, err := http.NewRequestWithContext(ctx, "POST", url, bytes.NewBuffer(jsonData))
+	if err != nil {
+		result.ErrorMessage = fmt.Sprintf("create request error: %v", err)
+		result.Duration = time.Since(start)
+		return result
+	}
+
+	req.Header.Set("Content-Type", "application/json")
+
+	httpClient := &http.Client{
+		Timeout: 30 * time.Second,
+	}
+
+	resp, err := httpClient.Do(req)
+	if err != nil {
+		result.ErrorMessage = fmt.Sprintf("send request error: %v", err)
+		result.Duration = time.Since(start)
+		return result
+	}
+	defer resp.Body.Close()
+
+	body, err := io.ReadAll(resp.Body)
+	if err != nil {
+		result.ErrorMessage = fmt.Sprintf("read response error: %v", err)
+		result.Duration = time.Since(start)
+		result.StatusCode = resp.StatusCode
+		return result
+	}
+
+	result.Duration = time.Since(start)
+	result.StatusCode = resp.StatusCode
+
+	if resp.StatusCode == http.StatusOK {
+		result.Success = true
+	} else {
+		result.ErrorMessage = fmt.Sprintf("status %d: %s", resp.StatusCode, string(body))
+	}
+
+	return result
+}
+
+func printStressTestResults(results []StressTestResult, totalRequests, successCount int, successRate float64, avgDuration time.Duration) {
+	separator := strings.Repeat("=", 80)
+	fmt.Println("\n" + separator)
+	fmt.Println("Stress Test Results")
+	fmt.Println(separator)
+	fmt.Printf("Total Requests:    %d\n", totalRequests)
+	fmt.Printf("Successful:        %d\n", successCount)
+	fmt.Printf("Failed:            %d\n", totalRequests-successCount)
+	fmt.Printf("Success Rate:      %.2f%%\n", successRate)
+	fmt.Printf("Average Duration:  %v\n", avgDuration)
+	fmt.Println(separator)
+
+	// Show first 10 failures if any
+	failureCount := 0
+	fmt.Println("\nFirst 10 Failures (if any):")
+	for _, result := range results {
+		if !result.Success && failureCount < 10 {
+			failureCount++
+			fmt.Printf("  Request #%d: %s (duration: %v)\n",
+				result.RequestID, result.ErrorMessage, result.Duration)
+		}
+		if failureCount >= 10 {
+			break
+		}
+	}
+
+	if failureCount == 0 {
+		fmt.Println("  No failures! 🎉")
+	}
+	fmt.Println()
+}

Original file line number	Diff line number	Diff line change
`@@ -16,9 +16,9 @@ import (`
`16`	`16`	`)`
`17`	`17`
`18`	`18`	`func init() {`
`19`		`- pkgtestcases.Register("cache", pkgtestcases.TestCase{`
	`19`	`+ pkgtestcases.Register("semantic-cache", pkgtestcases.TestCase{`
`20`	`20`	`Description: "Test semantic cache hit rate with similar questions",`
`21`		`- Tags: []string{"ai-gateway", "cache", "performance"},`
	`21`	`+ Tags: []string{"ai-gateway", "semantic-cache", "performance"},`
`22`	`22`	`Fn: testCache,`
`23`	`23`	`})`
`24`	`24`	`}`
`@@ -169,8 +169,6 @@ func sendChatRequest(ctx context.Context, question, localPort string, verbose bo`
`169`	`169`	`"messages": []map[string]string{`
`170`	`170`	`{"role": "user", "content": question},`
`171`	`171`	`},`
`172`		`- "max_tokens": 100,`
`173`		`- "stream": false,`
`174`	`172`	`}`
`175`	`173`
`176`	`174`	`jsonData, err := json.Marshal(requestBody)`