fuzzystrmatch: fix out of bounds in LevenshteinLessEqual

rafiss · rafiss · commit 188150c3f1e0 · 2025-08-25T14:48:42.000-04:00
This fixes a bug that was added when this function was introduced in 7a538b3. No release note since this bug was not released yet. Release note: None
diff --git a/pkg/util/fuzzystrmatch/leven.go b/pkg/util/fuzzystrmatch/leven.go
@@ -123,6 +123,9 @@ func LevenshteinLessEqualDistanceWithCost(
 				bestColumn = -netInserts
 			}
 			stopColumn = bestColumn + (slackDist / (insCost + delCost)) + 1
+			if stopColumn < 0 {
+				stopColumn = 0
+			}
 			if stopColumn > lenS {
 				stopColumn = lenS + 1
 			}
diff --git a/pkg/util/fuzzystrmatch/leven_test.go b/pkg/util/fuzzystrmatch/leven_test.go
@@ -5,7 +5,10 @@
 
 package fuzzystrmatch
 
-import "testing"
+import (
+	"math"
+	"testing"
+)
 
 func TestLevenshteinDistance(t *testing.T) {
 	tt := []struct {
@@ -482,3 +485,33 @@ func TestLevenshteinLessEqualDistanceWithCost(t *testing.T) {
 		}
 	}
 }
+
+func TestLevenshtein_ExtremeValues(t *testing.T) {
+	// Test all combinations of math.MinInt64 and math.MaxInt64 for integer
+	// arguments. This ensures the function handles extreme values correctly
+	// without panicking.
+	extremeValues := []int{math.MinInt64, math.MaxInt64, 0, 1, -1, -6503603920424974249, -3160545599026710833, 3234088755759361354}
+	testStrings := []string{"ab", "bc", "", "test"}
+
+	for _, source := range testStrings {
+		for _, target := range testStrings {
+			for _, insCost := range extremeValues {
+				for _, delCost := range extremeValues {
+					for _, subCost := range extremeValues {
+						for _, maxDist := range extremeValues {
+							// Call the functions and ensure it doesn't panic. We don't check
+							// the exact result since extreme values may cause integer
+							// overflow, but we ensure no panic occurs.
+							_ = LevenshteinLessEqualDistanceWithCost(
+								source, target, insCost, delCost, subCost, maxDist,
+							)
+							_ = LevenshteinDistanceWithCost(
+								source, target, insCost, delCost, subCost,
+							)
+						}
+					}
+				}
+			}
+		}
+	}
+}

Original file line number	Diff line number	Diff line change
`@@ -123,6 +123,9 @@ func LevenshteinLessEqualDistanceWithCost(`
`123`	`123`	`bestColumn = -netInserts`
`124`	`124`	`}`
`125`	`125`	`stopColumn = bestColumn + (slackDist / (insCost + delCost)) + 1`
	`126`	`+ if stopColumn < 0 {`
	`127`	`+ stopColumn = 0`
	`128`	`+ }`
`126`	`129`	`if stopColumn > lenS {`
`127`	`130`	`stopColumn = lenS + 1`
`128`	`131`	`}`