test: update tests to support ARM architecture

ilopezluna · ilopezluna · commit 2c9f3d2dfc09 · 2025-09-29T14:10:41.000+02:00
diff --git a/.gitignore b/.gitignore
@@ -4,6 +4,8 @@ model-runner
 model-runner.sock
 # Default MODELS_PATH in Makefile
 models-store/
+# Default MODELS_PATH in mdltool
+model-store/
 # Directory where we store the updated llama.cpp
 updated-inference/
 vendor/
diff --git a/pkg/inference/backends/llamacpp/llamacpp_config_test.go b/pkg/inference/backends/llamacpp/llamacpp_config_test.go
@@ -72,6 +72,13 @@ func TestGetArgs(t *testing.T) {
 	modelPath := "/path/to/model"
 	socket := "unix:///tmp/socket"
 
+	// Build base expected args based on architecture
+	baseArgs := []string{"--jinja", "-ngl", "999", "--metrics"}
+	if runtime.GOARCH == "arm64" {
+		nThreads := min(2, runtime.NumCPU()/2)
+		baseArgs = append(baseArgs, "--threads", strconv.Itoa(nThreads))
+	}
+
 	tests := []struct {
 		name     string
 		bundle   types.ModelBundle
@@ -85,30 +92,24 @@ func TestGetArgs(t *testing.T) {
 			bundle: &fakeBundle{
 				ggufPath: modelPath,
 			},
-			expected: []string{
-				"--jinja",
-				"-ngl", "999",
-				"--metrics",
+			expected: append(append([]string{}, baseArgs...),
 				"--model", modelPath,
 				"--host", socket,
 				"--ctx-size", "4096",
-			},
+			),
 		},
 		{
 			name: "embedding mode",
 			mode: inference.BackendModeEmbedding,
 			bundle: &fakeBundle{
 				ggufPath: modelPath,
 			},
-			expected: []string{
-				"--jinja",
-				"-ngl", "999",
-				"--metrics",
+			expected: append(append([]string{}, baseArgs...),
 				"--model", modelPath,
 				"--host", socket,
 				"--embeddings",
 				"--ctx-size", "4096",
-			},
+			),
 		},
 		{
 			name: "context size from backend config",
@@ -119,15 +120,12 @@ func TestGetArgs(t *testing.T) {
 			config: &inference.BackendConfiguration{
 				ContextSize: 1234,
 			},
-			expected: []string{
-				"--jinja",
-				"-ngl", "999",
-				"--metrics",
+			expected: append(append([]string{}, baseArgs...),
 				"--model", modelPath,
 				"--host", socket,
 				"--embeddings",
 				"--ctx-size", "1234", // should add this flag
-			},
+			),
 		},
 		{
 			name: "context size from model config",
@@ -141,15 +139,12 @@ func TestGetArgs(t *testing.T) {
 			config: &inference.BackendConfiguration{
 				ContextSize: 1234,
 			},
-			expected: []string{
-				"--jinja",
-				"-ngl", "999",
-				"--metrics",
+			expected: append(append([]string{}, baseArgs...),
 				"--model", modelPath,
 				"--host", socket,
 				"--embeddings",
 				"--ctx-size", "2096", // model config takes precedence
-			},
+			),
 		},
 		{
 			name: "chat template from model artifact",
@@ -158,15 +153,12 @@ func TestGetArgs(t *testing.T) {
 				ggufPath:     modelPath,
 				templatePath: "/path/to/bundle/template.jinja",
 			},
-			expected: []string{
-				"--jinja",
-				"-ngl", "999",
-				"--metrics",
+			expected: append(append([]string{}, baseArgs...),
 				"--model", modelPath,
 				"--host", socket,
 				"--chat-template-file", "/path/to/bundle/template.jinja",
 				"--ctx-size", "4096",
-			},
+			),
 		},
 		{
 			name: "raw flags from backend config",
@@ -177,16 +169,13 @@ func TestGetArgs(t *testing.T) {
 			config: &inference.BackendConfiguration{
 				RuntimeFlags: []string{"--some", "flag"},
 			},
-			expected: []string{
-				"--jinja",
-				"-ngl", "999",
-				"--metrics",
+			expected: append(append([]string{}, baseArgs...),
 				"--model", modelPath,
 				"--host", socket,
 				"--embeddings",
 				"--ctx-size", "4096",
 				"--some", "flag", // model config takes precedence
-			},
+			),
 		},
 	}