trustyai-explainability
diff --git a/‎api/lmes/v1alpha1/lmevaljob_types.go‎
Lines changed: 18 additions & 9 deletions b/‎api/lmes/v1alpha1/lmevaljob_types.go‎
Lines changed: 18 additions & 9 deletions
diff --git a/‎config/crd/bases/trustyai.opendatahub.io_lmevaljobs.yaml‎
Lines changed: 18 additions & 0 deletions b/‎config/crd/bases/trustyai.opendatahub.io_lmevaljobs.yaml‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎controllers/lmes/driver/driver.go‎
Lines changed: 16 additions & 11 deletions b/‎controllers/lmes/driver/driver.go‎
Lines changed: 16 additions & 11 deletions
diff --git a/‎controllers/lmes/driver/driver_test.go‎
Lines changed: 15 additions & 20 deletions b/‎controllers/lmes/driver/driver_test.go‎
Lines changed: 15 additions & 20 deletions
@@ -61,13 +61,16 @@ const (
 )
 
 type Arg struct {
-	Name  string `json:"name"`
+	// +kubebuilder:validation:Pattern=`^[a-zA-Z0-9._-]+$`
+	Name string `json:"name"`
+	// +kubebuilder:validation:Pattern=`^[a-zA-Z0-9._/:\- ]*$`
 	Value string `json:"value,omitempty"`
 }
 
 type Card struct {
 	// Unitxt card's ID
 	// +optional
+	// +kubebuilder:validation:Pattern=`^[a-zA-Z0-9._-]+$`
 	Name string `json:"name,omitempty"`
 	// A JSON string for a custom unitxt card which contains the custom dataset.
 	// Use the documentation here: https://www.unitxt.ai/en/latest/docs/adding_dataset.html#adding-to-the-catalog
@@ -212,6 +215,7 @@ type TaskRecipe struct {
 // GitSource specifies the git location of external tasks
 type GitSource struct {
 	// URL specifies the git repository URL
+	// +kubebuilder:validation:Pattern=`^https://[a-zA-Z0-9._/-]+$`
 	URL string `json:"url,omitempty"`
 	// Branch specifies the git branch to use
 	// +optional
@@ -221,6 +225,7 @@ type GitSource struct {
 	Commit *string `json:"commit,omitempty"`
 	// Path specifies the path to the task file
 	// +optional
+	// +kubebuilder:validation:Pattern=`^[a-zA-Z0-9._/-]*$`
 	Path string `json:"path,omitempty"`
 }
 
@@ -238,6 +243,7 @@ type CustomTasks struct {
 
 type TaskList struct {
 	// TaskNames from lm-eval's task list and/or from custom tasks if CustomTasks is defined
+	// +kubebuilder:validation:items:Pattern=`^[a-zA-Z0-9._-]+$`
 	TaskNames []string `json:"taskNames,omitempty"`
 	// Task Recipes specifically for Unitxt
 	TaskRecipes []TaskRecipe `json:"taskRecipes,omitempty"`
@@ -446,14 +452,15 @@ func (p *LMEvalPodSpec) GetSideCards() []corev1.Container {
 }
 
 type OfflineS3Spec struct {
-	AccessKeyIdRef     corev1.SecretKeySelector  `json:"accessKeyId"`
-	SecretAccessKeyRef corev1.SecretKeySelector  `json:"secretAccessKey"`
-	Bucket             corev1.SecretKeySelector  `json:"bucket"`
-	Path               string                    `json:"path"`
-	Region             corev1.SecretKeySelector  `json:"region"`
-	Endpoint           corev1.SecretKeySelector  `json:"endpoint"`
-	VerifySSL          *bool                     `json:"verifySSL,omitempty"`
-	CABundle           *corev1.SecretKeySelector `json:"caBundle,omitempty"`
+	AccessKeyIdRef     corev1.SecretKeySelector `json:"accessKeyId"`
+	SecretAccessKeyRef corev1.SecretKeySelector `json:"secretAccessKey"`
+	Bucket             corev1.SecretKeySelector `json:"bucket"`
+	// +kubebuilder:validation:Pattern=`^[a-zA-Z0-9._/-]*$`
+	Path      string                    `json:"path"`
+	Region    corev1.SecretKeySelector  `json:"region"`
+	Endpoint  corev1.SecretKeySelector  `json:"endpoint"`
+	VerifySSL *bool                     `json:"verifySSL,omitempty"`
+	CABundle  *corev1.SecretKeySelector `json:"caBundle,omitempty"`
 }
 
 // OfflineStorageSpec defines the storage configuration for LMEvalJob's offline mode
@@ -493,6 +500,7 @@ type LMEvalJobSpec struct {
 	// Important: Run "make" to regenerate code after modifying this file
 
 	// Model name
+	// +kubebuilder:validation:Enum=hf;openai-completions;openai-chat-completions;local-completions;local-chat-completions;watsonx_llm;textsynth
 	Model string `json:"model"`
 	// Args for the model
 	// +optional
@@ -506,6 +514,7 @@ type LMEvalJobSpec struct {
 	// the number of documents to evaluate to the first X documents (if an integer)
 	// per task or first X% of documents per task
 	// +optional
+	// +kubebuilder:validation:Pattern=`^(\d+\.?\d*|\d*\.\d+)$`
 	Limit string `json:"limit,omitempty"`
 	// Map to `--gen_kwargs` parameter for the underlying library.
 	// +optional
 
@@ -75,8 +75,10 @@ spec:
                 items:
                   properties:
                     name:
+                      pattern: ^[a-zA-Z0-9._-]+$
                       type: string
                     value:
+                      pattern: ^[a-zA-Z0-9._/:\- ]*$
                       type: string
                   required:
                   - name
@@ -87,6 +89,7 @@ spec:
                   Accepts an integer, or a float between 0.0 and 1.0 . If passed, will limit
                   the number of documents to evaluate to the first X documents (if an integer)
                   per task or first X% of documents per task
+                pattern: ^(\d+\.?\d*|\d*\.\d+)$
                 type: string
               logSamples:
                 description: |-
@@ -95,14 +98,24 @@ spec:
                 type: boolean
               model:
                 description: Model name
+                enum:
+                - hf
+                - openai-completions
+                - openai-chat-completions
+                - local-completions
+                - local-chat-completions
+                - watsonx_llm
+                - textsynth
                 type: string
               modelArgs:
                 description: Args for the model
                 items:
                   properties:
                     name:
+                      pattern: ^[a-zA-Z0-9._-]+$
                       type: string
                     value:
+                      pattern: ^[a-zA-Z0-9._/:\- ]*$
                       type: string
                   required:
                   - name
@@ -204,6 +217,7 @@ spec:
                             type: object
                             x-kubernetes-map-type: atomic
                           path:
+                            pattern: ^[a-zA-Z0-9._/-]*$
                             type: string
                           region:
                             description: SecretKeySelector selects a key of a Secret.
@@ -4828,9 +4842,11 @@ spec:
                                 type: string
                               path:
                                 description: Path specifies the path to the task file
+                                pattern: ^[a-zA-Z0-9._/-]*$
                                 type: string
                               url:
                                 description: URL specifies the git repository URL
+                                pattern: ^https://[a-zA-Z0-9._/-]+$
                                 type: string
                             type: object
                         type: object
@@ -4839,6 +4855,7 @@ spec:
                     description: TaskNames from lm-eval's task list and/or from custom
                       tasks if CustomTasks is defined
                     items:
+                      pattern: ^[a-zA-Z0-9._-]+$
                       type: string
                     type: array
                   taskRecipes:
@@ -4860,6 +4877,7 @@ spec:
                               type: string
                             name:
                               description: Unitxt card's ID
+                              pattern: ^[a-zA-Z0-9._-]+$
                               type: string
                           type: object
                         demosPoolSize:
 
@@ -218,7 +218,7 @@ func (d *driverImpl) detectDevice() error {
 		return fmt.Errorf("failed to find the matched output")
 	}
 
-	patchDevice(d.Option.Args, matches[1] == "True")
+	d.Option.Args = patchDevice(d.Option.Args, matches[1] == "True")
 
 	return nil
 }
@@ -241,21 +241,21 @@ func (d *driverImpl) downloadS3Assets() error {
 	return nil
 }
 
-func patchDevice(args []string, hasCuda bool) {
-	var device = "cpu"
+func patchDevice(args []string, hasCuda bool) []string {
+	device := "cpu"
 	if hasCuda {
 		device = "cuda"
 	}
-	// patch the python command in the Option.Arg by adding the `--device cuda` option
-	// find the string with the `python -m lm_eval` prefix. usually it should be the last one
-	for idx, arg := range args {
-		if strings.HasPrefix(arg, "python -m lm_eval") {
-			if !strings.Contains(arg, "--device") {
-				args[idx] = fmt.Sprintf("%s --device %s", arg, device)
-			}
-			break
+
+	// Check if --device already exists
+	for _, arg := range args {
+		if arg == "--device" {
+			return args // already has device specified
 		}
 	}
+
+	// If we reach here, --device doesn't exist, so add it
+	return append(args, "--device", device)
 }
 
 // Create a domain socket and use HTTP protocal to handle communication
@@ -598,6 +598,7 @@ func (d *driverImpl) fetchGitCustomTasks() error {
 		return err
 	}
 
+	// #nosec G204 -- CustomTaskGitURL is validated by ValidateGitURL() in the controller
 	cloneCommand := exec.Command("git", "clone", d.Option.CustomTaskGitURL, repositoryDestination)
 	if output, err := cloneCommand.CombinedOutput(); err != nil {
 		return fmt.Errorf("failed to clone git repository: %v, output: %s", err, string(output))
@@ -608,12 +609,14 @@ func (d *driverImpl) fetchGitCustomTasks() error {
 
 	// Checkout a specific branch, if specified
 	if d.Option.CustomTaskGitBranch != "" {
+		// #nosec G204 -- CustomTaskGitBranch is validated by ValidateGitBranch() in the controller
 		checkoutCommand := exec.Command("git", clonedDirectory, workTree, "checkout", d.Option.CustomTaskGitBranch)
 		if output, err := checkoutCommand.CombinedOutput(); err != nil {
 			return fmt.Errorf("failed to checkout branch %s: %v, output: %s",
 				d.Option.CustomTaskGitBranch, err, string(output))
 		}
 	} else {
+		// #nosec G204 -- DefaultGitBranch is a constant value, not user input
 		checkoutCmd := exec.Command("git", clonedDirectory, workTree, "checkout", DefaultGitBranch)
 		if output, err := checkoutCmd.CombinedOutput(); err != nil {
 			d.Option.Logger.Info("failed to checkout main branch, using default branch from clone",
@@ -623,6 +626,7 @@ func (d *driverImpl) fetchGitCustomTasks() error {
 
 	// Checkout a specific commit, if specified
 	if d.Option.CustomTaskGitCommit != "" {
+		// #nosec G204 -- CustomTaskGitCommit is validated by ValidateGitCommit() in the controller
 		checkoutCommand := exec.Command("git", clonedDirectory, workTree, "checkout", d.Option.CustomTaskGitCommit)
 		if output, err := checkoutCommand.CombinedOutput(); err != nil {
 			return fmt.Errorf("failed to checkout commit %s: %v, output: %s",
@@ -644,6 +648,7 @@ func (d *driverImpl) fetchGitCustomTasks() error {
 		return err
 	}
 
+	// #nosec G204 -- taskPath is derived from validated CustomTaskGitPath, TaskRecipesPath is controlled by the application
 	copyCmd := exec.Command("cp", "-r", taskPath+"/.", d.Option.TaskRecipesPath)
 	output, err := copyCmd.CombinedOutput()
 	if err != nil {
 
@@ -234,31 +234,26 @@ func Test_PatchDevice(t *testing.T) {
 		OutputPath:   ".",
 		DetectDevice: true,
 		Logger:       driverLog,
-		Args:         []string{"sh", "-ec", "python -m lm_eval --output_path /opt/app-root/src/output --model test --model_args arg1=value1 --tasks task1,task2"},
+		Args:         []string{"python", "-m", "lm_eval", "--output_path", "/opt/app-root/src/output", "--model", "test", "--model_args", "arg1=value1", "--tasks", "task1,task2"},
 	}
 
 	// append `--device cuda`
-	patchDevice(driverOpt.Args, true)
-	assert.Equal(t,
-		"python -m lm_eval --output_path /opt/app-root/src/output --model test --model_args arg1=value1 --tasks task1,task2 --device cuda",
-		driverOpt.Args[2],
-	)
+	driverOpt.Args = patchDevice(driverOpt.Args, true)
+	expected := []string{"python", "-m", "lm_eval", "--output_path", "/opt/app-root/src/output", "--model", "test", "--model_args", "arg1=value1", "--tasks", "task1,task2", "--device", "cuda"}
+	assert.Equal(t, expected, driverOpt.Args)
 
 	// append `--device cpu`
-	driverOpt.Args = []string{"sh", "-ec", "python -m lm_eval --output_path /opt/app-root/src/output --model test --model_args arg1=value1 --tasks task1,task2"}
-	patchDevice(driverOpt.Args, false)
-	assert.Equal(t,
-		"python -m lm_eval --output_path /opt/app-root/src/output --model test --model_args arg1=value1 --tasks task1,task2 --device cpu",
-		driverOpt.Args[2],
-	)
-
-	// no change because `--device cpu` exists
-	driverOpt.Args = []string{"sh", "-ec", "python -m lm_eval --device cpu --output_path /opt/app-root/src/output --model test --model_args arg1=value1 --tasks task1,task2"}
-	patchDevice(driverOpt.Args, true)
-	assert.Equal(t,
-		"python -m lm_eval --device cpu --output_path /opt/app-root/src/output --model test --model_args arg1=value1 --tasks task1,task2",
-		driverOpt.Args[2],
-	)
+	driverOpt.Args = []string{"python", "-m", "lm_eval", "--output_path", "/opt/app-root/src/output", "--model", "test", "--model_args", "arg1=value1", "--tasks", "task1,task2"}
+	driverOpt.Args = patchDevice(driverOpt.Args, false)
+	expected = []string{"python", "-m", "lm_eval", "--output_path", "/opt/app-root/src/output", "--model", "test", "--model_args", "arg1=value1", "--tasks", "task1,task2", "--device", "cpu"}
+	assert.Equal(t, expected, driverOpt.Args)
+
+	// no change because `--device` already exists
+	driverOpt.Args = []string{"python", "-m", "lm_eval", "--device", "cpu", "--output_path", "/opt/app-root/src/output", "--model", "test", "--model_args", "arg1=value1", "--tasks", "task1,task2"}
+	originalArgs := make([]string, len(driverOpt.Args))
+	copy(originalArgs, driverOpt.Args)
+	driverOpt.Args = patchDevice(driverOpt.Args, true)
+	assert.Equal(t, originalArgs, driverOpt.Args)
 }
 
 func Test_TaskRecipes(t *testing.T) {