fixes after testing

rupinSec · rupinSec · commit 6ce9b775c73f · 2025-05-23T17:34:11.000+05:30
diff --git a/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/Chart.yaml b/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/Chart.yaml
@@ -1,5 +1,5 @@
 apiVersion: v1
 appVersion: "1.0"
 description: A Helm chart for Kubernetes
-name: deployment-chart_4-21-0
+name: gpu-workload-4-21-0
 version: 4.21.0
diff --git a/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/app-values.yaml b/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/app-values.yaml
@@ -67,11 +67,10 @@ resources:
 
 gpu:
   enabled: false
+  provider: "nvidia.com/gpu"
   resources:
-    requests:
-      nvidia.com/gpu: 1
-    limits:
-      nvidia.com/gpu: 1
+    limits: 1
+    requests: 1
 
 # Optional configs
 LivenessProbe:
diff --git a/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/schema.json b/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/schema.json
@@ -734,65 +734,6 @@
           "type": "string",
           "description": "image of envoy to be used"
         },
-        "gpu": {
-          "type": "object",
-          "description": "GPU resource configuration",
-          "title": "GPU",
-          "properties": {
-            "enabled": {
-              "type": "boolean",
-              "description": "Enable GPU resources"
-            },
-            "driver": {
-              "type": "string",
-              "description": "GPU driver type (e.g. nvidia, amd64, intel). Supported: nvidia, amd64, intel."
-            },
-            "resources": {
-              "type": "object",
-              "description": "GPU resource requests and limits",
-              "properties": {
-                "requests": {
-                  "type": "object",
-                  "description": "Requested GPU resources",
-                  "properties": {
-                    "nvidia.com/gpu": {
-                      "type": ["integer", "string"],
-                      "description": "Number of NVIDIA GPUs requested"
-                    },
-                    "amd.com/gpu": {
-                      "type": ["integer", "string"],
-                      "description": "Number of AMD GPUs requested"
-                    },
-                    "intel.com/gpu": {
-                      "type": ["integer", "string"],
-                      "description": "Number of Intel GPUs requested"
-                    }
-                  },
-                  "additionalProperties": true
-                },
-                "limits": {
-                  "type": "object",
-                  "description": "GPU resource limits",
-                  "properties": {
-                    "nvidia.com/gpu": {
-                      "type": ["integer", "string"],
-                      "description": "Maximum number of NVIDIA GPUs allowed"
-                    },
-                    "amd.com/gpu": {
-                      "type": ["integer", "string"],
-                      "description": "Maximum number of AMD GPUs allowed"
-                    },
-                    "intel.com/gpu": {
-                      "type": ["integer", "string"],
-                      "description": "Maximum number of Intel GPUs allowed"
-                    }
-                  },
-                  "additionalProperties": true
-                }
-              }
-            }
-          }
-        },
         "resources": {
           "type": "object",
           "description": "minimum and maximum RAM and CPU available to the application",
@@ -840,6 +781,48 @@
         }
       }
     },
+      "gpu": {
+          "type": "object",
+          "description": "GPU resource configuration",
+          "title": "GPU",
+          "properties": {
+            "enabled": {
+              "type": "boolean",
+              "description": "Enable GPU resources",
+              "title": "GPU Spec"
+            },
+            "provider": {
+              "type": "string",
+              "description": "GPU driver type e.g. nvidia.com/gpu, amd.com/gpu, intel.com/gpu"
+            },
+            "resources": {
+              "type": "object",
+              "description": "GPU resource requests and limits",
+              "properties": {
+                "limits": {
+                  "type": "object",
+                  "description": "GPU resource limits",
+                  "properties": {
+                    "gpu": {
+                      "type": "string",
+                      "description": "Limit for GPU resources"
+                    }
+                  }
+                },
+                "requests": {
+                  "type": "object",
+                  "description": "GPU resource requests",
+                  "properties": {
+                    "gpu": {
+                      "type": "string",
+                      "description": "Request for GPU resources"
+                    }
+                  }
+                }
+              }
+            }
+          }
+        },
       "hostAliases":{
       "type": "array",
       "title": "hostAliases",
diff --git a/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/templates/deployment.yaml b/scripts/devtron-reference-helm-charts/gpu-workload-4-21-0/templates/deployment.yaml
@@ -193,21 +193,10 @@ spec:
           args:
 {{ toYaml .args | indent 12 -}}
 {{- end }}
-          {{- $resources := $.Values.resources | default dict }}
-          {{- $gpuResources := (and (hasKey $.Values.gpu "enabled") $.Values.gpu.enabled (hasKey $.Values.gpu "resources")) | ternary $.Values.gpu.resources (dict) }}
-          {{- $limits := merge (get $resources "limits" | default dict) (get $gpuResources "limits" | default dict) }}
-          {{- $requests := merge (get $resources "requests" | default dict) (get $gpuResources "requests" | default dict) }}
-          {{- if or $limits $requests }}
+{{- if .resources}}
           resources:
-          {{- if $limits }}
-            limits:
-{{ toYaml $limits | indent 14 }}
-          {{- end }}
-          {{- if $requests }}
-            requests:
-{{ toYaml $requests | indent 14 }}
-          {{- end }}
-          {{- end }}
+{{ toYaml .resources | indent 12 -}}
+{{- end }}
 {{- if .volumeMounts}}
           volumeMounts:
 {{ toYaml .volumeMounts | indent 12 -}}
@@ -409,21 +398,30 @@ spec:
 {{ toYaml .Values.ReadinessProbe.grpc | indent 14 }}
             {{- end}}
 {{- end }}
-          {{- $resources := $.Values.resources | default dict }}
-          {{- $gpuResources := (and (hasKey $.Values.gpu "enabled") $.Values.gpu.enabled (hasKey $.Values.gpu "resources")) | ternary $.Values.gpu.resources (dict) }}
-          {{- $limits := merge (get $resources "limits" | default dict) (get $gpuResources "limits" | default dict) }}
-          {{- $requests := merge (get $resources "requests" | default dict) (get $gpuResources "requests" | default dict) }}
-          {{- if or $limits $requests }}
+{{- $resources := $.Values.resources | default dict }}
+{{- $gpu := $.Values.gpu | default dict }}
+{{- $gpuEnabled := and (hasKey $gpu "enabled") $gpu.enabled (hasKey $gpu "provider") (hasKey $gpu "resources") }}
+{{- $gpuLimits := dict }}
+{{- $gpuRequests := dict }}
+{{- if $gpuEnabled }}
+  {{- $gpuLimits = dict $gpu.provider ($gpu.resources.limits | default 0) }}
+  {{- $gpuLimits = dict "limits" $gpuLimits }}
+  {{- $gpuRequests = dict $gpu.provider ($gpu.resources.requests | default 0) }}
+  {{- $gpuRequests = dict "requests" $gpuRequests }}
+{{- end }}
+{{- $limits := merge (get $resources "limits" | default dict) (get $gpuLimits "limits" | default dict) }}
+{{- $requests := merge (get $resources "requests" | default dict) (get $gpuRequests "requests" | default dict) }}
+{{- if or $limits $requests }}
           resources:
-          {{- if $limits }}
+{{- if $limits }}
             limits:
 {{ toYaml $limits | indent 14 }}
-          {{- end }}
-          {{- if $requests }}
+{{- end }}
+{{- if $requests }}
             requests:
 {{ toYaml $requests | indent 14 }}
-          {{- end }}
-          {{- end }}
+{{- end }}
+{{- end }}
 {{- if or $.Values.StartupProbe.Path  $.Values.StartupProbe.command $.Values.StartupProbe.tcp $.Values.StartupProbe.grpc }}
           startupProbe:
 {{- if $.Values.StartupProbe.Path }}
diff --git a/scripts/sql/33403700_gpu_workload_chart.down.sql b/scripts/sql/33403700_gpu_workload_chart.down.sql
@@ -1,3 +1,3 @@
 DELETE FROM global_strategy_metadata_chart_ref_mapping WHERE chart_ref_id=(select id from chart_ref where version='4.21.0' and name='GPU-Workload');
 
-DELETE FROM "public"."chart_ref" WHERE ("location" = 'gpu-workload_4-21-0' AND "version" = '4.21.0');
+DELETE FROM "public"."chart_ref" WHERE ("location" = 'gpu-workload-4-21-0' AND "version" = '4.21.0');
diff --git a/scripts/sql/33403700_gpu_workload_chart.up.sql b/scripts/sql/33403700_gpu_workload_chart.up.sql
@@ -1,6 +1,9 @@
 INSERT INTO "public"."chart_ref" ("name","location", "version", "deployment_strategy_path","is_default", "active", "created_on", "created_by", "updated_on", "updated_by") VALUES
-     ('GPU-Workload','gpu-workload_4-21-0', '4.21.0','pipeline-values.yaml','f', 't', 'now()', 1, 'now()', 1);
+     ('GPU-Workload','gpu-workload-4-21-0', '4.21.0','pipeline-values.yaml','f', 't', 'now()', 1, 'now()', 1);
 
 INSERT INTO global_strategy_metadata_chart_ref_mapping ("global_strategy_metadata_id", "chart_ref_id", "active", "created_on", "created_by", "updated_on", "updated_by","default")
 VALUES (1,(select id from chart_ref where version='4.21.0' and name='GPU-Workload'), true, now(), 1, now(), 1,true),
-(4,(select id from chart_ref where version='4.21.0' and name='GPU-Workload'), true, now(), 1, now(), 1,false);
+(4,(select id from chart_ref where version='4.21.0' and name='GPU-Workload'), true, now(), 1, now(), 1,false);
+
+INSERT INTO chart_ref_metadata("chart_name","chart_description") VALUES 
+('GPU-Workload','GPU Workload Charts enable the deployment of GPU workloads on Kubernetes Clusters.');

Original file line number	Diff line number	Diff line change
`@@ -1,3 +1,3 @@`
`1`	`1`	`DELETE FROM global_strategy_metadata_chart_ref_mapping WHERE chart_ref_id=(select id from chart_ref where version='4.21.0' and name='GPU-Workload');`
`2`	`2`
`3`		`-DELETE FROM "public"."chart_ref" WHERE ("location" = 'gpu-workload_4-21-0' AND "version" = '4.21.0');`
	`3`	`+DELETE FROM "public"."chart_ref" WHERE ("location" = 'gpu-workload-4-21-0' AND "version" = '4.21.0');`