solve bug for workloads default utilization

eliranw · eliranw · commit e7af5c5b3fa1 · 2025-12-21T15:36:20.000+02:00
diff --git a/internal/status-updater/handlers/pod/gpu_usage_calculator.go b/internal/status-updater/handlers/pod/gpu_usage_calculator.go
@@ -71,7 +71,7 @@ func calculateGpuUsageFromPodType(dynamicclient dynamic.Interface, pod *v1.Pod,
 	switch podType {
 	case "train":
 		return generateGpuUsageStatus(topology.Range{Min: 80, Max: 100}, gpuFraction, totalGpuMemory, false)
-	case "build", "interactive-preemptible":
+	case "build", "interactive-preemptible", "interactive", "distributed":
 		return generateGpuUsageStatus(topology.Range{Min: 0, Max: 0}, gpuFraction, totalGpuMemory, false)
 	case "inference":
 		return generateGpuUsageStatus(topology.Range{Min: 0, Max: 0}, gpuFraction, totalGpuMemory, true)
@@ -104,6 +104,22 @@ func calculateUtilizationFromAnnotation(annotationValue string) (*topology.Range
 }
 
 func getPodType(dynamicClient dynamic.Interface, pod *v1.Pod) (string, error) {
+	// First, try to get workload type from pod labels
+	if workloadKind, ok := pod.Labels["workloadKind"]; ok {
+		// Map Run:AI workload kinds to utilization types
+		switch workloadKind {
+		case "TrainingWorkload":
+			return "train", nil
+		case "DistributedWorkload":
+			return "distributed", nil
+		case "InferenceWorkload":
+			return "inference", nil
+		case "InteractiveWorkload":
+			return "interactive", nil
+		}
+	}
+
+	// Fallback to existing PodGroup lookup
 	podGroupName := pod.Annotations[constants.AnnotationPodGroupName]
 	if podGroupName == "" {
 		return "", fmt.Errorf("pod %s has no constants.PodGroupNameAnnotation annotation", pod.Name)