add dra job for 90% fill up and 10% churn

alaypatel07 · alaypatel07 · commit f309b5940135 · 2025-06-13T12:52:46.000-04:00
diff --git a/clusterloader2/testing/dra/README.md b/clusterloader2/testing/dra/README.md
@@ -0,0 +1,37 @@
+### Usage
+
+In order to test the workload here, use the [Getting Started] (../../docs/GETTING_STARTED.md) guide
+to set up a kind cluster for the test
+
+#### Steady State DRA Test
+
+This test scenario first fills the cluster to 90% utilization with long-running pods, then measures the performance of
+constantly scheduling short-lived pods at a steady rate.
+
+1. Use the following env variables:
+```
+export CL2_MODE=Indexed
+export CL2_NODES_PER_NAMESPACE=1
+export CL2_LOAD_TEST_THROUGHPUT=20   # Fast initial fill
+export CL2_STEADY_STATE_QPS=5        # Controlled rate for measurement
+export CL2_JOB_RUNNING_TIME=30s      # Short-lived pods runtime
+export CL2_LONG_JOB_RUNNING_TIME=1h  # Long-running pods runtime (for cluster fill)
+export CL2_GPUS_PER_NODE=8           # GPUs per node
+export CL2_FILL_PERCENTAGE=90        # Cluster fill percentage
+```
+
+2. Run the test with:
+```
+./run-e2e.sh cluster-loader2 \
+--provider=kind \
+--kubeconfig=/root/.kube/config \
+--report-dir=/tmp/clusterloader2-results \
+--testconfig=testing/dra/config.yaml \
+--nodes=5
+```
+
+This test will:
+1. Create ResourceClaimTemplates in each namespace
+2. Fill the cluster to 90% utilization with long-running pods (each using 1 GPU)
+3. Measure performance while continuously creating short-lived pods at a steady rate
+4. Collect metrics on pod startup latency, job lifecycle latency, and scheduler metrics
diff --git a/clusterloader2/testing/dra/config.yaml b/clusterloader2/testing/dra/config.yaml
@@ -0,0 +1,174 @@
+{{$MODE := DefaultParam .CL2_MODE "Indexed"}}
+{{$NODES_PER_NAMESPACE := MinInt .Nodes (DefaultParam .CL2_NODES_PER_NAMESPACE 100)}}
+{{$LOAD_TEST_THROUGHPUT := DefaultParam .CL2_LOAD_TEST_THROUGHPUT 10}}
+{{$STEADY_STATE_QPS := DefaultParam .CL2_STEADY_STATE_QPS 5}}
+{{$token := .CL2_TOKEN }}
+
+{{$namespaces := DivideInt .Nodes $NODES_PER_NAMESPACE}}
+
+# Node resource configuration
+{{$gpusPerNode := DefaultParam .CL2_GPUS_PER_NODE 8}}
+{{$totalGPUs := MultiplyInt $gpusPerNode .Nodes}}
+
+# fast fill job configuration - for initial fill up
+{{$fillPercentage := DefaultParam .CL2_FILL_PERCENTAGE 90}}
+{{$fillPodsCount := DivideInt (MultiplyInt $totalGPUs $fillPercentage) 100}}
+{{$fillPodsPerNamespace := DivideInt $fillPodsCount $namespaces}}
+{{$longJobSize := 1}}
+{{$longJobRunningTime := DefaultParam .CL2_LONG_JOB_RUNNING_TIME "1h"}}
+
+# churn job configuration for steady state
+{{$smallJobPodsCount := SubtractInt $totalGPUs (MultiplyInt $fillPodsPerNamespace $namespaces)}}
+{{$smallJobsPerNamespace := DivideInt $smallJobPodsCount $namespaces}}
+{{$smallJobSize := 1}}
+{{$smallJobCompletions := 10}}
+{{$jobRunningTime := DefaultParam .CL2_JOB_RUNNING_TIME "30s"}}
+
+name: dra-steady-state
+
+namespace:
+  number: {{$namespaces}}
+
+tuningSets:
+- name: FastFill
+  qpsLoad:
+    qps: {{$LOAD_TEST_THROUGHPUT}}
+- name: SteadyState
+  qpsLoad:
+    qps: {{$STEADY_STATE_QPS}}
+
+steps:
+- name: Start measurements
+  measurements:
+  - Identifier: WaitForFinishedJobs
+    Method: WaitForFinishedJobs
+    Params:
+      action: start
+      labelSelector: job-type = short-lived
+  - Identifier: WaitForControlledPodsRunning
+    Method: WaitForControlledPodsRunning
+    Params:
+      action: start
+      apiVersion: batch/v1
+      kind: Job
+      labelSelector: job-type = long-running
+      operationTimeout: 120s
+  - Identifier: FastFillSchedulingMetrics
+    Method: SchedulingMetrics
+    Params:
+      action: start
+      token: {{ $token }}
+      endpoint: "localhost:10259"
+  - Identifier: FastFillPodStartupLatency
+    Method: PodStartupLatency
+    Params:
+      action: start
+      labelSelector: job-type = long-running
+      threshold: 20s
+- name: Clearing SchedulingMetrics
+  measurements:
+  - Identifier: FastFillSchedulingMetrics
+    Method: SchedulingMetrics
+    Params:
+      action: reset
+      token: {{ $token }}
+      endpoint: "localhost:10259"
+- name: Create ResourceClaimTemplates in namespaces
+  phases:
+  - namespaceRange:
+      min: 1
+      max: {{$namespaces}}
+    replicasPerNamespace: 1
+    tuningSet: FastFill
+    objectBundle:
+    - basename: single-gpu
+      objectTemplatePath: "resourceclaimtemplate.yaml"
+- name: Fill cluster to {{$fillPercentage}}% utilization
+  phases:
+  - namespaceRange:
+      min: 1
+      max: {{$namespaces}}
+    replicasPerNamespace: {{$fillPodsPerNamespace}}
+    tuningSet: FastFill
+    objectBundle:
+    - basename: long-running
+      objectTemplatePath: "long-running-job.yaml"
+      templateFillMap:
+        Replicas: {{$longJobSize}}
+        Mode: {{$MODE}}
+        Sleep: {{$longJobRunningTime}}
+- name: Wait for fill pods to be running
+  measurements:
+  - Identifier: WaitForControlledPodsRunning
+    Method: WaitForControlledPodsRunning
+    Params:
+      action: gather
+      labelSelector: job-type = long-running
+      timeout: 15m
+- name: Gather measurements for long running pods
+  measurements:
+    - Identifier: FastFillSchedulingMetrics
+      Method: SchedulingMetrics
+      Params:
+        action: gather
+        token: {{ $token }}
+        endpoint: "localhost:10259"
+    - Identifier: FastFillPodStartupLatency
+      Method: PodStartupLatency
+      Params:
+        action: gather
+- name: reset metrics for steady state churn
+  measurements:
+    - Identifier: ChurnSchedulingMetrics
+      Method: SchedulingMetrics
+      Params:
+        action: start
+        token: {{ $token }}
+        endpoint: "localhost:10259"
+    - Identifier: ChurnSchedulingMetrics
+      Method: SchedulingMetrics
+      Params:
+        action: reset
+        token: {{ $token }}
+        endpoint: "localhost:10259"
+    - Identifier: ChurnPodStartupLatency
+      Method: PodStartupLatency
+      Params:
+        action: start
+        labelSelector: job-type = short-lived
+        threshold: 20s
+- name: Create steady state {{$MODE}} jobs
+  phases:
+  - namespaceRange:
+      min: 1
+      max: {{$namespaces}}
+    replicasPerNamespace: {{$smallJobsPerNamespace}}
+    tuningSet: SteadyState
+    objectBundle:
+    - basename: small
+      objectTemplatePath: "job.yaml"
+      templateFillMap:
+        Replicas: {{$smallJobSize}}
+        CompletionReplicas: {{$smallJobCompletions}}
+        Mode: {{$MODE}}
+        Sleep: {{$jobRunningTime}}
+- name: Wait for short-lived jobs to finish
+  measurements:
+    - Identifier: WaitForFinishedJobs
+      Method: WaitForFinishedJobs
+      Params:
+        action: gather
+        labelSelector: job-type = short-lived
+        timeout: 15m
+- name: Measure scheduler metrics
+  measurements:
+  - Identifier: ChurnSchedulingMetrics
+    Method: SchedulingMetrics
+    Params:
+      action: gather
+      token: {{ $token }}
+      endpoint: "localhost:10259"
+  - Identifier: ChurnPodStartupLatency
+    Method: PodStartupLatency
+    Params:
+      action: gather
diff --git a/clusterloader2/testing/dra/job.yaml b/clusterloader2/testing/dra/job.yaml
@@ -0,0 +1,30 @@
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: {{.Name}}
+  labels:
+    group: test-job
+    job-type: short-lived
+spec:
+  parallelism: {{.Replicas}}
+  completions: {{.CompletionReplicas}}
+  completionMode: {{.Mode}}
+  ttlSecondsAfterFinished: 300
+  template:
+    metadata:
+      labels:
+        group: test-pod
+        job-type: short-lived
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: {{.Name}}
+          image: gcr.io/k8s-staging-perf-tests/sleep:v0.0.3
+          args:
+            - {{.Sleep}}
+          resources:
+            claims:
+            - name: gpu
+      resourceClaims:
+      - name: gpu
+        resourceClaimTemplateName: single-gpu-0
diff --git a/clusterloader2/testing/dra/long-running-job.yaml b/clusterloader2/testing/dra/long-running-job.yaml
@@ -0,0 +1,30 @@
+apiVersion: batch/v1
+kind: Job
+metadata:
+  name: {{.Name}}
+  labels:
+    group: test-job
+    job-type: long-running
+spec:
+  parallelism: {{.Replicas}}
+  completions: {{.Replicas}}
+  completionMode: {{.Mode}}
+  activeDeadlineSeconds: 86400 # 24 hours
+  template:
+    metadata:
+      labels:
+        group: test-pod
+        job-type: long-running
+    spec:
+      restartPolicy: Never
+      containers:
+        - name: {{.Name}}
+          image: gcr.io/k8s-staging-perf-tests/sleep:v0.0.3
+          args:
+            - {{.Sleep}}
+          resources:
+            claims:
+            - name: gpu
+      resourceClaims:
+      - name: gpu
+        resourceClaimTemplateName: single-gpu-0 
diff --git a/clusterloader2/testing/dra/resourceclaimtemplate.yaml b/clusterloader2/testing/dra/resourceclaimtemplate.yaml
@@ -0,0 +1,10 @@
+apiVersion: resource.k8s.io/v1beta1
+kind: ResourceClaimTemplate
+metadata:
+  name: {{.Name}}
+spec:
+  spec:
+    devices:
+      requests:
+        - name: gpu
+          deviceClassName: gpu.example.com