@@ -67,6 +67,22 @@ steps:
67
67
Method : PrometheusSchedulingMetrics
68
68
Params :
69
69
action : start
70
+ - Identifier : FastFillDRAMetrics
71
+ Method : GenericPrometheusQuery
72
+ Params :
73
+ action : start
74
+ metricName : fastfill_kubelet_latencies
75
+ metricVersion : v1
76
+ unit : s
77
+ queries :
78
+ - name : p99_dra_prepare_resources
79
+ query : histogram_quantile(0.99, sum(rate(dra_operations_duration_seconds_bucket{operation_name="PrepareResources"}[%v])) by (le))
80
+ - name : p99_dra_unprepare_operations
81
+ query : histogram_quantile(0.99, sum(rate(dra_operations_duration_seconds_bucket{operation_name="UnprepareResources"}[%v])) by (le))
82
+ - name : p99_dra_grpc_node_prepare_resources
83
+ query : histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name="NodePrepareResources"}[%v])) by (le))
84
+ - name : p99_dra_grpc_node_unprepare_resources
85
+ query : histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name="NodeUnprepareResources"}[%v])) by (le))
70
86
- name : Create ResourceClaimTemplates in namespaces
71
87
phases :
72
88
- namespaceRange :
@@ -109,6 +125,10 @@ steps:
109
125
Method : PodStartupLatency
110
126
Params :
111
127
action : gather
128
+ - Identifier : FastFillDRAMetrics
129
+ Method : GenericPrometheusQuery
130
+ Params :
131
+ action : gather
112
132
- name : reset metrics for steady state churn
113
133
measurements :
114
134
- Identifier : ChurnSchedulingMetrics
@@ -123,6 +143,22 @@ steps:
123
143
perc50Threshold : 40s
124
144
perc90Threshold : 60s
125
145
perc99Threshold : 80s
146
+ - Identifier : ChurnDRAMetrics
147
+ Method : GenericPrometheusQuery
148
+ Params :
149
+ action : start
150
+ metricName : churn_kubelet_latencies
151
+ metricVersion : v1
152
+ unit : s
153
+ queries :
154
+ - name : p99_prepare_operations
155
+ query : histogram_quantile(0.99, sum(rate(dra_operations_duration_seconds_bucket{operation_name="PrepareResources"}[%v])) by (le))
156
+ - name : p99_unprepare_operations
157
+ query : histogram_quantile(0.99, sum(rate(dra_operations_duration_seconds_bucket{operation_name="UnprepareResources"}[%v])) by (le))
158
+ - name : p99_dra_grpc_node_prepare_resources
159
+ query : histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name=~".*NodePrepareResources"}[%v])) by (le))
160
+ - name : p99_dra_grpc_node_unprepare_resources
161
+ query : histogram_quantile(0.99, sum(rate(dra_grpc_operations_duration_seconds_bucket{method_name=~".*NodeUnprepareResources"}[%v])) by (le))
126
162
- name : Create steady state {{$MODE}} jobs
127
163
phases :
128
164
- namespaceRange :
@@ -158,4 +194,8 @@ steps:
158
194
action : gather
159
195
perc50Threshold : 40s
160
196
perc90Threshold : 60s
161
- perc99Threshold : 80s
197
+ perc99Threshold : 80s
198
+ - Identifier : ChurnDRAMetrics
199
+ Method : GenericPrometheusQuery
200
+ Params :
201
+ action : gather
0 commit comments