File tree Expand file tree Collapse file tree 2 files changed +24
-0
lines changed Expand file tree Collapse file tree 2 files changed +24
-0
lines changed Original file line number Diff line number Diff line change 32
32
averageValue : 20
33
33
behavior :
34
34
scaleUp :
35
+ # The stabilizationWindowSeconds is set to 0 to allow for immediate
36
+ # scaling up. This is a trade-off:
37
+ # - For highly volatile workloads, immediate scaling is critical to
38
+ # maintain performance and responsiveness.
39
+ # - However, this also introduces a risk of over-scaling if the workload
40
+ # spikes are very brief. A non-zero value would make the scaling
41
+ # less sensitive to short-lived spikes, but could introduce latency
42
+ # if the load persists.
35
43
stabilizationWindowSeconds : 0
36
44
policies :
37
45
- type : Pods
42
50
periodSeconds : 15
43
51
selectPolicy : Max
44
52
scaleDown :
53
+ # The stabilizationWindowSeconds is set to 30 to prevent the HPA from
54
+ # scaling down too aggressively. This means the controller will wait for
55
+ # 30 seconds after a scale-down event before considering another one.
56
+ # This helps to smooth out the scaling behavior and prevent "flapping"
57
+ # (rapidly scaling up and down). A larger value will make the scaling
58
+ # more conservative, which can be useful for workloads with fluctuating
59
+ # metrics, but it may also result in higher costs if the resources are
60
+ # not released quickly after a load decrease.
45
61
stabilizationWindowSeconds : 30
46
62
policies :
47
63
- type : Percent
Original file line number Diff line number Diff line change 34
34
# The scaling behavior can be customized to control how quickly the
35
35
# deployment scales up or down.
36
36
scaleDown :
37
+ # The stabilizationWindowSeconds is set to 30 to prevent the HPA from
38
+ # scaling down too aggressively. This means the controller will wait for
39
+ # 30 seconds after a scale-down event before considering another one.
40
+ # This helps to smooth out the scaling behavior and prevent "flapping"
41
+ # (rapidly scaling up and down). A larger value will make the scaling
42
+ # more conservative, which can be useful for workloads with fluctuating
43
+ # metrics, but it may also result in higher costs if the resources are
44
+ # not released quickly after a load decrease.
37
45
stabilizationWindowSeconds : 30
38
46
policies :
39
47
- type : Percent
You can’t perform that action at this time.
0 commit comments