File tree Expand file tree Collapse file tree 4 files changed +16
-4
lines changed
config/charts/inferencepool Expand file tree Collapse file tree 4 files changed +16
-4
lines changed Original file line number Diff line number Diff line change 65
65
"metricsPort" ,
66
66
runserver .DefaultMetricsPort ,
67
67
"The metrics port" )
68
+ enablePprof = flag .Bool (
69
+ "enablePprof" ,
70
+ runserver .DefaultEnablePprof ,
71
+ "Enables pprof handlers. Defaults to true. Set to false to disable pprof handlers." )
68
72
destinationEndpointHintKey = flag .String (
69
73
"destinationEndpointHintKey" ,
70
74
runserver .DefaultDestinationEndpointHintKey ,
@@ -263,10 +267,14 @@ func (r *Runner) Run(ctx context.Context) error {
263
267
setupLog .Error (err , "Failed to create controller manager" )
264
268
return err
265
269
}
266
- err = setupPprofHandlers (mgr )
267
- if err != nil {
268
- setupLog .Error (err , "Failed to setup pprof handlers" )
269
- return err
270
+
271
+ if * enablePprof {
272
+ setupLog .Info ("Enabling pprof handlers" )
273
+ err = setupPprofHandlers (mgr )
274
+ if err != nil {
275
+ setupLog .Error (err , "Failed to setup pprof handlers" )
276
+ return err
277
+ }
270
278
}
271
279
272
280
err = r .parseConfiguration (ctx )
Original file line number Diff line number Diff line change 35
35
- " 9003"
36
36
- -metricsPort
37
37
- " 9090"
38
+ # https://pkg.go.dev/flag#hdr-Command_line_flag_syntax; space is only for non-bool flags
39
+ - " -enablePprof={{ .Values.inferenceExtension.enablePprof }}"
38
40
{{- if eq (.Values.inferencePool.modelServerType | default "vllm") "triton-tensorrt-llm" }}
39
41
- -totalQueuedRequestsMetric
40
42
- " nv_trt_llm_request_metrics{request_type=waiting}"
Original file line number Diff line number Diff line change @@ -7,6 +7,7 @@ inferenceExtension:
7
7
pullPolicy : Always
8
8
extProcPort : 9002
9
9
env : {}
10
+ enablePprof : true # Enable pprof handlers for profiling and debugging
10
11
# Example environment variables:
11
12
# env:
12
13
# KV_CACHE_SCORE_WEIGHT: "1"
Original file line number Diff line number Diff line change @@ -72,6 +72,7 @@ const (
72
72
DefaultRefreshPrometheusMetricsInterval = 5 * time .Second // default for --refreshPrometheusMetricsInterval
73
73
DefaultSecureServing = true // default for --secureServing
74
74
DefaultHealthChecking = false // default for --healthChecking
75
+ DefaultEnablePprof = true // default for --enablePprof
75
76
DefaultTotalQueuedRequestsMetric = "vllm:num_requests_waiting" // default for --totalQueuedRequestsMetric
76
77
DefaultKvCacheUsagePercentageMetric = "vllm:gpu_cache_usage_perc" // default for --kvCacheUsagePercentageMetric
77
78
DefaultLoraInfoMetric = "vllm:lora_requests_info" // default for --loraInfoMetric
You can’t perform that action at this time.
0 commit comments