@@ -24,55 +24,105 @@ class TritonServerConfig:
2424 """
2525
2626 server_arg_keys = [
27+ # Server
28+ "id" ,
29+ "exit-timeout-secs" ,
2730 # Logging
2831 "log-verbose" ,
2932 "log-info" ,
3033 "log-warning" ,
3134 "log-error" ,
32- "id" ,
35+ "log-format" ,
36+ "log-file" ,
3337 # Model Repository
3438 "model-store" ,
3539 "model-repository" ,
36- # Exit
37- "exit-timeout-secs" ,
3840 "exit-on-error" ,
39- # Strictness
40- "strict-model-config" ,
41+ "disable-auto-complete-config" ,
4142 "strict-readiness" ,
42- # API Servers
43+ "model-control-mode" ,
44+ "repository-poll-secs" ,
45+ "load-model" ,
46+ "model-load-thread-count" ,
47+ "model-load-retry-count" ,
48+ "model-namespacing" ,
49+ # HTTP
4350 "allow-http" ,
51+ "http-address" ,
4452 "http-port" ,
53+ "reuse-http-port" ,
54+ "http-header-forward-pattern" ,
4555 "http-thread-count" ,
56+ "http-restricted-api" ,
57+ # GRPC
4658 "allow-grpc" ,
59+ "grpc-address" ,
4760 "grpc-port" ,
61+ "reuse-grpc-port" ,
62+ "grpc-header-forward-pattern" ,
4863 "grpc-infer-allocation-pool-size" ,
4964 "grpc-use-ssl" ,
5065 "grpc-use-ssl-mutual" ,
5166 "grpc-server-cert" ,
5267 "grpc-server-key" ,
5368 "grpc-root-cert" ,
69+ "grpc-infer-response-compression-level" ,
70+ "grpc-keepalive-time" ,
71+ "grpc-keepalive-timeout" ,
72+ "grpc-keepalive-permit-without-calls" ,
73+ "grpc-http2-max-pings-without-data" ,
74+ "grpc-http2-min-recv-ping-interval-without-data" ,
75+ "grpc-http2-max-ping-strikes" ,
76+ "grpc-max-connection-age" ,
77+ "grpc-max-connection-age-grace" ,
78+ "grpc-restricted-protocol" ,
79+ # Sagemaker
80+ "allow-sagemaker" ,
81+ "sagemaker-port" ,
82+ "sagemaker-safe-port-range" ,
83+ "sagemaker-thread-count" ,
84+ # Vertex
85+ "allow-vertex-ai" ,
86+ "vertex-ai-port" ,
87+ "vertex-ai-thread-count" ,
88+ "vertex-ai-default-model" ,
89+ # Metrics
5490 "allow-metrics" ,
5591 "allow-gpu-metrics" ,
56- "metrics-interval-ms" ,
92+ "allow-cpu-metrics" ,
93+ "metrics-address" ,
5794 "metrics-port" ,
95+ "metrics-interval-ms" ,
96+ "metrics-config" ,
5897 # Tracing
59- "trace-file" ,
60- "trace-level" ,
61- "trace-rate" ,
62- # Model control
63- "model-control-mode" ,
64- "repository-poll-secs" ,
65- "load-model" ,
66- # Memory and GPU
98+ "trace-config" ,
99+ # Backend
100+ "backend-directory" ,
101+ "backend-config" ,
102+ # Repository Agent
103+ "repoagent-directory" ,
104+ # Response Cache
105+ "cache-config" ,
106+ "cache-directory" ,
107+ # Rate Limiter
108+ "rate-limit" ,
109+ "rate-limit-resource" ,
110+ # Memory/Device Management
67111 "pinned-memory-pool-byte-size" ,
68112 "cuda-memory-pool-byte-size" ,
113+ "cuda-virtual-address-size" ,
69114 "min-supported-compute-capability" ,
70- # Backend config
71- "backend-directory" ,
72- "backend-config" ,
73- "allow-soft-placement" ,
74- "gpu-memory-fraction" ,
75- "tensorflow-version" ,
115+ "buffer-management-thread-count" ,
116+ "host-policy" ,
117+ "model-load-gpu-limit" ,
118+ # DEPRECATED
119+ "strict-model-config" ,
120+ "response-cache-byte-size" ,
121+ "trace-file" ,
122+ "trace-level" ,
123+ "trace-rate" ,
124+ "trace-count" ,
125+ "trace-log-frequency" ,
76126 ]
77127
78128 def __init__ (self ):
0 commit comments