Skip to content

Commit 60813c1

Browse files
authored
Updating Triton Server Arg Keys (#829)
* Updating server config keys * Fixing typos
1 parent 6f58032 commit 60813c1

File tree

1 file changed

+71
-21
lines changed

1 file changed

+71
-21
lines changed

model_analyzer/triton/server/server_config.py

Lines changed: 71 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -24,55 +24,105 @@ class TritonServerConfig:
2424
"""
2525

2626
server_arg_keys = [
27+
# Server
28+
"id",
29+
"exit-timeout-secs",
2730
# Logging
2831
"log-verbose",
2932
"log-info",
3033
"log-warning",
3134
"log-error",
32-
"id",
35+
"log-format",
36+
"log-file",
3337
# Model Repository
3438
"model-store",
3539
"model-repository",
36-
# Exit
37-
"exit-timeout-secs",
3840
"exit-on-error",
39-
# Strictness
40-
"strict-model-config",
41+
"disable-auto-complete-config",
4142
"strict-readiness",
42-
# API Servers
43+
"model-control-mode",
44+
"repository-poll-secs",
45+
"load-model",
46+
"model-load-thread-count",
47+
"model-load-retry-count",
48+
"model-namespacing",
49+
# HTTP
4350
"allow-http",
51+
"http-address",
4452
"http-port",
53+
"reuse-http-port",
54+
"http-header-forward-pattern",
4555
"http-thread-count",
56+
"http-restricted-api",
57+
# GRPC
4658
"allow-grpc",
59+
"grpc-address",
4760
"grpc-port",
61+
"reuse-grpc-port",
62+
"grpc-header-forward-pattern",
4863
"grpc-infer-allocation-pool-size",
4964
"grpc-use-ssl",
5065
"grpc-use-ssl-mutual",
5166
"grpc-server-cert",
5267
"grpc-server-key",
5368
"grpc-root-cert",
69+
"grpc-infer-response-compression-level",
70+
"grpc-keepalive-time",
71+
"grpc-keepalive-timeout",
72+
"grpc-keepalive-permit-without-calls",
73+
"grpc-http2-max-pings-without-data",
74+
"grpc-http2-min-recv-ping-interval-without-data",
75+
"grpc-http2-max-ping-strikes",
76+
"grpc-max-connection-age",
77+
"grpc-max-connection-age-grace",
78+
"grpc-restricted-protocol",
79+
# Sagemaker
80+
"allow-sagemaker",
81+
"sagemaker-port",
82+
"sagemaker-safe-port-range",
83+
"sagemaker-thread-count",
84+
# Vertex
85+
"allow-vertex-ai",
86+
"vertex-ai-port",
87+
"vertex-ai-thread-count",
88+
"vertex-ai-default-model",
89+
# Metrics
5490
"allow-metrics",
5591
"allow-gpu-metrics",
56-
"metrics-interval-ms",
92+
"allow-cpu-metrics",
93+
"metrics-address",
5794
"metrics-port",
95+
"metrics-interval-ms",
96+
"metrics-config",
5897
# Tracing
59-
"trace-file",
60-
"trace-level",
61-
"trace-rate",
62-
# Model control
63-
"model-control-mode",
64-
"repository-poll-secs",
65-
"load-model",
66-
# Memory and GPU
98+
"trace-config",
99+
# Backend
100+
"backend-directory",
101+
"backend-config",
102+
# Repository Agent
103+
"repoagent-directory",
104+
# Response Cache
105+
"cache-config",
106+
"cache-directory",
107+
# Rate Limiter
108+
"rate-limit",
109+
"rate-limit-resource",
110+
# Memory/Device Management
67111
"pinned-memory-pool-byte-size",
68112
"cuda-memory-pool-byte-size",
113+
"cuda-virtual-address-size",
69114
"min-supported-compute-capability",
70-
# Backend config
71-
"backend-directory",
72-
"backend-config",
73-
"allow-soft-placement",
74-
"gpu-memory-fraction",
75-
"tensorflow-version",
115+
"buffer-management-thread-count",
116+
"host-policy",
117+
"model-load-gpu-limit",
118+
# DEPRECATED
119+
"strict-model-config",
120+
"response-cache-byte-size",
121+
"trace-file",
122+
"trace-level",
123+
"trace-rate",
124+
"trace-count",
125+
"trace-log-frequency",
76126
]
77127

78128
def __init__(self):

0 commit comments

Comments
 (0)