You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/together/resources/endpoints.py
+24-4Lines changed: 24 additions & 4 deletions
Original file line number
Diff line number
Diff line change
@@ -59,6 +59,7 @@ def create(
59
59
disable_prompt_cache: bool=False,
60
60
disable_speculative_decoding: bool=False,
61
61
state: Literal["STARTED", "STOPPED"] ="STARTED",
62
+
inactive_timeout: Optional[int] =None,
62
63
) ->DedicatedEndpoint:
63
64
"""
64
65
Create a new dedicated endpoint.
@@ -72,6 +73,7 @@ def create(
72
73
disable_prompt_cache (bool, optional): Whether to disable the prompt cache. Defaults to False.
73
74
disable_speculative_decoding (bool, optional): Whether to disable speculative decoding. Defaults to False.
74
75
state (str, optional): The desired state of the endpoint. Defaults to "STARTED".
76
+
inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
75
77
76
78
Returns:
77
79
DedicatedEndpoint: Object containing endpoint information
max_replicas (int, optional): The maximum number of replicas to scale up to
172
178
state (str, optional): The desired state of the endpoint ("STARTED" or "STOPPED")
173
179
display_name (str, optional): A human-readable name for the endpoint
180
+
inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
174
181
175
182
Returns:
176
183
DedicatedEndpoint: Object containing endpoint information
disable_prompt_cache (bool, optional): Whether to disable the prompt cache. Defaults to False.
311
322
disable_speculative_decoding (bool, optional): Whether to disable speculative decoding. Defaults to False.
312
323
state (str, optional): The desired state of the endpoint. Defaults to "STARTED".
324
+
inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
313
325
314
326
Returns:
315
327
DedicatedEndpoint: Object containing endpoint information
max_replicas (int, optional): The maximum number of replicas to scale up to
410
426
state (str, optional): The desired state of the endpoint ("STARTED" or "STOPPED")
411
427
display_name (str, optional): A human-readable name for the endpoint
428
+
inactive_timeout (int, optional): The number of minutes of inactivity after which the endpoint will be automatically stopped. Set to 0 to disable automatic timeout.
412
429
413
430
Returns:
414
431
DedicatedEndpoint: Object containing endpoint information
0 commit comments