Skip to content

Commit ddc3dee

Browse files
committed
Retry load_model to 60 seconds
1 parent d46ae13 commit ddc3dee

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

inference/utils/inference_api_client.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -188,7 +188,7 @@ def wait_for_model_loading(self, model_identifier: str, max_attempts: int = 10,
188188
return False
189189
return False # Timed out without reaching LOADED state
190190

191-
@retry(stop=stop_after_attempt(5), wait=wait_fixed(30), retry=retry_if_result(lambda x: not x))
191+
@retry(stop=stop_after_attempt(5), wait=wait_fixed(60), retry=retry_if_result(lambda x: not x))
192192
def load_model(self, model_identifier: str) -> bool:
193193
"""
194194
Load a specific model, first unloading all models, and wait for loading to complete.

0 commit comments

Comments
 (0)