File tree Expand file tree Collapse file tree 1 file changed +3
-3
lines changed
src/sagemaker/serve/builder Expand file tree Collapse file tree 1 file changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -1293,6 +1293,9 @@ def _model_builder_optimize_wrapper(
1293
1293
max_runtime_in_sec = max_runtime_in_sec ,
1294
1294
)
1295
1295
1296
+ if sharding_config :
1297
+ self .pysdk_model ._is_sharded_model = True
1298
+
1296
1299
if input_args :
1297
1300
self .sagemaker_session .sagemaker_client .create_optimization_job (** input_args )
1298
1301
job_status = self .sagemaker_session .wait_for_optimization_job (job_name )
@@ -1302,9 +1305,6 @@ def _model_builder_optimize_wrapper(
1302
1305
if not speculative_decoding_config :
1303
1306
self .pysdk_model .remove_tag_with_key (Tag .SPECULATIVE_DRAFT_MODEL_PROVIDER )
1304
1307
1305
- if sharding_config :
1306
- self .pysdk_model ._is_sharded_model = True
1307
-
1308
1308
return self .pysdk_model
1309
1309
1310
1310
def _optimize_for_hf (
You can’t perform that action at this time.
0 commit comments