Skip to content

Commit 895f099

Browse files
authored
Merge branch 'master' into feature/modelcard-property
2 parents 118f4d9 + 3497670 commit 895f099

File tree

12 files changed

+89
-3
lines changed

12 files changed

+89
-3
lines changed

CHANGELOG.md

Lines changed: 29 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,34 @@
11
# Changelog
22

3+
## v2.222.1 (2024-06-12)
4+
5+
### Bug Fixes and Other Changes
6+
7+
* First changes
8+
* estimator.deploy not respecting instance type
9+
10+
## v2.222.0 (2024-06-07)
11+
12+
### Features
13+
14+
* jumpstart telemetry
15+
16+
### Bug Fixes and Other Changes
17+
18+
* update image_uri_configs 06-06-2024 07:17:31 PST
19+
* bump requests from 2.31.0 to 2.32.2 in /requirements/extras
20+
* chore: add HF LLM neuronx 0.0.23 image
21+
* Updates for DJL 0.28.0 release
22+
* chore(deps): bump mlflow from 2.11.1 to 2.12.1 in /tests/data/serve_resources/mlflow/tensorflow
23+
* chore(deps): bump mlflow from 2.11.1 to 2.12.1 in /tests/data/serve_resources/mlflow/xgboost
24+
* chore(deps): bump mlflow from 2.10.2 to 2.12.1 in /tests/data/serve_resources/mlflow/pytorch
25+
* chore(deps): bump apache-airflow from 2.9.0 to 2.9.1 in /requirements/extras
26+
* chore(deps): bump requests from 2.31.0 to 2.32.2 in /tests/data/serve_resources/mlflow/pytorch
27+
* Fix ci unit-tests
28+
* Making project name in workflow files dynamic
29+
* update image_uri_configs 05-29-2024 07:17:35 PST
30+
* Update: SM Endpoint Routing Strategy Support.
31+
332
## v2.221.1 (2024-05-22)
433

534
### Bug Fixes and Other Changes

VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
2.221.2.dev0
1+
2.222.2.dev0

src/sagemaker/image_uri_config/pytorch.json

Lines changed: 43 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,8 @@
8282
"1.13": "1.13.1",
8383
"2.0": "2.0.1",
8484
"2.1": "2.1.0",
85-
"2.2": "2.2.0"
85+
"2.2": "2.2.0",
86+
"2.3": "2.3.0"
8687
},
8788
"versions": {
8889
"0.4.0": {
@@ -1054,6 +1055,47 @@
10541055
"us-west-2": "763104351884"
10551056
},
10561057
"repository": "pytorch-inference"
1058+
},
1059+
"2.3.0": {
1060+
"py_versions": [
1061+
"py311"
1062+
],
1063+
"registries": {
1064+
"af-south-1": "626614931356",
1065+
"ap-east-1": "871362719292",
1066+
"ap-northeast-1": "763104351884",
1067+
"ap-northeast-2": "763104351884",
1068+
"ap-northeast-3": "364406365360",
1069+
"ap-south-1": "763104351884",
1070+
"ap-south-2": "772153158452",
1071+
"ap-southeast-1": "763104351884",
1072+
"ap-southeast-2": "763104351884",
1073+
"ap-southeast-3": "907027046896",
1074+
"ap-southeast-4": "457447274322",
1075+
"ca-central-1": "763104351884",
1076+
"ca-west-1": "204538143572",
1077+
"cn-north-1": "727897471807",
1078+
"cn-northwest-1": "727897471807",
1079+
"eu-central-1": "763104351884",
1080+
"eu-central-2": "380420809688",
1081+
"eu-north-1": "763104351884",
1082+
"eu-south-1": "692866216735",
1083+
"eu-south-2": "503227376785",
1084+
"eu-west-1": "763104351884",
1085+
"eu-west-2": "763104351884",
1086+
"eu-west-3": "763104351884",
1087+
"il-central-1": "780543022126",
1088+
"me-central-1": "914824155844",
1089+
"me-south-1": "217643126080",
1090+
"sa-east-1": "763104351884",
1091+
"us-east-1": "763104351884",
1092+
"us-east-2": "763104351884",
1093+
"us-gov-east-1": "446045086412",
1094+
"us-gov-west-1": "442386744353",
1095+
"us-west-1": "763104351884",
1096+
"us-west-2": "763104351884"
1097+
},
1098+
"repository": "pytorch-inference"
10571099
}
10581100
}
10591101
},

src/sagemaker/jumpstart/factory/estimator.py

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -322,7 +322,12 @@ def get_deploy_kwargs(
322322
model_id=model_id,
323323
model_from_estimator=True,
324324
model_version=model_version,
325-
instance_type=model_deploy_kwargs.instance_type if training_instance_type is None else None,
325+
instance_type=(
326+
model_deploy_kwargs.instance_type
327+
if training_instance_type is None
328+
or instance_type is not None # always use supplied inference instance type
329+
else None
330+
),
326331
region=region,
327332
image_uri=image_uri,
328333
source_dir=source_dir,

src/sagemaker/serve/builder/djl_builder.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -265,6 +265,7 @@ def _djl_model_builder_deploy_wrapper(self, *args, **kwargs) -> Type[PredictorBa
265265
# if has not been built for local container we must use cache
266266
# that hosting has write access to.
267267
self.pysdk_model.env["TRANSFORMERS_CACHE"] = "/tmp"
268+
self.pysdk_model.env["HF_HOME"] = "/tmp"
268269
self.pysdk_model.env["HUGGINGFACE_HUB_CACHE"] = "/tmp"
269270

270271
if "endpoint_logging" not in kwargs:

src/sagemaker/serve/builder/tei_builder.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -175,6 +175,7 @@ def _tei_model_builder_deploy_wrapper(self, *args, **kwargs) -> Type[PredictorBa
175175
# if has not been built for local container we must use cache
176176
# that hosting has write access to.
177177
self.pysdk_model.env["TRANSFORMERS_CACHE"] = "/tmp"
178+
self.pysdk_model.env["HF_HOME"] = "/tmp"
178179
self.pysdk_model.env["HUGGINGFACE_HUB_CACHE"] = "/tmp"
179180

180181
if "endpoint_logging" not in kwargs:

src/sagemaker/serve/builder/tgi_builder.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -214,6 +214,7 @@ def _tgi_model_builder_deploy_wrapper(self, *args, **kwargs) -> Type[PredictorBa
214214
# if has not been built for local container we must use cache
215215
# that hosting has write access to.
216216
self.pysdk_model.env["TRANSFORMERS_CACHE"] = "/tmp"
217+
self.pysdk_model.env["HF_HOME"] = "/tmp"
217218
self.pysdk_model.env["HUGGINGFACE_HUB_CACHE"] = "/tmp"
218219

219220
if "endpoint_logging" not in kwargs:

src/sagemaker/serve/model_server/djl_serving/server.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,7 @@
1919
_DEFAULT_ENV_VARS = {
2020
"SERVING_OPTS": "-Dai.djl.logging.level=debug",
2121
"TRANSFORMERS_CACHE": "/opt/ml/model/",
22+
"HF_HOME": "/opt/ml/model/",
2223
"HUGGINGFACE_HUB_CACHE": "/opt/ml/model/",
2324
}
2425

src/sagemaker/serve/model_server/tei/server.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,6 +18,7 @@
1818
_SHM_SIZE = "2G"
1919
_DEFAULT_ENV_VARS = {
2020
"TRANSFORMERS_CACHE": "/opt/ml/model/",
21+
"HF_HOME": "/opt/ml/model/",
2122
"HUGGINGFACE_HUB_CACHE": "/opt/ml/model/",
2223
}
2324

src/sagemaker/serve/model_server/tgi/server.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -17,6 +17,7 @@
1717
_SHM_SIZE = "2G"
1818
_DEFAULT_ENV_VARS = {
1919
"TRANSFORMERS_CACHE": "/opt/ml/model/",
20+
"HF_HOME": "/opt/ml/model/",
2021
"HUGGINGFACE_HUB_CACHE": "/opt/ml/model/",
2122
}
2223

0 commit comments

Comments
 (0)