Skip to content

Commit 2943dcd

Browse files
authored
Merge branch 'master' into master-update-apache-airflow
2 parents 1278b9b + 305bdf8 commit 2943dcd

File tree

25 files changed

+1110
-588
lines changed

25 files changed

+1110
-588
lines changed

CHANGELOG.md

Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,30 @@
11
# Changelog
22

3+
## v2.243.0 (2025-03-27)
4+
5+
### Features
6+
7+
* Enabled update_endpoint through model_builder
8+
9+
### Bug Fixes and Other Changes
10+
11+
* Update for PT 2.5.1, SMP 2.8.0
12+
* chore: move jumpstart region definitions to json file
13+
* fix flaky clarify model monitor test
14+
* fix flaky spark processor integ
15+
* use temp file in unit tests
16+
* Update transformers version
17+
* Aligned disable_output_compression for @remote with Estimator
18+
* Update Jinja version
19+
* update image_uri_configs 03-26-2025 07:18:16 PST
20+
* chore: fix integ tests to use latest version of model
21+
* update image_uri_configs 03-25-2025 07:18:13 PST
22+
* Skip tests failed due to deprecated instance type
23+
* update image_uri_configs 03-21-2025 07:17:55 PST
24+
* factor in set instance type when building JumpStart models in ModelBuilder.
25+
* ADD Documentation to ReadtheDocs for Upgrading torch versions
26+
* add new regions to JUMPSTART_LAUNCHED_REGIONS
27+
328
## v2.242.0 (2025-03-14)
429

530
### Features

VERSION

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
2.242.1.dev0
1+
2.243.1.dev0

doc/requirements.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ sphinx==5.1.1
22
sphinx-rtd-theme==0.5.0
33
docutils==0.15.2
44
packaging==20.9
5-
jinja2==3.1.4
5+
jinja2==3.1.6
66
schema==0.7.5
77
accelerate>=0.24.1,<=0.27.0
88
graphene<4.0

requirements/extras/test_requirements.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@ attrs>=23.1.0,<24
2020
fabric==2.6.0
2121
requests==2.32.2
2222
sagemaker-experiments==0.1.35
23-
Jinja2==3.1.4
23+
Jinja2==3.1.6
2424
pyvis==0.2.1
2525
pandas==1.4.4
2626
scikit-learn==1.3.0
@@ -33,7 +33,7 @@ pillow>=10.0.1,<=11
3333
opentelemetry-proto==1.27.0
3434
protobuf==4.25.5
3535
tensorboard>=2.9.0,<=2.15.2
36-
transformers==4.46.1
36+
transformers==4.48.0
3737
sentencepiece==0.1.99
3838
# https://github.com/triton-inference-server/server/issues/6246
3939
tritonclient[http]<2.37.0

src/sagemaker/fw_utils.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -155,6 +155,7 @@
155155
"2.3.0",
156156
"2.3.1",
157157
"2.4.1",
158+
"2.5.1",
158159
]
159160

160161
TRAINIUM_SUPPORTED_DISTRIBUTION_STRATEGIES = ["torch_distributed"]

src/sagemaker/image_uri_config/huggingface-llm-neuronx.json

Lines changed: 213 additions & 33 deletions
Large diffs are not rendered by default.

src/sagemaker/image_uri_config/huggingface-llm.json

Lines changed: 210 additions & 119 deletions
Large diffs are not rendered by default.

src/sagemaker/image_uri_config/pytorch-smp.json

Lines changed: 27 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,8 @@
99
"2.2": "2.3.1",
1010
"2.2.0": "2.3.1",
1111
"2.3.1": "2.5.0",
12-
"2.4.1": "2.7.0"
12+
"2.4.1": "2.7.0",
13+
"2.5.1": "2.8.0"
1314
},
1415
"versions": {
1516
"2.0.1": {
@@ -186,6 +187,31 @@
186187
"us-west-2": "658645717510"
187188
},
188189
"repository": "smdistributed-modelparallel"
190+
},
191+
"2.8.0": {
192+
"py_versions": [
193+
"py311"
194+
],
195+
"registries": {
196+
"ap-northeast-1": "658645717510",
197+
"ap-northeast-2": "658645717510",
198+
"ap-northeast-3": "658645717510",
199+
"ap-south-1": "658645717510",
200+
"ap-southeast-1": "658645717510",
201+
"ap-southeast-2": "658645717510",
202+
"ca-central-1": "658645717510",
203+
"eu-central-1": "658645717510",
204+
"eu-north-1": "658645717510",
205+
"eu-west-1": "658645717510",
206+
"eu-west-2": "658645717510",
207+
"eu-west-3": "658645717510",
208+
"sa-east-1": "658645717510",
209+
"us-east-1": "658645717510",
210+
"us-east-2": "658645717510",
211+
"us-west-1": "658645717510",
212+
"us-west-2": "658645717510"
213+
},
214+
"repository": "smdistributed-modelparallel"
189215
}
190216
}
191217
}

src/sagemaker/image_uri_config/sagemaker-base-python.json

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -12,6 +12,7 @@
1212
"ap-southeast-2": "452832661640",
1313
"ap-southeast-3": "276181064229",
1414
"ap-southeast-5": "148761635175",
15+
"ap-southeast-7": "528757812139",
1516
"ca-central-1": "310906938811",
1617
"cn-north-1": "390048526115",
1718
"cn-northwest-1": "390780980154",
@@ -26,6 +27,7 @@
2627
"il-central-1": "380164790875",
2728
"me-central-1": "103105715889",
2829
"me-south-1": "117516905037",
30+
"mx-central-1": "396913743851",
2931
"sa-east-1": "782484402741",
3032
"us-east-1": "081325390199",
3133
"us-east-2": "429704687514",

src/sagemaker/image_uris.py

Lines changed: 10 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -701,12 +701,16 @@ def get_training_image_uri(
701701
if "modelparallel" in distribution["smdistributed"]:
702702
if distribution["smdistributed"]["modelparallel"].get("enabled", True):
703703
framework = "pytorch-smp"
704-
if (
705-
"p5" in instance_type
706-
or "2.1" in framework_version
707-
or "2.2" in framework_version
708-
or "2.3" in framework_version
709-
or "2.4" in framework_version
704+
supported_smp_pt_versions_cu124 = ("2.5",)
705+
supported_smp_pt_versions_cu121 = ("2.1", "2.2", "2.3", "2.4")
706+
if any(
707+
pt_version in framework_version
708+
for pt_version in supported_smp_pt_versions_cu124
709+
):
710+
container_version = "cu124"
711+
elif "p5" in instance_type or any(
712+
pt_version in framework_version
713+
for pt_version in supported_smp_pt_versions_cu121
710714
):
711715
container_version = "cu121"
712716
else:

0 commit comments

Comments
 (0)