File tree Expand file tree Collapse file tree 5 files changed +54
-2
lines changed Expand file tree Collapse file tree 5 files changed +54
-2
lines changed Original file line number Diff line number Diff line change 1
1
# Changelog
2
2
3
+ ## v2.229.0 (2024-08-15)
4
+
5
+ ### Features
6
+
7
+ * Support for ModelBuilder In_Process Mode (1/2)
8
+ * Pulling in dependencies (in_process mode) using conda environment
9
+ * Add optional CodeArtifact login to FrameworkProcessing job script
10
+ * implemented security-monitoring to send metrics to CW #1510
11
+
12
+ ### Bug Fixes and Other Changes
13
+
14
+ * alt configs model deployment and training issues
15
+ * fix keras extension in integ test
16
+ * update image_uri_configs 08-13-2024 07:17:54 PST
17
+ * trn1 instance family does not support volume size
18
+ * Update model.py
19
+ * removed log statement
20
+ * update image_uri_configs 08-09-2024 07:18:00 PST
21
+ * Added torchrun compatibility for distributet training across multiple GPUs in a single node (single instance)
22
+ * BiasConfig type hint
23
+ * add model monitor image accounts for ap-southeast-5 and eu-central-2
24
+ * aligned UTC times with PST
25
+ * ensure hpt jobs inherit tags from config
26
+ * add JumpStart PDT and OSU regions
27
+ * chore(deps): bump certifi in /src/sagemaker/serve/utils
28
+ * Updates for DJL 0.29.0 release
29
+ * chore(deps): bump apache-airflow from 2.9.2 to 2.9.3 in /requirements/extras
30
+ * chore(deps): bump torch from 2.0.1 to 2.2.0 in /tests/data/serve_resources/mlflow/pytorch
31
+ * avoided printing stack trace and escaped input
32
+ * removing kwargs as this is breaking predictor_cls param for mode…
33
+
3
34
## v2.228.0 (2024-08-06)
4
35
5
36
### Features
Original file line number Diff line number Diff line change 1
- 2.228 .1.dev0
1
+ 2.229 .1.dev0
Original file line number Diff line number Diff line change @@ -198,7 +198,7 @@ def main(args):
198
198
199
199
if args .current_host == args .hosts [0 ]:
200
200
ckpt_manager .save ()
201
- net .save ("/opt/ml/model/1.keras " )
201
+ net .save ("/opt/ml/model/1" )
202
202
203
203
204
204
if __name__ == "__main__" :
Original file line number Diff line number Diff line change @@ -85,6 +85,11 @@ def test_mnist_with_checkpoint_config(
85
85
tensorflow_training_latest_version ,
86
86
tensorflow_training_latest_py_version ,
87
87
):
88
+ if Version (tensorflow_training_latest_version ) >= Version ("2.16" ):
89
+ pytest .skip (
90
+ "This test is failing in TensorFlow 2.16 beacuse of an upstream bug: "
91
+ "https://github.com/tensorflow/io/issues/2039"
92
+ )
88
93
checkpoint_s3_uri = "s3://{}/checkpoints/tf-{}" .format (
89
94
sagemaker_session .default_bucket (), sagemaker_timestamp ()
90
95
)
@@ -235,6 +240,11 @@ def test_mnist_distributed_cpu(
235
240
tensorflow_training_latest_version ,
236
241
tensorflow_training_latest_py_version ,
237
242
):
243
+ if Version (tensorflow_training_latest_version ) >= Version ("2.16" ):
244
+ pytest .skip (
245
+ "This test is failing in TensorFlow 2.16 beacuse of an upstream bug: "
246
+ "https://github.com/tensorflow/io/issues/2039"
247
+ )
238
248
_create_and_fit_estimator (
239
249
sagemaker_session ,
240
250
tensorflow_training_latest_version ,
Original file line number Diff line number Diff line change 19
19
import numpy as np
20
20
import pytest
21
21
from botocore .exceptions import ClientError
22
+ from packaging .version import Version
22
23
23
24
import tests .integ
24
25
from sagemaker import KMeans , LDA , RandomCutForest , image_uris
@@ -691,6 +692,11 @@ def test_tuning_tf(
691
692
tensorflow_training_latest_version ,
692
693
tensorflow_training_latest_py_version ,
693
694
):
695
+ if Version (tensorflow_training_latest_version ) >= Version ("2.16" ):
696
+ pytest .skip (
697
+ "This test is failing in TensorFlow 2.16 beacuse of an upstream bug: "
698
+ "https://github.com/tensorflow/io/issues/2039"
699
+ )
694
700
resource_path = os .path .join (DATA_DIR , "tensorflow_mnist" )
695
701
script_path = "mnist.py"
696
702
@@ -735,6 +741,11 @@ def test_tuning_tf_vpc_multi(
735
741
tensorflow_training_latest_py_version ,
736
742
):
737
743
"""Test Tensorflow multi-instance using the same VpcConfig for training and inference"""
744
+ if Version (tensorflow_training_latest_version ) >= Version ("2.16" ):
745
+ pytest .skip (
746
+ "This test is failing in TensorFlow 2.16 beacuse of an upstream bug: "
747
+ "https://github.com/tensorflow/io/issues/2039"
748
+ )
738
749
instance_type = cpu_instance_type
739
750
instance_count = 2
740
751
You can’t perform that action at this time.
0 commit comments