Skip to content

Commit 3ac9e36

Browse files
Yadan-WeiYadan Wei
andauthored
Onboard PT TR to autopatch (#5071)
* build PT25 TR EC2 * build PT2.5 TR SM * update protobuf version * build PT2.6 TR EC2 * build PT26 TR SM * build PT27 TR EC2 * build PT27 TR SM * build PT26 TR EC2 * build PT25 TR SM * retry build PT25 TR SM * remove sagemaker training version pin * build PT26 TR SM * revert toml --------- Co-authored-by: Yadan Wei <[email protected]>
1 parent aaec0c0 commit 3ac9e36

17 files changed

+76
-22
lines changed

miscellaneous_scripts/dockerfile_patch_script.sh

Lines changed: 0 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -47,13 +47,6 @@ elif [[ $LATEST_RELEASED_IMAGE_URI =~ ^763104351884\.dkr\.ecr\.us-west-2\.amazon
4747
curl -o /license.txt https://aws-dlc-licenses.s3.amazonaws.com/pytorch-2.7/license.txt
4848
fi
4949

50-
# Upgrade sagemaker-training
51-
if [[ $LATEST_RELEASED_IMAGE_URI =~ ^763104351884\.dkr\.ecr\.us-west-2\.amazonaws\.com/pytorch-training:2\.[4-6](.+)sagemaker ]]; then
52-
pip install -U "sagemaker-training>4.7.4" "protobuf>=4.25.8,<6"
53-
elif [[ $LATEST_RELEASED_IMAGE_URI =~ ^763104351884\.dkr\.ecr\.us-west-2\.amazonaws\.com/pytorch-training:2\.7(.+)sagemaker ]]; then
54-
pip install -U "sagemaker-training>4.7.4,<5" "sagemaker-pytorch-training>=2.9.0"
55-
fi
56-
5750
# For PT inference gpu sagemaker images, replace start_cuda_compat.sh
5851
if [[ $LATEST_RELEASED_IMAGE_URI =~ ^763104351884\.dkr\.ecr\.us-west-2\.amazonaws\.com/pytorch-inference:2\.[4-6]\.[0-9]+-gpu(.+)sagemaker ]]; then
5952
mv /tmp/new_pytorch_inference_start_cuda_compat /usr/local/bin/start_cuda_compat.sh

pytorch/training/buildspec-2-5-ec2.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ framework: &FRAMEWORK pytorch
55
version: &VERSION 2.5.1
66
short_version: &SHORT_VERSION "2.5"
77
arch_type: x86
8-
# autopatch_build: "True"
8+
autopatch_build: "True"
99

1010
repository_info:
1111
training_repository: &TRAINING_REPOSITORY

pytorch/training/buildspec-2-5-sm.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ framework: &FRAMEWORK pytorch
55
version: &VERSION 2.5.1
66
short_version: &SHORT_VERSION "2.5"
77
arch_type: x86
8-
# autopatch_build: "True"
8+
autopatch_build: "True"
99

1010
repository_info:
1111
training_repository: &TRAINING_REPOSITORY

pytorch/training/buildspec-2-6-ec2.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ framework: &FRAMEWORK pytorch
55
version: &VERSION 2.6.0
66
short_version: &SHORT_VERSION "2.6"
77
arch_type: x86
8-
# autopatch_build: "True"
8+
autopatch_build: "True"
99

1010
repository_info:
1111
training_repository: &TRAINING_REPOSITORY

pytorch/training/buildspec-2-6-sm.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ framework: &FRAMEWORK pytorch
55
version: &VERSION 2.6.0
66
short_version: &SHORT_VERSION "2.6"
77
arch_type: x86
8-
# autopatch_build: "True"
8+
autopatch_build: "True"
99

1010
repository_info:
1111
training_repository: &TRAINING_REPOSITORY

pytorch/training/buildspec-2-7-ec2.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ framework: &FRAMEWORK pytorch
55
version: &VERSION 2.7.1
66
short_version: &SHORT_VERSION "2.7"
77
arch_type: x86
8-
# autopatch_build: "True"
8+
autopatch_build: "True"
99

1010
repository_info:
1111
training_repository: &TRAINING_REPOSITORY

pytorch/training/buildspec-2-7-sm.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ framework: &FRAMEWORK pytorch
55
version: &VERSION 2.7.1
66
short_version: &SHORT_VERSION "2.7"
77
arch_type: x86
8-
# autopatch_build: "True"
8+
autopatch_build: "True"
99

1010
repository_info:
1111
training_repository: &TRAINING_REPOSITORY

pytorch/training/docker/2.5/py3/Dockerfile.ec2.cpu.core_packages.json

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -37,10 +37,10 @@
3737
"version_specifier": ">=4.66.3"
3838
},
3939
"requests": {
40-
"version_specifier": ">=2.32.0"
40+
"version_specifier": ">=2.32.4"
4141
},
4242
"setuptools": {
43-
"version_specifier": ">=70.0.0"
43+
"version_specifier": ">=80.9.0"
4444
},
4545
"urllib3": {
4646
"version_specifier": ">=2.5.0"
@@ -50,5 +50,8 @@
5050
},
5151
"numpy": {
5252
"version_specifier": "<2"
53+
},
54+
"opencv-python": {
55+
"version_specifier": "==4.11.0.86"
5356
}
5457
}

pytorch/training/docker/2.5/py3/Dockerfile.sagemaker.cpu.core_packages.json

Lines changed: 13 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -37,10 +37,10 @@
3737
"version_specifier": ">=4.66.3"
3838
},
3939
"requests": {
40-
"version_specifier": ">=2.32.0"
40+
"version_specifier": ">=2.32.4"
4141
},
4242
"setuptools": {
43-
"version_specifier": ">=70.0.0"
43+
"version_specifier": ">=80.9.0"
4444
},
4545
"urllib3": {
4646
"version_specifier": ">=2.5.0"
@@ -62,5 +62,16 @@
6262
},
6363
"tornado": {
6464
"version_specifier": ">=6.5.1"
65+
},
66+
"sagemaker-training": {
67+
"version_specifier": ">=5.0.0",
68+
"skip": "True"
69+
},
70+
"opencv-python": {
71+
"version_specifier": "==4.11.0.86"
72+
},
73+
"protobuf": {
74+
"version_specifier": ">=6.31.1",
75+
"skip": "True"
6576
}
6677
}

pytorch/training/docker/2.5/py3/cu124/Dockerfile.ec2.gpu.core_packages.json

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -45,10 +45,10 @@
4545
"version_specifier": ">=4.66.3"
4646
},
4747
"requests": {
48-
"version_specifier": ">=2.32.0"
48+
"version_specifier": ">=2.32.4"
4949
},
5050
"setuptools": {
51-
"version_specifier": ">=70.0.0"
51+
"version_specifier": ">=80.9.0"
5252
},
5353
"urllib3": {
5454
"version_specifier": ">=2.5.0"
@@ -58,5 +58,8 @@
5858
},
5959
"numpy": {
6060
"version_specifier": "<2"
61+
},
62+
"opencv-python": {
63+
"version_specifier": "==4.11.0.86"
6164
}
6265
}

0 commit comments

Comments
 (0)