From ee7cc9e022ac18e8944f8e87c04527bd84dfd9dd Mon Sep 17 00:00:00 2001 From: Haotian An Date: Tue, 27 Aug 2024 18:46:42 +0000 Subject: [PATCH] chore: add HF LLM neuronx 0.0.24 image --- .../huggingface-llm-neuronx.json | 31 ++++++++++++++++++- .../image_uris/test_huggingface_llm.py | 1 + 2 files changed, 31 insertions(+), 1 deletion(-) diff --git a/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json b/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json index 1f08c8bbcd..3283dd21f0 100644 --- a/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json +++ b/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json @@ -4,7 +4,7 @@ "inf2" ], "version_aliases": { - "0.0": "0.0.23" + "0.0": "0.0.24" }, "versions": { "0.0.16": { @@ -238,6 +238,35 @@ "container_version": { "inf2": "ubuntu22.04" } + }, + "0.0.24": { + "py_versions": [ + "py310" + ], + "registries": { + "ap-northeast-1": "763104351884", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-4": "457447274322", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-south-2": "503227376785", + "eu-west-1": "763104351884", + "eu-west-3": "763104351884", + "il-central-1": "780543022126", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-west-2": "763104351884", + "ca-west-1": "204538143572" + }, + "tag_prefix": "2.1.2-optimum0.0.24", + "repository": "huggingface-pytorch-tgi-inference", + "container_version": { + "inf2": "ubuntu22.04" + } } } } diff --git a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py index 4b50363d9e..c3fab15936 100644 --- a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py +++ b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py @@ -55,6 +55,7 @@ "0.0.21": "1.13.1-optimum0.0.21-neuronx-py310-ubuntu22.04", "0.0.22": "2.1.2-optimum0.0.22-neuronx-py310-ubuntu22.04", "0.0.23": "2.1.2-optimum0.0.23-neuronx-py310-ubuntu22.04", + "0.0.24": "2.1.2-optimum0.0.24-neuronx-py310-ubuntu22.04", }, }