From bc5ad686f985fe64d6a229456f96b97b05fdbba9 Mon Sep 17 00:00:00 2001 From: pagezyhf Date: Tue, 14 Oct 2025 16:55:03 +0200 Subject: [PATCH 1/4] add image --- .../image_uri_config/huggingface-neuronx.json | 54 +++++++++++++++++-- 1 file changed, 49 insertions(+), 5 deletions(-) diff --git a/src/sagemaker/image_uri_config/huggingface-neuronx.json b/src/sagemaker/image_uri_config/huggingface-neuronx.json index d39d58bb9e..fef36c96e1 100644 --- a/src/sagemaker/image_uri_config/huggingface-neuronx.json +++ b/src/sagemaker/image_uri_config/huggingface-neuronx.json @@ -8,7 +8,8 @@ "4.34": "4.34.1", "4.36": "4.36.2", "4.43": "4.43.2", - "4.48": "4.48.1" + "4.48": "4.48.1", + "4.51": "4.51.0" }, "versions": { "4.28.1": { @@ -63,7 +64,7 @@ "py_versions": [ "py310" ], - "repository": "huggingface-pytorch-inference-neuronx", + "repository": "huggingface-pytorch-training-neuronx", "registries": { "ap-east-2": "975050140332", "ap-northeast-1": "763104351884", @@ -107,7 +108,7 @@ "py_versions": [ "py310" ], - "repository": "huggingface-pytorch-inference-neuronx", + "repository": "huggingface-pytorch-training-neuronx", "registries": { "ap-east-2": "975050140332", "ap-northeast-1": "763104351884", @@ -151,7 +152,7 @@ "py_versions": [ "py310" ], - "repository": "huggingface-pytorch-inference-neuronx", + "repository": "huggingface-pytorch-training-neuronx", "registries": { "ap-northeast-1": "763104351884", "ap-south-1": "763104351884", @@ -194,7 +195,7 @@ "py_versions": [ "py310" ], - "repository": "huggingface-pytorch-inference-neuronx", + "repository": "huggingface-pytorch-training-neuronx", "registries": { "ap-northeast-1": "763104351884", "ap-south-1": "763104351884", @@ -228,6 +229,49 @@ "sdk2.20.0" ] } + }, + "4.51.0": { + "version_aliases": { + "pytorch2.7": "pytorch2.7.0" + }, + "pytorch2.7.0": { + "py_versions": [ + "py310" + ], + "repository": "huggingface-pytorch-training-neuronx", + "registries": { + "ap-northeast-1": "763104351884", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-4": "457447274322", + "ap-southeast-5": "550225433462", + "ap-southeast-7": "590183813437", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-south-2": "503227376785", + "eu-west-1": "763104351884", + "eu-west-3": "763104351884", + "il-central-1": "780543022126", + "mx-central-1":"637423239942", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-gov-east-1": "446045086412", + "us-gov-west-1": "442386744353", + "us-west-2": "763104351884", + "ca-west-1": "204538143572" + }, + "container_version": { + "inf": "ubuntu22.04" + }, + "sdk_versions": [ + "sdk2.24.1" + ] + } } } }, From 35d8e6265904bf9e0a99d245ed633540644458e2 Mon Sep 17 00:00:00 2001 From: pagezyhf Date: Tue, 14 Oct 2025 17:30:10 +0200 Subject: [PATCH 2/4] inf on dlc --- .../image_uri_config/huggingface-neuronx.json | 46 ++++++++++++++++++- 1 file changed, 45 insertions(+), 1 deletion(-) diff --git a/src/sagemaker/image_uri_config/huggingface-neuronx.json b/src/sagemaker/image_uri_config/huggingface-neuronx.json index fef36c96e1..732e397ce9 100644 --- a/src/sagemaker/image_uri_config/huggingface-neuronx.json +++ b/src/sagemaker/image_uri_config/huggingface-neuronx.json @@ -283,7 +283,8 @@ "4.28": "4.28.1", "4.34": "4.34.1", "4.36": "4.36.2", - "4.43": "4.43.2" + "4.43": "4.43.2", + "4.51": "4.51.3" }, "versions": { "4.28.1": { @@ -548,6 +549,49 @@ "sdk2.20.0" ] } + }, + "4.51.3": { + "version_aliases": { + "pytorch2.7": "pytorch2.7.1" + }, + "pytorch2.7.1": { + "py_versions": [ + "py310" + ], + "repository": "huggingface-pytorch-inference-neuronx", + "registries": { + "ap-northeast-1": "763104351884", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-4": "457447274322", + "ap-southeast-5": "550225433462", + "ap-southeast-7": "590183813437", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-south-2": "503227376785", + "eu-west-1": "763104351884", + "eu-west-3": "763104351884", + "il-central-1": "780543022126", + "mx-central-1":"637423239942", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-gov-east-1": "446045086412", + "us-gov-west-1": "442386744353", + "us-west-2": "763104351884", + "ca-west-1": "204538143572" + }, + "container_version": { + "inf": "ubuntu22.04" + }, + "sdk_versions": [ + "sdk2.24.1" + ] + } } } } From 8c2926292f782a2f5102801791b656792b34212b Mon Sep 17 00:00:00 2001 From: pagezyhf Date: Tue, 14 Oct 2025 19:14:34 +0200 Subject: [PATCH 3/4] neuron tgi dlcs --- .../huggingface-llm-neuronx.json | 112 +++++++++++++++++- .../image_uris/test_huggingface_llm.py | 3 + 2 files changed, 114 insertions(+), 1 deletion(-) diff --git a/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json b/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json index 1c425b37ec..a4885058c7 100644 --- a/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json +++ b/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json @@ -4,7 +4,9 @@ "inf2" ], "version_aliases": { - "0.0": "0.0.28" + "0.0": "0.0.28", + "0.2": "0.2.0", + "0.3": "0.3.0" }, "versions": { "0.0.16": { @@ -654,6 +656,114 @@ "container_version": { "inf2": "ubuntu22.04" } + }, + "0.2.0": { + "py_versions": [ + "py310" + ], + "registries": { + "af-south-1": "626614931356", + "ap-east-1": "871362719292", + "ap-east-2": "975050140332", + "ap-northeast-1": "763104351884", + "ap-northeast-2": "763104351884", + "ap-northeast-3": "364406365360", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-3": "907027046896", + "ap-southeast-4": "457447274322", + "ap-southeast-5": "550225433462", + "ap-southeast-6": "633930458069", + "ap-southeast-7": "590183813437", + "ca-central-1": "763104351884", + "ca-west-1": "204538143572", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-north-1": "763104351884", + "eu-south-1": "692866216735", + "eu-south-2": "503227376785", + "eu-west-1": "763104351884", + "eu-west-2": "763104351884", + "eu-west-3": "763104351884", + "il-central-1": "780543022126", + "me-central-1": "914824155844", + "me-south-1": "217643126080", + "mx-central-1": "637423239942", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-gov-east-1": "446045086412", + "us-gov-west-1": "442386744353", + "us-iso-east-1": "886529160074", + "us-isob-east-1": "094389454867", + "us-isof-east-1": "303241398832", + "us-isof-south-1": "454834333376", + "us-west-1": "763104351884", + "us-west-2": "763104351884" + }, + "tag_prefix": "2.5.1-optimum3.3.4", + "repository": "huggingface-pytorch-tgi-inference", + "container_version": { + "inf2": "ubuntu22.04" + } + }, + "0.3.0": { + "py_versions": [ + "py310" + ], + "registries": { + "af-south-1": "626614931356", + "ap-east-1": "871362719292", + "ap-east-2": "975050140332", + "ap-northeast-1": "763104351884", + "ap-northeast-2": "763104351884", + "ap-northeast-3": "364406365360", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-3": "907027046896", + "ap-southeast-4": "457447274322", + "ap-southeast-5": "550225433462", + "ap-southeast-6": "633930458069", + "ap-southeast-7": "590183813437", + "ca-central-1": "763104351884", + "ca-west-1": "204538143572", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-north-1": "763104351884", + "eu-south-1": "692866216735", + "eu-south-2": "503227376785", + "eu-west-1": "763104351884", + "eu-west-2": "763104351884", + "eu-west-3": "763104351884", + "il-central-1": "780543022126", + "me-central-1": "914824155844", + "me-south-1": "217643126080", + "mx-central-1": "637423239942", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-gov-east-1": "446045086412", + "us-gov-west-1": "442386744353", + "us-iso-east-1": "886529160074", + "us-isob-east-1": "094389454867", + "us-isof-east-1": "303241398832", + "us-isof-south-1": "454834333376", + "us-west-1": "763104351884", + "us-west-2": "763104351884" + }, + "tag_prefix": "2.7.0-optimum3.3.6", + "repository": "huggingface-pytorch-tgi-inference", + "container_version": { + "inf2": "ubuntu22.04" + } } } } diff --git a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py index 8949f45b2b..1d8942819d 100644 --- a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py +++ b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py @@ -70,6 +70,9 @@ "0.0.24": "2.1.2-optimum0.0.24-neuronx-py310-ubuntu22.04", "0.0.25": "2.1.2-optimum0.0.25-neuronx-py310-ubuntu22.04", "0.0.27": "2.1.2-optimum0.0.27-neuronx-py310-ubuntu22.04", + "0.0.28": "2.1.2-optimum0.0.28-neuronx-py310-ubuntu22.04", + "0.2.0": "2.1.2-optimum0.2.0-neuronx-py310-ubuntu22.04", + "0.3.0": "2.7.0-optimum3.3.6-neuronx-py310-ubuntu22.04" }, } From 2dda6daa4be3e4f74842806b5a9eadca74fad962 Mon Sep 17 00:00:00 2001 From: pagezyhf Date: Wed, 15 Oct 2025 10:37:38 +0200 Subject: [PATCH 4/4] fix test --- tests/unit/sagemaker/image_uris/test_huggingface_llm.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py index 1d8942819d..07aa15ec96 100644 --- a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py +++ b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py @@ -71,8 +71,8 @@ "0.0.25": "2.1.2-optimum0.0.25-neuronx-py310-ubuntu22.04", "0.0.27": "2.1.2-optimum0.0.27-neuronx-py310-ubuntu22.04", "0.0.28": "2.1.2-optimum0.0.28-neuronx-py310-ubuntu22.04", - "0.2.0": "2.1.2-optimum0.2.0-neuronx-py310-ubuntu22.04", - "0.3.0": "2.7.0-optimum3.3.6-neuronx-py310-ubuntu22.04" + "0.2.0": "2.5.1-optimum3.3.4-neuronx-py310-ubuntu22.04", + "0.3.0": "2.7.0-optimum3.3.6-neuronx-py310-ubuntu22.04", }, }