diff --git a/CHANGELOG.md b/CHANGELOG.md index 7c2b1851ae..8d2181c222 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,5 +1,19 @@ # Changelog +## v2.237.3 (2025-01-09) + +### Bug Fixes and Other Changes + + * model server might have already done a serialization. honor that by not decoding the request again if it is not already bytes or bytestream + * Disable jumpstart tests missing clean up logic + * Jumpstart ap southeast 5 + * add autogluon 1.2 + * updated inference script to cover context + * security update -> use sha256 instead of md5 for file hashing + * Fix Flake8 Violations + * Added parsing string support for situations where custom code might be used (ie. mlflow) + * Updating Inference Optimization Validations + ## v2.237.2 (2024-12-17) ### Bug Fixes and Other Changes diff --git a/VERSION b/VERSION index 8ea608a3da..1ca006360a 100644 --- a/VERSION +++ b/VERSION @@ -1 +1 @@ -2.237.3.dev0 +2.237.4.dev0 diff --git a/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json b/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json index 0fdb190d30..b16933d1a3 100644 --- a/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json +++ b/src/sagemaker/image_uri_config/huggingface-llm-neuronx.json @@ -4,7 +4,7 @@ "inf2" ], "version_aliases": { - "0.0": "0.0.25" + "0.0": "0.0.27" }, "versions": { "0.0.16": { @@ -344,6 +344,40 @@ "container_version": { "inf2": "ubuntu22.04" } + }, + "0.0.27": { + "py_versions": [ + "py310" + ], + "registries": { + "ap-northeast-1": "763104351884", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-4": "457447274322", + "ap-southeast-5": "550225433462", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-south-2": "503227376785", + "eu-west-1": "763104351884", + "eu-west-3": "763104351884", + "il-central-1": "780543022126", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-gov-east-1": "446045086412", + "us-gov-west-1": "442386744353", + "us-west-2": "763104351884", + "ca-west-1": "204538143572" + }, + "tag_prefix": "2.1.2-optimum0.0.27", + "repository": "huggingface-pytorch-tgi-inference", + "container_version": { + "inf2": "ubuntu22.04" + } } } } diff --git a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py index 28525a390c..49cc4773d6 100644 --- a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py +++ b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py @@ -58,6 +58,7 @@ "0.0.23": "2.1.2-optimum0.0.23-neuronx-py310-ubuntu22.04", "0.0.24": "2.1.2-optimum0.0.24-neuronx-py310-ubuntu22.04", "0.0.25": "2.1.2-optimum0.0.25-neuronx-py310-ubuntu22.04", + "0.0.27": "2.1.2-optimum0.0.27-neuronx-py310-ubuntu22.04", }, }