diff --git a/sagemaker-core/src/sagemaker/core/image_uri_config/huggingface-vllm-neuronx.json b/sagemaker-core/src/sagemaker/core/image_uri_config/huggingface-vllm-neuronx.json index c2592c915a..2a2e6c8f78 100644 --- a/sagemaker-core/src/sagemaker/core/image_uri_config/huggingface-vllm-neuronx.json +++ b/sagemaker-core/src/sagemaker/core/image_uri_config/huggingface-vllm-neuronx.json @@ -1,10 +1,10 @@ { "inference": { "processors": [ - "inf2" + "neuronx" ], "version_aliases": { - "0.4": "0.4.1" + "0.4": "0.4.2" }, "versions": { "0.4.1": { @@ -27,7 +27,33 @@ "tag_prefix": "0.10.2", "repository": "huggingface-vllm-inference-neuronx", "container_version": { - "inf2": "ubuntu22.04" + "neuronx": "ubuntu22.04" + }, + "sdk_versions": [ + "sdk2.26.0" + ] + }, + "0.4.2": { + "py_versions": [ + "py310" + ], + "registries": { + "ap-northeast-1": "763104351884", + "ap-south-1": "763104351884", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "eu-central-1": "763104351884", + "eu-west-1": "763104351884", + "eu-west-3": "763104351884", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-west-2": "763104351884" + }, + "tag_prefix": "0.11.0-optimum0.4.2", + "repository": "huggingface-vllm-inference-neuronx", + "container_version": { + "neuronx": "ubuntu22.04" }, "sdk_versions": [ "sdk2.26.0" @@ -35,4 +61,4 @@ } } } -} \ No newline at end of file +}