diff --git a/src/sagemaker/image_uri_config/huggingface-llm.json b/src/sagemaker/image_uri_config/huggingface-llm.json index 2571f39c17..bb659a89d3 100644 --- a/src/sagemaker/image_uri_config/huggingface-llm.json +++ b/src/sagemaker/image_uri_config/huggingface-llm.json @@ -132,6 +132,48 @@ "tag_prefix": "2.0.1-tgi0.9.3", "repository": "huggingface-pytorch-tgi-inference", "container_version": {"gpu": "cu118-ubuntu20.04"} + }, + "1.0.2": { + "py_versions": ["py39"], + "registries": { + "af-south-1": "626614931356", + "il-central-1": "780543022126", + "ap-east-1": "871362719292", + "ap-northeast-1": "763104351884", + "ap-northeast-2": "763104351884", + "ap-northeast-3": "364406365360", + "ap-south-1": "763104351884", + "ap-south-2": "772153158452", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-3": "907027046896", + "ap-southeast-4": "457447274322", + "ca-central-1": "763104351884", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-central-2": "380420809688", + "eu-north-1": "763104351884", + "eu-west-1": "763104351884", + "eu-west-2": "763104351884", + "eu-west-3": "763104351884", + "eu-south-1": "692866216735", + "eu-south-2": "503227376785", + "me-south-1": "217643126080", + "me-central-1": "914824155844", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-gov-east-1": "446045086412", + "us-gov-west-1": "442386744353", + "us-iso-east-1": "886529160074", + "us-isob-east-1": "094389454867", + "us-west-1": "763104351884", + "us-west-2": "763104351884" + }, + "tag_prefix": "2.0.1-tgi1.0.2", + "repository": "huggingface-pytorch-tgi-inference", + "container_version": {"gpu": "cu118-ubuntu20.04"} } } } diff --git a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py index dfb47775a6..cb0532dcf0 100644 --- a/tests/unit/sagemaker/image_uris/test_huggingface_llm.py +++ b/tests/unit/sagemaker/image_uris/test_huggingface_llm.py @@ -44,12 +44,13 @@ "us-west-1": "763104351884", "us-west-2": "763104351884", } -HF_VERSIONS = ["0.6.0", "0.8.2", "0.9.3"] +HF_VERSIONS = ["0.6.0", "0.8.2", "0.9.3", "1.0.2"] LMI_VERSIONS = ["0.23.0"] HF_VERSIONS_MAPPING = { "0.6.0": "2.0.0-tgi0.6.0-gpu-py39-cu118-ubuntu20.04", "0.8.2": "2.0.0-tgi0.8.2-gpu-py39-cu118-ubuntu20.04", "0.9.3": "2.0.1-tgi0.9.3-gpu-py39-cu118-ubuntu20.04", + "1.0.2": "2.0.1-tgi1.0.2-gpu-py39-cu118-ubuntu20.04", } LMI_VERSIONS_MAPPING = {"0.23.0": "deepspeed0.9.5-cu118"}