diff --git a/src/sagemaker/djl_inference/model.py b/src/sagemaker/djl_inference/model.py index 89f15a54ab..b22347afbd 100644 --- a/src/sagemaker/djl_inference/model.py +++ b/src/sagemaker/djl_inference/model.py @@ -599,7 +599,7 @@ def serving_image_uri(self, region_name): str: The appropriate image URI based on the given parameters. """ if not self.djl_version: - self.djl_version = "0.21.0" + self.djl_version = "0.22.1" return image_uris.retrieve( self._framework(), diff --git a/src/sagemaker/image_uri_config/djl-deepspeed.json b/src/sagemaker/image_uri_config/djl-deepspeed.json index 70394d0d9a..8eb171c05f 100644 --- a/src/sagemaker/image_uri_config/djl-deepspeed.json +++ b/src/sagemaker/image_uri_config/djl-deepspeed.json @@ -1,6 +1,36 @@ { "scope": ["inference"], "versions": { + "0.22.1": { + "registries": { + "af-south-1": "626614931356", + "ap-east-1": "871362719292", + "ap-northeast-1": "763104351884", + "ap-northeast-2": "763104351884", + "ap-northeast-3": "364406365360", + "ap-south-1": "763104351884", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-3": "907027046896", + "ca-central-1": "763104351884", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-north-1": "763104351884", + "eu-west-1": "763104351884", + "eu-west-2": "763104351884", + "eu-west-3": "763104351884", + "eu-south-1": "692866216735", + "me-south-1": "217643126080", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-west-1": "763104351884", + "us-west-2": "763104351884" + }, + "repository": "djl-inference", + "tag_prefix": "0.22.1-deepspeed0.8.3-cu118" + }, "0.21.0": { "registries": { "af-south-1": "626614931356", diff --git a/src/sagemaker/image_uri_config/djl-fastertransformer.json b/src/sagemaker/image_uri_config/djl-fastertransformer.json index 4c1873257a..d86f073b84 100644 --- a/src/sagemaker/image_uri_config/djl-fastertransformer.json +++ b/src/sagemaker/image_uri_config/djl-fastertransformer.json @@ -1,6 +1,36 @@ { "scope": ["inference"], "versions": { + "0.22.1": { + "registries": { + "af-south-1": "626614931356", + "ap-east-1": "871362719292", + "ap-northeast-1": "763104351884", + "ap-northeast-2": "763104351884", + "ap-northeast-3": "364406365360", + "ap-south-1": "763104351884", + "ap-southeast-1": "763104351884", + "ap-southeast-2": "763104351884", + "ap-southeast-3": "907027046896", + "ca-central-1": "763104351884", + "cn-north-1": "727897471807", + "cn-northwest-1": "727897471807", + "eu-central-1": "763104351884", + "eu-north-1": "763104351884", + "eu-west-1": "763104351884", + "eu-west-2": "763104351884", + "eu-west-3": "763104351884", + "eu-south-1": "692866216735", + "me-south-1": "217643126080", + "sa-east-1": "763104351884", + "us-east-1": "763104351884", + "us-east-2": "763104351884", + "us-west-1": "763104351884", + "us-west-2": "763104351884" + }, + "repository": "djl-inference", + "tag_prefix": "0.22.1-fastertransformer5.3.0-cu118" + }, "0.21.0": { "registries": { "af-south-1": "626614931356", diff --git a/tests/unit/sagemaker/image_uris/test_djl.py b/tests/unit/sagemaker/image_uris/test_djl.py index e85778acbe..4dc81b3562 100644 --- a/tests/unit/sagemaker/image_uris/test_djl.py +++ b/tests/unit/sagemaker/image_uris/test_djl.py @@ -41,8 +41,8 @@ "us-west-1": "763104351884", "us-west-2": "763104351884", } -DJL_DEEPSPEED_VERSIONS = ["0.21.0", "0.20.0", "0.19.0"] -DJL_FASTERTRANSFORMER_VERSIONS = ["0.21.0"] +DJL_DEEPSPEED_VERSIONS = ["0.22.1", "0.21.0", "0.20.0", "0.19.0"] +DJL_FASTERTRANSFORMER_VERSIONS = ["0.22.1", "0.21.0"] DJL_NEURONX_VERSIONS = ["0.22.1"] DJL_VERSIONS_TO_FRAMEWORK = { "0.19.0": {"djl-deepspeed": "deepspeed0.7.3-cu113"}, @@ -52,6 +52,8 @@ "djl-fastertransformer": "fastertransformer5.3.0-cu117", }, "0.22.1": { + "djl-deepspeed": "deepspeed0.8.3-cu118", + "djl-fastertransformer": "fastertransformer5.3.0-cu118", "djl-neuronx": "neuronx-sdk2.9.0", }, }