Skip to content

Commit d4f2653

Browse files
authored
Merge branch 'master' into master
2 parents 0983d5f + aa86be9 commit d4f2653

File tree

7 files changed

+71
-8
lines changed

7 files changed

+71
-8
lines changed

src/sagemaker/djl_inference/model.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -781,7 +781,7 @@ def serving_image_uri(self, region_name):
781781
str: The appropriate image URI based on the given parameters.
782782
"""
783783
if not self.djl_version:
784-
self.djl_version = "0.23.0"
784+
self.djl_version = "0.24.0"
785785

786786
return image_uris.retrieve(
787787
self._framework(),

src/sagemaker/huggingface/llm_utils.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,6 @@ def get_huggingface_llm_image_uri(
5151
image_scope="inference",
5252
)
5353
if backend == "lmi":
54-
version = version or "0.23.0"
54+
version = version or "0.24.0"
5555
return image_uris.retrieve(framework="djl-deepspeed", region=region, version=version)
5656
raise ValueError("Unsupported backend: %s" % backend)

src/sagemaker/image_uri_config/djl-deepspeed.json

+31
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,37 @@
11
{
22
"scope": ["inference"],
33
"versions": {
4+
"0.24.0": {
5+
"registries": {
6+
"af-south-1": "626614931356",
7+
"il-central-1": "780543022126",
8+
"ap-east-1": "871362719292",
9+
"ap-northeast-1": "763104351884",
10+
"ap-northeast-2": "763104351884",
11+
"ap-northeast-3": "364406365360",
12+
"ap-south-1": "763104351884",
13+
"ap-southeast-1": "763104351884",
14+
"ap-southeast-2": "763104351884",
15+
"ap-southeast-3": "907027046896",
16+
"ca-central-1": "763104351884",
17+
"cn-north-1": "727897471807",
18+
"cn-northwest-1": "727897471807",
19+
"eu-central-1": "763104351884",
20+
"eu-north-1": "763104351884",
21+
"eu-west-1": "763104351884",
22+
"eu-west-2": "763104351884",
23+
"eu-west-3": "763104351884",
24+
"eu-south-1": "692866216735",
25+
"me-south-1": "217643126080",
26+
"sa-east-1": "763104351884",
27+
"us-east-1": "763104351884",
28+
"us-east-2": "763104351884",
29+
"us-west-1": "763104351884",
30+
"us-west-2": "763104351884"
31+
},
32+
"repository": "djl-inference",
33+
"tag_prefix": "0.24.0-deepspeed0.10.0-cu118"
34+
},
435
"0.23.0": {
536
"registries": {
637
"af-south-1": "626614931356",

src/sagemaker/image_uri_config/djl-fastertransformer.json

+31
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,37 @@
11
{
22
"scope": ["inference"],
33
"versions": {
4+
"0.24.0": {
5+
"registries": {
6+
"af-south-1": "626614931356",
7+
"il-central-1": "780543022126",
8+
"ap-east-1": "871362719292",
9+
"ap-northeast-1": "763104351884",
10+
"ap-northeast-2": "763104351884",
11+
"ap-northeast-3": "364406365360",
12+
"ap-south-1": "763104351884",
13+
"ap-southeast-1": "763104351884",
14+
"ap-southeast-2": "763104351884",
15+
"ap-southeast-3": "907027046896",
16+
"ca-central-1": "763104351884",
17+
"cn-north-1": "727897471807",
18+
"cn-northwest-1": "727897471807",
19+
"eu-central-1": "763104351884",
20+
"eu-north-1": "763104351884",
21+
"eu-west-1": "763104351884",
22+
"eu-west-2": "763104351884",
23+
"eu-west-3": "763104351884",
24+
"eu-south-1": "692866216735",
25+
"me-south-1": "217643126080",
26+
"sa-east-1": "763104351884",
27+
"us-east-1": "763104351884",
28+
"us-east-2": "763104351884",
29+
"us-west-1": "763104351884",
30+
"us-west-2": "763104351884"
31+
},
32+
"repository": "djl-inference",
33+
"tag_prefix": "0.24.0-fastertransformer5.3.0-cu118"
34+
},
435
"0.23.0": {
536
"registries": {
637
"af-south-1": "626614931356",

tests/unit/sagemaker/image_uris/test_djl.py

+4-3
Original file line numberDiff line numberDiff line change
@@ -42,9 +42,8 @@
4242
"us-west-1": "763104351884",
4343
"us-west-2": "763104351884",
4444
}
45-
DJL_DEEPSPEED_VERSIONS = ["0.23.0", "0.22.1", "0.21.0", "0.20.0", "0.19.0"]
46-
DJL_FASTERTRANSFORMER_VERSIONS = ["0.23.0", "0.22.1", "0.21.0"]
47-
DJL_NEURONX_VERSIONS = ["0.23.0", "0.22.1"]
45+
DJL_DEEPSPEED_VERSIONS = ["0.24.0", "0.23.0", "0.22.1", "0.21.0", "0.20.0", "0.19.0"]
46+
DJL_FASTERTRANSFORMER_VERSIONS = ["0.24.0", "0.23.0", "0.22.1", "0.21.0"]
4847
DJL_NEURONX_VERSIONS = ["0.24.0", "0.23.0", "0.22.1"]
4948
DJL_VERSIONS_TO_FRAMEWORK = {
5049
"0.19.0": {"djl-deepspeed": "deepspeed0.7.3-cu113"},
@@ -64,6 +63,8 @@
6463
"djl-neuronx": "neuronx-sdk2.12.0",
6564
},
6665
"0.24.0": {
66+
"djl-deepspeed": "deepspeed0.10.0-cu118",
67+
"djl-fastertransformer": "fastertransformer5.3.0-cu118",
6768
"djl-neuronx": "neuronx-sdk2.14.1",
6869
},
6970
}

tests/unit/sagemaker/image_uris/test_huggingface_llm.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -45,15 +45,15 @@
4545
"us-west-2": "763104351884",
4646
}
4747
HF_VERSIONS = ["0.6.0", "0.8.2", "0.9.3", "1.0.3", "1.1.0"]
48-
LMI_VERSIONS = ["0.23.0"]
48+
LMI_VERSIONS = ["0.24.0"]
4949
HF_VERSIONS_MAPPING = {
5050
"0.6.0": "2.0.0-tgi0.6.0-gpu-py39-cu118-ubuntu20.04",
5151
"0.8.2": "2.0.0-tgi0.8.2-gpu-py39-cu118-ubuntu20.04",
5252
"0.9.3": "2.0.1-tgi0.9.3-gpu-py39-cu118-ubuntu20.04",
5353
"1.0.3": "2.0.1-tgi1.0.3-gpu-py39-cu118-ubuntu20.04",
5454
"1.1.0": "2.0.1-tgi1.1.0-gpu-py39-cu118-ubuntu20.04",
5555
}
56-
LMI_VERSIONS_MAPPING = {"0.23.0": "deepspeed0.9.5-cu118"}
56+
LMI_VERSIONS_MAPPING = {"0.24.0": "deepspeed0.10.0-cu118"}
5757

5858

5959
@pytest.mark.parametrize("version", HF_VERSIONS)

tests/unit/test_djl_inference.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@
4646
ROLE = "dummy_role"
4747
REGION = "us-west-2"
4848
BUCKET = "mybucket"
49-
IMAGE_URI = "763104351884.dkr.ecr.us-west-2.amazon.com/djl-inference:0.23.0-deepspeed0.9.5-cu118"
49+
IMAGE_URI = "763104351884.dkr.ecr.us-west-2.amazon.com/djl-inference:0.24.0-deepspeed0.10.0-cu118"
5050
GPU_INSTANCE = "ml.g5.12xlarge"
5151

5252

0 commit comments

Comments
 (0)