Skip to content

Commit 49e1885

Browse files
jinyoung-limroot
authored and
root
committed
feat: TGI optimum 0.0.18 (general+llm) (aws#4436)
* tgi optimum 0.0.18 * add test * update latest transformer version * add dlc optimum 0.0.18 config * 0.0 defaults to 0.0.16
1 parent 24f871f commit 49e1885

File tree

4 files changed

+88
-3
lines changed

4 files changed

+88
-3
lines changed

src/sagemaker/image_uri_config/huggingface-llm-neuronx.json

+29
Original file line numberDiff line numberDiff line change
@@ -64,6 +64,35 @@
6464
"container_version": {
6565
"inf2": "ubuntu22.04"
6666
}
67+
},
68+
"0.0.18": {
69+
"py_versions": [
70+
"py310"
71+
],
72+
"registries": {
73+
"ap-northeast-1": "763104351884",
74+
"ap-south-1": "763104351884",
75+
"ap-south-2": "772153158452",
76+
"ap-southeast-1": "763104351884",
77+
"ap-southeast-2": "763104351884",
78+
"ap-southeast-4": "457447274322",
79+
"eu-central-1": "763104351884",
80+
"eu-central-2": "380420809688",
81+
"eu-south-2": "503227376785",
82+
"eu-west-1": "763104351884",
83+
"eu-west-3": "763104351884",
84+
"il-central-1": "780543022126",
85+
"sa-east-1": "763104351884",
86+
"us-east-1": "763104351884",
87+
"us-east-2": "763104351884",
88+
"us-west-2": "763104351884",
89+
"ca-west-1": "204538143572"
90+
},
91+
"tag_prefix": "1.13.1-optimum0.0.18",
92+
"repository": "huggingface-pytorch-tgi-inference",
93+
"container_version": {
94+
"inf2": "ubuntu22.04"
95+
}
6796
}
6897
}
6998
}

src/sagemaker/image_uri_config/huggingface-neuronx.json

+57-2
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,8 @@
44
"trn"
55
],
66
"version_aliases": {
7-
"4.28": "4.28.1"
7+
"4.28": "4.28.1",
8+
"4.34": "4.34.1"
89
},
910
"versions": {
1011
"4.28.1": {
@@ -86,7 +87,9 @@
8687
"inf"
8788
],
8889
"version_aliases": {
89-
"4.28": "4.28.1"
90+
"4.28": "4.28.1",
91+
"4.34": "4.34.1",
92+
"4.36": "4.36.2"
9093
},
9194
"versions": {
9295
"4.28.1": {
@@ -192,6 +195,58 @@
192195
"sdk2.15.0"
193196
]
194197
}
198+
},
199+
"4.36.2": {
200+
"version_aliases": {
201+
"pytorch1.13": "pytorch1.13.1"
202+
},
203+
"pytorch1.13.1": {
204+
"py_versions": [
205+
"py310"
206+
],
207+
"repository": "huggingface-pytorch-inference-neuronx",
208+
"registries": {
209+
"af-south-1": "626614931356",
210+
"il-central-1": "780543022126",
211+
"ap-east-1": "871362719292",
212+
"ap-northeast-1": "763104351884",
213+
"ap-northeast-2": "763104351884",
214+
"ap-northeast-3": "364406365360",
215+
"ap-south-1": "763104351884",
216+
"ap-south-2": "772153158452",
217+
"ap-southeast-1": "763104351884",
218+
"ap-southeast-2": "763104351884",
219+
"ap-southeast-4": "457447274322",
220+
"ca-central-1": "763104351884",
221+
"cn-north-1": "727897471807",
222+
"cn-northwest-1": "727897471807",
223+
"eu-central-1": "763104351884",
224+
"eu-central-2": "380420809688",
225+
"eu-north-1": "763104351884",
226+
"eu-west-1": "763104351884",
227+
"eu-west-2": "763104351884",
228+
"eu-west-3": "763104351884",
229+
"eu-south-1": "692866216735",
230+
"eu-south-2": "503227376785",
231+
"me-south-1": "217643126080",
232+
"sa-east-1": "763104351884",
233+
"us-east-1": "763104351884",
234+
"us-east-2": "763104351884",
235+
"us-gov-east-1": "446045086412",
236+
"us-gov-west-1": "442386744353",
237+
"us-iso-east-1": "886529160074",
238+
"us-isob-east-1": "094389454867",
239+
"us-west-1": "763104351884",
240+
"us-west-2": "763104351884",
241+
"ca-west-1": "204538143572"
242+
},
243+
"container_version": {
244+
"inf": "ubuntu20.04"
245+
},
246+
"sdk_versions": [
247+
"sdk2.16.1"
248+
]
249+
}
195250
}
196251
}
197252
}

tests/conftest.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -441,7 +441,7 @@ def huggingface_neuron_latest_inference_transformer_version():
441441

442442
@pytest.fixture(scope="module")
443443
def huggingface_neuronx_latest_inference_transformer_version():
444-
return "4.34.1"
444+
return "4.36.2"
445445

446446

447447
@pytest.fixture(scope="module")

tests/unit/sagemaker/image_uris/test_huggingface_llm.py

+1
Original file line numberDiff line numberDiff line change
@@ -34,6 +34,7 @@
3434
"inf2": {
3535
"0.0.16": "1.13.1-optimum0.0.16-neuronx-py310-ubuntu22.04",
3636
"0.0.17": "1.13.1-optimum0.0.17-neuronx-py310-ubuntu22.04",
37+
"0.0.18": "1.13.1-optimum0.0.18-neuronx-py310-ubuntu22.04",
3738
},
3839
}
3940

0 commit comments

Comments
 (0)