Skip to content

Commit 122ea28

Browse files
malav-shastrimalavhs
authored and
root
committed
feat: Add support for TGI Neuronx 0.0.27 and HF PT 2.3.0 image in PySDK (aws#5050)
Co-authored-by: malavhs <[email protected]>
1 parent dfad50d commit 122ea28

File tree

3 files changed

+88
-1
lines changed

3 files changed

+88
-1
lines changed

src/sagemaker/image_uri_config/huggingface-llm-neuronx.json

Lines changed: 35 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
"inf2"
55
],
66
"version_aliases": {
7-
"0.0": "0.0.25"
7+
"0.0": "0.0.27"
88
},
99
"versions": {
1010
"0.0.16": {
@@ -364,6 +364,40 @@
364364
"container_version": {
365365
"inf2": "ubuntu22.04"
366366
}
367+
},
368+
"0.0.27": {
369+
"py_versions": [
370+
"py310"
371+
],
372+
"registries": {
373+
"ap-northeast-1": "763104351884",
374+
"ap-south-1": "763104351884",
375+
"ap-south-2": "772153158452",
376+
"ap-southeast-1": "763104351884",
377+
"ap-southeast-2": "763104351884",
378+
"ap-southeast-4": "457447274322",
379+
"ap-southeast-5": "550225433462",
380+
"cn-north-1": "727897471807",
381+
"cn-northwest-1": "727897471807",
382+
"eu-central-1": "763104351884",
383+
"eu-central-2": "380420809688",
384+
"eu-south-2": "503227376785",
385+
"eu-west-1": "763104351884",
386+
"eu-west-3": "763104351884",
387+
"il-central-1": "780543022126",
388+
"sa-east-1": "763104351884",
389+
"us-east-1": "763104351884",
390+
"us-east-2": "763104351884",
391+
"us-gov-east-1": "446045086412",
392+
"us-gov-west-1": "442386744353",
393+
"us-west-2": "763104351884",
394+
"ca-west-1": "204538143572"
395+
},
396+
"tag_prefix": "2.1.2-optimum0.0.27",
397+
"repository": "huggingface-pytorch-tgi-inference",
398+
"container_version": {
399+
"inf2": "ubuntu22.04"
400+
}
367401
}
368402
}
369403
}

src/sagemaker/image_uri_config/huggingface.json

Lines changed: 52 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1931,6 +1931,58 @@
19311931
"cpu": "ubuntu22.04"
19321932
}
19331933
}
1934+
},
1935+
"4.48.0": {
1936+
"version_aliases": {
1937+
"pytorch2.3": "pytorch2.3.0"
1938+
},
1939+
"pytorch2.3.0": {
1940+
"py_versions": [
1941+
"py311"
1942+
],
1943+
"registries": {
1944+
"af-south-1": "626614931356",
1945+
"il-central-1": "780543022126",
1946+
"ap-east-1": "871362719292",
1947+
"ap-northeast-1": "763104351884",
1948+
"ap-northeast-2": "763104351884",
1949+
"ap-northeast-3": "364406365360",
1950+
"ap-south-1": "763104351884",
1951+
"ap-south-2": "772153158452",
1952+
"ap-southeast-1": "763104351884",
1953+
"ap-southeast-2": "763104351884",
1954+
"ap-southeast-3": "907027046896",
1955+
"ap-southeast-4": "457447274322",
1956+
"ca-central-1": "763104351884",
1957+
"cn-north-1": "727897471807",
1958+
"cn-northwest-1": "727897471807",
1959+
"eu-central-1": "763104351884",
1960+
"eu-central-2": "380420809688",
1961+
"eu-north-1": "763104351884",
1962+
"eu-west-1": "763104351884",
1963+
"eu-west-2": "763104351884",
1964+
"eu-west-3": "763104351884",
1965+
"eu-south-1": "692866216735",
1966+
"eu-south-2": "503227376785",
1967+
"me-south-1": "217643126080",
1968+
"me-central-1": "914824155844",
1969+
"sa-east-1": "763104351884",
1970+
"us-east-1": "763104351884",
1971+
"us-east-2": "763104351884",
1972+
"us-gov-east-1": "446045086412",
1973+
"us-gov-west-1": "442386744353",
1974+
"us-iso-east-1": "886529160074",
1975+
"us-isob-east-1": "094389454867",
1976+
"us-west-1": "763104351884",
1977+
"us-west-2": "763104351884",
1978+
"ca-west-1": "204538143572"
1979+
},
1980+
"repository": "huggingface-pytorch-inference",
1981+
"container_version": {
1982+
"gpu": "cu121-ubuntu22.04",
1983+
"cpu": "ubuntu22.04"
1984+
}
1985+
}
19341986
}
19351987
}
19361988
}

tests/unit/sagemaker/image_uris/test_huggingface_llm.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -60,6 +60,7 @@
6060
"0.0.23": "2.1.2-optimum0.0.23-neuronx-py310-ubuntu22.04",
6161
"0.0.24": "2.1.2-optimum0.0.24-neuronx-py310-ubuntu22.04",
6262
"0.0.25": "2.1.2-optimum0.0.25-neuronx-py310-ubuntu22.04",
63+
"0.0.27": "2.1.2-optimum0.0.27-neuronx-py310-ubuntu22.04",
6364
},
6465
}
6566

0 commit comments

Comments
 (0)