Skip to content

Commit dc0860d

Browse files
authored
release: huggingface tgi neuronx 0.0.25 image (#4893)
* release: huggingface tgi neuronx 0.0.25 image * tests * add tgi 2.3.1 * update default version * update py version * fix tests * test * Revert "fix tests" This reverts commit 9374c75. * Revert "Revert "fix tests"" This reverts commit 20d46d1. * Revert "test" This reverts commit 90f6e0b.
1 parent c0d50ef commit dc0860d

File tree

3 files changed

+84
-2
lines changed

3 files changed

+84
-2
lines changed

src/sagemaker/image_uri_config/huggingface-llm-neuronx.json

Lines changed: 34 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
"inf2"
55
],
66
"version_aliases": {
7-
"0.0": "0.0.24"
7+
"0.0": "0.0.25"
88
},
99
"versions": {
1010
"0.0.16": {
@@ -301,6 +301,39 @@
301301
"container_version": {
302302
"inf2": "ubuntu22.04"
303303
}
304+
},
305+
"0.0.25": {
306+
"py_versions": [
307+
"py310"
308+
],
309+
"registries": {
310+
"ap-northeast-1": "763104351884",
311+
"ap-south-1": "763104351884",
312+
"ap-south-2": "772153158452",
313+
"ap-southeast-1": "763104351884",
314+
"ap-southeast-2": "763104351884",
315+
"ap-southeast-4": "457447274322",
316+
"cn-north-1": "727897471807",
317+
"cn-northwest-1": "727897471807",
318+
"eu-central-1": "763104351884",
319+
"eu-central-2": "380420809688",
320+
"eu-south-2": "503227376785",
321+
"eu-west-1": "763104351884",
322+
"eu-west-3": "763104351884",
323+
"il-central-1": "780543022126",
324+
"sa-east-1": "763104351884",
325+
"us-east-1": "763104351884",
326+
"us-east-2": "763104351884",
327+
"us-gov-east-1": "446045086412",
328+
"us-gov-west-1": "442386744353",
329+
"us-west-2": "763104351884",
330+
"ca-west-1": "204538143572"
331+
},
332+
"tag_prefix": "2.1.2-optimum0.0.25",
333+
"repository": "huggingface-pytorch-tgi-inference",
334+
"container_version": {
335+
"inf2": "ubuntu22.04"
336+
}
304337
}
305338
}
306339
}

src/sagemaker/image_uri_config/huggingface-llm.json

Lines changed: 48 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@
1212
"1.2": "1.2.0",
1313
"1.3": "1.3.3",
1414
"1.4": "1.4.5",
15-
"2.0": "2.2.0"
15+
"2.0": "2.3.1"
1616
},
1717
"versions": {
1818
"0.6.0": {
@@ -719,6 +719,53 @@
719719
"container_version": {
720720
"gpu": "cu121-ubuntu22.04-v2.0"
721721
}
722+
},
723+
"2.3.1": {
724+
"py_versions": [
725+
"py311"
726+
],
727+
"registries": {
728+
"af-south-1": "626614931356",
729+
"il-central-1": "780543022126",
730+
"ap-east-1": "871362719292",
731+
"ap-northeast-1": "763104351884",
732+
"ap-northeast-2": "763104351884",
733+
"ap-northeast-3": "364406365360",
734+
"ap-south-1": "763104351884",
735+
"ap-south-2": "772153158452",
736+
"ap-southeast-1": "763104351884",
737+
"ap-southeast-2": "763104351884",
738+
"ap-southeast-3": "907027046896",
739+
"ap-southeast-4": "457447274322",
740+
"ca-central-1": "763104351884",
741+
"cn-north-1": "727897471807",
742+
"cn-northwest-1": "727897471807",
743+
"eu-central-1": "763104351884",
744+
"eu-central-2": "380420809688",
745+
"eu-north-1": "763104351884",
746+
"eu-west-1": "763104351884",
747+
"eu-west-2": "763104351884",
748+
"eu-west-3": "763104351884",
749+
"eu-south-1": "692866216735",
750+
"eu-south-2": "503227376785",
751+
"me-south-1": "217643126080",
752+
"me-central-1": "914824155844",
753+
"sa-east-1": "763104351884",
754+
"us-east-1": "763104351884",
755+
"us-east-2": "763104351884",
756+
"us-gov-east-1": "446045086412",
757+
"us-gov-west-1": "442386744353",
758+
"us-iso-east-1": "886529160074",
759+
"us-isob-east-1": "094389454867",
760+
"us-west-1": "763104351884",
761+
"us-west-2": "763104351884",
762+
"ca-west-1": "204538143572"
763+
},
764+
"tag_prefix": "2.4.0-tgi2.3.1",
765+
"repository": "huggingface-pytorch-tgi-inference",
766+
"container_version": {
767+
"gpu": "cu124-ubuntu22.04"
768+
}
722769
}
723770
}
724771
}

tests/unit/sagemaker/image_uris/test_huggingface_llm.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -45,6 +45,7 @@
4545
"2.0.1": "2.1.1-tgi2.0.1-gpu-py310-cu121-ubuntu22.04",
4646
"2.0.2": "2.3.0-tgi2.0.2-gpu-py310-cu121-ubuntu22.04",
4747
"2.2.0": "2.3.0-tgi2.2.0-gpu-py310-cu121-ubuntu22.04-v2.0",
48+
"2.3.1": "2.4.0-tgi2.3.1-gpu-py311-cu124-ubuntu22.04",
4849
},
4950
"inf2": {
5051
"0.0.16": "1.13.1-optimum0.0.16-neuronx-py310-ubuntu22.04",
@@ -56,6 +57,7 @@
5657
"0.0.22": "2.1.2-optimum0.0.22-neuronx-py310-ubuntu22.04",
5758
"0.0.23": "2.1.2-optimum0.0.23-neuronx-py310-ubuntu22.04",
5859
"0.0.24": "2.1.2-optimum0.0.24-neuronx-py310-ubuntu22.04",
60+
"0.0.25": "2.1.2-optimum0.0.25-neuronx-py310-ubuntu22.04",
5961
},
6062
}
6163

0 commit comments

Comments
 (0)