Skip to content

Commit 7b74cac

Browse files
committed
change: Updates for DJL 0.33.0 release
1 parent 40c791c commit 7b74cac

File tree

4 files changed

+124
-53
lines changed

4 files changed

+124
-53
lines changed

src/sagemaker/huggingface/llm_utils.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -82,8 +82,8 @@ def get_huggingface_llm_image_uri(
8282
image_scope="inference",
8383
)
8484
if backend == "lmi":
85-
version = version or "0.24.0"
86-
return image_uris.retrieve(framework="djl-deepspeed", region=region, version=version)
85+
version = version or "0.33.0"
86+
return image_uris.retrieve(framework="djl-lmi", region=region, version=version)
8787
raise ValueError("Unsupported backend: %s" % backend)
8888

8989

src/sagemaker/image_uri_config/djl-lmi.json

Lines changed: 106 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,114 @@
33
"inference"
44
],
55
"version_aliases": {
6-
"latest": "0.30.0"
6+
"latest": "0.33.0"
77
},
88
"versions": {
9+
"0.33.0": {
10+
"registries": {
11+
"af-south-1": "626614931356",
12+
"il-central-1": "780543022126",
13+
"ap-east-1": "871362719292",
14+
"ap-northeast-1": "763104351884",
15+
"ap-northeast-2": "763104351884",
16+
"ap-northeast-3": "364406365360",
17+
"ap-south-1": "763104351884",
18+
"ap-southeast-1": "763104351884",
19+
"ap-southeast-2": "763104351884",
20+
"ap-southeast-3": "907027046896",
21+
"ca-central-1": "763104351884",
22+
"cn-north-1": "727897471807",
23+
"cn-northwest-1": "727897471807",
24+
"eu-central-1": "763104351884",
25+
"eu-north-1": "763104351884",
26+
"eu-west-1": "763104351884",
27+
"eu-west-2": "763104351884",
28+
"eu-west-3": "763104351884",
29+
"eu-south-1": "692866216735",
30+
"me-south-1": "217643126080",
31+
"me-central-1": "914824155844",
32+
"sa-east-1": "763104351884",
33+
"us-east-1": "763104351884",
34+
"us-east-2": "763104351884",
35+
"us-gov-east-1": "446045086412",
36+
"us-gov-west-1": "442386744353",
37+
"us-west-1": "763104351884",
38+
"us-west-2": "763104351884",
39+
"ca-west-1": "204538143572"
40+
},
41+
"repository": "djl-inference",
42+
"tag_prefix": "0.33.0-lmi15.0.0-cu128"
43+
},
44+
"0.32.0": {
45+
"registries": {
46+
"af-south-1": "626614931356",
47+
"il-central-1": "780543022126",
48+
"ap-east-1": "871362719292",
49+
"ap-northeast-1": "763104351884",
50+
"ap-northeast-2": "763104351884",
51+
"ap-northeast-3": "364406365360",
52+
"ap-south-1": "763104351884",
53+
"ap-southeast-1": "763104351884",
54+
"ap-southeast-2": "763104351884",
55+
"ap-southeast-3": "907027046896",
56+
"ca-central-1": "763104351884",
57+
"cn-north-1": "727897471807",
58+
"cn-northwest-1": "727897471807",
59+
"eu-central-1": "763104351884",
60+
"eu-north-1": "763104351884",
61+
"eu-west-1": "763104351884",
62+
"eu-west-2": "763104351884",
63+
"eu-west-3": "763104351884",
64+
"eu-south-1": "692866216735",
65+
"me-south-1": "217643126080",
66+
"me-central-1": "914824155844",
67+
"sa-east-1": "763104351884",
68+
"us-east-1": "763104351884",
69+
"us-east-2": "763104351884",
70+
"us-gov-east-1": "446045086412",
71+
"us-gov-west-1": "442386744353",
72+
"us-west-1": "763104351884",
73+
"us-west-2": "763104351884",
74+
"ca-west-1": "204538143572"
75+
},
76+
"repository": "djl-inference",
77+
"tag_prefix": "0.32.0-lmi14.0.0-cu126"
78+
},
79+
"0.31.0": {
80+
"registries": {
81+
"af-south-1": "626614931356",
82+
"il-central-1": "780543022126",
83+
"ap-east-1": "871362719292",
84+
"ap-northeast-1": "763104351884",
85+
"ap-northeast-2": "763104351884",
86+
"ap-northeast-3": "364406365360",
87+
"ap-south-1": "763104351884",
88+
"ap-southeast-1": "763104351884",
89+
"ap-southeast-2": "763104351884",
90+
"ap-southeast-3": "907027046896",
91+
"ca-central-1": "763104351884",
92+
"cn-north-1": "727897471807",
93+
"cn-northwest-1": "727897471807",
94+
"eu-central-1": "763104351884",
95+
"eu-north-1": "763104351884",
96+
"eu-west-1": "763104351884",
97+
"eu-west-2": "763104351884",
98+
"eu-west-3": "763104351884",
99+
"eu-south-1": "692866216735",
100+
"me-south-1": "217643126080",
101+
"me-central-1": "914824155844",
102+
"sa-east-1": "763104351884",
103+
"us-east-1": "763104351884",
104+
"us-east-2": "763104351884",
105+
"us-gov-east-1": "446045086412",
106+
"us-gov-west-1": "442386744353",
107+
"us-west-1": "763104351884",
108+
"us-west-2": "763104351884",
109+
"ca-west-1": "204538143572"
110+
},
111+
"repository": "djl-inference",
112+
"tag_prefix": "0.31.0-lmi13.0.0-cu124"
113+
},
9114
"0.30.0": {
10115
"registries": {
11116
"af-south-1": "626614931356",

src/sagemaker/image_uri_config/djl-tensorrtllm.json

Lines changed: 11 additions & 45 deletions
Original file line numberDiff line numberDiff line change
@@ -3,44 +3,10 @@
33
"inference"
44
],
55
"version_aliases": {
6-
"latest": "0.30.0"
6+
"latest": "0.33.0"
77
},
88
"versions": {
9-
"0.30.0": {
10-
"registries": {
11-
"af-south-1": "626614931356",
12-
"il-central-1": "780543022126",
13-
"ap-east-1": "871362719292",
14-
"ap-northeast-1": "763104351884",
15-
"ap-northeast-2": "763104351884",
16-
"ap-northeast-3": "364406365360",
17-
"ap-south-1": "763104351884",
18-
"ap-southeast-1": "763104351884",
19-
"ap-southeast-2": "763104351884",
20-
"ap-southeast-3": "907027046896",
21-
"ca-central-1": "763104351884",
22-
"cn-north-1": "727897471807",
23-
"cn-northwest-1": "727897471807",
24-
"eu-central-1": "763104351884",
25-
"eu-north-1": "763104351884",
26-
"eu-west-1": "763104351884",
27-
"eu-west-2": "763104351884",
28-
"eu-west-3": "763104351884",
29-
"eu-south-1": "692866216735",
30-
"me-south-1": "217643126080",
31-
"sa-east-1": "763104351884",
32-
"us-east-1": "763104351884",
33-
"us-east-2": "763104351884",
34-
"us-gov-east-1": "446045086412",
35-
"us-gov-west-1": "442386744353",
36-
"us-west-1": "763104351884",
37-
"us-west-2": "763104351884",
38-
"ca-west-1": "204538143572"
39-
},
40-
"repository": "djl-inference",
41-
"tag_prefix": "0.30.0-tensorrtllm0.12.0-cu125"
42-
},
43-
"0.29.0": {
9+
"0.33.0": {
4410
"registries": {
4511
"af-south-1": "626614931356",
4612
"il-central-1": "780543022126",
@@ -72,9 +38,9 @@
7238
"ca-west-1": "204538143572"
7339
},
7440
"repository": "djl-inference",
75-
"tag_prefix": "0.29.0-tensorrtllm0.11.0-cu124"
41+
"tag_prefix": "0.33.0-tensorrtllm0.21.0-cu128"
7642
},
77-
"0.28.0": {
43+
"0.32.0": {
7844
"registries": {
7945
"af-south-1": "626614931356",
8046
"il-central-1": "780543022126",
@@ -106,9 +72,9 @@
10672
"ca-west-1": "204538143572"
10773
},
10874
"repository": "djl-inference",
109-
"tag_prefix": "0.28.0-tensorrtllm0.9.0-cu122"
75+
"tag_prefix": "0.32.0-tensorrtllm0.12.0-cu125"
11076
},
111-
"0.27.0": {
77+
"0.30.0": {
11278
"registries": {
11379
"af-south-1": "626614931356",
11480
"il-central-1": "780543022126",
@@ -140,9 +106,9 @@
140106
"ca-west-1": "204538143572"
141107
},
142108
"repository": "djl-inference",
143-
"tag_prefix": "0.27.0-tensorrtllm0.8.0-cu122"
109+
"tag_prefix": "0.30.0-tensorrtllm0.12.0-cu125"
144110
},
145-
"0.26.0": {
111+
"0.29.0": {
146112
"registries": {
147113
"af-south-1": "626614931356",
148114
"il-central-1": "780543022126",
@@ -174,9 +140,9 @@
174140
"ca-west-1": "204538143572"
175141
},
176142
"repository": "djl-inference",
177-
"tag_prefix": "0.26.0-tensorrtllm0.7.1-cu122"
143+
"tag_prefix": "0.29.0-tensorrtllm0.11.0-cu124"
178144
},
179-
"0.25.0": {
145+
"0.28.0": {
180146
"registries": {
181147
"af-south-1": "626614931356",
182148
"il-central-1": "780543022126",
@@ -208,7 +174,7 @@
208174
"ca-west-1": "204538143572"
209175
},
210176
"repository": "djl-inference",
211-
"tag_prefix": "0.25.0-tensorrtllm0.5.0-cu122"
177+
"tag_prefix": "0.28.0-tensorrtllm0.9.0-cu122"
212178
}
213179
}
214180
}

tests/unit/sagemaker/image_uris/test_huggingface_llm.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
from sagemaker.huggingface import get_huggingface_llm_image_uri
1919
from tests.unit.sagemaker.image_uris import expected_uris, conftest
2020

21-
LMI_VERSIONS = ["0.24.0"]
21+
LMI_VERSIONS = ["0.33.0"]
2222
TEI_VERSIONS_MAPPING = {
2323
"gpu": {
2424
"1.2.3": "2.0.1-tei1.2.3-gpu-py310-cu122-ubuntu22.04",
@@ -141,15 +141,15 @@ def test_lmi_uris(load_config):
141141
ACCOUNTS = load_config["inference"]["versions"][version]["registries"]
142142
for region in ACCOUNTS.keys():
143143
for lmi_version in LMI_VERSIONS:
144-
djl_deepspeed_config = conftest.get_config("djl-deepspeed.json")
145-
DJL_DEEPSPEED_REGIONS = djl_deepspeed_config["versions"][lmi_version][
144+
djl_lmi_config = conftest.get_config("djl-lmi.json")
145+
DJL_LMI_REGIONS = djl_lmi_config["versions"][lmi_version][
146146
"registries"
147147
].keys()
148-
if region not in DJL_DEEPSPEED_REGIONS:
148+
if region not in DJL_LMI_REGIONS:
149149
continue
150150

151151
uri = get_huggingface_llm_image_uri("lmi", region=region, version=lmi_version)
152-
tag = djl_deepspeed_config["versions"][lmi_version]["tag_prefix"]
152+
tag = djl_lmi_config["versions"][lmi_version]["tag_prefix"]
153153

154154
expected = expected_uris.djl_framework_uri(
155155
"djl-inference", ACCOUNTS[region], tag, region=region

0 commit comments

Comments
 (0)