Skip to content

Commit 90cdb78

Browse files
authored
Merge branch 'aws:master' into master
2 parents 2591a24 + 1074667 commit 90cdb78

27 files changed

+466
-239
lines changed

available_images.md

Lines changed: 1 addition & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -329,10 +329,6 @@ Prior EC2 Framework Container Versions
329329
| PyTorch 2.3.0 |training |No |GPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-training:2.3.0-gpu-py311-cu121-ubuntu20.04-ec2 |
330330
| PyTorch 2.3.0 |inference |No |CPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.3.0-cpu-py311-ubuntu20.04-ec2 |
331331
| PyTorch 2.3.0 |inference |No |GPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.3.0-gpu-py311-cu121-ubuntu20.04-ec2 |
332-
| PyTorch 2.2.0 |training |No |CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-training:2.2.0-cpu-py310-ubuntu20.04-ec2 |
333-
| PyTorch 2.2.0 |training |No |GPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-training:2.2.0-gpu-py310-cu121-ubuntu20.04-ec2 |
334-
| PyTorch 2.2.0 |inference |No |CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.2.0-cpu-py310-ubuntu20.04-ec2 |
335-
| PyTorch 2.2.0 |inference |No |GPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.2.0-gpu-py310-cu118-ubuntu20.04-ec2 |
336332
| TensorFlow 2.16.2 |training |No |CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/tensorflow-training:2.16.2-cpu-py310-ubuntu20.04-ec2 |
337333
| TensorFlow 2.16.2 |training |No |GPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/tensorflow-training:2.16.2-gpu-py310-cu123-ubuntu20.04-ec2 |
338334
| TensorFlow 2.16.1 |inference |No |CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/tensorflow-inference:2.16.1-cpu-py310-ubuntu20.04-ec2 |
@@ -350,10 +346,6 @@ Prior SageMaker Framework Container Versions
350346
| PyTorch 2.3.0 | training | No | GPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-training:2.3.0-gpu-py311-cu121-ubuntu20.04-sagemaker |
351347
| PyTorch 2.3.0 | inference | No | CPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.3.0-cpu-py311-ubuntu20.04-sagemaker |
352348
| PyTorch 2.3.0 | inference | No | GPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.3.0-gpu-py311-cu121-ubuntu20.04-sagemaker |
353-
| PyTorch 2.2.0 | training | No | CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-training:2.2.0-cpu-py310-ubuntu20.04-sagemaker |
354-
| PyTorch 2.2.0 | training | No | GPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-training:2.2.0-gpu-py310-cu121-ubuntu20.04-sagemaker |
355-
| PyTorch 2.2.0 | inference | No | CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.2.0-cpu-py310-ubuntu20.04-sagemaker |
356-
| PyTorch 2.2.0 | inference | No | GPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference:2.2.0-gpu-py310-cu118-ubuntu20.04-sagemaker |
357349
| TensorFlow 2.16.2 | training | No | CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/tensorflow-training:2.16.2-cpu-py310-ubuntu20.04-sagemaker |
358350
| TensorFlow 2.16.2 | training | No | GPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/tensorflow-training:2.16.2-gpu-py310-cu123-ubuntu20.04-sagemaker |
359351
| TensorFlow 2.16.1 | inference | No | CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/tensorflow-inference:2.16.1-cpu-py310-ubuntu20.04-sagemaker |
@@ -366,15 +358,13 @@ Prior EC2 Framework ARM64/Graviton Containers
366358
| PyTorch 2.4.0 |inference |No |CPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.4.0-cpu-py311-ubuntu22.04-ec2 |
367359
| PyTorch 2.4.0 |inference |No |GPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.4.0-gpu-py311-cu124-ubuntu22.04-ec2 |
368360
| PyTorch 2.3.0 |inference |No |CPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.3.0-cpu-py311-ubuntu20.04-ec2 |
369-
| PyTorch 2.2.1 |inference |No |CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.2.1-cpu-py310-ubuntu20.04-ec2 |
370361

371362
Prior SageMaker Framework ARM64/Graviton Containers
372363
============================
373364
| Framework |Job Type |Horovod Options|CPU/GPU |Python Version Options |Example URL |
374365
|-------------------|-----------|---------------|-----------|-----------------------|---------------------------------------------------------------------------------------------------|
375366
| PyTorch 2.4.0 | inference | No | CPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.4.0-cpu-py311-ubuntu22.04-sagemaker |
376367
| PyTorch 2.3.0 | inference | No | CPU | 3.11 (py311) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.3.0-cpu-py311-ubuntu20.04-sagemaker |
377-
| PyTorch 2.2.1 | inference | No | CPU | 3.10 (py310) | 763104351884.dkr.ecr.us-east-1.amazonaws.com/pytorch-inference-graviton:2.2.1-cpu-py310-ubuntu20.04-sagemaker |
378368

379369
Prior AutoGluon Training Containers
380370
===============================
@@ -395,7 +385,7 @@ Prior AutoGluon Inference Containers
395385
Prior SageMaker Training Compiler Containers
396386
===============================
397387

398-
| Framework |Job Type |CPU/GPU |Python Version Options |Example URL |
388+
| Framework |Job Type |CPU/GPU |Python Version Options |Example URL |
399389
|-----------------------------------------------|-----------|-----------|-----------------------|---------------------------------------------------------------------------------------------------|
400390
|TensorFlow 2.6.3 with HuggingFace transformers 4.17.0 and SageMaker Training Compiler |training |GPU | 3.8 (py38) |763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-tensorflow-trcomp-training:2.6.3-transformers4.17.0-gpu-py38-cu112-ubuntu20.04 |
401391
|PyTorch 1.12.0 with SageMaker Training Compiler |training |GPU | 3.8 (py38) |763104351884.dkr.ecr.us-west-2.amazonaws.com/pytorch-trcomp-training:1.12.0-gpu-py38-cu113-ubuntu20.04-sagemaker |

huggingface/pytorch/inference/buildspec.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ images:
3535
python_version: &DOCKER_PYTHON_VERSION py3
3636
tag_python_version: &TAG_PYTHON_VERSION py311
3737
os_version: &OS_VERSION ubuntu22.04
38-
transformers_version: &TRANSFORMERS_VERSION 4.46.1
38+
transformers_version: &TRANSFORMERS_VERSION 4.48.0
3939
tag: !join [ *VERSION, '-', 'transformers', *TRANSFORMERS_VERSION, '-', *DEVICE_TYPE, '-', *TAG_PYTHON_VERSION, '-', *OS_VERSION ]
4040
docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /Dockerfile., *DEVICE_TYPE ]
4141
context:
@@ -48,8 +48,8 @@ images:
4848
python_version: &DOCKER_PYTHON_VERSION py3
4949
tag_python_version: &TAG_PYTHON_VERSION py311
5050
cuda_version: &CUDA_VERSION cu121
51-
os_version: &OS_VERSION ubuntu20.04
52-
transformers_version: &TRANSFORMERS_VERSION 4.46.1
51+
os_version: &OS_VERSION ubuntu22.04
52+
transformers_version: &TRANSFORMERS_VERSION 4.48.0
5353
tag: !join [ *VERSION, '-', 'transformers', *TRANSFORMERS_VERSION, '-', *DEVICE_TYPE, '-', *TAG_PYTHON_VERSION, '-',
5454
*CUDA_VERSION, '-', *OS_VERSION ]
5555
docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /,

huggingface/pytorch/inference/docker/2.3/py3/Dockerfile.cpu

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,13 @@
11
FROM ubuntu:22.04 AS base_image
22

33
LABEL maintainer="Amazon AI"
4-
LABEL dlc_major_version="1"
4+
LABEL dlc_major_version="2"
55
LABEL com.amazonaws.sagemaker.capabilities.accept-bind-to-port=true
66
LABEL com.amazonaws.sagemaker.capabilities.multi-models=true
77

88
ARG PYTHON=python3
99
ARG PYTHON_VERSION=3.11.9
10-
ARG MINIFORGE3_VERSION=23.11.0-0
10+
ARG MINIFORGE3_VERSION=24.11.0-0
1111
ARG OPEN_MPI_VERSION=4.1.5
1212
ARG MMS_VERSION=1.1.11
1313

huggingface/pytorch/inference/docker/2.3/py3/cu121/Dockerfile.gpu

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,15 @@
1-
FROM nvidia/cuda:12.1.1-base-ubuntu20.04 AS base_image
1+
FROM nvidia/cuda:12.1.1-base-ubuntu22.04 AS base_image
22

33
LABEL maintainer="Amazon AI"
4-
LABEL dlc_major_version="1"
4+
LABEL dlc_major_version="2"
55
LABEL com.amazonaws.sagemaker.capabilities.accept-bind-to-port=true
66
LABEL com.amazonaws.sagemaker.capabilities.multi-models=true
77
LABEL com.amazonaws.sagemaker.inference.cuda.verified_versions=12.2
88

99
ARG MMS_VERSION=1.1.11
1010
ARG PYTHON=python3
1111
ARG PYTHON_VERSION=3.11.9
12-
ARG MINIFORGE3_VERSION=23.11.0-0
12+
ARG MINIFORGE3_VERSION=24.11.0-0
1313
ARG OPEN_MPI_VERSION=4.1.5
1414

1515
# Nvidia software versions
@@ -85,7 +85,6 @@ RUN apt-get update \
8585
libnuma1 \
8686
libnuma-dev \
8787
libsm6 \
88-
libssl1.1 \
8988
libssl-dev \
9089
libxext6 \
9190
libxrender-dev \

huggingface/pytorch/training/buildspec-neuronx.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -36,7 +36,7 @@ images:
3636
tag_python_version: &TAG_PYTHON_VERSION py310
3737
neuron_sdk_version: &NEURON_SDK_VERSION sdk2.20.0
3838
os_version: &OS_VERSION ubuntu20.04
39-
transformers_version: &TRANSFORMERS_VERSION 4.43.2
39+
transformers_version: &TRANSFORMERS_VERSION 4.48.1
4040
datasets_version: &DATASETS_VERSION 2.18.0
4141
tag: !join [ *VERSION, '-', 'transformers', *TRANSFORMERS_VERSION, '-', *DEVICE_TYPE, '-', *TAG_PYTHON_VERSION,"-", *NEURON_SDK_VERSION, '-', *OS_VERSION ]
4242
docker_file: !join [ docker/, *SHORT_VERSION, /, *DOCKER_PYTHON_VERSION, /, *NEURON_SDK_VERSION, /Dockerfile., *DEVICE_TYPE ]

huggingface/pytorch/training/buildspec.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -24,7 +24,7 @@ images:
2424
tag_python_version: &TAG_PYTHON_VERSION py311
2525
cuda_version: &CUDA_VERSION cu121
2626
os_version: &OS_VERSION ubuntu20.04
27-
transformers_version: &TRANSFORMERS_VERSION 4.46.1
27+
transformers_version: &TRANSFORMERS_VERSION 4.48.0
2828
datasets_version: &DATASETS_VERSION 3.1.0
2929
tag: !join [ *VERSION, '-', 'transformers', *TRANSFORMERS_VERSION, '-', *DEVICE_TYPE, '-', *TAG_PYTHON_VERSION, '-',
3030
*CUDA_VERSION, '-', *OS_VERSION ]

huggingface/pytorch/training/docker/2.1/py3/sdk2.20.0/Dockerfile.neuronx

Lines changed: 7 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,17 +4,21 @@
44
# docker image region us-west-2
55
FROM 763104351884.dkr.ecr.us-west-2.amazonaws.com/pytorch-training-neuronx:2.1.2-neuronx-py310-sdk2.20.0-ubuntu20.04
66

7-
87
LABEL maintainer="Amazon AI"
9-
LABEL dlc_major_version="1"
8+
LABEL dlc_major_version="2"
109

1110
# version args
12-
ARG OPTIMUM_NEURON_VERSION=0.0.25
11+
ARG OPTIMUM_NEURON_VERSION=0.0.28
1312
ARG TRANSFORMERS_VERSION
1413
ARG DATASETS_VERSION
1514
ARG GEVENT_VERSION=24.10.3
1615
ARG PYTHON=python3
1716

17+
RUN apt-get remove -y --purge emacs && \
18+
apt-get autoremove -y
19+
20+
RUN pip install --upgrade pip
21+
1822
# install Hugging Face libraries and its dependencies
1923
RUN pip install --no-cache-dir \
2024
"sagemaker==2.232.2" \

huggingface/pytorch/training/docker/2.3/py3/cu121/Dockerfile.gpu

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,11 @@
44
# docker image region us-west-2
55
FROM 763104351884.dkr.ecr.us-west-2.amazonaws.com/pytorch-training:2.3.0-gpu-py311-cu121-ubuntu20.04-sagemaker
66

7+
RUN apt-get remove -y --purge emacs && \
8+
apt-get autoremove -y
9+
710
LABEL maintainer="Amazon AI"
8-
LABEL dlc_major_version="1"
11+
LABEL dlc_major_version="2"
912

1013
# version args
1114
ARG TRANSFORMERS_VERSION
@@ -17,10 +20,11 @@ ARG ACCELERATE_VERSION=1.1.0
1720
ARG TRL_VERSION=0.11.4
1821
ARG PEFT_VERSION=0.13.2
1922
ARG FLASH_ATTN_VERSION=2.6.3
23+
ARG NINJA_VERSION=1.11.1
2024
ARG PYTHON=python3
2125

2226
# TODO: Remove when the base image is updated
23-
RUN pip install --upgrade "pip==24.1.2" \
27+
RUN pip install --upgrade pip \
2428
&& pip uninstall -y transformer-engine flash-attn pyarrow cryptography \
2529
&& pip install --no-cache-dir -U pyarrow cryptography pyopenssl Pillow \
2630
&& pip --no-cache-dir install --upgrade wheel setuptools \
@@ -38,6 +42,7 @@ RUN pip install --no-cache-dir \
3842
bitsandbytes \
3943
evaluate==${EVALUATE_VERSION} \
4044
accelerate==${ACCELERATE_VERSION} \
45+
ninja==${NINJA_VERSION} \
4146
trl==${TRL_VERSION} \
4247
peft==${PEFT_VERSION} \
4348
flash-attn==${FLASH_ATTN_VERSION}

release_images_inference.yml

Lines changed: 16 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -149,11 +149,11 @@ release_images:
149149
framework: "huggingface_pytorch"
150150
version: "2.3.0"
151151
arch_type: "x86"
152-
hf_transformers: "4.46.1"
152+
hf_transformers: "4.48.0"
153153
inference:
154154
device_types: ["gpu" ]
155155
python_versions: [ "py311" ]
156-
os_version: "ubuntu20.04"
156+
os_version: "ubuntu22.04"
157157
cuda_version: "cu121"
158158
example: False
159159
disable_sm_tag: True
@@ -162,11 +162,24 @@ release_images:
162162
framework: "huggingface_pytorch"
163163
version: "2.3.0"
164164
arch_type: "x86"
165-
hf_transformers: "4.46.1"
165+
hf_transformers: "4.48.0"
166166
inference:
167167
device_types: [ "cpu" ]
168168
python_versions: [ "py311" ]
169169
os_version: "ubuntu22.04"
170170
example: False
171171
disable_sm_tag: True
172172
force_release: False
173+
14:
174+
framework: "djl"
175+
version: "0.32.0"
176+
arch_type: "x86"
177+
inference:
178+
device_types: [ "gpu" ]
179+
python_versions: [ "py312" ]
180+
os_version: "ubuntu22.04"
181+
lmi_version: "14.0.0"
182+
cuda_version: "cu124"
183+
example: False
184+
disable_sm_tag: True
185+
force_release: False

0 commit comments

Comments
 (0)