Skip to content

Commit e2d7d31

Browse files
[Neuron] Update Dockerfile.neuron to use latest neuron release (2.23) (#18512)
Signed-off-by: Satyajith Chilappagari <satchill@amazon.com>
1 parent 23b67b3 commit e2d7d31

File tree

1 file changed

+4
-3
lines changed

1 file changed

+4
-3
lines changed

docker/Dockerfile.neuron

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# default base image
22
# https://gallery.ecr.aws/neuron/pytorch-inference-neuronx
3-
ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.5.1-neuronx-py310-sdk2.22.0-ubuntu22.04"
3+
ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.6.0-neuronx-py310-sdk2.23.0-ubuntu22.04"
44

55
FROM $BASE_IMAGE
66

@@ -22,8 +22,7 @@ WORKDIR ${APP_MOUNT}/vllm
2222

2323
RUN python3 -m pip install --upgrade pip
2424
RUN python3 -m pip install --no-cache-dir fastapi ninja tokenizers pandas tenacity
25-
RUN python3 -m pip install sentencepiece transformers==4.48.0 -U
26-
RUN python3 -m pip install neuronx-cc==2.17.194.0 --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
25+
RUN python3 -m pip install neuronx-cc==2.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
2726
RUN python3 -m pip install pytest
2827

2928
# uninstall transformers-neuronx package explicitly to avoid version conflict
@@ -49,6 +48,8 @@ RUN python3 -m pip install -e tests/vllm_test_utils
4948
# FIXME: `--no-deps` argument is temporarily added to resolve transformers package version conflict
5049
RUN python3 -m pip install transformers-neuronx==0.13.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U --no-deps
5150

51+
RUN python3 -m pip install sentencepiece transformers==4.48.0 -U
52+
5253
# overwrite entrypoint to run bash script
5354
RUN echo "import subprocess; import sys; subprocess.check_call(sys.argv[1:])" > /usr/local/bin/dockerd-entrypoint.py
5455

0 commit comments

Comments
 (0)