File tree Expand file tree Collapse file tree 1 file changed +4
-3
lines changed Expand file tree Collapse file tree 1 file changed +4
-3
lines changed Original file line number Diff line number Diff line change 1
1
# default base image
2
2
# https://gallery.ecr.aws/neuron/pytorch-inference-neuronx
3
- ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.5.1 -neuronx-py310-sdk2.22 .0-ubuntu22.04"
3
+ ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.6.0 -neuronx-py310-sdk2.23 .0-ubuntu22.04"
4
4
5
5
FROM $BASE_IMAGE
6
6
@@ -22,8 +22,7 @@ WORKDIR ${APP_MOUNT}/vllm
22
22
23
23
RUN python3 -m pip install --upgrade pip
24
24
RUN python3 -m pip install --no-cache-dir fastapi ninja tokenizers pandas tenacity
25
- RUN python3 -m pip install sentencepiece transformers==4.48.0 -U
26
- RUN python3 -m pip install neuronx-cc==2.17.194.0 --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
25
+ RUN python3 -m pip install neuronx-cc==2.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
27
26
RUN python3 -m pip install pytest
28
27
29
28
# uninstall transformers-neuronx package explicitly to avoid version conflict
@@ -49,6 +48,8 @@ RUN python3 -m pip install -e tests/vllm_test_utils
49
48
# FIXME: `--no-deps` argument is temporarily added to resolve transformers package version conflict
50
49
RUN python3 -m pip install transformers-neuronx==0.13.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U --no-deps
51
50
51
+ RUN python3 -m pip install sentencepiece transformers==4.48.0 -U
52
+
52
53
# overwrite entrypoint to run bash script
53
54
RUN echo "import subprocess; import sys; subprocess.check_call(sys.argv[1:])" > /usr/local/bin/dockerd-entrypoint.py
54
55
You can’t perform that action at this time.
0 commit comments