Skip to content

Commit 628ec6c

Browse files
authored
[Docker] bump up neuron sdk v2.21 (#11593)
Signed-off-by: Liangfu Chen <liangfc@amazon.com>
1 parent 3682e33 commit 628ec6c

File tree

4 files changed

+6
-8
lines changed

4 files changed

+6
-8
lines changed

Dockerfile.neuron

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
# default base image
22
# https://gallery.ecr.aws/neuron/pytorch-inference-neuronx
3-
ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.1.2-neuronx-py310-sdk2.20.2-ubuntu20.04"
3+
ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.5.1-neuronx-py310-sdk2.21.0-ubuntu22.04"
44

55
FROM $BASE_IMAGE
66

@@ -22,9 +22,9 @@ WORKDIR ${APP_MOUNT}/vllm
2222

2323
RUN python3 -m pip install --upgrade pip
2424
RUN python3 -m pip install --no-cache-dir fastapi ninja tokenizers pandas
25-
RUN python3 -m pip install sentencepiece transformers==4.36.2 -U
25+
RUN python3 -m pip install sentencepiece transformers==4.45.2 -U
2626
RUN python3 -m pip install transformers-neuronx --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
27-
RUN python3 -m pip install --pre neuronx-cc==2.15.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
27+
RUN python3 -m pip install neuronx-cc==2.16.345.0 --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
2828

2929
COPY . .
3030
ARG GIT_REPO_CHECK=0

requirements-neuron.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,6 @@
22
-r requirements-common.txt
33

44
# Dependencies for Neuron devices
5-
transformers-neuronx >= 0.12.0
6-
torch-neuronx >= 2.1.2
5+
transformers-neuronx >= 0.13.0
6+
torch-neuronx >= 2.5.0
77
neuronx-cc

vllm/_custom_ops.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,7 @@
2323
import vllm._moe_C # noqa: F401
2424
supports_moe_ops = True
2525

26-
# neuron has torch version that doesn't even have impl_abstract
27-
if TYPE_CHECKING or current_platform.is_neuron():
26+
if TYPE_CHECKING:
2827

2928
def register_fake(fn):
3029
return lambda name: fn

vllm/triton_utils/importing.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,6 @@
88
HAS_TRITON = (
99
find_spec("triton") is not None
1010
and not current_platform.is_xpu() # Not compatible
11-
and not current_platform.is_neuron() # neuron has too old torch
1211
)
1312

1413
if not HAS_TRITON:

0 commit comments

Comments
 (0)