File tree Expand file tree Collapse file tree 4 files changed +6
-8
lines changed Expand file tree Collapse file tree 4 files changed +6
-8
lines changed Original file line number Diff line number Diff line change 1
1
# default base image
2
2
# https://gallery.ecr.aws/neuron/pytorch-inference-neuronx
3
- ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.1.2 -neuronx-py310-sdk2.20.2-ubuntu20 .04"
3
+ ARG BASE_IMAGE="public.ecr.aws/neuron/pytorch-inference-neuronx:2.5.1 -neuronx-py310-sdk2.21.0-ubuntu22 .04"
4
4
5
5
FROM $BASE_IMAGE
6
6
@@ -22,9 +22,9 @@ WORKDIR ${APP_MOUNT}/vllm
22
22
23
23
RUN python3 -m pip install --upgrade pip
24
24
RUN python3 -m pip install --no-cache-dir fastapi ninja tokenizers pandas
25
- RUN python3 -m pip install sentencepiece transformers==4.36 .2 -U
25
+ RUN python3 -m pip install sentencepiece transformers==4.45 .2 -U
26
26
RUN python3 -m pip install transformers-neuronx --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
27
- RUN python3 -m pip install --pre neuronx-cc==2.15.* --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
27
+ RUN python3 -m pip install neuronx-cc==2.16.345.0 --extra-index-url=https://pip.repos.neuron.amazonaws.com -U
28
28
29
29
COPY . .
30
30
ARG GIT_REPO_CHECK=0
Original file line number Diff line number Diff line change 2
2
-r requirements-common.txt
3
3
4
4
# Dependencies for Neuron devices
5
- transformers-neuronx >= 0.12 .0
6
- torch-neuronx >= 2.1.2
5
+ transformers-neuronx >= 0.13 .0
6
+ torch-neuronx >= 2.5.0
7
7
neuronx-cc
Original file line number Diff line number Diff line change 23
23
import vllm ._moe_C # noqa: F401
24
24
supports_moe_ops = True
25
25
26
- # neuron has torch version that doesn't even have impl_abstract
27
- if TYPE_CHECKING or current_platform .is_neuron ():
26
+ if TYPE_CHECKING :
28
27
29
28
def register_fake (fn ):
30
29
return lambda name : fn
Original file line number Diff line number Diff line change 8
8
HAS_TRITON = (
9
9
find_spec ("triton" ) is not None
10
10
and not current_platform .is_xpu () # Not compatible
11
- and not current_platform .is_neuron () # neuron has too old torch
12
11
)
13
12
14
13
if not HAS_TRITON :
You can’t perform that action at this time.
0 commit comments