2
2
# SPDX-License-Identifier: Apache-2.0
3
3
4
4
# ======== Base Stage ========
5
- FROM intel/deep-learning-essentials:2025.1.3-0-devel-ubuntu24.04 AS vllm-base
5
+ FROM amr-registry.caas. intel.com/intelanalytics/llm-scaler-platform:25.38.4.1 AS vllm-base
6
6
7
7
ARG https_proxy
8
8
ARG http_proxy
@@ -18,7 +18,6 @@ RUN apt-get update -y && \
18
18
# add-apt-repository ppa:deadsnakes/ppa && \
19
19
apt-get update -y && \
20
20
apt-get install -y python3.12 python3.12-dev python3-pip && \
21
- # curl -sS https://bootstrap.pypa.io/get-pip.py | python3.12 && \
22
21
update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 1 && \
23
22
update-alternatives --install /usr/bin/python python /usr/bin/python3.12 1 && \
24
23
apt-get install -y --no-install-recommends --fix-missing \
@@ -36,30 +35,13 @@ RUN apt-get update -y && \
36
35
linux-libc-dev && \
37
36
# Install Intel GPU runtime packages
38
37
apt-get update -y && \
39
- apt-get install -y libze1 libze-dev libze-intel-gpu1 intel-opencl-icd libze-intel-gpu-raytracing && \
40
38
apt-get install -y intel-oneapi-dpcpp-ct=2025.1.0-452 && \
41
39
apt-get clean && rm -rf /var/lib/apt/lists/*
42
40
43
- # pin compute runtime version
44
- # RUN mkdir /tmp/neo && \
45
- # cd /tmp/neo && \
46
- # wget https://github.com/intel/intel-graphics-compiler/releases/download/v2.12.5/intel-igc-core-2_2.12.5+19302_amd64.deb && \
47
- # wget https://github.com/intel/intel-graphics-compiler/releases/download/v2.12.5/intel-igc-opencl-2_2.12.5+19302_amd64.deb && \
48
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/intel-ocloc-dbgsym_25.22.33944.8-0_amd64.ddeb && \
49
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/intel-ocloc_25.22.33944.8-0_amd64.deb && \
50
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/intel-opencl-icd-dbgsym_25.22.33944.8-0_amd64.ddeb && \
51
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/intel-opencl-icd_25.22.33944.8-0_amd64.deb && \
52
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/libigdgmm12_22.7.0_amd64.deb && \
53
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/libze-intel-gpu1-dbgsym_25.22.33944.8-0_amd64.ddeb && \
54
- # wget https://github.com/intel/compute-runtime/releases/download/25.22.33944.8/libze-intel-gpu1_25.22.33944.8-0_amd64.deb && \
55
- # dpkg -i *.deb
56
-
57
41
WORKDIR /llm
58
- # TODO: update vllm_for_multi_arc.patch
59
42
COPY ./patches/vllm_for_multi_arc.patch /tmp/
60
43
# TODO: update oneccl...
61
44
COPY ./patches/0001-oneccl-align-global-V0.1.1.patch /tmp/
62
- # COPY ./patches/vllm_int4_for_multi_arc.so /opt/lib/
63
45
64
46
# Set environment variables early
65
47
ENV LD_LIBRARY_PATH="$LD_LIBRARY_PATH:/usr/local/lib/"
@@ -126,9 +108,6 @@ ARG https_proxy
126
108
# install additional dependencies for openai api server
127
109
RUN pip install accelerate hf_transfer 'modelscope!=1.15.0'
128
110
129
- # Install required triton version
130
- # RUN pip uninstall pytorch-triton-xpu triton -y && \
131
- # pip install https://download.pytorch-extension.intel.com/ipex_dev/xpu/triton-3.3.0%2Bgitbd88137b-cp310-cp310-linux_x86_64.whl
132
111
133
112
# Pin transformers version to avoid conflict in vLLM
134
113
RUN pip install "transformers<4.54.0"
0 commit comments