drizzlezyk commited on
Commit
8be9541
·
verified ·
1 Parent(s): c364ab1

Upload inference/Dockerfile with huggingface_hub

Browse files
Files changed (1) hide show
  1. inference/Dockerfile +44 -0
inference/Dockerfile ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM quay.io/ascend/cann:8.3.rc1.alpha003-910b-ubuntu22.04-py3.11
2
+ # Define environments
3
+ ENV DEBIAN_FRONTEND=noninteractive
4
+
5
+ ARG PY_BIN=/usr/local/python3.11.13/bin
6
+ WORKDIR /vllm-workspace
7
+
8
+ # Download VLLM
9
+ ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
10
+ ARG VLLM_TAG=v0.11.0rc3
11
+ RUN git clone --depth 1 --branch $VLLM_TAG $VLLM_REPO
12
+
13
+ # Download VLLM-ASCEND
14
+ ARG VLLM_REPO=https://github.com/vllm-project/vllm-ascend.git
15
+ ARG VLLM_TAG=v0.11.0rc0
16
+ RUN git clone --depth 1 --branch $VLLM_TAG $VLLM_REPO
17
+
18
+
19
+ WORKDIR /vllm-workspace/vllm-ascend
20
+ # patch
21
+ RUN sed -i 's|https://mirrors.huaweicloud.com/ascend/repos/pypi|https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple|g' requirements.txt && \
22
+ sed -i 's/torch-npu==2.7.1.dev20250724/torch-npu==2.7.1/g' requirements.txt && \
23
+ sed -i 's/torch-npu==2.7.1.dev20250724/torch-npu==2.7.1/g' pyproject.toml && \
24
+ sed -i 's/torch==2.7.1/torch==2.7.1/g' pyproject.toml
25
+ # # ---------------------------
26
+ RUN git submodule update --init --recursive
27
+
28
+
29
+ #Install VLLM
30
+ WORKDIR /vllm-workspace/vllm
31
+ RUN source /usr/local/Ascend/ascend-toolkit/set_env.sh && \
32
+ source /usr/local/Ascend/nnal/atb/set_env.sh && \
33
+ export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/`uname -i`-linux/devlib && \
34
+ VLLM_USE_PRECOMPILED=0 && \
35
+ VLLM_TARGET_DEVICE=empty ${PY_BIN}/pip install -v --no-deps -e .
36
+
37
+
38
+ #Install VLLM-ASCNED
39
+ WORKDIR /vllm-workspace/vllm-ascend
40
+ RUN source /usr/local/Ascend/ascend-toolkit/set_env.sh && \
41
+ source /usr/local/Ascend/nnal/atb/set_env.sh && \
42
+ export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/`uname -i`-linux/devlib && \
43
+ VLLM_USE_PRECOMPILED=0 && \
44
+ VLLM_TARGET_DEVICE=empty ${PY_BIN}/pip install -v --no-deps -e .