Spaces:
Runtime error
Runtime error
Updates to flash attn install
#1
by nateraw - opened
- Dockerfile +5 -0
- start_server.sh +2 -0
Dockerfile
CHANGED
|
@@ -91,6 +91,11 @@ RUN curl https://sh.rustup.rs -sSf | bash -s -- -y
|
|
| 91 |
ENV PATH="$HOME/.cargo/bin:${PATH}"
|
| 92 |
RUN chmod -R 777 $HOME/.cargo/
|
| 93 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 94 |
# Python packages
|
| 95 |
RUN --mount=target=requirements.txt,source=requirements.txt \
|
| 96 |
pip install --no-cache-dir --upgrade -r requirements.txt
|
|
|
|
| 91 |
ENV PATH="$HOME/.cargo/bin:${PATH}"
|
| 92 |
RUN chmod -R 777 $HOME/.cargo/
|
| 93 |
|
| 94 |
+
# Install ninja, which might help speed up flash attn build time
|
| 95 |
+
RUN apt-get update && apt-get install -y --no-install-recommends \
|
| 96 |
+
ninja-build \
|
| 97 |
+
&& rm -rf /var/lib/apt/lists/*
|
| 98 |
+
|
| 99 |
# Python packages
|
| 100 |
RUN --mount=target=requirements.txt,source=requirements.txt \
|
| 101 |
pip install --no-cache-dir --upgrade -r requirements.txt
|
start_server.sh
CHANGED
|
@@ -3,7 +3,9 @@ JUPYTER_TOKEN="${JUPYTER_TOKEN:=huggingface}"
|
|
| 3 |
|
| 4 |
echo "Starting Jupyter Lab with token $JUPYTER_TOKEN"
|
| 5 |
make install
|
|
|
|
| 6 |
make install-flash-attention
|
|
|
|
| 7 |
|
| 8 |
jupyter-lab \
|
| 9 |
--ip 0.0.0.0 \
|
|
|
|
| 3 |
|
| 4 |
echo "Starting Jupyter Lab with token $JUPYTER_TOKEN"
|
| 5 |
make install
|
| 6 |
+
cd server
|
| 7 |
make install-flash-attention
|
| 8 |
+
cd ..
|
| 9 |
|
| 10 |
jupyter-lab \
|
| 11 |
--ip 0.0.0.0 \
|