Spaces:
Runtime error
Runtime error
Updates to flash attn install
#1
by
nateraw
- opened
- Dockerfile +5 -0
- start_server.sh +2 -0
Dockerfile
CHANGED
@@ -91,6 +91,11 @@ RUN curl https://sh.rustup.rs -sSf | bash -s -- -y
|
|
91 |
ENV PATH="$HOME/.cargo/bin:${PATH}"
|
92 |
RUN chmod -R 777 $HOME/.cargo/
|
93 |
|
|
|
|
|
|
|
|
|
|
|
94 |
# Python packages
|
95 |
RUN --mount=target=requirements.txt,source=requirements.txt \
|
96 |
pip install --no-cache-dir --upgrade -r requirements.txt
|
|
|
91 |
ENV PATH="$HOME/.cargo/bin:${PATH}"
|
92 |
RUN chmod -R 777 $HOME/.cargo/
|
93 |
|
94 |
+
# Install ninja, which might help speed up flash attn build time
|
95 |
+
RUN apt-get update && apt-get install -y --no-install-recommends \
|
96 |
+
ninja-build \
|
97 |
+
&& rm -rf /var/lib/apt/lists/*
|
98 |
+
|
99 |
# Python packages
|
100 |
RUN --mount=target=requirements.txt,source=requirements.txt \
|
101 |
pip install --no-cache-dir --upgrade -r requirements.txt
|
start_server.sh
CHANGED
@@ -3,7 +3,9 @@ JUPYTER_TOKEN="${JUPYTER_TOKEN:=huggingface}"
|
|
3 |
|
4 |
echo "Starting Jupyter Lab with token $JUPYTER_TOKEN"
|
5 |
make install
|
|
|
6 |
make install-flash-attention
|
|
|
7 |
|
8 |
jupyter-lab \
|
9 |
--ip 0.0.0.0 \
|
|
|
3 |
|
4 |
echo "Starting Jupyter Lab with token $JUPYTER_TOKEN"
|
5 |
make install
|
6 |
+
cd server
|
7 |
make install-flash-attention
|
8 |
+
cd ..
|
9 |
|
10 |
jupyter-lab \
|
11 |
--ip 0.0.0.0 \
|