Updates to flash attn install

#1
by nateraw - opened
Files changed (2) hide show
  1. Dockerfile +5 -0
  2. start_server.sh +2 -0
Dockerfile CHANGED
@@ -91,6 +91,11 @@ RUN curl https://sh.rustup.rs -sSf | bash -s -- -y
91
  ENV PATH="$HOME/.cargo/bin:${PATH}"
92
  RUN chmod -R 777 $HOME/.cargo/
93
 
 
 
 
 
 
94
  # Python packages
95
  RUN --mount=target=requirements.txt,source=requirements.txt \
96
  pip install --no-cache-dir --upgrade -r requirements.txt
 
91
  ENV PATH="$HOME/.cargo/bin:${PATH}"
92
  RUN chmod -R 777 $HOME/.cargo/
93
 
94
+ # Install ninja, which might help speed up flash attn build time
95
+ RUN apt-get update && apt-get install -y --no-install-recommends \
96
+ ninja-build \
97
+ && rm -rf /var/lib/apt/lists/*
98
+
99
  # Python packages
100
  RUN --mount=target=requirements.txt,source=requirements.txt \
101
  pip install --no-cache-dir --upgrade -r requirements.txt
start_server.sh CHANGED
@@ -3,7 +3,9 @@ JUPYTER_TOKEN="${JUPYTER_TOKEN:=huggingface}"
3
 
4
  echo "Starting Jupyter Lab with token $JUPYTER_TOKEN"
5
  make install
 
6
  make install-flash-attention
 
7
 
8
  jupyter-lab \
9
  --ip 0.0.0.0 \
 
3
 
4
  echo "Starting Jupyter Lab with token $JUPYTER_TOKEN"
5
  make install
6
+ cd server
7
  make install-flash-attention
8
+ cd ..
9
 
10
  jupyter-lab \
11
  --ip 0.0.0.0 \