Spaces:

MatrixStudio
/

Qwen-7B-gguf-API

Sleeping

App Files Files Community

Alex0007 commited on Jan 15

Commit

859ea12

•

1 Parent(s): 43b8c19

更新了一下Dockerfile

Browse files

Files changed (3) hide show

Dockerfile +5 -20
README.md +1 -1
config.toml +0 -2

Dockerfile CHANGED Viewed

@@ -1,48 +1,33 @@
-# Using a standard Ubuntu base image
 FROM ubuntu:22.04
-# Environment variables
 ENV MODEL_NAME="Qwen-7B-gguf"
 ENV MODEL_FILE="qwen7b-q4_0.gguf"
 ENV MODEL_USER="MatrixStudio"
 ENV DEFAULT_MODEL_BRANCH="main"
 ENV MODEL_URL="https://huggingface.co/${MODEL_USER}/${MODEL_NAME}/resolve/${DEFAULT_MODEL_BRANCH}/${MODEL_FILE}"
-# Installing necessary packages
-RUN apt-get update && apt-get upgrade -y \
-    && apt-get install -y build-essential python3 python3-pip wget curl git \
-    --no-install-recommends \
-    && apt-get clean && rm -rf /var/lib/apt/lists/*
-# Setting up the working directory
 WORKDIR /app
 COPY ./requirements.txt /app/requirements.txt
 RUN pip install --upgrade pip && pip install --no-cache-dir --upgrade -r /app/requirements.txt
-# Cloning the llama.cpp repository
 RUN git clone https://github.com/ggerganov/llama.cpp.git
-# Moving to the llama.cpp directory and building the project
 WORKDIR /app/llama.cpp
 RUN make
-# Model download process
 RUN mkdir -p models/7B && wget -O models/7B/${MODEL_FILE} ${MODEL_URL}
-# Changing ownership to a non-root user
 RUN useradd -m -u 1000 user && chown -R user:user /app
 USER user
 ENV HOME=/home/user
 ENV PATH=/home/user/.local/bin:$PATH
 RUN chmod -R 777 /app/llama.cpp
-# Setting up the application
-EXPOSE 8080
 # Adjust the CMD to use the absolute path of the server executable
-# CMD ["/app/llama.cpp/server", "-m", "/app/llama.cpp/models/7B/qwen7b-q4_0.gguf", "-c", "16000", "--host", "0.0.0.0", "--port", "8000"]
-# CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]
-CMD ["python3", "-m", "llama_cpp.server", "--model", "/app/llama.cpp/models/7B/qwen7b-q4_0.gguf", "--host", "0.0.0.0", "--port", "8000", "--n_threads", "16"]

 FROM ubuntu:22.04
 ENV MODEL_NAME="Qwen-7B-gguf"
 ENV MODEL_FILE="qwen7b-q4_0.gguf"
 ENV MODEL_USER="MatrixStudio"
 ENV DEFAULT_MODEL_BRANCH="main"
 ENV MODEL_URL="https://huggingface.co/${MODEL_USER}/${MODEL_NAME}/resolve/${DEFAULT_MODEL_BRANCH}/${MODEL_FILE}"
+RUN apt-get update && apt-get upgrade -y && apt-get install -y build-essential python3 python3-pip wget curl git
 WORKDIR /app
 COPY ./requirements.txt /app/requirements.txt
 RUN pip install --upgrade pip && pip install --no-cache-dir --upgrade -r /app/requirements.txt
 RUN git clone https://github.com/ggerganov/llama.cpp.git
 WORKDIR /app/llama.cpp
 RUN make
 RUN mkdir -p models/7B && wget -O models/7B/${MODEL_FILE} ${MODEL_URL}
 RUN useradd -m -u 1000 user && chown -R user:user /app
 USER user
 ENV HOME=/home/user
 ENV PATH=/home/user/.local/bin:$PATH
 RUN chmod -R 777 /app/llama.cpp
+EXPOSE 7860
 # Adjust the CMD to use the absolute path of the server executable
+# CMD ["/app/llama.cpp/server", "-m", "/app/llama.cpp/models/7B/qwen7b-q4_0.gguf", "-c", "16000", "--host", "0.0.0.0", "--port", "7860"]
+# CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]
+CMD ["python3", "-m", "llama_cpp.server", "--model", "/app/llama.cpp/models/7B/qwen7b-q4_0.gguf", "--host", "0.0.0.0", "--port", "7860", "--n_threads", "16"]

README.md CHANGED Viewed

@@ -4,6 +4,6 @@ emoji: 🦍⨐
 colorFrom: green
 colorTo: yellow
 sdk: docker
-app_port: 8080
 pinned: false
 ---

 colorFrom: green
 colorTo: yellow
 sdk: docker
+app_port: 7860
 pinned: false
 ---

config.toml DELETED Viewed

	@@ -1,2 +0,0 @@
1	- model="/app/llama.cpp/models/7B/qwen7b-q4_0.gguf"
2	- n_threads="1"