ilhooq's picture
Try Q4_K_M
0f08574
ARG UBUNTU_VERSION=22.04
FROM ubuntu:$UBUNTU_VERSION as build
RUN apt-get update && \
apt-get install -y pkg-config build-essential git libcurl4-openssl-dev libopenblas-dev
RUN git clone https://github.com/ggerganov/llama.cpp.git
WORKDIR /llama.cpp
# ENV LLAMA_CURL=1
RUN make LLAMA_OPENBLAS=1
FROM ubuntu:$UBUNTU_VERSION as runtime
RUN apt-get update && \
apt-get install -y libcurl4-openssl-dev curl libopenblas-base
COPY --from=build /llama.cpp/server /server
ENV LC_ALL=C.utf8
RUN mkdir /models
RUN curl -L https://huggingface.co/TheBloke/deepseek-coder-1.3b-instruct-GGUF/resolve/main/deepseek-coder-1.3b-instruct.Q4_K_M.gguf --output /models/deepseek-coder-1.3b-instruct.Q4_K_M.gguf
COPY ./public /webui
ENTRYPOINT [ "/server" ]
CMD [ "--host", "0.0.0.0", "--port", "7860", "--model", "/models/deepseek-coder-1.3b-instruct.Q4_K_M.gguf", "-t", "2", "--mlock", "-c", "512", "--chat-template", "deepseek", "--path", "/webui" ]