File size: 474 Bytes
435f6db
00fa67d
45c1114
00fa67d
45c1114
33f9f12
 
00fa67d
7ee4214
1
2
3
4
5
6
7
8
9
10
FROM ghcr.io/ggerganov/llama.cpp:server-cuda

RUN apt update && apt install -y curl

RUN mkdir /models

RUN curl -L https://huggingface.co/TheBloke/deepseek-coder-6.7B-instruct-GGUF/resolve/main/deepseek-coder-6.7b-instruct.Q6_K.gguf --output /models/deepseek-coder-6.7b-instruct.Q6_K.gguf

ENTRYPOINT [ "/server", "-ngl", "32" "--host", "0.0.0.0", "--port", "7860", "--model", "/models/deepseek-coder-6.7b-instruct.Q6_K.gguf", "-c", "4096", "--chat-template", "deepseek" ]