Create Dockerfile
Browse files- Dockerfile +7 -0
Dockerfile
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
FROM ghcr.io/ggerganov/llama.cpp:server-cuda
|
2 |
+
|
3 |
+
ENV LLAMA_ARG_CTX_SIZE=10000
|
4 |
+
ENV LLAMA_ARG_FLASH_ATTN=1
|
5 |
+
ENV LLAMA_ARG_HF_REPO=bartowski/Qwen2.5-Coder-14B-GGUF
|
6 |
+
ENV LLAMA_ARG_HF_FILE=Qwen2.5-Coder-14B-Q4_K_M.gguf
|
7 |
+
ENV LLAMA_ARG_N_PARALLEL=2
|