ngxson HF staff commited on
Commit
a3b9e70
1 Parent(s): 3426c82

Create Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -0
Dockerfile ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ FROM ghcr.io/ggerganov/llama.cpp:server-cuda
2
+
3
+ ENV LLAMA_ARG_CTX_SIZE=10000
4
+ ENV LLAMA_ARG_FLASH_ATTN=1
5
+ ENV LLAMA_ARG_HF_REPO=bartowski/Qwen2.5-Coder-14B-GGUF
6
+ ENV LLAMA_ARG_HF_FILE=Qwen2.5-Coder-14B-Q4_K_M.gguf
7
+ ENV LLAMA_ARG_N_PARALLEL=2