Jacky2305 commited on
Commit
387c4fa
·
verified ·
1 Parent(s): 0ed234d

Create Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +14 -0
Dockerfile ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM ghcr.io/ggerganov/llama.cpp:server
2
+
3
+ # HF Spaces 要求用 7860 端口
4
+ EXPOSE 7860
5
+
6
+ # 下载模型并启动 llama-server
7
+ # 用 -hf 参数直接从 HF Hub 拉取,无需预先下载
8
+ CMD ["--hf-repo", "bartowski/Qwen2.5-3B-Instruct-GGUF", \
9
+ "--hf-file", "Qwen2.5-3B-Instruct-Q4_K_M.gguf", \
10
+ "--host", "0.0.0.0", \
11
+ "--port", "7860", \
12
+ "--ctx-size", "4096", \
13
+ "--threads", "4", \
14
+ "--n-predict", "512"]