Create Dockerfile
Browse files- Dockerfile +14 -0
Dockerfile
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
FROM ghcr.io/ggerganov/llama.cpp:server
|
| 2 |
+
|
| 3 |
+
# HF Spaces 要求用 7860 端口
|
| 4 |
+
EXPOSE 7860
|
| 5 |
+
|
| 6 |
+
# 下载模型并启动 llama-server
|
| 7 |
+
# 用 -hf 参数直接从 HF Hub 拉取,无需预先下载
|
| 8 |
+
CMD ["--hf-repo", "bartowski/Qwen2.5-3B-Instruct-GGUF", \
|
| 9 |
+
"--hf-file", "Qwen2.5-3B-Instruct-Q4_K_M.gguf", \
|
| 10 |
+
"--host", "0.0.0.0", \
|
| 11 |
+
"--port", "7860", \
|
| 12 |
+
"--ctx-size", "4096", \
|
| 13 |
+
"--threads", "4", \
|
| 14 |
+
"--n-predict", "512"]
|