cxumol commited on
Commit
8050b28
·
verified ·
1 Parent(s): 73e3723

model: change to official qwen2.5-1.5b-instruct-q4_k_m.gguf

Browse files
Files changed (1) hide show
  1. Dockerfile +2 -2
Dockerfile CHANGED
@@ -13,8 +13,8 @@ WORKDIR /app/llama.cpp
13
 
14
  # Hardcode for now
15
  ARG LLAMA_CPP_RELEASE_URL="https://github.com/ggml-org/llama.cpp/releases/download/b6218/llama-b6218-bin-ubuntu-x64.zip"
16
- ARG MODEL_URL="https://huggingface.co/mradermacher/Qwen2.5-1.5B-Instruct-abliterated-i1-GGUF/resolve/main/Qwen2.5-1.5B-Instruct-abliterated.i1-Q4_K_M.gguf"
17
- ARG MODEL_FILENAME="Qwen2.5-1.5B-Instruct-abliterated.i1-Q4_K_M.gguf"
18
 
19
 
20
  RUN curl -L "${LLAMA_CPP_RELEASE_URL}" -o llama.zip && \
 
13
 
14
  # Hardcode for now
15
  ARG LLAMA_CPP_RELEASE_URL="https://github.com/ggml-org/llama.cpp/releases/download/b6218/llama-b6218-bin-ubuntu-x64.zip"
16
+ ARG MODEL_URL="https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct-GGUF/resolve/main/qwen2.5-1.5b-instruct-q4_k_m.gguf"
17
+ ARG MODEL_FILENAME="qwen2.5-1.5b-instruct-q4_k_m.gguf"
18
 
19
 
20
  RUN curl -L "${LLAMA_CPP_RELEASE_URL}" -o llama.zip && \