llava-1.5-7b-GGUF

Running

limcheekin commited on Dec 2, 2023

Commit

24caaad

•

1 Parent(s): 646c37a

feat: added clip model and chat_format

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -15,7 +15,8 @@ RUN pip install -U pip setuptools wheel && \
 # Download model
 RUN mkdir model && \
-    curl -L https://huggingface.co/mys/ggml_llava-v1.5-7b/resolve/main/ggml-model-q5_k.gguf -o model/gguf-model.bin
 COPY ./start_server.sh ./
 COPY ./main.py ./

 # Download model
 RUN mkdir model && \
+    curl -L https://huggingface.co/mys/ggml_llava-v1.5-7b/resolve/main/ggml-model-q5_k.gguf -o model/gguf-model.bin && \
+    curl -L https://huggingface.co/mys/ggml_llava-v1.5-7b/resolve/main/mmproj-model-f16.gguf -o model/clip-model.bin
 COPY ./start_server.sh ./
 COPY ./main.py ./

main.py CHANGED Viewed

@@ -6,7 +6,9 @@ app = create_app(
     Settings(
         n_threads=2,  # set to number of cpu cores
         model="model/gguf-model.bin",
-        embedding=True
     )
 )

     Settings(
         n_threads=2,  # set to number of cpu cores
         model="model/gguf-model.bin",
+        clip_model_path="model/clip-model.bin",
+        embedding=True,
+        chat_format="llava-1-5"
     )
 )