Spaces:

ggml-org
/

gguf-my-repo

Running on A10G

ngxson HF staff commited on Dec 3, 2024

Commit

04bf0e1

•

1 Parent(s): ce40819

Update start.sh

Files changed (1) hide show

start.sh CHANGED Viewed

@@ -5,13 +5,17 @@ if [ ! -d "llama.cpp" ]; then
   git clone https://github.com/ggerganov/llama.cpp
 fi
 if [[ -z "${RUN_LOCALLY}" ]]; then
   # enable CUDA if NOT running locally
-  export LLAMA_CUDA=1
 fi
 cd llama.cpp
-make -j llama-quantize llama-gguf-split llama-imatrix
 cd ..
 python app.py

   git clone https://github.com/ggerganov/llama.cpp
 fi
+export GGML_CUDA=OFF
 if [[ -z "${RUN_LOCALLY}" ]]; then
   # enable CUDA if NOT running locally
+  export GGML_CUDA=ON
 fi
 cd llama.cpp
+cmake -B build -DBUILD_SHARED_LIBS=OFF -DGGML_CUDA=${GGML_CUDA} -DLLAMA_CURL=ON
+cmake --build build --config Release -j --target llama-quantize llama-gguf-split llama-imatrix
+cp ./build/bin/llama-* .
+rm -rf build
 cd ..
 python app.py