Spaces:
Runtime error
Runtime error
FROM nvidia/cuda:12.1.1-devel-ubuntu22.04 | |
ARG MODEL | |
ARG MODEL_NAME | |
ARG ADDITIONAL | |
RUN mkdir /opt/koboldcpp | |
RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y | |
RUN git clone https://github.com/lostruins/koboldcpp /opt/koboldcpp | |
WORKDIR /opt/koboldcpp | |
COPY default.json /opt/koboldcpp/default.json | |
RUN make LLAMA_OPENBLAS=1 LLAMA_CUBLAS=1 LLAMA_PORTABLE=1 | |
RUN wget -O model.ggml $MODEL || true | |
CMD /bin/python3 ./koboldcpp.py --model model.ggml $ADDITIONAL --port 7860 --hordeconfig $MODEL_NAME 1 1 --preloadstory default.json --ignoremissing | |