concedo commited on
Commit
81d6ed5
1 Parent(s): 92f0235

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -7
Dockerfile CHANGED
@@ -1,12 +1,12 @@
1
- FROM debian
2
  ARG MODEL
3
  ARG MODEL_NAME
4
  ARG ADDITIONAL
5
  RUN mkdir /opt/koboldcpp
6
- RUN apt update && apt install curl -y
 
7
  WORKDIR /opt/koboldcpp
8
- COPY *.json /opt/koboldcpp/
9
- RUN curl -fLo koboldcpp https://github.com/LostRuins/koboldcpp/releases/latest/download/koboldcpp-linux-x64-nocuda
10
- RUN chmod +x ./koboldcpp
11
- RUN curl -fLo model.ggml $MODEL || true
12
- CMD ./koboldcpp --model model.ggml $ADDITIONAL --port 7860 --hordemodelname $MODEL_NAME --hordemaxctx 1 --hordegenlen 1 --preloadstory default.json --ignoremissing
 
1
+ FROM nvidia/cuda:11.8.0-devel-ubuntu22.04
2
  ARG MODEL
3
  ARG MODEL_NAME
4
  ARG ADDITIONAL
5
  RUN mkdir /opt/koboldcpp
6
+ RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
7
+ RUN git clone https://github.com/lostruins/koboldcpp /opt/koboldcpp
8
  WORKDIR /opt/koboldcpp
9
+ COPY default.json /opt/koboldcpp/default.json
10
+ RUN make LLAMA_OPENBLAS=1
11
+ RUN wget -O model.ggml $MODEL || true
12
+ CMD /bin/python3 ./koboldcpp.py --model model.ggml $ADDITIONAL --port 7860 --hordeconfig $MODEL_NAME 1 1 --preloadstory default.json --ignoremissing