5fp commited on
Commit
d19e237
1 Parent(s): dc5ffc0

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +5 -10
Dockerfile CHANGED
@@ -1,11 +1,7 @@
1
  ARG UBUNTU_VERSION=22.04
2
- ARG CUDA_VERSION=12.3.1
3
- ARG BASE_CUDA_DEV_CONTAINER=nvidia/cuda:${CUDA_VERSION}-devel-ubuntu${UBUNTU_VERSION}
4
- ARG BASE_CUDA_RUN_CONTAINER=nvidia/cuda:${CUDA_VERSION}-runtime-ubuntu${UBUNTU_VERSION}
5
 
6
- FROM ${BASE_CUDA_DEV_CONTAINER} as build
7
-
8
- ARG CUDA_DOCKER_ARCH=all
9
 
10
  RUN apt-get update && \
11
  apt-get install -y build-essential git cmake wget
@@ -16,8 +12,8 @@ RUN git clone https://github.com/ggerganov/llama.cpp.git
16
 
17
  WORKDIR /build/llama.cpp
18
 
19
- ENV CUDA_DOCKER_ARCH=${CUDA_DOCKER_ARCH}
20
- ENV LLAMA_CUBLAS=1
21
 
22
  RUN mkdir build && \
23
  cd build && \
@@ -27,8 +23,7 @@ RUN mkdir build && \
27
  WORKDIR /data
28
  RUN wget https://huggingface.co/brunopio/Llama3-8B-1.58-100B-tokens-GGUF/resolve/main/Llama3-8B-1.58-100B-tokens-TQ2_0.gguf -nv -O model.gguf
29
 
30
- FROM ${BASE_CUDA_RUN_CONTAINER} as runtime
31
-
32
 
33
  WORKDIR /app
34
 
 
1
  ARG UBUNTU_VERSION=22.04
2
+ ARG BASE_CPU_CONTAINER=ubuntu:${UBUNTU_VERSION}
 
 
3
 
4
+ FROM ${BASE_CPU_CONTAINER} as build
 
 
5
 
6
  RUN apt-get update && \
7
  apt-get install -y build-essential git cmake wget
 
12
 
13
  WORKDIR /build/llama.cpp
14
 
15
+ # Ensure that LLAMA_CUBLAS is not set to 1
16
+ ENV LLAMA_CUBLAS=0
17
 
18
  RUN mkdir build && \
19
  cd build && \
 
23
  WORKDIR /data
24
  RUN wget https://huggingface.co/brunopio/Llama3-8B-1.58-100B-tokens-GGUF/resolve/main/Llama3-8B-1.58-100B-tokens-TQ2_0.gguf -nv -O model.gguf
25
 
26
+ FROM ${BASE_CPU_CONTAINER} as runtime
 
27
 
28
  WORKDIR /app
29