Spaces:
Sleeping
Sleeping
File size: 1,187 Bytes
e3396ba 85f179c e3396ba 85f179c e3396ba 7fd3f9f 85f179c 4966618 d1343e4 351861c d1343e4 e3396ba 773e76d 1fb7f0b 7fd3f9f 85f179c e3396ba 85f179c e3396ba cd2b254 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 |
# Loading base. I'm using Debian, u can use whatever u want.
FROM python:3.11.5-slim-bookworm
# Just for sure everything will be fine.
USER root
# Installing gcc compiler and main library.
RUN apt update && apt install gcc cmake build-essential -y
RUN CMAKE_ARGS="-DLLAMA_BLAS=ON -DLLAMA_BLAS_VENDOR=OpenBLAS" pip install llama-cpp-python
# Copying files into folder and making it working dir.
RUN mkdir app
COPY . /app
RUN chmod -R 777 /app
WORKDIR /app
# Making dir for translator model (facebook/m2m100_1.2B)
RUN mkdir translator
RUN chmod -R 777 translator
# Installing wget and downloading model.
RUN apt install wget -y
RUN wget -q -O model.bin https://huggingface.co/TheBloke/Llama-2-13B-chat-GGUF/resolve/main/llama-2-13b-chat.Q5_K_M.gguf
RUN ls
# You can use other models! Or u can comment this two RUNs and include in Space/repo/Docker image own model with name "model.bin".
# Updating pip and installing everything from requirements
RUN python3 -m pip install -U --no-cache-dir pip setuptools wheel
RUN pip install --no-cache-dir --upgrade -r /app/requirements.txt
# Now it's time to run Quart app using uvicorn! (It's faster, trust me.)
CMD ["gradio", "gradio_app.py"] |