Spaces:

CooLLaMACEO
/

ChatMPT

Running

CooLLaMACEO commited on Feb 3

Commit

0f79223

verified ·

1 Parent(s): caa3198

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,19 +1,20 @@
 FROM python:3.10-slim
-# Install system dependencies
-RUN apt-get update && apt-get install -y \
-    build-essential \
-    python3-dev \
-    wget \
-    && rm -rf /var/lib/apt/lists/*
-# The -q flag makes it quiet so the logs don't hit the 2MB limit
 RUN wget -q -O model.gguf https://huggingface.co/maddes8cht/mosaicml-mpt-7b-chat-gguf/resolve/main/mosaicml-mpt-7b-chat-Q2_K.gguf
-# Install modern llama-cpp and web server
-RUN pip install --no-cache-dir llama-cpp-python fastapi uvicorn
 COPY app.py .
-# Port 7860 is required for Hugging Face Spaces
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

 FROM python:3.10-slim
+# Install wget to get the model
+RUN apt-get update && apt-get install -y wget && rm -rf /var/lib/apt/lists/*
+# 1. Download the GGUF model (Quiet mode)
 RUN wget -q -O model.gguf https://huggingface.co/maddes8cht/mosaicml-mpt-7b-chat-gguf/resolve/main/mosaicml-mpt-7b-chat-Q2_K.gguf
+# 2. Install llama-cpp-python using a PRE-BUILT wheel
+# This skips the "Building wheel" phase and finishes in seconds
+RUN pip install --no-cache-dir \
+    https://huggingface.co/Luigi/llama-cpp-python-wheels-hf-spaces-free-cpu/resolve/main/llama_cpp_python-0.3.22-cp310-cp310-linux_x86_64.whl
+# 3. Install web server basics
+RUN pip install --no-cache-dir fastapi uvicorn
 COPY app.py .
+# Port 7860 for Hugging Face
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]