LLM_Deployment / Dockerfile
Prabhash's picture
Update Dockerfile
3a77aaf verified
raw
history blame
No virus
396 Bytes
FROM python:3.9
WORKDIR /code
COPY ./requirements.txt /code/requirements.txt
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
# Download Gemma-2B model
RUN wget https://huggingface.co/google/gemma-1.1-2b-it-GGUF/tree/main?show_tensors=2b_it_v1p1.gguf -O /code/2b_it_v1p1.gguf
COPY ./main.py /code/main.py
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]