embedding / Dockerfile
zhengr's picture
Update Dockerfile
2333256 verified
raw
history blame
2.17 kB
# Builder stage
# FROM ubuntu:latest
# # Update packages and install curl and gnupg
# RUN apt-get update && apt-get install -y \
# curl \
# gnupg
# # Add NVIDIA package repositories
# RUN curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg \
# && echo "deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://nvidia.github.io/libnvidia-container/stable/deb/ $(. /etc/os-release; echo $UBUNTU_CODENAME) main" > /etc/apt/sources.list.d/nvidia-container-toolkit.list
# # Install NVIDIA container toolkit (Check for any updated methods or URLs for Ubuntu jammy)
# RUN apt-get update && apt-get install -y nvidia-container-toolkit || true
# # Install application
# RUN curl https://ollama.ai/install.sh | sh
# # Below is to fix embedding bug as per
# # RUN curl -fsSL https://ollama.com/install.sh | sed 's#https://ollama.com/download#https://github.com/jmorganca/ollama/releases/download/v0.1.29#' | sh
# # Create the directory and give appropriate permissions
# RUN mkdir -p /.ollama && chmod 777 /.ollama
# WORKDIR /.ollama
# # Copy the entry point script
# COPY entrypoint.sh /entrypoint.sh
# RUN chmod +x /entrypoint.sh
# # Set the entry point script as the default command
# ENTRYPOINT ["/entrypoint.sh"]
# CMD ["ollama", "serve"]
# # Set the model as an environment variable (this can be overridden)
# ENV model=${model}
# Expose the server port
# Use the official Ollama Docker image as the base image
FROM ollama/ollama:0.2.1
RUN apt update && apt install -y python3 && apt install -y python3-pip
RUN pip install litellm
RUN pip install 'litellm[proxy]'
# Create a directory for Ollama data
RUN mkdir -p /.ollama
RUN chmod -R 777 /.ollama
WORKDIR /.ollama
# Copy the entry point script
COPY entrypoint.sh /entrypoint.sh
RUN chmod +x /entrypoint.sh
# Set the entry point script as the default command
ENTRYPOINT ["/entrypoint.sh"]
# Set the model as an environment variable (this can be overridden)
ENV model=${model}
# Expose the port that Ollama runs on
EXPOSE 7860
# Command to start the Ollama server
CMD ["serve"]