# Builder stage # FROM ubuntu:latest # # Update packages and install curl and gnupg # RUN apt-get update && apt-get install -y \ # curl \ # gnupg # # Add NVIDIA package repositories # RUN curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg \ # && echo "deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://nvidia.github.io/libnvidia-container/stable/deb/ $(. /etc/os-release; echo $UBUNTU_CODENAME) main" > /etc/apt/sources.list.d/nvidia-container-toolkit.list # # Install NVIDIA container toolkit (Check for any updated methods or URLs for Ubuntu jammy) # RUN apt-get update && apt-get install -y nvidia-container-toolkit || true # # Install application # RUN curl https://ollama.ai/install.sh | sh # # Below is to fix embedding bug as per # # RUN curl -fsSL https://ollama.com/install.sh | sed 's#https://ollama.com/download#https://github.com/jmorganca/ollama/releases/download/v0.1.29#' | sh # # Create the directory and give appropriate permissions # RUN mkdir -p /.ollama && chmod 777 /.ollama # WORKDIR /.ollama # # Copy the entry point script # COPY entrypoint.sh /entrypoint.sh # RUN chmod +x /entrypoint.sh # # Set the entry point script as the default command # ENTRYPOINT ["/entrypoint.sh"] # CMD ["ollama", "serve"] # # Set the model as an environment variable (this can be overridden) # ENV model=${model} # Expose the server port # Use the official Ollama Docker image as the base image FROM ollama/ollama:0.2.1 RUN apt update && apt install -y python3 && apt install -y python3-pip RUN pip install litellm RUN pip install 'litellm[proxy]' # Create a directory for Ollama data RUN mkdir -p /.ollama RUN chmod -R 777 /.ollama WORKDIR /.ollama # Copy the entry point script COPY entrypoint.sh /entrypoint.sh RUN chmod +x /entrypoint.sh # Set the entry point script as the default command ENTRYPOINT ["/entrypoint.sh"] # Set the model as an environment variable (this can be overridden) ENV model=${model} # Expose the port that Ollama runs on EXPOSE 7860 # Command to start the Ollama server CMD ["serve"]