# devel needed for bitsandbytes requirement of libcudart.so, otherwise runtime sufficient FROM nvidia/cuda:11.8.0-cudnn8-devel-ubuntu20.04 ENV DEBIAN_FRONTEND=noninteractive ENV PATH="/h2ogpt_conda/bin:${PATH}" ARG PATH="/h2ogpt_conda/bin:${PATH}" ENV HOME=/workspace ENV CUDA_HOME=/usr/local/cuda-11.8 ENV VLLM_CACHE=/workspace/.vllm_cache WORKDIR /workspace COPY . /workspace/ RUN cd /workspace && chmod +x /workspace/docker_build_script_ubuntu.sh && ./docker_build_script_ubuntu.sh RUN chmod -R a+rwx /workspace ARG user=h2ogpt ARG group=h2ogpt ARG uid=1000 ARG gid=1000 RUN groupadd -g ${gid} ${group} && useradd -u ${uid} -g ${group} -s /bin/bash ${user} EXPOSE 8888 EXPOSE 7860 EXPOSE 5000 USER h2ogpt # ENTRYPOINT ["python3.10"] CMD ["python3.10", "generate.py", "--load_8bit", "True", "--base_model", "h2oai/h2ogpt-4096-llama2-7b-chat"]