Guido Schmutz
Dynamically create the service_conf.yaml file by replacing environment variables from .env (#3341)
49f80bf
# base stage | |
FROM ubuntu:24.04 AS base | |
USER root | |
ARG ARCH=amd64 | |
ENV LIGHTEN=1 | |
WORKDIR /ragflow | |
RUN rm -f /etc/apt/apt.conf.d/docker-clean \ | |
&& echo 'Binary::apt::APT::Keep-Downloaded-Packages "true";' > /etc/apt/apt.conf.d/keep-cache | |
RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \ | |
apt update && apt-get --no-install-recommends install -y ca-certificates | |
# If you download Python modules too slow, you can use a pip mirror site to speed up apt and poetry | |
RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list.d/ubuntu.sources | |
RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \ | |
apt update && apt install -y curl libpython3-dev nginx libglib2.0-0 libglx-mesa0 pkg-config libicu-dev libgdiplus default-jdk python3-pip pipx \ | |
libasound2t64 libatk-bridge2.0-0 libgtk-4-1 libnss3 xdg-utils unzip libgbm-dev wget \ | |
&& rm -rf /var/lib/apt/lists/* && \ | |
wget -q -O chrome-linux64.zip https://bit.ly/chrome-linux64-121-0-6167-85 && \ | |
unzip chrome-linux64.zip && \ | |
rm chrome-linux64.zip && \ | |
mv chrome-linux64 /opt/chrome/ && \ | |
ln -s /opt/chrome/chrome /usr/local/bin/ && \ | |
wget -q -O chromedriver-linux64.zip https://bit.ly/chromedriver-linux64-121-0-6167-85 && \ | |
unzip -j chromedriver-linux64.zip chromedriver-linux64/chromedriver && \ | |
rm chromedriver-linux64.zip && \ | |
mv chromedriver /usr/local/bin/ && rm -f /usr/bin/google-chrome | |
RUN pip3 config set global.index-url https://pypi.tuna.tsinghua.edu.cn/simple && pip3 config set global.trusted-host "pypi.tuna.tsinghua.edu.cn mirrors.pku.edu.cn" && pip3 config set global.extra-index-url "https://mirrors.pku.edu.cn/pypi/web/simple" \ | |
&& pipx install poetry \ | |
&& /root/.local/bin/poetry self add poetry-plugin-pypi-mirror | |
# https://forum.aspose.com/t/aspose-slides-for-net-no-usable-version-of-libssl-found-with-linux-server/271344/13 | |
# aspose-slides on linux/arm64 is unavailable | |
RUN --mount=type=bind,source=libssl1.1_1.1.1f-1ubuntu2_amd64.deb,target=/root/libssl1.1_1.1.1f-1ubuntu2_amd64.deb \ | |
if [ "${ARCH}" = "amd64" ]; then \ | |
dpkg -i /root/libssl1.1_1.1.1f-1ubuntu2_amd64.deb; \ | |
fi | |
ENV PYTHONDONTWRITEBYTECODE=1 DOTNET_SYSTEM_GLOBALIZATION_INVARIANT=1 | |
ENV PATH=/root/.local/bin:$PATH | |
# Configure Poetry | |
ENV POETRY_NO_INTERACTION=1 | |
ENV POETRY_VIRTUALENVS_IN_PROJECT=true | |
ENV POETRY_VIRTUALENVS_CREATE=true | |
ENV POETRY_REQUESTS_TIMEOUT=15 | |
ENV POETRY_PYPI_MIRROR_URL=https://pypi.tuna.tsinghua.edu.cn/simple/ | |
# builder stage | |
FROM base AS builder | |
USER root | |
WORKDIR /ragflow | |
RUN --mount=type=cache,id=ragflow_builder_apt,target=/var/cache/apt,sharing=locked \ | |
apt update && apt install -y nodejs npm cargo && \ | |
rm -rf /var/lib/apt/lists/* | |
COPY web web | |
COPY docs docs | |
RUN --mount=type=cache,id=ragflow_builder_npm,target=/root/.npm,sharing=locked \ | |
cd web && npm i && npm run build | |
# install dependencies from poetry.lock file | |
COPY pyproject.toml poetry.toml poetry.lock ./ | |
RUN --mount=type=cache,id=ragflow_builder_poetry,target=/root/.cache/pypoetry,sharing=locked \ | |
if [ "$LIGHTEN" -eq 0 ]; then \ | |
poetry install --no-root --with=full; \ | |
else \ | |
poetry install --no-root; \ | |
fi | |
# production stage | |
FROM base AS production | |
USER root | |
WORKDIR /ragflow | |
# Install python packages' dependencies | |
# cv2 requires libGL.so.1 | |
RUN --mount=type=cache,id=ragflow_production_apt,target=/var/cache/apt,sharing=locked \ | |
apt update && apt install -y --no-install-recommends nginx libgl1 vim less && \ | |
rm -rf /var/lib/apt/lists/* | |
COPY web web | |
COPY api api | |
COPY conf conf | |
COPY deepdoc deepdoc | |
COPY rag rag | |
COPY agent agent | |
COPY graphrag graphrag | |
COPY pyproject.toml poetry.toml poetry.lock ./ | |
# Copy models downloaded via download_deps.py | |
RUN mkdir -p /ragflow/rag/res/deepdoc /root/.ragflow | |
RUN --mount=type=bind,source=huggingface.co,target=/huggingface.co \ | |
tar --exclude='.*' -cf - \ | |
/huggingface.co/InfiniFlow/text_concat_xgb_v1.0 \ | |
/huggingface.co/InfiniFlow/deepdoc \ | |
| tar -xf - --strip-components=3 -C /ragflow/rag/res/deepdoc | |
# Copy nltk data downloaded via download_deps.py | |
COPY nltk_data /root/nltk_data | |
# https://github.com/chrismattmann/tika-python | |
# This is the only way to run python-tika without internet access. Without this set, the default is to check the tika version and pull latest every time from Apache. | |
COPY tika-server-standard-3.0.0.jar tika-server-standard-3.0.0.jar.md5 ./ | |
ENV TIKA_SERVER_JAR="file:///ragflow/tika-server-standard.jar" | |
# Copy compiled web pages | |
COPY --from=builder /ragflow/web/dist /ragflow/web/dist | |
# Copy Python environment and packages | |
ENV VIRTUAL_ENV=/ragflow/.venv | |
COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV} | |
ENV PATH="${VIRTUAL_ENV}/bin:${PATH}" | |
ENV PYTHONPATH=/ragflow/ | |
COPY docker/service_conf.yaml.template ./conf/service_conf.yaml.template | |
COPY docker/entrypoint.sh ./entrypoint.sh | |
RUN chmod +x ./entrypoint.sh | |
ENTRYPOINT ["./entrypoint.sh"] | |