| |
| FROM ubuntu:22.04 AS base |
| USER root |
| SHELL ["/bin/bash", "-c"] |
|
|
| ENV LIGHTEN=1 |
|
|
| WORKDIR /ragflow |
|
|
| RUN rm -f /etc/apt/apt.conf.d/docker-clean \ |
| && echo 'Binary::apt::APT::Keep-Downloaded-Packages "true";' > /etc/apt/apt.conf.d/keep-cache |
|
|
| RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \ |
| apt update && apt-get --no-install-recommends install -y ca-certificates |
|
|
| |
| RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list |
|
|
| RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \ |
| apt update && DEBIAN_FRONTEND=noninteractive apt install -y curl libpython3-dev nginx libglib2.0-0 libglx-mesa0 pkg-config libicu-dev libgdiplus default-jdk python3-pip pipx \ |
| libatk-bridge2.0-0 libgtk-4-1 libnss3 xdg-utils unzip libgbm-dev wget git \ |
| && rm -rf /var/lib/apt/lists/* |
|
|
| RUN pip3 config set global.index-url https://pypi.tuna.tsinghua.edu.cn/simple && pip3 config set global.trusted-host "pypi.tuna.tsinghua.edu.cn mirrors.pku.edu.cn" && pip3 config set global.extra-index-url "https://mirrors.pku.edu.cn/pypi/web/simple" \ |
| && pipx install poetry \ |
| && /root/.local/bin/poetry self add poetry-plugin-pypi-mirror |
|
|
| |
| |
| RUN --mount=type=bind,source=libssl1.1_1.1.1f-1ubuntu2_amd64.deb,target=/root/libssl1.1_1.1.1f-1ubuntu2_amd64.deb \ |
| --mount=type=bind,source=libssl1.1_1.1.1f-1ubuntu2_arm64.deb,target=/root/libssl1.1_1.1.1f-1ubuntu2_arm64.deb \ |
| if [ "$(uname -m)" = "x86_64" ]; then \ |
| dpkg -i /root/libssl1.1_1.1.1f-1ubuntu2_amd64.deb; \ |
| elif [ "$(uname -m)" = "aarch64" ]; then \ |
| dpkg -i /root/libssl1.1_1.1.1f-1ubuntu2_arm64.deb; \ |
| fi |
|
|
| ENV PYTHONDONTWRITEBYTECODE=1 DOTNET_SYSTEM_GLOBALIZATION_INVARIANT=1 |
| ENV PATH=/root/.local/bin:$PATH |
| |
| ENV POETRY_NO_INTERACTION=1 |
| ENV POETRY_VIRTUALENVS_IN_PROJECT=true |
| ENV POETRY_VIRTUALENVS_CREATE=true |
| ENV POETRY_REQUESTS_TIMEOUT=15 |
| ENV POETRY_PYPI_MIRROR_URL=https://pypi.tuna.tsinghua.edu.cn/simple/ |
|
|
| |
| RUN --mount=type=cache,id=ragflow_base_apt,target=/var/cache/apt,sharing=locked \ |
| curl -fsSL https://deb.nodesource.com/setup_20.x | bash - && \ |
| apt purge -y nodejs npm && \ |
| apt autoremove && \ |
| apt update && \ |
| apt install -y nodejs cargo && \ |
| rm -rf /var/lib/apt/lists/* |
|
|
| |
| FROM base AS builder |
| USER root |
|
|
| WORKDIR /ragflow |
|
|
| COPY .git /ragflow/.git |
|
|
| RUN current_commit=$(git rev-parse --short HEAD); \ |
| last_tag=$(git describe --tags --abbrev=0); \ |
| commit_count=$(git rev-list --count "$last_tag..HEAD"); \ |
| version_info=""; \ |
| if [ "$commit_count" -eq 0 ]; then \ |
| version_info=$last_tag; \ |
| else \ |
| version_info="$current_commit($last_tag~$commit_count)"; \ |
| fi; \ |
| if [ "$LIGHTEN" == "1" ]; then \ |
| version_info="$version_info slim"; \ |
| else \ |
| version_info="$version_info full"; \ |
| fi; \ |
| echo "RAGFlow version: $version_info"; \ |
| echo $version_info > /ragflow/VERSION |
|
|
| COPY web web |
| COPY docs docs |
| RUN --mount=type=cache,id=ragflow_builder_npm,target=/root/.npm,sharing=locked \ |
| cd web && npm install --force && npm run build |
|
|
| |
| COPY pyproject.toml poetry.toml poetry.lock ./ |
|
|
| RUN --mount=type=cache,id=ragflow_builder_poetry,target=/root/.cache/pypoetry,sharing=locked \ |
| if [ "$LIGHTEN" == "1" ]; then \ |
| poetry install --no-root; \ |
| else \ |
| poetry install --no-root --with=full; \ |
| fi |
|
|
| |
| FROM base AS production |
| USER root |
|
|
| WORKDIR /ragflow |
|
|
| COPY --from=builder /ragflow/VERSION /ragflow/VERSION |
|
|
| |
| |
| RUN --mount=type=cache,id=ragflow_production_apt,target=/var/cache/apt,sharing=locked \ |
| apt update && apt install -y --no-install-recommends nginx libgl1 vim less && \ |
| rm -rf /var/lib/apt/lists/* |
|
|
| COPY web web |
| COPY api api |
| COPY conf conf |
| COPY deepdoc deepdoc |
| COPY rag rag |
| COPY agent agent |
| COPY graphrag graphrag |
| COPY pyproject.toml poetry.toml poetry.lock ./ |
|
|
| |
| RUN mkdir -p /ragflow/rag/res/deepdoc /root/.ragflow |
| RUN --mount=type=bind,source=huggingface.co,target=/huggingface.co \ |
| tar --exclude='.*' -cf - \ |
| /huggingface.co/InfiniFlow/text_concat_xgb_v1.0 \ |
| /huggingface.co/InfiniFlow/deepdoc \ |
| | tar -xf - --strip-components=3 -C /ragflow/rag/res/deepdoc |
|
|
| |
| COPY nltk_data /root/nltk_data |
|
|
| |
| |
| COPY tika-server-standard-3.0.0.jar /ragflow/tika-server-standard.jar |
| COPY tika-server-standard-3.0.0.jar.md5 /ragflow/tika-server-standard.jar.md5 |
| ENV TIKA_SERVER_JAR="file:///ragflow/tika-server-standard.jar" |
|
|
| |
| COPY cl100k_base.tiktoken /ragflow/9b5ad71b2ce5302211f9c61530b329a4922fc6a4 |
|
|
| |
| RUN --mount=type=bind,source=chrome-linux64-121-0-6167-85,target=/chrome-linux64.zip \ |
| unzip /chrome-linux64.zip && \ |
| mv chrome-linux64 /opt/chrome && \ |
| ln -s /opt/chrome/chrome /usr/local/bin/ |
| RUN --mount=type=bind,source=chromedriver-linux64-121-0-6167-85,target=/chromedriver-linux64.zip \ |
| unzip -j /chromedriver-linux64.zip chromedriver-linux64/chromedriver && \ |
| mv chromedriver /usr/local/bin/ && \ |
| rm -f /usr/bin/google-chrome |
|
|
| |
| COPY --from=builder /ragflow/web/dist /ragflow/web/dist |
|
|
| |
| ENV VIRTUAL_ENV=/ragflow/.venv |
| COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV} |
| ENV PATH="${VIRTUAL_ENV}/bin:${PATH}" |
|
|
| ENV PYTHONPATH=/ragflow/ |
|
|
| COPY docker/service_conf.yaml.template ./conf/service_conf.yaml.template |
| COPY docker/entrypoint.sh ./entrypoint.sh |
| RUN chmod +x ./entrypoint.sh |
|
|
| ENTRYPOINT ["./entrypoint.sh"] |
|
|