- # base stage
- FROM ubuntu:24.04 AS base
- USER root
-
- ENV LIGHTEN=0
-
- WORKDIR /ragflow
-
- RUN rm -f /etc/apt/apt.conf.d/docker-clean \
- && echo 'Binary::apt::APT::Keep-Downloaded-Packages "true";' > /etc/apt/apt.conf.d/keep-cache
-
- RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
- apt update && apt-get --no-install-recommends install -y ca-certificates
-
- # if you located in China, you can use tsinghua mirror to speed up apt
- RUN sed -i 's|http://archive.ubuntu.com|https://mirrors.tuna.tsinghua.edu.cn|g' /etc/apt/sources.list.d/ubuntu.sources
-
- RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
- apt update && apt install -y curl libpython3-dev nginx libglib2.0-0 libglx-mesa0 pkg-config libicu-dev libgdiplus \
- && rm -rf /var/lib/apt/lists/* \
- && curl -sSL https://install.python-poetry.org | python3 -
-
- RUN curl -o libssl1.deb http://archive.ubuntu.com/ubuntu/pool/main/o/openssl1.0/libssl1.0.0_1.0.2n-1ubuntu5_amd64.deb && dpkg -i libssl1.deb && rm -f libssl1.deb
-
- ENV PYTHONDONTWRITEBYTECODE=1 DOTNET_SYSTEM_GLOBALIZATION_INVARIANT=1
-
- # Configure Poetry
- ENV POETRY_NO_INTERACTION=1
- ENV POETRY_VIRTUALENVS_IN_PROJECT=true
- ENV POETRY_VIRTUALENVS_CREATE=true
- ENV POETRY_REQUESTS_TIMEOUT=15
-
- # builder stage
- FROM base AS builder
- USER root
-
- WORKDIR /ragflow
-
- RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
- apt update && apt install -y nodejs npm cargo && \
- rm -rf /var/lib/apt/lists/*
-
- COPY web web
- RUN cd web && npm i --force && npm run build
-
- # install dependencies from poetry.lock file
- COPY pyproject.toml poetry.toml poetry.lock ./
-
- RUN --mount=type=cache,target=/root/.cache/pypoetry,sharing=locked \
- if [ "$LIGHTEN" -eq 0 ]; then \
- /root/.local/bin/poetry install --sync --no-cache --no-root --with=full; \
- else \
- /root/.local/bin/poetry install --sync --no-cache --no-root; \
- fi
-
- # production stage
- FROM base AS production
- USER root
-
- WORKDIR /ragflow
-
- # Install python packages' dependencies
- # cv2 requires libGL.so.1
- RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \
- apt update && apt install -y --no-install-recommends nginx libgl1 vim less && \
- rm -rf /var/lib/apt/lists/*
-
- COPY web web
- COPY api api
- COPY conf conf
- COPY deepdoc deepdoc
- COPY rag rag
- COPY agent agent
- COPY graphrag graphrag
- COPY pyproject.toml poetry.toml poetry.lock ./
-
- # Copy models downloaded via download_deps.py
- RUN mkdir -p /ragflow/rag/res/deepdoc /root/.ragflow
- RUN --mount=type=bind,source=huggingface.co,target=/huggingface.co \
- tar --exclude='.*' -cf - \
- /huggingface.co/InfiniFlow/text_concat_xgb_v1.0 \
- /huggingface.co/InfiniFlow/deepdoc \
- | tar -xf - --strip-components=3 -C /ragflow/rag/res/deepdoc
- RUN --mount=type=bind,source=huggingface.co,target=/huggingface.co \
- tar -cf - \
- /huggingface.co/BAAI/bge-large-zh-v1.5 \
- /huggingface.co/BAAI/bge-reranker-v2-m3 \
- /huggingface.co/maidalun1020/bce-embedding-base_v1 \
- /huggingface.co/maidalun1020/bce-reranker-base_v1 \
- | tar -xf - --strip-components=2 -C /root/.ragflow
-
- # Copy compiled web pages
- COPY --from=builder /ragflow/web/dist /ragflow/web/dist
-
- # Copy Python environment and packages
- ENV VIRTUAL_ENV=/ragflow/.venv
- COPY --from=builder ${VIRTUAL_ENV} ${VIRTUAL_ENV}
- ENV PATH="${VIRTUAL_ENV}/bin:/root/.local/bin:${PATH}"
-
- # Download nltk data
- RUN python3 -m nltk.downloader wordnet punkt punkt_tab
-
- ENV PYTHONPATH=/ragflow/
-
- COPY docker/entrypoint.sh ./entrypoint.sh
- RUN chmod +x ./entrypoint.sh
-
- ENTRYPOINT ["./entrypoint.sh"]
|