feat: add mineru more images

2026-02-10 17:45:39 +08:00
parent 60d566d050
commit ced072de66
13 changed files with 309 additions and 6 deletions
@@ -16,6 +16,9 @@
  "[yaml]": {
    "editor.formatOnSave": true
  },
+  "[dockerfile]": {
+    "editor.formatOnSave": true
+  },
  "[dockercompose]": {
    "editor.formatOnSave": true
  },
@@ -1,5 +1,5 @@
 # MinerU Docker image
-MINERU_VERSION=2.7.3
+MINERU_VERSION=2.7.6

 # Port configurations
 MINERU_PORT_OVERRIDE_VLLM=30000
@@ -0,0 +1,27 @@
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + iluvatar GPU.
+FROM crpi-vofi3w62lkohhxsp.cn-shanghai.personal.cr.aliyuncs.com/opendatalab-mineru/corex:4.4.0_torch2.7.1_vllm0.11.2_py3.10
+
+
+# Install Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install 'mineru[core]>=2.7.4' \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,34 @@
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + Hygon DCU.
+FROM harbor.sourcefind.cn:5443/dcu/admin/base/vllm:0.9.2-ubuntu22.04-dtk25.04.2-1226-das1.7-py3.10-20251226
+
+
+# Install Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install mineru[api,gradio] \
+  "matplotlib>=3.10,<4" \
+  "ultralytics>=8.3.48,<9" \
+  "doclayout_yolo==0.0.4" \
+  "ftfy>=6.3.1,<7" \
+  "shapely>=2.0.7,<3" \
+  "pyclipper>=1.3.0,<2" \
+  "omegaconf>=2.3.0,<3" \
+  numpy==1.25.0 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -11,7 +11,7 @@ x-mineru-vllm: &mineru-vllm
  image: ${GLOBAL_REGISTRY:-}alexsuntop/mineru:${MINERU_VERSION:-2.7.6}
  build:
    context: .
-    dockerfile: Dockerfile
+    dockerfile: ${MINERU_DOCKERFILE_PATH:-Dockerfile}
    platforms:
      - linux/amd64
      - linux/arm64
@@ -0,0 +1,30 @@
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + Enflame GCU.
+FROM crpi-vofi3w62lkohhxsp.cn-shanghai.personal.cr.aliyuncs.com/opendatalab-mineru/gcu:docker_images_topsrider_i3x_3.6.20260106_vllm0.11_pytorch2.8.0
+
+
+# Install Noto fonts for Chinese characters
+RUN echo 'deb http://mirrors.aliyun.com/ubuntu/ noble main restricted universe multiverse\n\
+  deb http://mirrors.aliyun.com/ubuntu/ noble-updates main restricted universe multiverse\n\
+  deb http://mirrors.aliyun.com/ubuntu/ noble-backports main restricted universe multiverse\n\
+  deb http://mirrors.aliyun.com/ubuntu/ noble-security main restricted universe multiverse' > /tmp/aliyun-sources.list && \
+  apt-get -o Dir::Etc::SourceList=/tmp/aliyun-sources.list update && \
+  apt-get -o Dir::Etc::SourceList=/tmp/aliyun-sources.list install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/* /tmp/aliyun-sources.list
+
+# Install mineru latest
+RUN python3 -m pip install "mineru[core]>=2.7.2" \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,33 @@
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + Kunlun XPU.
+FROM docker.1ms.run/wjie520/vllm_kunlun:v0.10.1.1rc1
+
+
+# Install Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install "mineru[api,gradio]>=2.7.6" \
+  "matplotlib>=3.10,<4" \
+  "ultralytics>=8.3.48,<9" \
+  "doclayout_yolo==0.0.4" \
+  "ftfy>=6.3.1,<7" \
+  "shapely>=2.0.7,<3" \
+  "pyclipper>=1.3.0,<2" \
+  "omegaconf>=2.3.0,<3" \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  sed -i '1,200{s/self\.act = act_layer()/self.act = nn.GELU()/;t;b};' /root/miniconda/envs/vllm_kunlun_0.10.1.1/lib/python3.10/site-packages/vllm_kunlun/models/qwen2_vl.py && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,34 @@
+# 基础镜像配置 vLLM 或 LMDeploy 推理环境，请根据实际需要选择其中一个，要求 amd64(x86-64) CPU + metax GPU。
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + metax GPU.
+FROM cr.metax-tech.com/public-ai-release/maca/vllm:maca.ai3.1.0.7-torch2.6-py310-ubuntu22.04-amd64
+# Base image containing the LMDeploy inference environment, requiring amd64(x86-64) CPU + metax GPU.
+# FROM crpi-vofi3w62lkohhxsp.cn-shanghai.personal.cr.aliyuncs.com/opendatalab-mineru/maca:maca.ai3.1.0.7-torch2.6-py310-ubuntu22.04-lmdeploy0.10.2-amd64
+
+# Install libgl for opencv support & Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig \
+  libgl1 && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# mod torchvision to be compatible with torch 2.6
+RUN sed -i '3s/^Version: 0.15.1+metax3\.1\.0\.4$/Version: 0.21.0+metax3.1.0.4/' /opt/conda/lib/python3.10/site-packages/torchvision-0.15.1+metax3.1.0.4.dist-info/METADATA && \
+  mv /opt/conda/lib/python3.10/site-packages/torchvision-0.15.1+metax3.1.0.4.dist-info /opt/conda/lib/python3.10/site-packages/torchvision-0.21.0+metax3.1.0.4.dist-info
+
+# Install mineru latest
+RUN /opt/conda/bin/python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  /opt/conda/bin/python3 -m pip install 'mineru[core]>=2.6.5' \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  /opt/conda/bin/python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "/opt/conda/bin/mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,42 @@
+# 基础镜像配置 vLLM 或 LMDeploy ，请根据实际需要选择其中一个，要求 amd64(x86-64) CPU + Cambricon MLU.
+# Base image containing the LMDEPLOY inference environment, requiring amd64(x86-64) CPU + Cambricon MLU.
+FROM crpi-4crprmm5baj1v8iv.cn-hangzhou.personal.cr.aliyuncs.com/lmdeploy_dlinfer/camb:qwen2.5_vl
+ARG BACKEND=lmdeploy
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + Cambricon MLU.
+# FROM crpi-vofi3w62lkohhxsp.cn-shanghai.personal.cr.aliyuncs.com/opendatalab-mineru/mlu:vllm0.8.3-torch2.6.0-torchmlu1.26.1-ubuntu22.04-py310
+# ARG BACKEND=vllm
+
+# Install Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN /bin/bash -c '\
+  if [ "$BACKEND" = "vllm" ]; then \
+  source /torch/venv3/pytorch_infer/bin/activate; \
+  fi && \
+  python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install "mineru[core]>=2.7.4" \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install $(if [ "$BACKEND" = "lmdeploy" ]; then echo "accelerate==1.2.0"; else echo "transformers==4.50.3"; fi) && \
+  python3 -m pip cache purge'
+
+# Download models and update the configuration file
+RUN /bin/bash -c '\
+  if [ "$BACKEND" = "vllm" ]; then \
+  source /torch/venv3/pytorch_infer/bin/activate; \
+  fi && \
+  mineru-models-download -s modelscope -m all'
+
+WORKDIR /workspace
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,38 @@
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + MooreThreads GPU.
+FROM registry.mthreads.com/mcconline/vllm-musa-qy2-py310:v0.8.4-release
+
+
+# Install libgl for opencv support & Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig \
+  libgl1 && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  git clone https://gitcode.com/gh_mirrors/vi/vision.git -b v0.20.0 --depth 1 && \
+  cd vision && \
+  python3 setup.py install && \
+  python3 -m pip install "mineru[api,gradio]>=2.7.2" \
+  "matplotlib>=3.10,<4" \
+  "ultralytics>=8.3.48,<9" \
+  "doclayout_yolo==0.0.4" \
+  "ftfy>=6.3.1,<7" \
+  "shapely>=2.0.7,<3" \
+  "pyclipper>=1.3.0,<2" \
+  "omegaconf>=2.3.0,<3" \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,32 @@
+# 基础镜像配置 vLLM 或 LMDeploy ，请根据实际需要选择其中一个，要求 ARM(AArch64) CPU + Ascend NPU。
+# Base image containing the vLLM inference environment, requiring ARM(AArch64) CPU + Ascend NPU.
+FROM quay.m.daocloud.io/ascend/vllm-ascend:v0.11.0
+# Base image containing the LMDeploy inference environment, requiring ARM(AArch64) CPU + Ascend NPU.
+# FROM crpi-4crprmm5baj1v8iv.cn-hangzhou.personal.cr.aliyuncs.com/lmdeploy_dlinfer/ascend:mineru-a2
+
+
+# Install libgl for opencv support & Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig \
+  libgl1 \
+  libglib2.0-0 && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install 'mineru[core]>=2.6.5' \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN TORCH_DEVICE_BACKEND_AUTOLOAD=0 /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]
@@ -0,0 +1,30 @@
+# 基础镜像配置 vLLM 或 LMDeploy 推理环境，请根据实际需要选择其中一个，要求 amd64(x86-64) CPU + t-head PPU。
+# Base image containing the vLLM inference environment, requiring amd64(x86-64) CPU + t-head PPU.
+FROM crpi-vofi3w62lkohhxsp.cn-shanghai.personal.cr.aliyuncs.com/opendatalab-mineru/ppu:ppu-pytorch2.6.0-ubuntu24.04-cuda12.6-vllm0.8.5-py312
+# Base image containing the LMDeploy inference environment, requiring amd64(x86-64) CPU + t-head PPU.
+# FROM crpi-4crprmm5baj1v8iv.cn-hangzhou.personal.cr.aliyuncs.com/lmdeploy_dlinfer/ppu:mineru-ppu
+
+# Install libgl for opencv support & Noto fonts for Chinese characters
+RUN apt-get update && \
+  apt-get install -y \
+  fonts-noto-core \
+  fonts-noto-cjk \
+  fontconfig \
+  libgl1 && \
+  fc-cache -fv && \
+  apt-get clean && \
+  rm -rf /var/lib/apt/lists/*
+
+# Install mineru latest
+RUN python3 -m pip install -U pip -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip install 'mineru[core]>=2.6.5' \
+  numpy==1.26.4 \
+  opencv-python==4.11.0.86 \
+  -i https://mirrors.aliyun.com/pypi/simple && \
+  python3 -m pip cache purge
+
+# Download models and update the configuration file
+RUN /bin/bash -c "mineru-models-download -s modelscope -m all"
+
+# Set the entry point to activate the virtual environment and run the command line tool
+ENTRYPOINT ["/bin/bash", "-c", "export MINERU_MODEL_SOURCE=local && exec \"$@\"", "--"]