3 weeks ago · cb69cbce44
--- a/deploy/hps/sdk/scripts/assemble.sh
+++ b/deploy/hps/sdk/scripts/assemble.sh
@@ -8,5 +8,5 @@ docker run \
 
															     -v "$(pwd)":/workspace \
														
 
															     -w /workspace \
														
 
															     --rm \
														
 
															-    python:3.10@sha256:6ff000548a4fa34c1be02624836e75e212d4ead8227b4d4381c3ae998933a922 \
														
 
															+    python:3.10 \
														
 
															     /bin/bash scripts/_assemble.sh "$@"
														
--- a/deploy/hps/server_env/Dockerfile
+++ b/deploy/hps/server_env/Dockerfile
@@ -33,9 +33,7 @@ ENV DEBIAN_FRONTEND=noninteractive
 
															 RUN mkdir /paddlex
														
 
															-RUN apt-get update \
														
 
															-    && apt-get install -y --no-install-recommends software-properties-common \
														
 
															-    && add-apt-repository -y ppa:deadsnakes/ppa \
														
 
															+RUN echo 'deb http://archive.ubuntu.com/ubuntu jammy main universe' > /etc/apt/sources.list.d/jammy-temp.list \
														
 
															     && apt-get update \
														
 
															     && apt-get install -y --no-install-recommends python3.10 python3.10-venv \
														
 
															     && python3.10 -m venv /paddlex/py310 \
														
@@ -101,7 +99,8 @@ RUN --mount=type=bind,source=deploy/hps/server_env/requirements/${DEVICE_TYPE}.t
 
															     python -m pip install --requirement /tmp/requirements.txt --requirement /tmp/hpi_requirements.txt \
														
 
															     && if [ "${ENV_TYPE}" = 'dev' ]; then \
														
 
															         python -m pip install --requirement /tmp/dev_requirements.txt; \
														
 
															-    fi
														
 
															+    fi \
														
 
															+    && python -m pip install https://paddle-whl.bj.bcebos.com/nightly/cu126/safetensors/safetensors-0.6.2.dev0-cp38-abi3-linux_x86_64.whl
														
 
															 RUN --mount=type=bind,source=.,target=/tmp/PaddleX,rw \
														
 
															     python -m pip install --no-deps /tmp/PaddleX
														
--- a/deploy/hps/server_env/requirements/cpu.txt
+++ b/deploy/hps/server_env/requirements/cpu.txt
@@ -2,7 +2,7 @@
 
															 # This file is autogenerated by pip-compile with Python 3.10
														
 
															 # by the following command:
														
 
															 #
														
 
															-#    pip-compile --allow-unsafe --extra=base --extra=serving --no-emit-index-url --no-emit-trusted-host --output-file=requirements/cpu.txt --strip-extras ../../../setup.py paddlex-hps-server/pyproject.toml requirements/app.in requirements/cpu.in
														
 
															+#    pip-compile --allow-unsafe --cert=None --client-cert=None --extra=base --extra=serving --index-url=None --no-emit-index-url --no-emit-trusted-host --output-file=requirements/cpu.txt --pip-args=None --strip-extras ../../../setup.py paddlex-hps-server/pyproject.toml requirements/app.in requirements/cpu.in
														
 
															 #
														
 
															 aiohappyeyeballs==2.4.6
														
 
															     # via aiohttp
														
@@ -289,6 +289,8 @@ pyparsing==3.2.1
 
															     # via matplotlib
														
 
															 pypdfium2==4.30.1
														
 
															     # via paddlex (../../../setup.py)
														
 
															+python-bidi==0.6.6
														
 
															+    # via paddlex (../../../setup.py)
														
 
															 python-dateutil==2.9.0.post0
														
 
															     # via
														
 
															     #   matplotlib
														
@@ -324,6 +326,8 @@ ruamel-yaml==0.18.10
 
															     # via paddlex (../../../setup.py)
														
 
															 ruamel-yaml-clib==0.2.12
														
 
															     # via ruamel-yaml
														
 
															+safetensors==0.6.2
														
 
															+    # via paddlex (../../../setup.py)
														
 
															 scikit-image==0.24.0
														
 
															     # via paddlex (../../../setup.py)
														
 
															 scikit-learn==1.6.1
														
@@ -332,6 +336,8 @@ scipy==1.15.2
 
															     # via
														
 
															     #   scikit-image
														
 
															     #   scikit-learn
														
 
															+sentencepiece==0.2.1
														
 
															+    # via paddlex (../../../setup.py)
														
 
															 shapely==2.0.7
														
 
															     # via paddlex (../../../setup.py)
														
 
															 six==1.17.0
														
--- a/deploy/hps/server_env/requirements/cpu_dev.txt
+++ b/deploy/hps/server_env/requirements/cpu_dev.txt
@@ -2,5 +2,5 @@
 
															 # This file is autogenerated by pip-compile with Python 3.10
														
 
															 # by the following command:
														
 
															 #
														
 
															-#    pip-compile --allow-unsafe --constraint=requirements/cpu.txt --no-emit-index-url --no-emit-trusted-host --output-file=requirements/cpu_dev.txt --strip-extras requirements/cpu_dev.in
														
 
															+#    pip-compile --allow-unsafe --cert=None --client-cert=None --constraint=requirements/cpu.txt --index-url=None --no-emit-index-url --no-emit-trusted-host --output-file=requirements/cpu_dev.txt --pip-args=None --strip-extras requirements/cpu_dev.in
														
 
															 #
														
--- a/deploy/hps/server_env/requirements/cpu_hpi.txt
+++ b/deploy/hps/server_env/requirements/cpu_hpi.txt
@@ -2,7 +2,7 @@
 
															 # This file is autogenerated by pip-compile with Python 3.10
														
 
															 # by the following command:
														
 
															 #
														
 
															-#    pip-compile --allow-unsafe --constraint=requirements/cpu.txt --no-emit-index-url --no-emit-trusted-host --output-file=requirements/cpu_hpi.txt --strip-extras requirements/cpu_hpi.in
														
 
															+#    pip-compile --allow-unsafe --cert=None --client-cert=None --constraint=requirements/cpu.txt --index-url=None --no-emit-index-url --no-emit-trusted-host --output-file=requirements/cpu_hpi.txt --pip-args=None --strip-extras requirements/cpu_hpi.in
														
 
															 #
														
 
															 certifi==2025.1.31
														
 
															     # via
														
--- a/deploy/hps/server_env/requirements/gpu.txt
+++ b/deploy/hps/server_env/requirements/gpu.txt
@@ -2,7 +2,7 @@
 
															 # This file is autogenerated by pip-compile with Python 3.10
														
 
															 # by the following command:
														
 
															 #
														
 
															-#    pip-compile --allow-unsafe --extra=base --extra=serving --no-emit-index-url --no-emit-trusted-host --output-file=requirements/gpu.txt --strip-extras ../../../setup.py paddlex-hps-server/pyproject.toml requirements/app.in requirements/gpu.in
														
 
															+#    pip-compile --allow-unsafe --cert=None --client-cert=None --extra=base --extra=serving --index-url=None --no-emit-index-url --no-emit-trusted-host --output-file=requirements/gpu.txt --pip-args=None --strip-extras ../../../setup.py paddlex-hps-server/pyproject.toml requirements/app.in requirements/gpu.in
														
 
															 #
														
 
															 aiohappyeyeballs==2.4.6
														
 
															     # via aiohttp
														
@@ -289,6 +289,8 @@ pyparsing==3.2.1
 
															     # via matplotlib
														
 
															 pypdfium2==4.30.1
														
 
															     # via paddlex (../../../setup.py)
														
 
															+python-bidi==0.6.6
														
 
															+    # via paddlex (../../../setup.py)
														
 
															 python-dateutil==2.9.0.post0
														
 
															     # via
														
 
															     #   matplotlib
														
@@ -324,6 +326,8 @@ ruamel-yaml==0.18.10
 
															     # via paddlex (../../../setup.py)
														
 
															 ruamel-yaml-clib==0.2.12
														
 
															     # via ruamel-yaml
														
 
															+safetensors==0.6.2
														
 
															+    # via paddlex (../../../setup.py)
														
 
															 scikit-image==0.24.0
														
 
															     # via paddlex (../../../setup.py)
														
 
															 scikit-learn==1.6.1
														
@@ -332,6 +336,8 @@ scipy==1.15.2
 
															     # via
														
 
															     #   scikit-image
														
 
															     #   scikit-learn
														
 
															+sentencepiece==0.2.1
														
 
															+    # via paddlex (../../../setup.py)
														
 
															 shapely==2.0.7
														
 
															     # via paddlex (../../../setup.py)
														
 
															 six==1.17.0
														
--- a/deploy/hps/server_env/requirements/gpu_dev.txt
+++ b/deploy/hps/server_env/requirements/gpu_dev.txt
@@ -2,5 +2,5 @@
 
															 # This file is autogenerated by pip-compile with Python 3.10
														
 
															 # by the following command:
														
 
															 #
														
 
															-#    pip-compile --allow-unsafe --constraint=requirements/gpu.txt --no-emit-index-url --no-emit-trusted-host --output-file=requirements/gpu_dev.txt --strip-extras requirements/gpu_dev.in
														
 
															+#    pip-compile --allow-unsafe --cert=None --client-cert=None --constraint=requirements/gpu.txt --index-url=None --no-emit-index-url --no-emit-trusted-host --output-file=requirements/gpu_dev.txt --pip-args=None --strip-extras requirements/gpu_dev.in
														
 
															 #
														
--- a/deploy/hps/server_env/requirements/gpu_hpi.txt
+++ b/deploy/hps/server_env/requirements/gpu_hpi.txt
@@ -2,7 +2,7 @@
 
															 # This file is autogenerated by pip-compile with Python 3.10
														
 
															 # by the following command:
														
 
															 #
														
 
															-#    pip-compile --allow-unsafe --constraint=requirements/gpu.txt --no-emit-index-url --no-emit-trusted-host --output-file=requirements/gpu_hpi.txt --strip-extras requirements/gpu_hpi.in
														
 
															+#    pip-compile --allow-unsafe --cert=None --client-cert=None --constraint=requirements/gpu.txt --index-url=None --no-emit-index-url --no-emit-trusted-host --output-file=requirements/gpu_hpi.txt --pip-args=None --strip-extras requirements/gpu_hpi.in
														
 
															 #
														
 
															 certifi==2025.1.31
														
 
															     # via
														
--- a/docs/pipeline_usage/tutorials/ocr_pipelines/PaddleOCR-VL.md
+++ b/docs/pipeline_usage/tutorials/ocr_pipelines/PaddleOCR-VL.md
@@ -78,8 +78,8 @@ comments: true
 
															 </thead>
														
 
															 <tbody>
														
 
															 <tr>
														
 
															-<td>PP-DocLayoutV2-L</td>
														
 
															-<td><a href="https://paddle-model-ecology.bj.bcebos.com/paddlex/official_inference_model/paddle3.0.0/PP-DocLayoutV2-L_infer.tar">推理模型</a>/<a href="https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayoutV2-L_pretrained.pdparams">训练模型</a></td>
														
 
															+<td>PP-DocLayoutV2</td>
														
 
															+<td><a href="https://paddle-model-ecology.bj.bcebos.com/paddlex/official_inference_model/paddle3.0.0/PP-DocLayoutV2_infer.tar">推理模型</a>/<a href="https://paddle-model-ecology.bj.bcebos.com/paddlex/official_pretrained_model/PP-DocLayoutV2_pretrained.pdparams">训练模型</a></td>
														
 
															 <td>-</td>
														
 
															 <td>- / -</td>
														
 
															 <td>- / -</td>
														
@@ -287,6 +287,7 @@ comments: true
 
															     * 由于我们没有收集NPU和XPU的设备内存数据，因此表中相应位置的数据标记为N/A。
														
 
															 ## 2. 快速开始
														
 
															+
														
 
															 PaddleX 所提供的模型产线均可以快速体验效果，你可以在本地使用命令行或 Python 体验通用通用版面解析v3产线的效果。
														
 
															 在本地使用通用版面解析v3产线前，请确保您已经按照[PaddleX本地安装教程](../../../installation/installation.md)完成了PaddleX的wheel包安装。如果您希望选择性安装依赖，请参考安装教程中的相关说明。该产线对应的依赖分组为 `ocr`。此外，为了使用飞桨框架读取 safetensors 格式模型，请执行如下命令安装 safetensors：
														
@@ -907,6 +908,20 @@ docker run \
 
															     paddlex_genai_server --model_name PaddleOCR-VL-0.9B --host 0.0.0.0 --port 8118 --backend vllm
														
 
															 ```
														
 
															+若您使用的是  NVIDIA 50 系显卡 (Compute Capacity >= 12)，需要在启动服务前安装指定版本的 FlashAttention:
														
 
															+
														
 
															+```
														
 
															+docker run \
														
 
															+    -it \
														
 
															+    --rm \
														
 
															+    --gpus all \
														
 
															+    --network host \
														
 
															+    ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddlex-genai-vllm-server \
														
 
															+    /bin/bash
														
 
															+python -m pip install flash-attn==2.8.3
														
 
															+paddlex_genai_server --model_name PaddleOCR-VL-0.9B --backend vllm --port 8118
														
 
															+```
														
 
															+
														
 
															 #### 3.1.2 通过 PaddleX CLI 和启动
														
 
															 由于推理加速框架可能与飞桨框架存在依赖冲突，建议在虚拟环境中安装。示例如下：
														
@@ -917,13 +932,19 @@ python -m venv .venv
 
															 # 激活环境
														
 
															 source .venv/bin/activate
														
 
															 # 安装 PaddleX
														
 
															-python -m pip install "paddlex[ocr]"
														
 
															+python -m pip install paddlex
														
 
															 # 安装 vLLM 服务器插件
														
 
															 paddlex --install genai-vllm-server
														
 
															 # 安装 SGLang 服务器插件
														
 
															 # paddlex --install genai-sglang-server
														
 
															 ```
														
 
															+若您使用的是  NVIDIA 50 系显卡 (Compute Capacity >= 12)，需要在启动服务前安装指定版本的 FlashAttention:
														
 
															+
														
 
															+```
														
 
															+python -m pip install flash-attn==2.8.3
														
 
															+```
														
 
															+
														
 
															 安装完成后，可通过 `paddlex_genai_server` 命令启动服务：
														
 
															 ```bash
														
@@ -1146,6 +1167,12 @@ PaddleX 会将来自单张或多张输入图像中的子图分组并对服务器
 
															 <td>否</td>
														
 
															 </tr>
														
 
															 <tr>
														
 
															+<td><code>useDocOrientationClassify</code></td>
														
 
															+<td><code>boolean</code> | <code>null</code></td>
														
 
															+<td>请参阅产线对象中 <code>predict</code> 方法的 <code>use_doc_orientation_classify</code> 参数相关说明。</td>
														
 
															+<td>否</td>
														
 
															+</tr>
														
 
															+<tr>
														
 
															 <td><code>useDocUnwarping</code></td>
														
 
															 <td><code>boolean</code> | <code>null</code></td>
														
 
															 <td>请参阅产线对象中 <code>predict</code> 方法的 <code>use_doc_unwarping</code> 参数相关说明。</td>
														
--- a/paddlex/.version
+++ b/paddlex/.version
@@ -1 +1 @@
 
															-3.3.3
														
 
															+3.3.4
														
--- a/paddlex/inference/models/common/vlm/transformers/model_utils.py
+++ b/paddlex/inference/models/common/vlm/transformers/model_utils.py
@@ -1607,6 +1607,8 @@ class PretrainedModel(
 
															                 except NotImplementedError:
														
 
															                     if convert_from_hf:
														
 
															                         raise ValueError("`convert_from_hf=True` is not supported")
														
 
															+                    else:
														
 
															+                        transpose_weight_keys = None
														
 
															                 state_dict = load_state_dict(
														
 
															                     shard_file,
														
 
															                     tp_actions if pre_tensor_parallel_split else None,
														
@@ -1937,6 +1939,8 @@ class PretrainedModel(
 
															                 except NotImplementedError:
														
 
															                     if convert_from_hf:
														
 
															                         raise ValueError("`convert_from_hf=True` is not supported")
														
 
															+                    else:
														
 
															+                        transpose_weight_keys = None
														
 
															                 state_dict = load_state_dict(
														
 
															                     resolved_archive_file,
														
 
															                     convert_from_hf=convert_from_hf,
														
--- a/paddlex/inference/utils/hpi_model_info_collection.json
+++ b/paddlex/inference/utils/hpi_model_info_collection.json
@@ -1465,6 +1465,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     },
														
 
															     "paddle31": {
														
@@ -2946,6 +2949,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     },
														
 
															     "paddle311": {
														
@@ -4428,6 +4434,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     }
														
 
															   },
														
@@ -5849,6 +5858,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     },
														
 
															     "paddle31": {
														
@@ -7288,6 +7300,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     },
														
 
															     "paddle311": {
														
@@ -8726,6 +8741,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     }
														
 
															   },
														
@@ -9774,6 +9792,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     },
														
 
															     "paddle31": {
														
@@ -10835,6 +10856,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     },
														
 
															     "paddle311": {
														
@@ -11880,6 +11904,9 @@
 
															       ],
														
 
															       "YOWO": [
														
 
															         "paddle"
														
 
															+      ],
														
 
															+      "PP-DocLayoutV2": [
														
 
															+        "paddle"
														
 
															       ]
														
 
															     }
														
 
															   }
														
--- a/paddlex/inference/utils/official_models.py
+++ b/paddlex/inference/utils/official_models.py
@@ -433,11 +433,12 @@ class _BaseModelHoster(ABC):
 
															             )
														
 
															             self._download(model_name, model_dir)
														
 
															-        return (
														
 
															-            model_dir / "PaddleOCR-VL-0.9B"
														
 
															-            if model_name == "PaddleOCR-VL"
														
 
															-            else model_dir
														
 
															-        )
														
 
															+        if model_name == "PaddleOCR-VL":
														
 
															+            vl_model_dir = model_dir / "PaddleOCR-VL-0.9B"
														
 
															+            if vl_model_dir.exists() and vl_model_dir.is_dir():
														
 
															+                return vl_model_dir
														
 
															+
														
 
															+        return model_dir
														
 
															     @abstractmethod
														
 
															     def _download(self):
														
@@ -584,17 +585,19 @@ Otherwise, only local models can be used."""
 
															         for idx, hoster in enumerate(hosters):
														
 
															             if model_name in hoster.model_list:
														
 
															                 try:
														
 
															-                    return hoster.get_model(model_name)
														
 
															-                except Exception as e:
														
 
															-                    logging.warning(
														
 
															-                        f"Encounter exception when download model from {hoster.alias}: \n{e}."
														
 
															+                    model_path = hoster.get_model(model_name)
														
 
															+                    logging.debug(
														
 
															+                        f"`{model_name}` model files has been download from model source: `{hoster.alias}`!"
														
 
															                     )
														
 
															+                    return model_path
														
 
															+
														
 
															+                except Exception as e:
														
 
															                     if len(hosters) <= 1:
														
 
															                         raise Exception(
														
 
															-                            f"No model source is available! Please check network or use local model files!"
														
 
															+                            f"Encounter exception when download model from {hoster.alias}. No model source is available! Please check network or use local model files!"
														
 
															                         )
														
 
															                     logging.warning(
														
 
															-                        f"PaddleX would try to download from other model sources."
														
 
															+                        f"Encountering exception when download model from {hoster.alias}: \n{e}, will try to download from other model sources: `hosters[idx + 1].alias`."
														
 
															                     )
														
 
															                     return self._download_from_hoster(hosters[idx + 1 :], model_name)
														
--- a/paddlex/paddlex_cli.py
+++ b/paddlex/paddlex_cli.py
@@ -370,14 +370,7 @@ def install(args):
 
															             if "vllm" in plugin_type or "sglang" in plugin_type:
														
 
															                 try:
														
 
															                     install_packages(["wheel"], constraints="required")
														
 
															-                    if "vllm" in plugin_type:
														
 
															-                        install_packages(
														
 
															-                            ["flash-attn == 2.8.3"], constraints="required"
														
 
															-                        )
														
 
															-                    elif "sglang" in plugin_type:
														
 
															-                        install_packages(
														
 
															-                            ["flash-attn == 2.8.2"], constraints="required"
														
 
															-                        )
														
 
															+                    install_packages(["flash-attn == 2.8.2"], constraints="required")
														
 
															                 except Exception:
														
 
															                     logging.error("Installation failed", exc_info=True)
														
 
															                     sys.exit(1)
														
--- a/setup.py
+++ b/setup.py
@@ -38,10 +38,10 @@ BASE_DEP_SPECS = {
 
															     "imagesize": "",
														
 
															     "Jinja2": "",
														
 
															     "joblib": "",
														
 
															-    "langchain": ">= 0.2",
														
 
															-    "langchain-community": ">= 0.2",
														
 
															+    "langchain": ">= 0.2, < 1.0",
														
 
															+    "langchain-community": ">= 0.2, < 1.0",
														
 
															     "langchain-core": "",
														
 
															-    "langchain-openai": ">= 0.1",
														
 
															+    "langchain-openai": ">= 0.1, < 1.0",
														
 
															     "lxml": "",
														
 
															     "matplotlib": "",
														
 
															     "modelscope": ">=1.28.0",