hai 8 meses · f551f0a0ea
--- a/docs/index.md
+++ b/docs/index.md
--- a/docs/installation/installation.md
+++ b/docs/installation/installation.md
@@ -3,7 +3,7 @@ comments: true
 
				 ---
			
 
				 
			
 
				 # PaddleX本地安装教程
			
 
				-> ❗安装 PaddleX 前请先确保您有基础的 <b>Python 运行环境</b>（注：当前支持Python 3.8 ～ Python 3.10下运行，更多Python版本适配中）。
			
 
				+> ❗安装 PaddleX 前请先确保您有基础的 <b>Python 运行环境</b>（注：当前支持Python 3.8 ～ Python 3.12下运行）。
			
 
				 
			
 
				 ## 1. 快速安装
			
 
				 欢迎您使用飞桨低代码开发工具PaddleX，在我们正式开始本地安装之前，请首先明确您的开发需求，并根据您的需求选择合适的安装模式。
			
@@ -61,8 +61,8 @@ PaddleX支持的插件如下，请您根据开发需求，确定所需的一个
 
				 </tr>
			
 
				 <tr>
			
 
				 <td>通用OCR</td>
			
 
				-<td>文本检测<br>文本识别</td>
			
 
				-<td><code>PaddleOCR</code></td>
			
 
				+<td>文档图像方向分类<br>文本图像矫正<br>文本检测<br>文本行方向分类<br>文本识别</td>
			
 
				+<td><code>PaddleOCR</code><br><code>PaddleClas</code></td>
			
 
				 </tr>
			
 
				 <tr>
			
 
				 <td>通用表格识别</td>
			
@@ -131,7 +131,7 @@ paddlex --install PaddleXXX  # 例如PaddleOCR
 
				 
			
 
				 当您使用自定义方式安装时，需要先安装飞桨 PaddlePaddle 框架，随后获取 PaddleX 源码，最后选择PaddleX的安装模式。
			
 
				 
			
 
				-> ❗ 注：目前 PaddleX 仅支持 11.8 和 12.3 版本的 CUDA，请确保已安装的 Nvidia 驱动支持的上述 CUDA 版本。
			
 
				+> ❗ 无需关注物理机上的 CUDA 版本，只需关注显卡驱动程序版本。
			
 
				 
			
 
				 ### 2.1 基于Docker获取PaddleX
			
 
				 参考下述命令，使用 PaddleX 官方 Docker 镜像，创建一个名为 `paddlex` 的容器，并将当前工作目录映射到容器内的 `/paddle` 目录。
			
@@ -143,10 +143,10 @@ paddlex --install PaddleXXX  # 例如PaddleOCR
 
				 docker run --name paddlex -v $PWD:/paddle --shm-size=8g --network=host -it ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlex/paddlex:paddlex3.0.0rc0-paddlepaddle3.0.0rc0-cpu /bin/bash
			
 
				 
			
 
				 # 对于 GPU 用户
			
 
				-# 对于 CUDA11.8 用户
			
 
				+# GPU 版本，需显卡驱动程序版本 ≥450.80.02（Linux）或 ≥452.39（Windows）
			
 
				 docker run --gpus all --name paddlex -v $PWD:/paddle --shm-size=8g --network=host -it ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlex/paddlex:paddlex3.0.0rc0-paddlepaddle3.0.0rc0-gpu-cuda11.8-cudnn8.6-trt8.5 /bin/bash
			
 
				 
			
 
				-# 对于 CUDA12.3 用户
			
 
				+# GPU 版本，需显卡驱动程序版本 ≥545.23.06（Linux）或 ≥545.84（Windows）
			
 
				 docker run --gpus all --name paddlex -v $PWD:/paddle --shm-size=8g --network=host -it ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlex/paddlex:paddlex3.0.0rc0-paddlepaddle3.0.0rc0-gpu-cuda12.3-cudnn9.0-trt8.6 /bin/bash
			
 
				 ```
			
 
				 
			
--- a/docs/installation/paddlepaddle_install.md
+++ b/docs/installation/paddlepaddle_install.md
@@ -18,10 +18,10 @@ comments: true
 
				 docker run --name paddlex -v $PWD:/paddle --shm-size=8G --network=host -it ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddle:3.0.0rc0 /bin/bash
			
 
				 
			
 
				 # 对于 gpu 用户:
			
 
				-# CUDA11.8 用户
			
 
				+# GPU 版本，需显卡驱动程序版本 ≥450.80.02（Linux）或 ≥452.39（Windows）
			
 
				 docker run --gpus all --name paddlex -v $PWD:/paddle --shm-size=8G --network=host -it ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddle:3.0.0rc0-gpu-cuda11.8-cudnn8.6-trt8.5 /bin/bash
			
 
				 
			
 
				-# CUDA12.3 用户
			
 
				+# GPU 版本，需显卡驱动程序版本 ≥545.23.06（Linux）或 ≥545.84（Windows）
			
 
				 docker run --gpus all --name paddlex -v $PWD:/paddle --shm-size=8G --network=host -it ccr-2vdh3abv-pub.cnc.bj.baidubce.com/paddlepaddle/paddle:3.0.0rc0-gpu-cuda12.3-cudnn9.0-trt8.6 /bin/bash
			
 
				 ```
			
 
				 
			
@@ -57,7 +57,7 @@ python -m pip install paddlepaddle-gpu==3.0.0rc0 -i https://www.paddlepaddle.org
 
				 # gpu，该命令仅适用于 CUDA 版本为 12.3 的机器环境
			
 
				 python -m pip install paddlepaddle-gpu==3.0.0rc0 -i https://www.paddlepaddle.org.cn/packages/stable/cu123/
			
 
				 ```
			
 
				-> ❗ <b>注</b>：更多飞桨 Wheel 版本请参考[飞桨官网](https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/install/pip/linux-pip.html)。
			
 
				+> ❗ <b>注</b>：无需关注物理机上的 CUDA 版本，只需关注显卡驱动程序版本。更多飞桨 Wheel 版本请参考[飞桨官网](https://www.paddlepaddle.org.cn/install/quick?docurl=/documentation/docs/zh/install/pip/linux-pip.html)。
			
 
				 
			
 
				 <b>关于其他硬件安装飞桨，请参考</b>[PaddleX多硬件使用指南](../other_devices_support/multi_devices_use_guide.md)<b>。</b>
			
 
				 
			
--- a/docs/pipeline_usage/tutorials/cv_pipelines/human_keypoint_detection.md
+++ b/docs/pipeline_usage/tutorials/cv_pipelines/human_keypoint_detection.md
@@ -73,23 +73,43 @@ PaddleX 的人体关键点检测产线是一个 Top-Down 方案，由行人检
 
				 </tr>
			
 
				 </table>
			
 
				 
			
 
				-**测试环境说明：**
			
 
				+<b>测试环境说明：</b>
			
 
				 
			
 
				-- **性能测试环境**
			
 
				-  - **测试数据集**：
			
 
				+- <b>性能测试环境</b>
			
 
				+  - <b>测试数据集</b>：
			
 
				     - 行人检测模型：CrowdHuman数据集。
			
 
				     - 人体关键点检测模型：COCO数据集 AP(0.5:0.95)，所依赖的检测框为ground truth标注得到。
			
 
				-  - **硬件配置**：
			
 
				+  - <b>硬件配置</b>：
			
 
				     - GPU：NVIDIA Tesla T4
			
 
				     - CPU：Intel Xeon Gold 6271C @ 2.60GHz
			
 
				     - 其他环境：Ubuntu 20.04 / cuDNN 8.6 / TensorRT 8.5.2.2
			
 
				 
			
 
				-- **推理模式说明**
			
 
				-
			
 
				-| 模式        | GPU配置                          | CPU配置          | 加速技术组合                                |
			
 
				-|-------------|----------------------------------|------------------|---------------------------------------------|
			
 
				-| 常规模式    | FP32精度 / 无TRT加速             | FP32精度 / 8线程       | PaddleInference                             |
			
 
				-| 高性能模式  | 选择先验精度类型和加速策略的最优组合         | FP32精度 / 8线程       | 选择先验最优后端（Paddle/OpenVINO/TRT等） |
			
 
				+- <b>推理模式说明</b>
			
 
				+
			
 
				+<table border="1">
			
 
				+    <thead>
			
 
				+        <tr>
			
 
				+            <th>模式</th>
			
 
				+            <th>GPU配置</th>
			
 
				+            <th>CPU配置</th>
			
 
				+            <th>加速技术组合</th>
			
 
				+        </tr>
			
 
				+    </thead>
			
 
				+    <tbody>
			
 
				+        <tr>
			
 
				+            <td>常规模式</td>
			
 
				+            <td>FP32精度 / 无TRT加速</td>
			
 
				+            <td>FP32精度 / 8线程</td>
			
 
				+            <td>PaddleInference</td>
			
 
				+        </tr>
			
 
				+        <tr>
			
 
				+            <td>高性能模式</td>
			
 
				+            <td>选择先验精度类型和加速策略的最优组合</td>
			
 
				+            <td>FP32精度 / 8线程</td>
			
 
				+            <td>选择先验最优后端（Paddle/OpenVINO/TRT等）</td>
			
 
				+        </tr>
			
 
				+    </tbody>
			
 
				+</table>
			
 
				 
			
 
				 </details>
			
 
				 
			
--- a/docs/pipeline_usage/tutorials/ocr_pipelines/layout_parsing_v2.md
+++ b/docs/pipeline_usage/tutorials/ocr_pipelines/layout_parsing_v2.md
--- a/docs/pipeline_usage/tutorials/ocr_pipelines/table_recognition.md
+++ b/docs/pipeline_usage/tutorials/ocr_pipelines/table_recognition.md
@@ -605,6 +605,7 @@ paddlex --pipeline table_recognition \
 
				        ...,
			
 
				        [448, ..., 121]], dtype=int16)}}]}}
			
 
				 ```
			
 
				+
			
 
				 运行结果参数说明可以参考[2.2 Python脚本方式](#22-python脚本方式集成)中的结果解释。
			
 
				 
			
 
				 可视化结果保存在`save_path`下，其中表格识别的可视化结果如下：
			
--- a/docs/pipeline_usage/tutorials/ocr_pipelines/table_recognition_v2.md
+++ b/docs/pipeline_usage/tutorials/ocr_pipelines/table_recognition_v2.md
@@ -96,7 +96,7 @@ comments: true
 
				 <th>检测Hmean（%）</th>
			
 
				 <th>GPU推理耗时（ms）<br/>[常规模式 / 高性能模式]</th>
			
 
				 <th>CPU推理耗时（ms）<br/>[常规模式 / 高性能模式]</th>
			
 
				-<th>模型存储大小（M)</th>
			
 
				+<th>模型存储大小（M）</th>
			
 
				 <th>介绍</th>
			
 
				 </tr>
			
 
				 </thead>
			
@@ -561,7 +561,7 @@ devanagari_PP-OCRv3_mobile_rec_infer.tar">推理模型</a>/<a href="https://padd
 
				 <tr>
			
 
				 <th>模型</th><th>模型下载链接</th>
			
 
				 <th>MS-SSIM （%）</th>
			
 
				-<th>模型存储大小（M)</th>
			
 
				+<th>模型存储大小（M）</th>
			
 
				 <th>介绍</th>
			
 
				 </tr>
			
 
				 </thead>
			
@@ -583,7 +583,7 @@ devanagari_PP-OCRv3_mobile_rec_infer.tar">推理模型</a>/<a href="https://padd
 
				 <th>Top-1 Acc（%）</th>
			
 
				 <th>GPU推理耗时（ms）<br/>[常规模式 / 高性能模式]</th>
			
 
				 <th>CPU推理耗时（ms）<br/>[常规模式 / 高性能模式]</th>
			
 
				-<th>模型存储大小（M)</th>
			
 
				+<th>模型存储大小（M）</th>
			
 
				 <th>介绍</th>
			
 
				 </tr>
			
 
				 </thead>
			
@@ -1470,7 +1470,7 @@ SubPipelines:
 
				 
			
 
				       TextRecognition:
			
 
				         module_name: text_recognition
			
 
				-        model_name: PP-OCRv4_server_rec
			
 
				+        model_name: PP-OCRv4_server_rec_doc
			
 
				         model_dir: null # 替换为微调后文本识别的模型权重路径
			
 
				         batch_size: 1
			
 
				         score_thresh: 0
			
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -1,9 +1,8 @@
 
				 site_name: PaddleX 文档 #站点名称
			
 
				 site_url: https://paddlepaddle.github.io/PaddleX/
			
 
				 docs_dir: docs # 文档路径
			
 
				-
			
 
				+ 
			
 
				 repo_url: https://github.com/PaddlePaddle/PaddleX #仓库地址
			
 
				-
			
 
				 edit_uri: edit/develop/docs/ #修改文件的路径
			
 
				 theme:
			
 
				   name: material
			
@@ -102,9 +101,12 @@ plugins:
 
				             OCR: OCR
			
 
				             通用OCR产线: OCR
			
 
				             通用表格识别产线: General Table Recognition
			
 
				+            通用表格识别v2产线: General Table Recognition V2
			
 
				             通用版面解析产线: General Layout Parsing
			
 
				+            通用版面解析v2产线: General Layout Parsing V2
			
 
				             公式识别产线: Formula Recognition
			
 
				             印章文本识别产线: Seal Recognition
			
 
				+            文档图像预处理产线: Document Image Preprocessing
			
 
				             计算机视觉: Computer Vision
			
 
				             通用图像分类: General Image Classification
			
 
				             通用目标检测: General Object Detection
			
@@ -131,6 +133,14 @@ plugins:
 
				             文本识别模块: Text Recognition
			
 
				             版面区域检测模块: Layout Parsing
			
 
				             表格结构识别模块: Table Structure Recognition
			
 
				+            表格单元格检测模块: Table Cell Detection
			
 
				+            表格分类模块: Table Classification
			
 
				+            文本行方向分类: Text Line Orientation Classification
			
 
				+            人体关键点检测模块: Human Keypoint Detection
			
 
				+            开放词汇目标检测模块: Open-Vocabulary Object Detection
			
 
				+            开放词汇目标分割模块: Open-Vocabulary Segmentation
			
 
				+            多语种语音识别模块: Multilingual Speech Recognition
			
 
				+            BEV融合3D检测模块: 3D Multimodal Fusion Detection
			
 
				             文档图像方向分类: Document Image Orientation Classification
			
 
				             文本图像矫正模块: Text Image Unwarping
			
 
				             公式识别模块: Formula Recognition
			
@@ -148,14 +158,25 @@ plugins:
 
				             主体检测模块: Main Body Detection
			
 
				             行人检测模块: Human Detection
			
 
				             车辆检测模块: Vehicle Detection
			
 
				+            3D多模态融合检测: 3D Multi-modal Fusion Detection
			
 
				+            人体关键点检测: Human Keypoint Detection
			
 
				+            开放词汇检测: Open Vocabulary Detection
			
 
				+            开放词汇分割: Open Vocabulary Segmentation
			
 
				+            旋转目标检测: Rotated Object Detection
			
 
				             图像分割: Image Segmentation
			
 
				             语义分割模块: Semantic Segmentation
			
 
				             实例分割模块: Instance Segmentation
			
 
				+            人脸特征模块: Face Feature
			
 
				             图像异常检测模块: Image Anomaly Detection
			
 
				             时序分析: Time Series Analysis
			
 
				             时序预测模块: Time Series Forecasting
			
 
				             时序异常检测模块: Time Series Anomaly Detection
			
 
				             时序分类模块: Time Series Classification
			
 
				+            语音处理: Speech
			
 
				+            多语种语音识别: Multilingual Speech Recognition
			
 
				+            视频分析: Video
			
 
				+            通用视频分类: General Video Classification
			
 
				+            通用视频检测: General Video Detection
			
 
				             说明文件: Instructions
			
 
				             PaddleX单模型Python脚本使用说明: PaddleX Module Python API Usage
			
 
				             PaddleX通用模型配置文件参数说明: PaddleX Common Module Config Parameters
			
@@ -187,6 +208,8 @@ plugins:
 
				             时序异常检测任务模块: Time Series Anomaly Detection Task
			
 
				             时序分类任务模块: Time Series Classification Task
			
 
				             时序预测任务模块: Time Series Forecasting Task                 
			
 
				+            语音识别: Speech
			
 
				+            3D检测: 3D
			
 
				             产线列表: Pipeline List
			
 
				             PaddleX产线列表(CPU/GPU): PaddleX Pipeline List (CPU/GPU)
			
 
				             PaddleX产线列表(DCU): PaddleX Pipeline List (DCU)
			
@@ -306,9 +329,12 @@ nav:
 
				        - OCR:
			
 
				          - 通用OCR产线: pipeline_usage/tutorials/ocr_pipelines/OCR.md
			
 
				          - 通用表格识别产线: pipeline_usage/tutorials/ocr_pipelines/table_recognition.md
			
 
				-         - 通用版面解析产线: pipeline_usage/tutorials/ocr_pipelines/layout_parsing.md
			
 
				+         - 通用表格识别v2产线: pipeline_usage/tutorials/ocr_pipelines/table_recognition_v2.md
			
 
				+         - 通用版面解析产线: pipeline_usage/tutorials/ocr_pipelines/layout_parsing_.md
			
 
				+         - 通用版面解析v2产线: pipeline_usage/tutorials/ocr_pipelines/layout_parsing_v2.md
			
 
				          - 公式识别产线: pipeline_usage/tutorials/ocr_pipelines/formula_recognition.md
			
 
				          - 印章文本识别产线: pipeline_usage/tutorials/ocr_pipelines/seal_recognition.md
			
 
				+         - 文档图像预处理产线: pipeline_usage/tutorials/ocr_pipelines/doc_preprocessor.md
			
 
				        - 计算机视觉:
			
 
				          - 通用图像分类: pipeline_usage/tutorials/cv_pipelines/image_classification.md
			
 
				          - 通用目标检测: pipeline_usage/tutorials/cv_pipelines/object_detection.md
			
@@ -317,6 +343,11 @@ nav:
 
				          - 图像多标签分类: pipeline_usage/tutorials/cv_pipelines/image_multi_label_classification.md
			
 
				          - 小目标检测: pipeline_usage/tutorials/cv_pipelines/small_object_detection.md
			
 
				          - 图像异常检测: pipeline_usage/tutorials/cv_pipelines/image_anomaly_detection.md
			
 
				+         - 3D多模态融合检测: pipeline_usage/tutorials/cv_pipelines/3d_bev_detection.md
			
 
				+         - 人体关键点检测: pipeline_usage/tutorials/cv_pipelines/human_keypoint_detection.md
			
 
				+         - 开放词汇检测: pipeline_usage/tutorials/cv_pipelines/open_vocabulary_detection.md
			
 
				+         - 开放词汇分割: pipeline_usage/tutorials/cv_pipelines/open_vocabulary_segmentation.md
			
 
				+         - 旋转目标检测: pipeline_usage/tutorials/cv_pipelines/rotated_object_detection.md
			
 
				          - 通用图像识别: pipeline_usage/tutorials/cv_pipelines/general_image_recognition.md
			
 
				          - 行人属性识别: pipeline_usage/tutorials/cv_pipelines/pedestrian_attribute_recognition.md
			
 
				          - 车辆属性识别: pipeline_usage/tutorials/cv_pipelines/vehicle_attribute_recognition.md
			
@@ -325,6 +356,11 @@ nav:
 
				          - 时序预测产线: pipeline_usage/tutorials/time_series_pipelines/time_series_forecasting.md
			
 
				          - 时序异常检测产线: pipeline_usage/tutorials/time_series_pipelines/time_series_anomaly_detection.md
			
 
				          - 时序分类产线: pipeline_usage/tutorials/time_series_pipelines/time_series_classification.md 
			
 
				+       - 语音处理: 
			
 
				+         - 多语种语音识别: pipeline_usage/tutorials/speech_pipelines/multilingual_speech_recognition.md
			
 
				+       - 视频分析:
			
 
				+         - 通用视频分类: pipeline_usage/tutorials/video_pipelines/video_classification.md
			
 
				+         - 通用视频检测: pipeline_usage/tutorials/video_pipelines/video_detection.md
			
 
				        - 说明文件: 
			
 
				          - PaddleX产线命令行使用说明: pipeline_usage/instructions/pipeline_CLI_usage.md
			
 
				          - PaddleX产线Python脚本使用说明: pipeline_usage/instructions/pipeline_python_API.md
			
@@ -335,8 +371,11 @@ nav:
 
				          - 文本识别模块: module_usage/tutorials/ocr_modules/text_recognition.md
			
 
				          - 版面区域检测模块: module_usage/tutorials/ocr_modules/layout_detection.md
			
 
				          - 表格结构识别模块: module_usage/tutorials/ocr_modules/table_structure_recognition.md
			
 
				+         - 表格单元格检测模块: module_usage/tutorials/ocr_modules/table_cells_detection.md
			
 
				+         - 表格分类模块: module_usage/tutorials/ocr_modules/table_classification.md
			
 
				          - 文档图像方向分类: module_usage/tutorials/ocr_modules/doc_img_orientation_classification.md
			
 
				          - 文本图像矫正模块: module_usage/tutorials/ocr_modules/text_image_unwarping.md
			
 
				+         - 文本行方向分类: module_usage/tutorials/ocr_modules/textline_orientation_classification.md
			
 
				          - 公式识别模块: module_usage/tutorials/ocr_modules/formula_recognition.md
			
 
				        - 图像分类:
			
 
				          - 图像分类模块: module_usage/tutorials/cv_modules/image_classification.md
			
@@ -353,18 +392,21 @@ nav:
 
				          - 主体检测模块: module_usage/tutorials/cv_modules/mainbody_detection.md
			
 
				          - 行人检测模块: module_usage/tutorials/cv_modules/human_detection.md
			
 
				          - 车辆检测模块: module_usage/tutorials/cv_modules/vehicle_detection.md
			
 
				+         - 人体关键点检测模块: module_usage/tutorials/cv_modules/human_keypoint_detection.md
			
 
				+         - 开放词汇目标检测模块: module_usage/tutorials/cv_modules/open_vocabulary_detection.md
			
 
				        - 图像分割:
			
 
				          - 语义分割模块: module_usage/tutorials/cv_modules/semantic_segmentation.md
			
 
				          - 实例分割模块: module_usage/tutorials/cv_modules/instance_segmentation.md
			
 
				-         - 图像异常检测模块: module_usage/tutorials/cv_modules/anomaly_detection.md  
			
 
				+         - 图像异常检测模块: module_usage/tutorials/cv_modules/anomaly_detection.md 
			
 
				+         - 开放词汇目标分割模块: module_usage/tutorials/cv_modules/open_vocabulary_segmentation.md 
			
 
				        - 时序分析:
			
 
				          - 时序预测模块: module_usage/tutorials/time_series_modules/time_series_forecasting.md
			
 
				          - 时序异常检测模块: module_usage/tutorials/time_series_modules/time_series_anomaly_detection.md
			
 
				          - 时序分类模块: module_usage/tutorials/time_series_modules/time_series_classification.md  
			
 
				        - 语音识别:
			
 
				          - 多语种语音识别模块: module_usage/tutorials/speech_modules/multilingual_speech_recognition.md
			
 
				-       - 3D检测:
			
 
				-        - BEV融合3D检测模块: module_usage/tutorials/cv_modules/3d_bev_detection.md
			
 
				+       - 3D检测: 
			
 
				+         - BEV融合3D检测模块: module_usage/tutorials/cv_modules/3d_bev_detection.md
			
 
				        - 说明文件:
			
 
				          - PaddleX单模型Python脚本使用说明: module_usage/instructions/model_python_API.md
			
 
				          - PaddleX通用模型配置文件参数说明: module_usage/instructions/config_parameters_common.md