Parcourir la source

fix(vl_recognition): 更新VLM表格识别配置,切换为MinerU模块并修正服务地址

zhch158_admin il y a 2 semaines
Parent
commit
78706b705c

+ 6 - 3
ocr_tools/universal_doc_parser/config/bank_statement_yusys_v3.yaml

@@ -111,12 +111,15 @@ table_recognition_wired:
 # VLM 表格识别配置(当分类为 'wireless' 时使用)
 vl_recognition:
   # 可选: "mineru" (MinerU VLM) 或 "paddle" (PaddleOCR-VL)
-  module: "paddle"
-  model_name: "PaddleOCR-VL-0.9B"
+  module: "mineru"
+  # model_name: "PaddleOCR-VL-0.9B"
+  # module: "paddle"
+  # model_name: "PaddleOCR-VL-0.9B"
   
   # 后端配置
   backend: "http-client"  # 可选: "http-client", "vllm-engine", "transformers"
-  server_url: "http://10.192.72.11:20016"  # PaddleOCR-VL 服务地址
+  server_url: "http://10.192.72.11:20006"  # MinerU-VL 服务地址
+  # server_url: "http://10.192.72.11:20016"  # PaddleOCR-VL 服务地址
   
   # 图片尺寸限制(避免序列长度超限)
   max_image_size: 4096