PP-StructureV3.yaml 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227
  1. pipeline_name: PP-StructureV3
  2. batch_size: 8
  3. use_doc_preprocessor: False
  4. use_seal_recognition: False
  5. use_table_recognition: True
  6. use_formula_recognition: True
  7. use_chart_recognition: False
  8. use_region_detection: True
  9. format_block_content: False
  10. SubModules:
  11. LayoutDetection:
  12. module_name: layout_detection
  13. model_name: PP-DocLayout_plus-L
  14. model_dir: null
  15. batch_size: 8
  16. threshold:
  17. 0: 0.3 # paragraph_title
  18. 1: 0.5 # image
  19. 2: 0.4 # text
  20. 3: 0.5 # number
  21. 4: 0.5 # abstract
  22. 5: 0.5 # content
  23. 6: 0.5 # figure_table_chart_title
  24. 7: 0.3 # formula
  25. 8: 0.5 # table
  26. 9: 0.5 # reference
  27. 10: 0.5 # doc_title
  28. 11: 0.5 # footnote
  29. 12: 0.5 # header
  30. 13: 0.5 # algorithm
  31. 14: 0.5 # footer
  32. 15: 0.45 # seal
  33. 16: 0.5 # chart
  34. 17: 0.5 # formula_number
  35. 18: 0.5 # aside_text
  36. 19: 0.5 # reference_content
  37. layout_nms: True
  38. layout_unclip_ratio: [1.0, 1.0]
  39. layout_merge_bboxes_mode:
  40. 0: "large" # paragraph_title
  41. 1: "large" # image
  42. 2: "union" # text
  43. 3: "union" # number
  44. 4: "union" # abstract
  45. 5: "union" # content
  46. 6: "union" # figure_table_chart_title
  47. 7: "large" # formula
  48. 8: "union" # table
  49. 9: "union" # reference
  50. 10: "union" # doc_title
  51. 11: "union" # footnote
  52. 12: "union" # header
  53. 13: "union" # algorithm
  54. 14: "union" # footer
  55. 15: "union" # seal
  56. 16: "large" # chart
  57. 17: "union" # formula_number
  58. 18: "union" # aside_text
  59. 19: "union" # reference_content
  60. ChartRecognition:
  61. module_name: chart_recognition
  62. model_name: PP-Chart2Table
  63. model_dir: null
  64. batch_size: 1
  65. RegionDetection:
  66. module_name: layout_detection
  67. model_name: PP-DocBlockLayout
  68. model_dir: null
  69. layout_nms: True
  70. layout_merge_bboxes_mode: "small"
  71. SubPipelines:
  72. DocPreprocessor:
  73. pipeline_name: doc_preprocessor
  74. batch_size: 8
  75. use_doc_orientation_classify: True
  76. use_doc_unwarping: True
  77. SubModules:
  78. DocOrientationClassify:
  79. module_name: doc_text_orientation
  80. model_name: PP-LCNet_x1_0_doc_ori
  81. model_dir: null
  82. batch_size: 8
  83. DocUnwarping:
  84. module_name: image_unwarping
  85. model_name: UVDoc
  86. model_dir: null
  87. GeneralOCR:
  88. pipeline_name: OCR
  89. batch_size: 8
  90. text_type: general
  91. use_doc_preprocessor: False
  92. use_textline_orientation: True
  93. SubModules:
  94. TextDetection:
  95. module_name: text_detection
  96. model_name: PP-OCRv5_server_det
  97. model_dir: null
  98. limit_side_len: 736
  99. limit_type: min
  100. max_side_limit: 4000
  101. thresh: 0.3
  102. box_thresh: 0.6
  103. unclip_ratio: 1.5
  104. TextLineOrientation:
  105. module_name: textline_orientation
  106. model_name: PP-LCNet_x1_0_textline_ori
  107. model_dir: null
  108. batch_size: 8
  109. TextRecognition:
  110. module_name: text_recognition
  111. model_name: PP-OCRv5_server_rec
  112. model_dir: null
  113. batch_size: 8
  114. score_thresh: 0.0
  115. TableRecognition:
  116. pipeline_name: table_recognition_v2
  117. use_layout_detection: False
  118. use_doc_preprocessor: False
  119. use_ocr_model: False
  120. SubModules:
  121. TableClassification:
  122. module_name: table_classification
  123. model_name: PP-LCNet_x1_0_table_cls
  124. model_dir: null
  125. WiredTableStructureRecognition:
  126. module_name: table_structure_recognition
  127. model_name: SLANeXt_wired
  128. model_dir: null
  129. WirelessTableStructureRecognition:
  130. module_name: table_structure_recognition
  131. model_name: SLANet_plus
  132. model_dir: null
  133. WiredTableCellsDetection:
  134. module_name: table_cells_detection
  135. model_name: RT-DETR-L_wired_table_cell_det
  136. model_dir: null
  137. WirelessTableCellsDetection:
  138. module_name: table_cells_detection
  139. model_name: RT-DETR-L_wireless_table_cell_det
  140. model_dir: null
  141. TableOrientationClassify:
  142. module_name: doc_text_orientation
  143. model_name: PP-LCNet_x1_0_doc_ori
  144. model_dir: null
  145. SubPipelines:
  146. GeneralOCR:
  147. pipeline_name: OCR
  148. text_type: general
  149. use_doc_preprocessor: False
  150. use_textline_orientation: True
  151. SubModules:
  152. TextDetection:
  153. module_name: text_detection
  154. model_name: PP-OCRv5_server_det
  155. model_dir: null
  156. limit_side_len: 736
  157. limit_type: min
  158. max_side_limit: 4000
  159. thresh: 0.3
  160. box_thresh: 0.4
  161. unclip_ratio: 1.5
  162. TextLineOrientation:
  163. module_name: textline_orientation
  164. model_name: PP-LCNet_x1_0_textline_ori
  165. model_dir: null
  166. batch_size: 8
  167. TextRecognition:
  168. module_name: text_recognition
  169. model_name: PP-OCRv5_server_rec
  170. model_dir: null
  171. batch_size: 8
  172. score_thresh: 0.0
  173. SealRecognition:
  174. pipeline_name: seal_recognition
  175. batch_size: 8
  176. use_layout_detection: False
  177. use_doc_preprocessor: False
  178. SubPipelines:
  179. SealOCR:
  180. pipeline_name: OCR
  181. batch_size: 8
  182. text_type: seal
  183. use_doc_preprocessor: False
  184. use_textline_orientation: False
  185. SubModules:
  186. TextDetection:
  187. module_name: seal_text_detection
  188. model_name: PP-OCRv4_server_seal_det
  189. model_dir: null
  190. limit_side_len: 736
  191. limit_type: min
  192. max_side_limit: 4000
  193. thresh: 0.2
  194. box_thresh: 0.6
  195. unclip_ratio: 0.5
  196. TextRecognition:
  197. module_name: text_recognition
  198. model_name: PP-OCRv5_server_rec
  199. model_dir: null
  200. batch_size: 8
  201. score_thresh: 0
  202. FormulaRecognition:
  203. pipeline_name: formula_recognition
  204. batch_size: 8
  205. use_layout_detection: False
  206. use_doc_preprocessor: False
  207. SubModules:
  208. FormulaRecognition:
  209. module_name: formula_recognition
  210. model_name: PP-FormulaNet_plus-L
  211. model_dir: null
  212. batch_size: 8