PP-StructureV3-original.yaml 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. pipeline_name: PP-StructureV3
  2. batch_size: 8
  3. use_doc_preprocessor: True
  4. use_seal_recognition: True
  5. use_table_recognition: True
  6. use_formula_recognition: True
  7. use_chart_recognition: True
  8. use_region_detection: True
  9. SubModules:
  10. LayoutDetection:
  11. module_name: layout_detection
  12. model_name: PP-DocLayout_plus-L
  13. model_dir: null
  14. batch_size: 8
  15. threshold:
  16. 0: 0.3 # paragraph_title
  17. 1: 0.5 # image
  18. 2: 0.4 # text
  19. 3: 0.5 # number
  20. 4: 0.5 # abstract
  21. 5: 0.5 # content
  22. 6: 0.5 # figure_table_chart_title
  23. 7: 0.3 # formula
  24. 8: 0.5 # table
  25. 9: 0.5 # reference
  26. 10: 0.5 # doc_title
  27. 11: 0.5 # footnote
  28. 12: 0.5 # header
  29. 13: 0.5 # algorithm
  30. 14: 0.5 # footer
  31. 15: 0.45 # seal
  32. 16: 0.5 # chart
  33. 17: 0.5 # formula_number
  34. 18: 0.5 # aside_text
  35. 19: 0.5 # reference_content
  36. layout_nms: True
  37. layout_unclip_ratio: [1.0, 1.0]
  38. layout_merge_bboxes_mode:
  39. 0: "large" # paragraph_title
  40. 1: "large" # image
  41. 2: "union" # text
  42. 3: "union" # number
  43. 4: "union" # abstract
  44. 5: "union" # content
  45. 6: "union" # figure_table_chart_title
  46. 7: "large" # formula
  47. 8: "union" # table
  48. 9: "union" # reference
  49. 10: "union" # doc_title
  50. 11: "union" # footnote
  51. 12: "union" # header
  52. 13: "union" # algorithm
  53. 14: "union" # footer
  54. 15: "union" # seal
  55. 16: "large" # chart
  56. 17: "union" # formula_number
  57. 18: "union" # aside_text
  58. 19: "union" # reference_content
  59. ChartRecognition:
  60. module_name: chart_recognition
  61. model_name: PP-Chart2Table
  62. model_dir: null
  63. batch_size: 1
  64. RegionDetection:
  65. module_name: layout_detection
  66. model_name: PP-DocBlockLayout
  67. model_dir: null
  68. layout_nms: True
  69. layout_merge_bboxes_mode: "small"
  70. SubPipelines:
  71. DocPreprocessor:
  72. pipeline_name: doc_preprocessor
  73. batch_size: 8
  74. use_doc_orientation_classify: True
  75. use_doc_unwarping: True
  76. SubModules:
  77. DocOrientationClassify:
  78. module_name: doc_text_orientation
  79. model_name: PP-LCNet_x1_0_doc_ori
  80. model_dir: null
  81. batch_size: 8
  82. DocUnwarping:
  83. module_name: image_unwarping
  84. model_name: UVDoc
  85. model_dir: null
  86. GeneralOCR:
  87. pipeline_name: OCR
  88. batch_size: 8
  89. text_type: general
  90. use_doc_preprocessor: False
  91. use_textline_orientation: True
  92. SubModules:
  93. TextDetection:
  94. module_name: text_detection
  95. model_name: PP-OCRv5_server_det
  96. model_dir: null
  97. limit_side_len: 736
  98. limit_type: min
  99. max_side_limit: 4000
  100. thresh: 0.3
  101. box_thresh: 0.6
  102. unclip_ratio: 1.5
  103. TextLineOrientation:
  104. module_name: textline_orientation
  105. model_name: PP-LCNet_x1_0_textline_ori
  106. model_dir: null
  107. batch_size: 8
  108. TextRecognition:
  109. module_name: text_recognition
  110. model_name: PP-OCRv5_server_rec
  111. model_dir: null
  112. batch_size: 8
  113. score_thresh: 0.0
  114. TableRecognition:
  115. pipeline_name: table_recognition_v2
  116. use_layout_detection: False
  117. use_doc_preprocessor: False
  118. use_ocr_model: False
  119. SubModules:
  120. TableClassification:
  121. module_name: table_classification
  122. model_name: PP-LCNet_x1_0_table_cls
  123. model_dir: null
  124. WiredTableStructureRecognition:
  125. module_name: table_structure_recognition
  126. model_name: SLANeXt_wired
  127. model_dir: null
  128. WirelessTableStructureRecognition:
  129. module_name: table_structure_recognition
  130. model_name: SLANet_plus
  131. model_dir: null
  132. WiredTableCellsDetection:
  133. module_name: table_cells_detection
  134. model_name: RT-DETR-L_wired_table_cell_det
  135. model_dir: null
  136. WirelessTableCellsDetection:
  137. module_name: table_cells_detection
  138. model_name: RT-DETR-L_wireless_table_cell_det
  139. model_dir: null
  140. TableOrientationClassify:
  141. module_name: doc_text_orientation
  142. model_name: PP-LCNet_x1_0_doc_ori
  143. model_dir: null
  144. SubPipelines:
  145. GeneralOCR:
  146. pipeline_name: OCR
  147. text_type: general
  148. use_doc_preprocessor: False
  149. use_textline_orientation: True
  150. SubModules:
  151. TextDetection:
  152. module_name: text_detection
  153. model_name: PP-OCRv5_server_det
  154. model_dir: null
  155. limit_side_len: 736
  156. limit_type: min
  157. max_side_limit: 4000
  158. thresh: 0.3
  159. box_thresh: 0.4
  160. unclip_ratio: 1.5
  161. TextLineOrientation:
  162. module_name: textline_orientation
  163. model_name: PP-LCNet_x1_0_textline_ori
  164. model_dir: null
  165. batch_size: 8
  166. TextRecognition:
  167. module_name: text_recognition
  168. model_name: PP-OCRv5_server_rec
  169. model_dir: null
  170. batch_size: 8
  171. score_thresh: 0.0
  172. SealRecognition:
  173. pipeline_name: seal_recognition
  174. batch_size: 8
  175. use_layout_detection: False
  176. use_doc_preprocessor: False
  177. SubPipelines:
  178. SealOCR:
  179. pipeline_name: OCR
  180. batch_size: 8
  181. text_type: seal
  182. use_doc_preprocessor: False
  183. use_textline_orientation: False
  184. SubModules:
  185. TextDetection:
  186. module_name: seal_text_detection
  187. model_name: PP-OCRv4_server_seal_det
  188. model_dir: null
  189. limit_side_len: 736
  190. limit_type: min
  191. max_side_limit: 4000
  192. thresh: 0.2
  193. box_thresh: 0.6
  194. unclip_ratio: 0.5
  195. TextRecognition:
  196. module_name: text_recognition
  197. model_name: PP-OCRv5_server_rec
  198. model_dir: null
  199. batch_size: 8
  200. score_thresh: 0
  201. FormulaRecognition:
  202. pipeline_name: formula_recognition
  203. batch_size: 8
  204. use_layout_detection: False
  205. use_doc_preprocessor: False
  206. SubModules:
  207. FormulaRecognition:
  208. module_name: formula_recognition
  209. model_name: PP-FormulaNet_plus-L
  210. model_dir: null
  211. batch_size: 8