table_recognition_v2.yaml 2.0 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
  1. pipeline_name: table_recognition_v2
  2. use_doc_preprocessor: True
  3. use_layout_detection: True
  4. use_ocr_model: True
  5. SubModules:
  6. LayoutDetection:
  7. module_name: layout_detection
  8. model_name: PP-DocLayout-L
  9. model_dir: null
  10. TableOrientationClassify:
  11. module_name: doc_text_orientation
  12. model_name: PP-LCNet_x1_0_doc_ori
  13. model_dir: null
  14. TableClassification:
  15. module_name: table_classification
  16. model_name: PP-LCNet_x1_0_table_cls
  17. model_dir: null
  18. WiredTableStructureRecognition:
  19. module_name: table_structure_recognition
  20. model_name: SLANeXt_wired
  21. model_dir: null
  22. WirelessTableStructureRecognition:
  23. module_name: table_structure_recognition
  24. model_name: SLANeXt_wireless
  25. model_dir: null
  26. WiredTableCellsDetection:
  27. module_name: table_cells_detection
  28. model_name: RT-DETR-L_wired_table_cell_det
  29. model_dir: null
  30. WirelessTableCellsDetection:
  31. module_name: table_cells_detection
  32. model_name: RT-DETR-L_wireless_table_cell_det
  33. model_dir: null
  34. SubPipelines:
  35. DocPreprocessor:
  36. pipeline_name: doc_preprocessor
  37. use_doc_orientation_classify: True
  38. use_doc_unwarping: True
  39. SubModules:
  40. DocOrientationClassify:
  41. module_name: doc_text_orientation
  42. model_name: PP-LCNet_x1_0_doc_ori
  43. model_dir: null
  44. DocUnwarping:
  45. module_name: image_unwarping
  46. model_name: UVDoc
  47. model_dir: null
  48. GeneralOCR:
  49. pipeline_name: OCR
  50. text_type: general
  51. use_doc_preprocessor: False
  52. use_textline_orientation: False
  53. SubModules:
  54. TextDetection:
  55. module_name: text_detection
  56. model_name: PP-OCRv4_server_det
  57. model_dir: null
  58. limit_side_len: 960
  59. limit_type: max
  60. max_side_limit: 4000
  61. thresh: 0.3
  62. box_thresh: 0.4
  63. unclip_ratio: 1.5
  64. TextRecognition:
  65. module_name: text_recognition
  66. model_name: PP-OCRv4_server_rec_doc
  67. model_dir: null
  68. batch_size: 1
  69. score_thresh: 0