PaddleOCR-VL.yaml 2.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596
  1. pipeline_name: PaddleOCR-VL
  2. batch_size: 64
  3. use_queues: True
  4. use_doc_preprocessor: False
  5. use_layout_detection: True
  6. use_chart_recognition: False
  7. format_block_content: False
  8. SubModules:
  9. LayoutDetection:
  10. module_name: layout_detection
  11. model_name: PP-DocLayoutV2
  12. model_dir: null
  13. batch_size: 8
  14. threshold:
  15. 0: 0.5 # abstract
  16. 1: 0.5 # algorithm
  17. 2: 0.5 # aside_text
  18. 3: 0.5 # chart
  19. 4: 0.5 # content
  20. 5: 0.4 # formula
  21. 6: 0.4 # doc_title
  22. 7: 0.5 # figure_title
  23. 8: 0.5 # footer
  24. 9: 0.5 # footer
  25. 10: 0.5 # footnote
  26. 11: 0.5 # formula_number
  27. 12: 0.5 # header
  28. 13: 0.5 # header
  29. 14: 0.5 # image
  30. 15: 0.4 # formula
  31. 16: 0.5 # number
  32. 17: 0.4 # paragraph_title
  33. 18: 0.5 # reference
  34. 19: 0.5 # reference_content
  35. 20: 0.45 # seal
  36. 21: 0.5 # table
  37. 22: 0.4 # text
  38. 23: 0.4 # text
  39. 24: 0.5 # vision_footnote
  40. layout_nms: True
  41. layout_unclip_ratio: [1.0, 1.0]
  42. layout_merge_bboxes_mode:
  43. 0: "union" # abstract
  44. 1: "union" # algorithm
  45. 2: "union" # aside_text
  46. 3: "large" # chart
  47. 4: "union" # content
  48. 5: "large" # display_formula
  49. 6: "large" # doc_title
  50. 7: "union" # figure_title
  51. 8: "union" # footer
  52. 9: "union" # footer
  53. 10: "union" # footnote
  54. 11: "union" # formula_number
  55. 12: "union" # header
  56. 13: "union" # header
  57. 14: "union" # image
  58. 15: "large" # inline_formula
  59. 16: "union" # number
  60. 17: "large" # paragraph_title
  61. 18: "union" # reference
  62. 19: "union" # reference_content
  63. 20: "union" # seal
  64. 21: "union" # table
  65. 22: "union" # text
  66. 23: "union" # text
  67. 24: "union" # vision_footnote
  68. VLRecognition:
  69. module_name: vl_recognition
  70. model_name: PaddleOCR-VL-0.9B
  71. model_dir: null
  72. batch_size: 2048
  73. genai_config:
  74. backend: native
  75. SubPipelines:
  76. DocPreprocessor:
  77. pipeline_name: doc_preprocessor
  78. batch_size: 8
  79. use_doc_orientation_classify: True
  80. use_doc_unwarping: True
  81. SubModules:
  82. DocOrientationClassify:
  83. module_name: doc_text_orientation
  84. model_name: PP-LCNet_x1_0_doc_ori
  85. model_dir: null
  86. batch_size: 8
  87. DocUnwarping:
  88. module_name: image_unwarping
  89. model_name: UVDoc
  90. model_dir: null