PaddleOCR-VL-Client-RT-DETR-H_layout_17cls.yaml 2.4 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798
  1. pipeline_name: PaddleOCR-VL
  2. batch_size: 64
  3. use_queues: True
  4. use_doc_preprocessor: False
  5. use_layout_detection: True
  6. use_chart_recognition: False
  7. format_block_content: False
  8. SubModules:
  9. LayoutDetection:
  10. module_name: layout_detection
  11. model_name: RT-DETR-H_layout_17cls
  12. model_dir: null
  13. batch_size: 8
  14. threshold:
  15. 0: 0.5 # abstract
  16. 1: 0.5 # algorithm
  17. 2: 0.5 # aside_text
  18. 3: 0.5 # chart
  19. 4: 0.5 # content
  20. 5: 0.4 # formula
  21. 6: 0.4 # doc_title
  22. 7: 0.5 # figure_title
  23. 8: 0.5 # footer
  24. 9: 0.5 # footer
  25. 10: 0.5 # footnote
  26. 11: 0.5 # formula_number
  27. 12: 0.5 # header
  28. 13: 0.5 # header
  29. 14: 0.5 # image
  30. 15: 0.4 # formula
  31. 16: 0.5 # number
  32. 17: 0.4 # paragraph_title
  33. 18: 0.5 # reference
  34. 19: 0.5 # reference_content
  35. 20: 0.45 # seal
  36. 21: 0.5 # table
  37. 22: 0.4 # text
  38. 23: 0.4 # text
  39. 24: 0.5 # vision_footnote
  40. layout_nms: True
  41. layout_unclip_ratio: [1.0, 1.0]
  42. layout_merge_bboxes_mode:
  43. 0: "union" # abstract
  44. 1: "union" # algorithm
  45. 2: "union" # aside_text
  46. 3: "large" # chart
  47. 4: "union" # content
  48. 5: "large" # display_formula
  49. 6: "large" # doc_title
  50. 7: "union" # figure_title
  51. 8: "union" # footer
  52. 9: "union" # footer
  53. 10: "union" # footnote
  54. 11: "union" # formula_number
  55. 12: "union" # header
  56. 13: "union" # header
  57. 14: "union" # image
  58. 15: "large" # inline_formula
  59. 16: "union" # number
  60. 17: "large" # paragraph_title
  61. 18: "union" # reference
  62. 19: "union" # reference_content
  63. 20: "union" # seal
  64. 21: "union" # table
  65. 22: "union" # text
  66. 23: "union" # text
  67. 24: "union" # vision_footnote
  68. VLRecognition:
  69. module_name: vl_recognition
  70. model_name: PaddleOCR-VL-0.9B
  71. model_dir: null
  72. batch_size: 2048
  73. genai_config:
  74. backend: vllm-server
  75. server_url: http://10.192.72.11:8110/v1
  76. SubPipelines:
  77. DocPreprocessor:
  78. pipeline_name: doc_preprocessor
  79. batch_size: 8
  80. use_doc_orientation_classify: True
  81. use_doc_unwarping: True
  82. SubModules:
  83. DocOrientationClassify:
  84. module_name: doc_text_orientation
  85. model_name: PP-LCNet_x1_0_doc_ori
  86. model_dir: null
  87. batch_size: 8
  88. DocUnwarping:
  89. module_name: image_unwarping
  90. model_name: UVDoc
  91. model_dir: null