Browse Source

update PP-StrutureV3 config (#3993)

changdazhou 6 months ago
parent
commit
f16f22d6b7
1 changed files with 27 additions and 56 deletions
  1. 27 56
      paddlex/configs/pipelines/PP-StructureV3.yaml

+ 27 - 56
paddlex/configs/pipelines/PP-StructureV3.yaml

@@ -7,7 +7,7 @@ use_doc_preprocessor: True
 use_seal_recognition: True
 use_table_recognition: True
 use_formula_recognition: True
-use_chart_recognition: False
+use_chart_recognition: True
 use_region_detection: True
 
 SubModules:
@@ -19,52 +19,26 @@ SubModules:
     threshold: 
       0: 0.3  # paragraph_title
       1: 0.5  # image
-      2: 0.5  # text
+      2: 0.4  # text
       3: 0.5  # number
       4: 0.5  # abstract
       5: 0.5  # content
-      6: 0.5  # figure_title
+      6: 0.5  # figure_table_chart_title
       7: 0.3  # formula
       8: 0.5  # table
-      9: 0.5  # table_title
-      10: 0.5 # reference
-      11: 0.5 # doc_title
-      12: 0.5 # footnote
-      13: 0.5 # header
-      14: 0.5 # algorithm
-      15: 0.5 # footer
-      16: 0.3 # seal
-      17: 0.5 # chart_title
-      18: 0.5 # chart
-      19: 0.5 # formula_number
-      20: 0.5 # header_image
-      21: 0.5 # footer_image
-      22: 0.5 # aside_text
+      9: 0.5  # reference
+      10: 0.5 # doc_title
+      11: 0.5 # footnote
+      12: 0.5 # header
+      13: 0.5 # algorithm
+      14: 0.5 # footer
+      15: 0.45 # seal
+      16: 0.5 # chart
+      17: 0.5 # formula_number
+      18: 0.5 # aside_text
+      19: 0.5 # reference_content
     layout_nms: True
-    layout_unclip_ratio:
-      0: [1.0, 1.0]  # paragraph_title
-      1: [1.0, 1.0]  # image
-      2: [1.0, 1.0]  # text
-      3: [1.0, 1.0]  # number
-      4: [1.0, 1.0]  # abstract
-      5: [1.0, 1.0]  # content
-      6: [1.0, 1.0]  # figure_title
-      7: [1.0, 1.0]  # formula
-      8: [1.0, 1.0]  # table
-      9: [1.0, 1.0]  # table_title
-      10: [1.0, 1.0] # reference
-      11: [1.0, 1.0] # doc_title
-      12: [1.0, 1.0] # footnote
-      13: [1.0, 1.0] # header
-      14: [1.0, 1.0] # algorithm
-      15: [1.0, 1.0] # footer
-      16: [1.0, 1.0] # seal
-      17: [1.0, 1.0] # chart_title
-      18: [1.0, 1.0] # chart
-      19: [1.0, 1.0] # formula_number
-      20: [1.0, 1.0] # header_image
-      21: [1.0, 1.0] # footer_image
-      22: [1.0, 1.0] # aside_text
+    layout_unclip_ratio: [1.0, 1.0] 
     layout_merge_bboxes_mode: 
       0: "large"  # paragraph_title
       1: "large"  # image
@@ -72,23 +46,20 @@ SubModules:
       3: "union"  # number
       4: "union"  # abstract
       5: "union"  # content
-      6: "union"  # figure_title
+      6: "union"  # figure_table_chart_title
       7: "large"  # formula
       8: "union"  # table
-      9: "union"  # table_title
-      10: "union" # reference
-      11: "union" # doc_title
-      12: "union" # footnote
-      13: "union" # header
-      14: "union" # algorithm
-      15: "union" # footer
-      16: "union" # seal
-      17: "union" # chart_title
-      18: "large" # chart
-      19: "union" # formula_number
-      20: "union" # header_image
-      21: "union" # footer_image
-      22: "union" # aside_text
+      9: "union"  # reference
+      10: "union" # doc_title
+      11: "union" # footnote
+      12: "union" # header
+      13: "union" # algorithm
+      14: "union" # footer
+      15: "union" # seal
+      16: "large" # chart
+      17: "union" # formula_number
+      18: "union" # aside_text
+      19: "union" # reference_content
   ChartRecognition:
     module_name: chart_recognition
     model_name: PP-Chart2Table