|
@@ -106,6 +106,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
self.use_doc_preprocessor = False
|
|
self.use_doc_preprocessor = False
|
|
|
self.use_table_recognition = config.get("use_table_recognition", True)
|
|
self.use_table_recognition = config.get("use_table_recognition", True)
|
|
|
self.use_seal_recognition = config.get("use_seal_recognition", True)
|
|
self.use_seal_recognition = config.get("use_seal_recognition", True)
|
|
|
|
|
+ self.format_block_content = config.get("format_block_content", False)
|
|
|
self.use_region_detection = config.get(
|
|
self.use_region_detection = config.get(
|
|
|
"use_region_detection",
|
|
"use_region_detection",
|
|
|
True,
|
|
True,
|
|
@@ -848,6 +849,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
use_formula_recognition: Union[bool, None],
|
|
use_formula_recognition: Union[bool, None],
|
|
|
use_chart_recognition: Union[bool, None],
|
|
use_chart_recognition: Union[bool, None],
|
|
|
use_region_detection: Union[bool, None],
|
|
use_region_detection: Union[bool, None],
|
|
|
|
|
+ format_block_content: Union[bool, None],
|
|
|
) -> dict:
|
|
) -> dict:
|
|
|
"""
|
|
"""
|
|
|
Get the model settings based on the provided parameters or default values.
|
|
Get the model settings based on the provided parameters or default values.
|
|
@@ -858,6 +860,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
use_seal_recognition (Union[bool, None]): Enables seal recognition if True. Defaults to system setting if None.
|
|
use_seal_recognition (Union[bool, None]): Enables seal recognition if True. Defaults to system setting if None.
|
|
|
use_table_recognition (Union[bool, None]): Enables table recognition if True. Defaults to system setting if None.
|
|
use_table_recognition (Union[bool, None]): Enables table recognition if True. Defaults to system setting if None.
|
|
|
use_formula_recognition (Union[bool, None]): Enables formula recognition if True. Defaults to system setting if None.
|
|
use_formula_recognition (Union[bool, None]): Enables formula recognition if True. Defaults to system setting if None.
|
|
|
|
|
+ format_block_content (Union[bool, None]): Enables block content formatting if True. Defaults to system setting if None.
|
|
|
|
|
|
|
|
Returns:
|
|
Returns:
|
|
|
dict: A dictionary containing the model settings.
|
|
dict: A dictionary containing the model settings.
|
|
@@ -886,6 +889,9 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
if use_chart_recognition is None:
|
|
if use_chart_recognition is None:
|
|
|
use_chart_recognition = self.use_chart_recognition
|
|
use_chart_recognition = self.use_chart_recognition
|
|
|
|
|
|
|
|
|
|
+ if format_block_content is None:
|
|
|
|
|
+ format_block_content = self.format_block_content
|
|
|
|
|
+
|
|
|
return dict(
|
|
return dict(
|
|
|
use_doc_preprocessor=use_doc_preprocessor,
|
|
use_doc_preprocessor=use_doc_preprocessor,
|
|
|
use_seal_recognition=use_seal_recognition,
|
|
use_seal_recognition=use_seal_recognition,
|
|
@@ -893,6 +899,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
use_formula_recognition=use_formula_recognition,
|
|
use_formula_recognition=use_formula_recognition,
|
|
|
use_chart_recognition=use_chart_recognition,
|
|
use_chart_recognition=use_chart_recognition,
|
|
|
use_region_detection=use_region_detection,
|
|
use_region_detection=use_region_detection,
|
|
|
|
|
+ format_block_content=format_block_content,
|
|
|
)
|
|
)
|
|
|
|
|
|
|
|
def predict(
|
|
def predict(
|
|
@@ -906,6 +913,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
use_formula_recognition: Union[bool, None] = None,
|
|
use_formula_recognition: Union[bool, None] = None,
|
|
|
use_chart_recognition: Union[bool, None] = None,
|
|
use_chart_recognition: Union[bool, None] = None,
|
|
|
use_region_detection: Union[bool, None] = None,
|
|
use_region_detection: Union[bool, None] = None,
|
|
|
|
|
+ format_block_content: Union[bool, None] = None,
|
|
|
layout_threshold: Optional[Union[float, dict]] = None,
|
|
layout_threshold: Optional[Union[float, dict]] = None,
|
|
|
layout_nms: Optional[bool] = None,
|
|
layout_nms: Optional[bool] = None,
|
|
|
layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
|
|
layout_unclip_ratio: Optional[Union[float, Tuple[float, float], dict]] = None,
|
|
@@ -943,6 +951,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
use_table_recognition (Optional[bool]): Whether to use table recognition.
|
|
use_table_recognition (Optional[bool]): Whether to use table recognition.
|
|
|
use_formula_recognition (Optional[bool]): Whether to use formula recognition.
|
|
use_formula_recognition (Optional[bool]): Whether to use formula recognition.
|
|
|
use_region_detection (Optional[bool]): Whether to use region detection.
|
|
use_region_detection (Optional[bool]): Whether to use region detection.
|
|
|
|
|
+ format_block_content (Optional[bool]): Whether to format block content.
|
|
|
layout_threshold (Optional[float]): The threshold value to filter out low-confidence predictions. Default is None.
|
|
layout_threshold (Optional[float]): The threshold value to filter out low-confidence predictions. Default is None.
|
|
|
layout_nms (bool, optional): Whether to use layout-aware NMS. Defaults to False.
|
|
layout_nms (bool, optional): Whether to use layout-aware NMS. Defaults to False.
|
|
|
layout_unclip_ratio (Optional[Union[float, Tuple[float, float]]], optional): The ratio of unclipping the bounding box.
|
|
layout_unclip_ratio (Optional[Union[float, Tuple[float, float]]], optional): The ratio of unclipping the bounding box.
|
|
@@ -982,6 +991,7 @@ class _LayoutParsingPipelineV2(BasePipeline):
|
|
|
use_formula_recognition,
|
|
use_formula_recognition,
|
|
|
use_chart_recognition,
|
|
use_chart_recognition,
|
|
|
use_region_detection,
|
|
use_region_detection,
|
|
|
|
|
+ format_block_content,
|
|
|
)
|
|
)
|
|
|
|
|
|
|
|
if not self.check_model_settings_valid(model_settings):
|
|
if not self.check_model_settings_valid(model_settings):
|