瀏覽代碼

fix: add content existence checks for inline and interline equations in pipeline_middle_json_mkcontent.py

myhloli 4 月之前
父節點
當前提交
46bfb77488
共有 1 個文件被更改,包括 4 次插入2 次删除
  1. 4 2
      mineru/backend/pipeline/pipeline_middle_json_mkcontent.py

+ 4 - 2
mineru/backend/pipeline/pipeline_middle_json_mkcontent.py

@@ -157,9 +157,11 @@ def merge_para_with_text(para_block):
             if span_type == ContentType.TEXT:
                 content = escape_special_markdown_char(span['content'])
             elif span_type == ContentType.INLINE_EQUATION:
-                content = f"{inline_left_delimiter}{span['content']}{inline_right_delimiter}"
+                if span.get('content', ''):
+                    content = f"{inline_left_delimiter}{span['content']}{inline_right_delimiter}"
             elif span_type == ContentType.INTERLINE_EQUATION:
-                content = f"\n{display_left_delimiter}\n{span['content']}\n{display_right_delimiter}\n"
+                if span.get('content', ''):
+                    content = f"\n{display_left_delimiter}\n{span['content']}\n{display_right_delimiter}\n"
 
             content = content.strip()