Selaa lähdekoodia

Merge pull request #2975 from myhloli/dev

fix: add Noto fonts installation for Chinese character support in Dockerfile
Xiaomeng Zhao 4 kuukautta sitten
vanhempi
commit
59b4dd1905

+ 7 - 2
docker/china/Dockerfile

@@ -1,8 +1,13 @@
 # Use the official sglang image
 FROM lmsysorg/sglang:v0.4.8.post1-cu126
 
-# Install libgl for opencv support
-RUN apt-get update && apt-get install -y libgl1 && apt-get clean && rm -rf /var/lib/apt/lists/*
+# Install libgl for opencv support & Noto fonts for Chinese characters
+RUN apt-get update && \
+    apt-get install -y fonts-noto-core fonts-noto-cjk && \
+    apt-get install -y libgl1 && \
+    apt-get clean && \
+    fc-cache -fv && \
+    rm -rf /var/lib/apt/lists/*
 
 # Install mineru latest
 RUN python3 -m pip install -U 'mineru[core]' -i https://mirrors.aliyun.com/pypi/simple --break-system-packages

+ 6 - 1
docker/global/Dockerfile

@@ -2,7 +2,12 @@
 FROM lmsysorg/sglang:v0.4.8.post1-cu126
 
 # Install libgl for opencv support
-RUN apt-get update && apt-get install -y libgl1 && apt-get clean && rm -rf /var/lib/apt/lists/*
+RUN apt-get update && \
+    apt-get install -y fonts-noto-core fonts-noto-cjk && \
+    apt-get install -y libgl1 && \
+    apt-get clean && \
+    fc-cache -fv && \
+    rm -rf /var/lib/apt/lists/*
 
 # Install mineru latest
 RUN python3 -m pip install -U 'mineru[core]' --break-system-packages

+ 1 - 0
mineru/backend/pipeline/model_json_to_middle_json.py

@@ -89,6 +89,7 @@ def page_model_info_to_page_info(page_model_info, image_dict, page, image_writer
                 "type": ContentType.INTERLINE_EQUATION,
                 'score': block['score'],
                 "bbox": block['bbox'],
+                "content": "",
             })
 
         all_bboxes, all_discarded_blocks, footnote_blocks = prepare_block_bboxes(