|
|
@@ -35,7 +35,7 @@ class MinerUVLLMProcessor:
|
|
|
server_url: str = "http://127.0.0.1:8121",
|
|
|
timeout: int = 300,
|
|
|
normalize_numbers: bool = False,
|
|
|
- debug: bool = False):
|
|
|
+ log_level: str = "INFO"):
|
|
|
"""
|
|
|
初始化处理器
|
|
|
|
|
|
@@ -43,12 +43,12 @@ class MinerUVLLMProcessor:
|
|
|
server_url: vLLM 服务器地址
|
|
|
timeout: 请求超时时间
|
|
|
normalize_numbers: 是否标准化数字
|
|
|
- debug: 是否启用调试模式
|
|
|
+ log_level: 日志级别(DEBUG, INFO, WARNING, ERROR),当为 DEBUG 时会打印详细错误信息和保存中间结果
|
|
|
"""
|
|
|
self.server_url = server_url.rstrip('/')
|
|
|
self.timeout = timeout
|
|
|
self.normalize_numbers = normalize_numbers
|
|
|
- self.debug = debug
|
|
|
+ self.log_level = log_level
|
|
|
self.backend = "http-client" # 固定使用 http-client 后端
|
|
|
|
|
|
logger.info(f"MinerU vLLM Processor 初始化完成:")
|
|
|
@@ -56,7 +56,7 @@ class MinerUVLLMProcessor:
|
|
|
logger.info(f" - 后端: vlm-{self.backend}")
|
|
|
logger.info(f" - 超时: {timeout}s")
|
|
|
logger.info(f" - 数字标准化: {normalize_numbers}")
|
|
|
- logger.info(f" - 调试模式: {debug}")
|
|
|
+ logger.info(f" - 日志级别: {log_level}")
|
|
|
|
|
|
def do_parse_single_file(self,
|
|
|
input_file: str,
|
|
|
@@ -130,7 +130,7 @@ class MinerUVLLMProcessor:
|
|
|
|
|
|
except Exception as e:
|
|
|
logger.error(f"Failed to process {file_path}: {e}")
|
|
|
- if self.debug:
|
|
|
+ if self.log_level == "DEBUG":
|
|
|
traceback.print_exc()
|
|
|
return {
|
|
|
"success": False,
|
|
|
@@ -227,8 +227,8 @@ class MinerUVLLMProcessor:
|
|
|
except Exception as e:
|
|
|
logger.warning(f"Failed to draw layout bbox: {e}")
|
|
|
|
|
|
- # 调试模式下保存额外信息
|
|
|
- if self.debug:
|
|
|
+ # DEBUG 模式下保存额外信息(中间结果)
|
|
|
+ if self.log_level == "DEBUG":
|
|
|
# 保存 middle.json
|
|
|
middle_json_str = json.dumps(middle_json, ensure_ascii=False, indent=2)
|
|
|
if self.normalize_numbers:
|
|
|
@@ -247,7 +247,7 @@ class MinerUVLLMProcessor:
|
|
|
|
|
|
except Exception as e:
|
|
|
logger.error(f"Error in _process_output: {e}")
|
|
|
- if self.debug:
|
|
|
+ if self.log_level == "DEBUG":
|
|
|
traceback.print_exc()
|
|
|
|
|
|
return saved_files
|
|
|
@@ -367,7 +367,7 @@ class MinerUVLLMProcessor:
|
|
|
result_info["error"] = str(e)
|
|
|
result_info["success"] = False
|
|
|
logger.error(f"Error processing {image_name}: {e}")
|
|
|
- if self.debug:
|
|
|
+ if self.log_level == "DEBUG":
|
|
|
traceback.print_exc()
|
|
|
|
|
|
finally:
|