Przeglądaj źródła

fix(glmocr_vl_adapter): 更新模型参数以提高识别性能,调整最大令牌数、温度、top_p 和 top_k 值

zhch158_admin 6 dni temu
rodzic
commit
6d0491be49

+ 4 - 4
ocr_tools/universal_doc_parser/config/bank_statement_glm_vl.yaml

@@ -70,10 +70,10 @@ vl_recognition:
     retry_backoff_max_seconds: 8.0
     retry_jitter_ratio: 0.2
     retry_status_codes: [429, 500, 502, 503, 504]
-    max_tokens: 4096
-    temperature: 0.8
-    top_p: 0.9
-    top_k: 50
+    max_tokens: 16384
+    temperature: 0.1
+    top_p: 0.0001
+    top_k: 1
     repetition_penalty: 1.1
   
   # 场景特定配置

+ 4 - 4
ocr_tools/universal_doc_parser/config/bank_statement_yusys_v4.yaml

@@ -170,10 +170,10 @@ vl_recognition:
     retry_backoff_max_seconds: 8.0
     retry_jitter_ratio: 0.2
     retry_status_codes: [429, 500, 502, 503, 504]
-    max_tokens: 4096
-    temperature: 0.8
-    top_p: 0.9
-    top_k: 50
+    max_tokens: 16384
+    temperature: 0.1
+    top_p: 0.0001
+    top_k: 1
     repetition_penalty: 1.1
   
   # 场景特定配置

+ 4 - 4
ocr_tools/universal_doc_parser/models/adapters/glmocr_vl_adapter.py

@@ -83,10 +83,10 @@ class GLMOCRVLRecognizer(BaseVLRecognizer):
         self.retry_max_attempts = model_params.get('retry_max_attempts', 2)
         
         # 生成参数
-        self.max_tokens = model_params.get('max_tokens', 4096)
-        self.temperature = model_params.get('temperature', 0.8)
-        self.top_p = model_params.get('top_p', 0.9)
-        self.top_k = model_params.get('top_k', 50)
+        self.max_tokens = model_params.get('max_tokens', 16384)
+        self.temperature = model_params.get('temperature', 0.1)
+        self.top_p = model_params.get('top_p', 0.00001)
+        self.top_k = model_params.get('top_k', 1)
         self.repetition_penalty = model_params.get('repetition_penalty', 1.1)
         
         logger.info(f"GLM-OCR VL Recognizer configured with max_image_size={self.max_image_size}")