6 månader sedan · 46ea5db8ff
--- a/llmops/agents/outline_agent.py
+++ b/llmops/agents/outline_agent.py
@@ -38,6 +38,7 @@ import requests
 
				 from datetime import datetime
			
 
				 
			
 
				 from pydantic import BaseModel, Field
			
 
				+from llmops.config import RULES_ENGINE_BASE_URL
			
 
				 
			
 
				 
			
 
				 # 数据模型定义（与现有项目兼容）
			
@@ -158,30 +159,8 @@ class OutlineGeneratorAgent:
 
				                             "dependencies": []
			
 
				                         })
			
 
				 
			
 
				-        # 注意：现在依赖LLM根据提示词生成包含所有必需指标的大纲，不再在代码中强制添加
			
 
				-
			
 
				-        # 如果LLM没有提供任何指标，则自动补充基础指标
			
 
				-        if not global_metrics:
			
 
				-            print("⚠️ LLM未提供指标，使用默认基础指标")
			
 
				-            available_metrics = self._load_available_metrics()
			
 
				-
			
 
				-            # 选择前5个基础指标
			
 
				-            base_metrics = [m for m in available_metrics if m.get('type') == '基础统计指标'][:5]
			
 
				-
			
 
				-            for metric in base_metrics:
			
 
				-                metric_name = metric['name']
			
 
				-                knowledge_id = f"metric-{metric_name}"
			
 
				-                if sections:  # 确保有章节
			
 
				-                    sections[0]["metrics_needed"].append(knowledge_id)  # 添加到第一个章节
			
 
				-                global_metrics.append({
			
 
				-                    "metric_id": knowledge_id,
			
 
				-                    "metric_name": metric_name,
			
 
				-                    "calculation_logic": f"使用规则引擎计算{metric_name}: {metric.get('description', '')}",
			
 
				-                    "required_fields": ["transactions"],
			
 
				-                    "dependencies": []
			
 
				-                })
			
 
				-
			
 
				-        print(f"📊 最终生成 {len(global_metrics)} 个指标")
			
 
				+        # 完全依赖LLM生成包含所有必需指标的大纲
			
 
				+        print(f"🤖 大模型生成 {len(global_metrics)} 个指标")
			
 
				 
			
 
				         return {
			
 
				             "report_title": new_format_data.get("chapter_title", "流水分析报告"),
			
@@ -189,7 +168,7 @@ class OutlineGeneratorAgent:
 
				             "global_metrics": global_metrics
			
 
				         }
			
 
				 
			
 
				-    def create_prompt(self) -> str:
			
 
				+    def create_prompt(self, question: str, industry: str) -> str:
			
 
				         """创建大纲生成提示"""
			
 
				 
			
 
				         # 从API动态获取可用的指标列表
			
@@ -203,15 +182,12 @@ class OutlineGeneratorAgent:
 
				         # 构建基础提示词
			
 
				         base_prompt = f"""[角色定义]
			
 
				 你的角色是: 流水分析报告的大纲生成模块。
			
 
				-你的目标是:
			
 
				-基于输入的流水分析业务背景信息,
			
 
				-生成一份可交付、结构清晰、可被程序解析的流水分析报告大纲,
			
 
				-并以结构化 JSON 的形式，明确每个章节及其下属分析主题所需的分析指标与分析项要求,
			
 
				-以指导后续分析能力的调用。
			
 
				+你的目标是:{question},生成一份针对{industry}行业的全面的流水分析报告大纲。
			
 
				+生成结构清晰、可被程序解析的JSON格式大纲，明确每个章节及其下属分析主题所需的分析指标。
			
 
				 
			
 
				 [职责边界]
			
 
				 你只能完成以下事项:
			
 
				-1.确定流水分析报告应包含的章节结构
			
 
				+1.确定{industry}流水分析报告应包含的章节结构
			
 
				 2.明确每个章节下需要覆盖的分析主题
			
 
				 3.为每个分析主题列出所需的计算指标、统计指标或分析指标
			
 
				 
			
@@ -226,42 +202,62 @@ class OutlineGeneratorAgent:
 
				 
			
 
				 [可用指标总览]
			
 
				 系统当前支持 {len(available_metrics)} 个指标。
			
 
				+指标内容为{available_metrics}
			
 
				 
			
 
				 [重要要求]
			
 
				-请根据用户需求和可用指标列表，从上述指标中选择最相关的指标。优先选择基础统计指标和时间分析指标，确保报告的完整性和实用性。
			
 
				+请根据用户需求和可用指标列表，从上述指标中选择最相关的指标。必须基于用户查询的具体需求进行智能匹配，确保选择的指标能够充分满足分析需求。
			
 
				 
			
 
				 [强制要求]
			
 
				 生成大纲时，请：
			
 
				-1. 从可用指标中选择合适的指标组合
			
 
				-2. 确保选择的指标能够满足用户分析需求
			
 
				-3. 在metrics_needed数组中列出选定的指标名称
			
 
				-4. 在global_metrics数组中包含对应指标的详细定义
			
 
				+1. 仔细分析用户查询，识别所有提到的分析需求点
			
 
				+2. 从可用指标中选择能够满足这些需求的完整指标组合
			
 
				+3. 基于语义相关性进行指标筛选，不要过于保守
			
 
				+4. 在各章节的metrics对象中，按照指标类型(calculation_metrics/statistical_metrics/analysis_metrics)列出选定的指标
			
 
				+5. 为每个指标提供metric_name和metric_description字段
			
 
				+6. 优先选择与用户查询直接相关的指标
			
 
				 
			
 
				 [可选择的指标列表]
			
 
				 {metrics_list_text}
			
 
				 
			
 
				-[重要兼容性要求]
			
 
				-虽然你必须使用上述JSON结构输出，但为了确保与现有系统的兼容性，请在输出中额外包含以下字段：
			
 
				-- 在根级别添加 "report_title": "流水分析报告"
			
 
				-- 在根级别添加 "global_metrics": [] (空数组或根据实际需求填充指标定义)
			
 
				-- 确保输出能被现有系统正确解析和使用
			
 
				+[重要说明]
			
 
				+请确保：
			
 
				+- 从提供的可用指标列表中选择最相关的指标
			
 
				+- 为每个选定的指标提供清晰的名称和描述
			
 
				+- 输出格式必须严格遵循上述JSON结构
			
 
				+- 确保选择的指标能够满足用户查询的具体分析需求
			
 
				 
			
 
				 [输出格式要求]
			
 
				 你必须且只能以 JSON 字符串 形式输出分析大纲，不得输出任何解释性自然语言。
			
 
				 JSON 必须严格遵循以下结构约定:
			
 
				 {{
			
 
				-  "chapter_id": "string",
			
 
				   "chapter_title": "string",
			
 
				-  "chapter_type": "string",
			
 
				   "sections": [
			
 
				     {{
			
 
				       "section_id": "string",
			
 
				       "section_title": "string",
			
 
				       "section_description": "string",
			
 
				-      "metrics_needed": ["string"]
			
 
				+      "metrics": {{
			
 
				+        "calculation_metrics": [
			
 
				+          {{
			
 
				+            "metric_name": "string",
			
 
				+            "metric_description": "string"
			
 
				+          }}
			
 
				+        ],
			
 
				+        "statistical_metrics": [
			
 
				+          {{
			
 
				+            "metric_name": "string",
			
 
				+            "metric_description": "string"
			
 
				+          }}
			
 
				+        ],
			
 
				+        "analysis_metrics": [
			
 
				+          {{
			
 
				+            "metric_name": "string",
			
 
				+            "metric_description": "string"
			
 
				+          }}
			
 
				+        ]
			
 
				+      }}
			
 
				     }}
			
 
				-  ],
			
 
				-  "global_metrics": []
			
 
				+  ]
			
 
				 }}"""
			
 
				 
			
 
				         return base_prompt
			
@@ -277,7 +273,7 @@ JSON 必须严格遵循以下结构约定:
 
				 
			
 
				     async def generate_outline(self, question: str, industry: str, sample_data: List[Dict[str, Any]]) -> ReportOutline:
			
 
				         """异步生成大纲（修复版：自动补全缺失字段）"""
			
 
				-        prompt = self.create_prompt()
			
 
				+        prompt = self.create_prompt(question, industry)
			
 
				 
			
 
				         # 在prompt末尾添加业务背景信息
			
 
				         full_prompt = f"""{prompt}
			
@@ -355,7 +351,8 @@ JSON 必须严格遵循以下结构约定:
 
				         # 保存API结果到文件
			
 
				         api_results_dir = "api_results"
			
 
				         os.makedirs(api_results_dir, exist_ok=True)
			
 
				-        filename = f"{call_id}.json"
			
 
				+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
			
 
				+        filename = f"{timestamp}_{call_id}.json"
			
 
				         filepath = os.path.join(api_results_dir, filename)
			
 
				 
			
 
				         try:
			
@@ -370,13 +367,13 @@ JSON 必须严格遵循以下结构约定:
 
				         print("========================================")
			
 
				 
			
 
				         # 后处理，补全缺失的section_id和metric_id
			
 
				-        outline = self._post_process_outline(outline)
			
 
				+        outline = self._post_process_outline(outline, question, industry)
			
 
				 
			
 
				         return outline
			
 
				 
			
 
				-    def _post_process_outline(self, outline: ReportOutline) -> ReportOutline:
			
 
				+    def _post_process_outline(self, outline: ReportOutline, question: str, industry: str) -> ReportOutline:
			
 
				         """
			
 
				-        后处理大纲，自动补全缺失的必需字段
			
 
				+        后处理大纲，自动补全缺失的必需字段，并基于查询优化指标
			
 
				         """
			
 
				         # 为章节补全section_id
			
 
				         for idx, section in enumerate(outline.sections):
			
@@ -402,6 +399,11 @@ JSON 必须严格遵循以下结构约定:
 
				                     metric.calculation_logic
			
 
				                 )
			
 
				 
			
 
				+        # 基于用户查询进行指标优化筛选
			
 
				+        if hasattr(outline, 'global_metrics') and outline.global_metrics:
			
 
				+            print(f"📊 AI选择了 {len(outline.global_metrics)} 个指标，进行智能优化...")
			
 
				+            outline = self._optimize_metrics_by_query(outline, question, industry)
			
 
				+
			
 
				         return outline
			
 
				 
			
 
				     def _infer_required_fields(self, logic: str) -> List[str]:
			
@@ -424,6 +426,293 @@ JSON 必须严格遵循以下结构约定:
 
				 
			
 
				         return list(set(fields))
			
 
				 
			
 
				+    def _optimize_metrics_by_query(self, outline: ReportOutline, question: str, industry: str) -> ReportOutline:
			
 
				+        """
			
 
				+        基于用户查询进行智能指标优化
			
 
				+        """
			
 
				+        # 获取所有可用指标
			
 
				+        available_metrics = self._load_available_metrics()
			
 
				+
			
 
				+        # 已选择的指标名称集合
			
 
				+        selected_metric_names = {m.metric_name for m in outline.global_metrics}
			
 
				+
			
 
				+        # 基于用户查询进行语义匹配，找出缺失的关键指标
			
 
				+        query_keywords = self._extract_query_keywords(question, industry)
			
 
				+        missing_key_metrics = self._find_missing_key_metrics(
			
 
				+            available_metrics, selected_metric_names, query_keywords
			
 
				+        )
			
 
				+
			
 
				+        # 补充缺失的关键指标
			
 
				+        supplemented_count = 0
			
 
				+        for metric_name in missing_key_metrics:
			
 
				+            # 找到对应的可用指标信息
			
 
				+            available_metric = next((m for m in available_metrics if m['name'] == metric_name), None)
			
 
				+            if available_metric:
			
 
				+                # 创建MetricRequirement对象
			
 
				+                metric_req = MetricRequirement(
			
 
				+                    metric_id=f"metric-{metric_name}",
			
 
				+                    metric_name=metric_name,
			
 
				+                    calculation_logic=f"使用规则引擎计算{metric_name}",
			
 
				+                    required_fields=["transactions"],
			
 
				+                    dependencies=[]
			
 
				+                )
			
 
				+                outline.global_metrics.append(metric_req)
			
 
				+                supplemented_count += 1
			
 
				+                print(f"  补充关键指标: {metric_name}")
			
 
				+
			
 
				+        if supplemented_count > 0:
			
 
				+            print(f"✅ 基于查询分析补充了 {supplemented_count} 个关键指标，总计 {len(outline.global_metrics)} 个指标")
			
 
				+
			
 
				+        # 智能分配章节指标需求
			
 
				+        self._smart_assign_section_metrics(outline)
			
 
				+
			
 
				+        return outline
			
 
				+
			
 
				+    def _extract_query_keywords(self, question: str, industry: str) -> List[str]:
			
 
				+        """
			
 
				+        通过大模型从用户查询中提取关键词
			
 
				+
			
 
				+        Args:
			
 
				+            question: 用户查询
			
 
				+            industry: 行业信息
			
 
				+
			
 
				+        Returns:
			
 
				+            关键词列表
			
 
				+        """
			
 
				+        try:
			
 
				+            keyword_prompt = ChatPromptTemplate.from_messages([
			
 
				+                ("system", """你是一个专业的关键词提取专家，需要从用户查询中提取关键的分析指标和业务术语。
			
 
				+
			
 
				+请分析查询内容，识别出用户关心的核心指标、分析维度和业务概念。
			
 
				+
			
 
				+返回格式：
			
 
				+请以逗号分隔的关键词列表形式返回，不要其他解释。
			
 
				+
			
 
				+示例：
			
 
				+收入分析, 支出统计, 交易对手, 时间趋势, 占比分析"""),
			
 
				+                ("human", """用户查询：{question}
			
 
				+行业背景：{industry}
			
 
				+
			
 
				+请提取这个查询中的关键分析指标和业务术语。""")
			
 
				+            ])
			
 
				+
			
 
				+            chain = keyword_prompt | self.llm
			
 
				+            result = chain.invoke({
			
 
				+                "question": question,
			
 
				+                "industry": industry
			
 
				+            })
			
 
				+
			
 
				+            keywords_text = result.content.strip()
			
 
				+            # 按逗号分割并清理空白
			
 
				+            keywords = [kw.strip() for kw in keywords_text.split(',') if kw.strip()]
			
 
				+
			
 
				+            print(f"🔍 提取到查询关键词: {keywords}")
			
 
				+            return keywords
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            print(f"⚠️ 关键词提取失败，使用简单分词: {str(e)}")
			
 
				+            # 备选方案：简单的文本分词
			
 
				+            import re
			
 
				+            # 移除标点符号，提取中文词组
			
 
				+            text = re.sub(r'[^\u4e00-\u9fa5a-zA-Z]', ' ', question)
			
 
				+            words = [w for w in text.split() if len(w) > 1]
			
 
				+            print(f"🔄 备选关键词: {words}")
			
 
				+            return words
			
 
				+
			
 
				+    def _find_missing_key_metrics(self, available_metrics: List[Dict], selected_metric_names: set,
			
 
				+                                  query_keywords: List[str]) -> List[str]:
			
 
				+        """
			
 
				+        基于查询关键词找出缺失的关键指标
			
 
				+
			
 
				+        Args:
			
 
				+            available_metrics: 所有可用指标
			
 
				+            selected_metric_names: 已选择的指标名称集合
			
 
				+            query_keywords: 查询关键词
			
 
				+
			
 
				+        Returns:
			
 
				+            缺失的关键指标名称列表
			
 
				+        """
			
 
				+        if not query_keywords or not available_metrics:
			
 
				+            return []
			
 
				+
			
 
				+        try:
			
 
				+            missing_prompt = ChatPromptTemplate.from_messages([
			
 
				+                ("system", """你是一个专业的指标推荐专家，需要根据用户查询的关键词，识别出可能缺失的关键指标。
			
 
				+
			
 
				+请分析：
			
 
				+1. 用户关心的分析维度（收入、支出、排名、趋势等）
			
 
				+2. 已选择的指标
			
 
				+3. 可用的指标库
			
 
				+
			
 
				+推荐一些重要的缺失指标，帮助完善分析报告。
			
 
				+
			
 
				+返回格式：
			
 
				+只返回指标名称列表，用换行符分隔，不要其他解释。
			
 
				+
			
 
				+示例：
			
 
				+总收入分析
			
 
				+支出占比统计
			
 
				+交易对手排名"""),
			
 
				+                ("human", """查询关键词：{keywords}
			
 
				+
			
 
				+已选择的指标：
			
 
				+{selected_metrics}
			
 
				+
			
 
				+可用指标库：
			
 
				+{available_metrics}
			
 
				+
			
 
				+请推荐一些重要的缺失指标。""")
			
 
				+            ])
			
 
				+
			
 
				+            # 格式化输入
			
 
				+            selected_list = '\n'.join(selected_metric_names) if selected_metric_names else '无'
			
 
				+            available_list = '\n'.join([m.get('name', '') for m in available_metrics if m.get('name')])
			
 
				+
			
 
				+            chain = missing_prompt | self.llm
			
 
				+            result = chain.invoke({
			
 
				+                "keywords": ', '.join(query_keywords),
			
 
				+                "selected_metrics": selected_list,
			
 
				+                "available_metrics": available_list
			
 
				+            })
			
 
				+
			
 
				+            # 解析结果
			
 
				+            recommended_metrics = []
			
 
				+            for line in result.content.strip().split('\n'):
			
 
				+                metric_name = line.strip()
			
 
				+                if metric_name and metric_name not in selected_metric_names:
			
 
				+                    # 验证指标是否存在于可用指标库中
			
 
				+                    if any(m.get('name') == metric_name for m in available_metrics):
			
 
				+                        recommended_metrics.append(metric_name)
			
 
				+
			
 
				+            print(f"📊 推荐缺失指标: {recommended_metrics}")
			
 
				+            return recommended_metrics
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            print(f"⚠️ 指标推荐失败: {str(e)}")
			
 
				+            return []
			
 
				+
			
 
				+    def _smart_assign_section_metrics(self, outline: ReportOutline) -> None:
			
 
				+        """
			
 
				+        智能分配章节指标需求
			
 
				+
			
 
				+        Args:
			
 
				+            outline: 报告大纲对象，会被原地修改
			
 
				+        """
			
 
				+        if not outline.sections or not outline.global_metrics:
			
 
				+            return
			
 
				+
			
 
				+        try:
			
 
				+            # 获取所有可用的指标ID
			
 
				+            available_metric_ids = {m.metric_id for m in outline.global_metrics}
			
 
				+
			
 
				+            assign_prompt = ChatPromptTemplate.from_messages([
			
 
				+                ("system", """你是一个专业的报告结构专家，需要将全局指标智能分配到各个章节。
			
 
				+
			
 
				+分配原则：
			
 
				+1. 每个章节分配3-5个最相关的指标
			
 
				+2. 指标应与章节内容高度相关
			
 
				+3. 避免重复分配相同的指标
			
 
				+4. 优先分配核心指标到主要章节
			
 
				+
			
 
				+返回格式：
			
 
				+为每个章节返回指标ID列表，用分号分隔章节，格式如下：
			
 
				+章节ID:指标ID1,指标ID2,指标ID3
			
 
				+
			
 
				+示例：
			
 
				+sec_1:metric-total_income,metric-expense_trend,metric-profit_margin
			
 
				+sec_2:metric-customer_analysis,metric-market_share"""),
			
 
				+                ("human", """报告标题：{report_title}
			
 
				+
			
 
				+章节列表：
			
 
				+{sections}
			
 
				+
			
 
				+可用指标：
			
 
				+{available_metrics}
			
 
				+
			
 
				+请为每个章节分配最合适的指标ID。""")
			
 
				+            ])
			
 
				+
			
 
				+            # 格式化输入
			
 
				+            sections_text = '\n'.join([
			
 
				+                f"{section.section_id}: {section.title} - {section.description}"
			
 
				+                for section in outline.sections
			
 
				+            ])
			
 
				+
			
 
				+            available_metrics_text = '\n'.join([
			
 
				+                f"{m.metric_id}: {m.metric_name} - {m.calculation_logic}"
			
 
				+                for m in outline.global_metrics
			
 
				+            ])
			
 
				+
			
 
				+            chain = assign_prompt | self.llm
			
 
				+            result = chain.invoke({
			
 
				+                "report_title": outline.report_title,
			
 
				+                "sections": sections_text,
			
 
				+                "available_metrics": available_metrics_text
			
 
				+            })
			
 
				+
			
 
				+            # 解析结果并分配指标
			
 
				+            lines = result.content.strip().split('\n')
			
 
				+            assigned_metrics = set()  # 避免重复分配
			
 
				+
			
 
				+            for line in lines:
			
 
				+                if ':' not in line:
			
 
				+                    continue
			
 
				+
			
 
				+                section_id, metrics_str = line.split(':', 1)
			
 
				+                section_id = section_id.strip()
			
 
				+
			
 
				+                # 找到对应的章节
			
 
				+                section = next((s for s in outline.sections if s.section_id == section_id), None)
			
 
				+                if not section:
			
 
				+                    continue
			
 
				+
			
 
				+                # 解析指标ID列表
			
 
				+                metric_ids = [mid.strip() for mid in metrics_str.split(',') if mid.strip()]
			
 
				+
			
 
				+                # 验证指标ID并分配（避免重复）
			
 
				+                valid_metrics = []
			
 
				+                for metric_id in metric_ids:
			
 
				+                    if metric_id in available_metric_ids and metric_id not in assigned_metrics:
			
 
				+                        valid_metrics.append(metric_id)
			
 
				+                        assigned_metrics.add(metric_id)
			
 
				+
			
 
				+                    # 每个章节最多分配5个指标
			
 
				+                    if len(valid_metrics) >= 5:
			
 
				+                        break
			
 
				+
			
 
				+                section.metrics_needed = valid_metrics
			
 
				+                print(f"📋 章节 '{section.title}' 分配了 {len(valid_metrics)} 个指标: {valid_metrics}")
			
 
				+
			
 
				+            # 检查是否有章节没有分配到指标，如果有则平均分配剩余指标
			
 
				+            unassigned_sections = [s for s in outline.sections if not s.metrics_needed]
			
 
				+            remaining_metrics = [m.metric_id for m in outline.global_metrics if m.metric_id not in assigned_metrics]
			
 
				+
			
 
				+            if unassigned_sections and remaining_metrics:
			
 
				+                print(f"🔄 为 {len(unassigned_sections)} 个未分配章节平均分配剩余指标")
			
 
				+                metrics_per_section = max(1, len(remaining_metrics) // len(unassigned_sections))
			
 
				+
			
 
				+                for i, section in enumerate(unassigned_sections):
			
 
				+                    start_idx = i * metrics_per_section
			
 
				+                    end_idx = min(start_idx + metrics_per_section, len(remaining_metrics))
			
 
				+                    section.metrics_needed = remaining_metrics[start_idx:end_idx]
			
 
				+                    print(f"📋 章节 '{section.title}' 分配了 {len(section.metrics_needed)} 个指标: {section.metrics_needed}")
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            print(f"⚠️ 智能指标分配失败，使用平均分配: {str(e)}")
			
 
				+            # 备选方案：平均分配所有指标到各个章节
			
 
				+            if outline.sections and outline.global_metrics:
			
 
				+                all_metric_ids = [m.metric_id for m in outline.global_metrics]
			
 
				+                metrics_per_section = max(1, len(all_metric_ids) // len(outline.sections))
			
 
				+
			
 
				+                for i, section in enumerate(outline.sections):
			
 
				+                    start_idx = i * metrics_per_section
			
 
				+                    end_idx = min(start_idx + metrics_per_section, len(all_metric_ids))
			
 
				+                    section.metrics_needed = all_metric_ids[start_idx:end_idx]
			
 
				+                    print(f"🔄 备选分配 - 章节 '{section.title}' 分配了 {len(section.metrics_needed)} 个指标")
			
 
				+
			
 
				+   
			
 
				+   
			
 
				+
			
 
				     def _load_available_knowledge(self) -> List[Dict[str, Any]]:
			
 
				         """
			
 
				         从规则引擎获取可用的知识元数据
			
@@ -432,7 +721,7 @@ JSON 必须严格遵循以下结构约定:
 
				             知识元数据列表，包含id和description
			
 
				         """
			
 
				         try:
			
 
				-            url = "http://10.192.72.11:31809/api/rules/getKnowledgeMeta"
			
 
				+            url = f"{RULES_ENGINE_BASE_URL}/api/rules/getKnowledgeMeta"
			
 
				             headers = {
			
 
				                 "Accept": "*/*",
			
 
				                 "Accept-Encoding": "gzip, deflate, br",
			
@@ -518,7 +807,7 @@ JSON 必须严格遵循以下结构约定:
 
				 
			
 
				     def _match_metric_to_knowledge(self, metric_name: str, metric_description: str) -> str:
			
 
				         """
			
 
				-        根据指标名称和描述匹配最合适的知识ID
			
 
				+        通过大模型判断指标是否与可用知识匹配
			
 
				 
			
 
				         Args:
			
 
				             metric_name: 指标名称
			
@@ -530,7 +819,7 @@ JSON 必须严格遵循以下结构约定:
 
				         if not self.available_knowledge:
			
 
				             return ""
			
 
				 
			
 
				-        # 精确匹配：直接用指标名称匹配知识ID
			
 
				+        # 首先尝试精确匹配：直接用指标名称匹配知识ID
			
 
				         for knowledge in self.available_knowledge:
			
 
				             knowledge_id = knowledge.get("id", "")
			
 
				             # 去掉前缀匹配，如 "metric-分析账户数量" 匹配 "分析账户数量"
			
@@ -538,84 +827,66 @@ JSON 必须严格遵循以下结构约定:
 
				                 print(f"🔗 精确匹配指标 '{metric_name}' -> 知识ID: {knowledge_id}")
			
 
				                 return knowledge_id
			
 
				 
			
 
				-        # 扩展匹配：匹配更多的农业相关指标
			
 
				-        if "农业" in metric_name:
			
 
				-            if "总经营收入" in metric_name:
			
 
				-                # 匹配农业总经营收入
			
 
				-                for knowledge in self.available_knowledge:
			
 
				-                    if knowledge.get("id") == "metric-农业总经营收入":
			
 
				-                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业总经营收入")
			
 
				-                        return "metric-农业总经营收入"
			
 
				-            if "总经营支出" in metric_name:
			
 
				-                # 匹配农业总经营支出
			
 
				-                for knowledge in self.available_knowledge:
			
 
				-                    if knowledge.get("id") == "metric-农业总经营支出":
			
 
				-                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业总经营支出")
			
 
				-                        return "metric-农业总经营支出"
			
 
				-            if "交易对手收入排名TOP3" in metric_name or "收入排名" in metric_name:
			
 
				-                # 匹配农业交易对手收入TOP3
			
 
				-                for knowledge in self.available_knowledge:
			
 
				-                    if knowledge.get("id") == "metric-农业交易对手经营收入top3":
			
 
				-                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业交易对手经营收入top3")
			
 
				-                        return "metric-农业交易对手经营收入top3"
			
 
				-            if "交易对手支出排名TOP3" in metric_name or "支出排名" in metric_name:
			
 
				-                # 匹配农业交易对手支出TOP3
			
 
				-                for knowledge in self.available_knowledge:
			
 
				-                    if knowledge.get("id") == "metric-农业交易对手经营支出top3":
			
 
				-                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业交易对手经营支出top3")
			
 
				-                        return "metric-农业交易对手经营支出top3"
			
 
				-
			
 
				-        # 如果精确匹配失败，使用关键词匹配
			
 
				-        keywords = [metric_name]
			
 
				-        if metric_description:
			
 
				-            # 从描述中提取关键信息
			
 
				-            desc_lower = metric_description.lower()
			
 
				-            if "收入" in metric_name or "收入" in desc_lower:
			
 
				-                keywords.extend(["收入", "总收入", "经营收入"])
			
 
				-            if "支出" in metric_name or "支出" in desc_lower:
			
 
				-                keywords.extend(["支出", "总支出", "经营支出"])
			
 
				-            if "排名" in metric_name or "top" in desc_lower:
			
 
				-                keywords.append("排名")
			
 
				-            if "比例" in metric_name or "占比" in desc_lower:
			
 
				-                keywords.append("比例")
			
 
				-            if "时间范围" in metric_name:
			
 
				-                keywords.append("时间范围")
			
 
				-            if "账户" in metric_name:
			
 
				-                keywords.append("账户")
			
 
				-
			
 
				-        best_match = None
			
 
				-        best_score = 0
			
 
				+        # 使用大模型进行语义匹配
			
 
				+        match_prompt = ChatPromptTemplate.from_messages([
			
 
				+            ("system", """你是一个专业的指标匹配专家，需要根据指标名称和描述，从提供的知识库中找到最合适的匹配项。
			
 
				 
			
 
				-        for knowledge in self.available_knowledge:
			
 
				-            knowledge_id = knowledge.get("id", "")
			
 
				-            knowledge_desc = knowledge.get("description", "").lower()
			
 
				+请分析指标的语义含义和计算逻辑，判断哪个知识项最匹配。
			
 
				 
			
 
				-            # 计算匹配分数
			
 
				-            score = 0
			
 
				-            for keyword in keywords:
			
 
				-                if keyword.lower() in knowledge_desc:
			
 
				-                    score += 1
			
 
				+返回格式：
			
 
				+如果找到匹配：返回知识ID
			
 
				+如果未找到匹配：返回空字符串 ""
			
 
				 
			
 
				-            # 行业匹配加分
			
 
				-            if "黑色金属" in knowledge_desc and "黑色金属" in metric_name:
			
 
				-                score += 2
			
 
				-            if "农业" in knowledge_desc and "农业" in metric_name:
			
 
				-                score += 2
			
 
				+只返回知识ID或空字符串，不要其他解释。"""),
			
 
				+            ("human", """指标信息：
			
 
				+名称：{metric_name}
			
 
				+描述：{metric_description}
			
 
				 
			
 
				-            # 直接名称匹配加分
			
 
				-            if metric_name.lower() in knowledge_desc:
			
 
				-                score += 3
			
 
				+可用知识库：
			
 
				+{knowledge_list}
			
 
				 
			
 
				-            if score > best_score:
			
 
				-                best_score = score
			
 
				-                best_match = knowledge_id
			
 
				+请判断这个指标是否与知识库中的某个项目匹配。如果匹配，返回对应的知识ID；如果不匹配，返回空字符串。""")
			
 
				+        ])
			
 
				 
			
 
				-        if best_match and best_score > 0:
			
 
				-            print(f"🔗 关键词匹配指标 '{metric_name}' -> 知识ID: {best_match} (匹配分数: {best_score})")
			
 
				-            return best_match
			
 
				+        # 构建知识库描述
			
 
				+        knowledge_list = "\n".join([
			
 
				+            f"ID: {k.get('id', '')}\n描述: {k.get('description', '')}"
			
 
				+            for k in self.available_knowledge
			
 
				+        ])
			
 
				 
			
 
				-        print(f"❌ 指标 '{metric_name}' 未找到匹配的知识ID")
			
 
				-        return ""
			
 
				+        try:
			
 
				+            # 调用大模型进行匹配
			
 
				+            chain = match_prompt | self.llm
			
 
				+            result = chain.invoke({
			
 
				+                "metric_name": metric_name,
			
 
				+                "metric_description": metric_description or "无描述",
			
 
				+                "knowledge_list": knowledge_list
			
 
				+            })
			
 
				+
			
 
				+            matched_knowledge_id = result.content.strip()
			
 
				+
			
 
				+            # 验证返回的知识ID是否存在于可用知识中
			
 
				+            if matched_knowledge_id and any(k.get("id") == matched_knowledge_id for k in self.available_knowledge):
			
 
				+                print(f"🤖 大模型匹配指标 '{metric_name}' -> 知识ID: {matched_knowledge_id}")
			
 
				+                return matched_knowledge_id
			
 
				+            else:
			
 
				+                print(f"❌ 大模型未找到指标 '{metric_name}' 的匹配项")
			
 
				+                return ""
			
 
				+
			
 
				+        except Exception as e:
			
 
				+            print(f"⚠️ 大模型匹配失败，使用备选方案: {str(e)}")
			
 
				+            # 备选方案：简单的关键词匹配（不包含特定业务逻辑）
			
 
				+            for knowledge in self.available_knowledge:
			
 
				+                knowledge_id = knowledge.get("id", "")
			
 
				+                knowledge_desc = knowledge.get("description", "").lower()
			
 
				+
			
 
				+                # 检查指标名称是否在知识描述中出现
			
 
				+                if metric_name.lower() in knowledge_desc:
			
 
				+                    print(f"🔄 备选匹配指标 '{metric_name}' -> 知识ID: {knowledge_id}")
			
 
				+                    return knowledge_id
			
 
				+
			
 
				+            print(f"❌ 指标 '{metric_name}' 未找到匹配的知识ID")
			
 
				+            return ""
			
 
				 
			
 
				 
			
 
				 async def generate_report_outline(question: str, industry: str, sample_data: List[Dict[str, Any]], api_key: str, max_retries: int = 3, retry_delay: float = 2.0) -> ReportOutline:
			
@@ -674,7 +945,7 @@ async def generate_report_outline(question: str, industry: str, sample_data: Lis
 
				     print("⚠️ 所有重试均失败，使用默认大纲结构")
			
 
				 
			
 
				     # 获取实际可用的指标来构建默认大纲
			
 
				-    available_metrics = self._load_available_metrics()
			
 
				+    available_metrics = agent._load_available_metrics()
			
 
				 
			
 
				     # 选择一些基础指标作为默认值
			
 
				     default_metric_ids = []
			
--- a/llmops/agents/planning_agent.py
+++ b/llmops/agents/planning_agent.py
@@ -1,31 +1,3 @@
 
				-"""
			
 
				-规划Agent (Planning Agent)
			
 
				-=========================
			
 
				-
			
 
				-此Agent负责分析当前状态并做出智能决策，决定下一步行动。
			
 
				-
			
 
				-核心功能：
			
 
				-1. 状态评估：分析大纲、指标计算进度和完整性
			
 
				-2. 决策制定：决定生成大纲、计算指标、完成报告或澄清需求
			
 
				-3. 优先级排序：确定最关键的任务和指标
			
 
				-4. 流程控制：管理整个报告生成工作流的执行顺序
			
 
				-
			
 
				-决策逻辑：
			
 
				-- 大纲为空 → 生成大纲
			
 
				-- 指标覆盖率 < 80% → 计算指标
			
 
				-- 指标覆盖率 ≥ 80% → 生成报告
			
 
				-- 需求模糊 → 澄清需求
			
 
				-
			
 
				-技术实现：
			
 
				-- 使用LangChain和结构化输出
			
 
				-- 支持异步处理
			
 
				-- 智能状态评估
			
 
				-- 灵活的决策机制
			
 
				-
			
 
				-作者: Big Agent Team
			
 
				-版本: 1.0.0
			
 
				-创建时间: 2024-12-20
			
 
				-"""
			
 
				 
			
 
				 from typing import List, Dict, Optional, Any, Union
			
 
				 from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
			
@@ -119,11 +91,9 @@ class PlanningAgent:
 
				         return ChatPromptTemplate.from_messages([
			
 
				             ("system", """你是报告规划总控智能体，核心职责是精准分析当前状态并决定下一步行动。
			
 
				 
			
 
				-### 决策选项（四选一）
			
 
				+### 决策选项（二选一）
			
 
				 1. generate_outline：大纲未生成或大纲无效
			
 
				-2. compute_metrics：大纲已生成但指标未完成（覆盖率<80%）
			
 
				-3. finalize_report：指标覆盖率≥80%，信息充足
			
 
				-4. clarify_requirements：用户需求模糊，缺少关键信息
			
 
				+2. compute_metrics：大纲已生成但指标未完成
			
 
				 
			
 
				 ### 决策规则（按顺序检查）
			
 
				 1. 检查 outline_draft 是否为空 → 空则选择 generate_outline
			
@@ -145,10 +115,8 @@ class PlanningAgent:
 
				 ### 输出字段说明
			
 
				 - decision: 决策字符串
			
 
				 - reasoning: 决策原因说明
			
 
				-- next_actions: 动作列表（可选）
			
 
				-- metrics_to_compute: 待计算指标ID列表，必须从状态信息中的可用指标ID中选择（决策为compute_metrics时必须提供）
			
 
				-- priority_metrics: 优先级指标列表（前2-3个最重要的指标）
			
 
				-- additional_requirements: 额外需求（可选）
			
 
				+- metrics_to_compute: 待计算指标ID列表，必须从状态信息中的"有效待计算指标ID列表"中选择。选择所有可用指标，除非指标数量过多（>10个）需要分批计算
			
 
				+- priority_metrics: 优先级指标列表（前2-3个最重要的指标），从metrics_to_compute中选择
			
 
				 
			
 
				 必须输出有效的JSON格式！"""),
			
 
				 
			
@@ -266,7 +234,8 @@ class PlanningAgent:
 
				         # 保存API结果到文件
			
 
				         api_results_dir = "api_results"
			
 
				         os.makedirs(api_results_dir, exist_ok=True)
			
 
				-        filename = f"{call_id}.json"
			
 
				+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
			
 
				+        filename = f"{timestamp}_{call_id}.json"
			
 
				         filepath = os.path.join(api_results_dir, filename)
			
 
				 
			
 
				         try:
			
@@ -301,9 +270,10 @@ class PlanningAgent:
 
				 
			
 
				         # 获取可用的指标ID
			
 
				         available_metric_ids = []
			
 
				-        if state.get('outline_draft') and state.get('outline_draft').get('global_metrics'):
			
 
				-            available_metric_ids = [m.get('metric_id', '') for m in state['outline_draft']['global_metrics']]
			
 
				-            available_metric_ids = [mid for mid in available_metric_ids if mid]  # 过滤空值
			
 
				+        outline_draft = state.get('outline_draft')
			
 
				+        if outline_draft and outline_draft.global_metrics:
			
 
				+            available_metric_ids = [m.metric_id for m in outline_draft.global_metrics if m.metric_id]
			
 
				+        
			
 
				 
			
 
				         return f"""当前状态评估：
			
 
				 - 规划步骤: {state.get('planning_step', 0)}
			
@@ -403,53 +373,4 @@ async def plan_next_action(question: str, industry: str, current_state: Dict[str
 
				             priority_metrics=[]
			
 
				         )
			
 
				 
			
 
				-    def _get_default_decision(self, current_state: Dict[str, Any]) -> PlanningDecision:
			
 
				-        """
			
 
				-        基于状态分析的默认决策逻辑
			
 
				-
			
 
				-        Args:
			
 
				-            current_state: 当前状态信息
			
 
				-
			
 
				-        Returns:
			
 
				-            默认规划决策
			
 
				-        """
			
 
				-        state_analysis = analyze_current_state(current_state)
			
 
				-
			
 
				-        if not state_analysis["has_outline"]:
			
 
				-            default_decision = PlanningDecision(
			
 
				-                decision="generate_outline",
			
 
				-                reasoning="大纲不存在，需要先生成大纲",
			
 
				-                next_actions=["生成报告大纲"],
			
 
				-                metrics_to_compute=[],
			
 
				-                priority_metrics=[]
			
 
				-            )
			
 
				-        elif state_analysis["coverage"] < 0.8 and state_analysis["valid_pending_metrics"]:
			
 
				-            # 计算指标 - 使用实际的指标ID
			
 
				-            metrics_to_compute = state_analysis["valid_pending_ids"][:5]  # 最多计算5个
			
 
				-            default_decision = PlanningDecision(
			
 
				-                decision="compute_metrics",
			
 
				-                reasoning=f"指标覆盖率{state_analysis['coverage']:.1%}，需要计算更多指标",
			
 
				-                next_actions=[f"计算指标: {', '.join(metrics_to_compute)}"],
			
 
				-                metrics_to_compute=metrics_to_compute,
			
 
				-                priority_metrics=metrics_to_compute[:2]  # 前2个为优先级
			
 
				-            )
			
 
				-        elif state_analysis["valid_pending_ids"]:
			
 
				-            # 还有指标但都失败了，生成报告
			
 
				-            default_decision = PlanningDecision(
			
 
				-                decision="finalize_report",
			
 
				-                reasoning="部分指标计算失败，但已有足够信息生成报告",
			
 
				-                next_actions=["生成最终报告"],
			
 
				-                metrics_to_compute=[],
			
 
				-                priority_metrics=[]
			
 
				-            )
			
 
				-        else:
			
 
				-            # 信息充足，生成报告
			
 
				-            default_decision = PlanningDecision(
			
 
				-                decision="finalize_report",
			
 
				-                reasoning="所有必要指标已计算完成",
			
 
				-                next_actions=["生成最终报告"],
			
 
				-                metrics_to_compute=[],
			
 
				-                priority_metrics=[]
			
 
				-            )
			
 
				-
			
 
				-        return default_decision
			
 
				+   
			
--- a/llmops/agents/rules_engine_metric_calculation_agent.py
+++ b/llmops/agents/rules_engine_metric_calculation_agent.py
@@ -55,27 +55,16 @@ from langchain_openai import ChatOpenAI
 
				 from langchain_core.prompts import ChatPromptTemplate
			
 
				 import re
			
 
				 
			
 
				+from llmops.config import RULES_ENGINE_BASE_URL
			
 
				+
			
 
				 
			
 
				 class RulesEngineMetricCalculationAgent:
			
 
				     """规则引擎指标计算Agent"""
			
 
				 
			
 
				     def __init__(self, api_key: str, base_url: str = "https://api.deepseek.com"):
			
 
				-        """
			
 
				-        初始化规则引擎指标计算Agent
			
 
				 
			
 
				-        Args:
			
 
				-            api_key: DeepSeek API密钥
			
 
				-            base_url: DeepSeek API基础URL
			
 
				-        """
			
 
				-        self.llm = ChatOpenAI(
			
 
				-            model="deepseek-chat",
			
 
				-            api_key=api_key,
			
 
				-            base_url=base_url,
			
 
				-            temperature=0.1
			
 
				-        )
			
 
				 
			
 
				-        # 加载配置文件
			
 
				-        self.configs = self._load_configs()
			
 
				+
			
 
				 
			
 
				         # 获取可用的知识元数据
			
 
				         self.available_knowledge = self._load_available_knowledge()
			
@@ -143,23 +132,7 @@ class RulesEngineMetricCalculationAgent:
 
				             print(f"加载数据文件 {data_file_path} 失败: {e}")
			
 
				             return []
			
 
				 
			
 
				-    def _load_configs(self) -> Dict[str, Dict]:
			
 
				-        """加载所有规则引擎配置文件"""
			
 
				-        configs = {}
			
 
				-        json_dir = "json_files"
			
 
				 
			
 
				-        if os.path.exists(json_dir):
			
 
				-            for file in os.listdir(json_dir):
			
 
				-                if file.endswith('.json') and '规则引擎' in file:
			
 
				-                    try:
			
 
				-                        with open(os.path.join(json_dir, file), 'r', encoding='utf-8') as f:
			
 
				-                            config = json.load(f)
			
 
				-                            key = file.replace('.json', '')
			
 
				-                            configs[key] = config
			
 
				-                    except Exception as e:
			
 
				-                        print(f"加载规则引擎配置文件 {file} 失败: {e}")
			
 
				-
			
 
				-        return configs
			
 
				 
			
 
				     def _load_available_knowledge(self) -> List[Dict[str, Any]]:
			
 
				         """
			
@@ -169,7 +142,7 @@ class RulesEngineMetricCalculationAgent:
 
				             知识元数据列表，包含id、description和inputField
			
 
				         """
			
 
				         try:
			
 
				-            url = "http://10.192.72.11:31809/api/rules/getKnowledgeMeta"
			
 
				+            url = f"{RULES_ENGINE_BASE_URL}/api/rules/getKnowledgeMeta"
			
 
				             headers = {
			
 
				                 "Accept": "*/*",
			
 
				                 "Accept-Encoding": "gzip, deflate, br",
			
@@ -179,7 +152,7 @@ class RulesEngineMetricCalculationAgent:
 
				             }
			
 
				 
			
 
				             response = requests.post(url, headers=headers, json={}, timeout=30)
			
 
				-            print(f"访问知识接口：{response}")
			
 
				+
			
 
				             if response.status_code == 200:
			
 
				                 knowledge_meta = response.json()
			
 
				                 if isinstance(knowledge_meta, list):
			
@@ -290,8 +263,8 @@ class RulesEngineMetricCalculationAgent:
 
				 
			
 
				             # 规则引擎API配置
			
 
				             method = "POST"
			
 
				-            url = "http://10.192.72.11:31809/api/rules/executeKnowledge"
			
 
				-            # url = "http://10.192.72.11:31809/api/rules/executeKnowledge"
			
 
				+
			
 
				+            url = f"{RULES_ENGINE_BASE_URL}/api/rules/executeKnowledge"
			
 
				             headers = {
			
 
				                 "Accept": "*/*",
			
 
				                 "Accept-Encoding": "gzip, deflate, br",
			
@@ -342,7 +315,8 @@ class RulesEngineMetricCalculationAgent:
 
				                     # 保存API结果到文件
			
 
				                     api_results_dir = "api_results"
			
 
				                     os.makedirs(api_results_dir, exist_ok=True)
			
 
				-                    filename = f"{call_id}.json"
			
 
				+                    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
			
 
				+                    filename = f"{timestamp}_{call_id}.json"
			
 
				                     filepath = os.path.join(api_results_dir, filename)
			
 
				 
			
 
				                     try:
			
@@ -388,7 +362,8 @@ class RulesEngineMetricCalculationAgent:
 
				                     # 保存API结果到文件
			
 
				                     api_results_dir = "api_results"
			
 
				                     os.makedirs(api_results_dir, exist_ok=True)
			
 
				-                    filename = f"{call_id}.json"
			
 
				+                    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
			
 
				+                    filename = f"{timestamp}_{call_id}.json"
			
 
				                     filepath = os.path.join(api_results_dir, filename)
			
 
				 
			
 
				                     try:
			
@@ -589,7 +564,7 @@ class RulesEngineMetricCalculationAgent:
 
				 
			
 
				         # 规则引擎API配置
			
 
				         method = "POST"
			
 
				-        url = "http://10.192.72.11:31809/api/rules/executeKnowledge"
			
 
				+        url = f"{RULES_ENGINE_BASE_URL}/api/rules/executeKnowledge"
			
 
				         headers = {
			
 
				             "Accept": "*/*",
			
 
				             "Accept-Encoding": "gzip, deflate, br",
			
@@ -663,7 +638,8 @@ class RulesEngineMetricCalculationAgent:
 
				                     # 保存API结果到文件
			
 
				                     api_results_dir = "api_results"
			
 
				                     os.makedirs(api_results_dir, exist_ok=True)
			
 
				-                    filename = f"{call_id}.json"
			
 
				+                    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
			
 
				+                    filename = f"{timestamp}_{call_id}.json"
			
 
				                     filepath = os.path.join(api_results_dir, filename)
			
 
				 
			
 
				                     try:
			
@@ -709,7 +685,8 @@ class RulesEngineMetricCalculationAgent:
 
				                     # 保存API结果到文件
			
 
				                     api_results_dir = "api_results"
			
 
				                     os.makedirs(api_results_dir, exist_ok=True)
			
 
				-                    filename = f"{call_id}.json"
			
 
				+                    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
			
 
				+                    filename = f"{timestamp}_{call_id}.json"
			
 
				                     filepath = os.path.join(api_results_dir, filename)
			
 
				 
			
 
				                     try:
			
--- a/llmops/complete_agent_flow_rule.py
+++ b/llmops/complete_agent_flow_rule.py
@@ -31,24 +31,19 @@ import asyncio
 
				 from typing import Dict, Any, List
			
 
				 from datetime import datetime
			
 
				 from langgraph.graph import StateGraph, START, END
			
 
				-from langchain_core.messages import HumanMessage
			
 
				 
			
 
				 from workflow_state import (
			
 
				     IntegratedWorkflowState,
			
 
				     create_initial_integrated_state,
			
 
				-    is_state_ready_for_calculation,
			
 
				     get_calculation_progress,
			
 
				     update_state_with_outline_generation,
			
 
				     update_state_with_planning_decision,
			
 
				-    finalize_state_with_report,
			
 
				     convert_numpy_types,
			
 
				-    MetricRequirement,
			
 
				-    ReportOutline
			
 
				+
			
 
				 )
			
 
				-from llmops.agents.outline_agent import OutlineGeneratorAgent, generate_report_outline
			
 
				-from llmops.agents.planning_agent import PlanningAgent, plan_next_action, analyze_current_state
			
 
				-from llmops.agents.metric_calculation_agent import MetricCalculationAgent
			
 
				-from llmops.agents.rules_engine_metric_calculation_agent import RulesEngineMetricCalculationAgent
			
 
				+from agents.outline_agent import  generate_report_outline
			
 
				+from agents.planning_agent import  plan_next_action
			
 
				+from agents.rules_engine_metric_calculation_agent import RulesEngineMetricCalculationAgent
			
 
				 
			
 
				 
			
 
				 class CompleteAgentFlow:
			
@@ -65,10 +60,7 @@ class CompleteAgentFlow:
 
				         self.api_key = api_key
			
 
				         self.base_url = base_url
			
 
				 
			
 
				-        # 初始化各个智能体
			
 
				-        self.planning_agent = PlanningAgent(api_key, base_url)
			
 
				-        self.outline_agent = OutlineGeneratorAgent(api_key, base_url)
			
 
				-        # self.metric_agent = MetricCalculationAgent(api_key, base_url)
			
 
				+        # 初始规则引擎智能体
			
 
				         self.rules_engine_agent = RulesEngineMetricCalculationAgent(api_key, base_url)
			
 
				 
			
 
				         # 创建工作流图
			
@@ -81,9 +73,7 @@ class CompleteAgentFlow:
 
				         # 添加节点
			
 
				         workflow.add_node("planning_node", self._planning_node)
			
 
				         workflow.add_node("outline_generator", self._outline_generator_node)
			
 
				-        workflow.add_node("metric_evaluator", self._metric_evaluator_node)
			
 
				         workflow.add_node("metric_calculator", self._metric_calculator_node)
			
 
				-        workflow.add_node("report_finalizer", self._report_finalizer_node)
			
 
				 
			
 
				         # 设置入口点
			
 
				         workflow.set_entry_point("planning_node")
			
@@ -94,18 +84,14 @@ class CompleteAgentFlow:
 
				             self._route_from_planning,
			
 
				             {
			
 
				                 "outline_generator": "outline_generator",
			
 
				-                "metric_evaluator": "metric_evaluator",
			
 
				                 "metric_calculator": "metric_calculator",
			
 
				-                "report_finalizer": "report_finalizer",
			
 
				                 END: END
			
 
				             }
			
 
				         )
			
 
				 
			
 
				         # 从各个节点返回规划节点重新决策
			
 
				         workflow.add_edge("outline_generator", "planning_node")
			
 
				-        workflow.add_edge("metric_evaluator", "planning_node")
			
 
				-        workflow.add_edge("metric_calculator", "planning_node")
			
 
				-        workflow.add_edge("report_finalizer", END)
			
 
				+        workflow.add_edge("metric_calculator", END)
			
 
				 
			
 
				         return workflow
			
 
				 
			
@@ -205,7 +191,7 @@ class CompleteAgentFlow:
 
				                 industry=state["industry"],
			
 
				                 sample_data=state["data_set"][:3],  # 使用前3个样本
			
 
				                 api_key=self.api_key,
			
 
				-                max_retries=1,  # 最多重试5次
			
 
				+                max_retries=3,  # 最多重试5次
			
 
				                 retry_delay=3.0  # 每次重试间隔3秒
			
 
				             )
			
 
				 
			
@@ -214,6 +200,10 @@ class CompleteAgentFlow:
 
				 
			
 
				             print(f"✅ 大纲生成完成：{outline.report_title}")
			
 
				             print(f"   包含 {len(outline.sections)} 个章节，{len(outline.global_metrics)} 个指标需求")
			
 
				+
			
 
				+            # 分析并打印AI的指标选择推理过程
			
 
				+            self._print_ai_selection_analysis(outline)
			
 
				+
			
 
				             return convert_numpy_types(new_state)
			
 
				 
			
 
				         except Exception as e:
			
@@ -222,6 +212,57 @@ class CompleteAgentFlow:
 
				             new_state["errors"].append(f"大纲生成错误: {str(e)}")
			
 
				             return convert_numpy_types(new_state)
			
 
				 
			
 
				+    def _print_ai_selection_analysis(self, outline):
			
 
				+        """打印AI指标选择的推理过程分析 - 完全通用版本"""
			
 
				+        print()
			
 
				+        print('╔══════════════════════════════════════════════════════════════════════════════╗')
			
 
				+        print('║                          🤖 AI指标选择分析                                    ║')
			
 
				+        print('╚══════════════════════════════════════════════════════════════════════════════╝')
			
 
				+        print()
			
 
				+
			
 
				+        # 计算总指标数 - outline可能是字典格式，需要适配
			
 
				+        if hasattr(outline, 'sections'):
			
 
				+            # Pydantic模型格式
			
 
				+            total_metrics = sum(len(section.metrics_needed) for section in outline.sections)
			
 
				+            sections = outline.sections
			
 
				+        else:
			
 
				+            # 字典格式
			
 
				+            total_metrics = sum(len(section.get('metrics_needed', [])) for section in outline.get('sections', []))
			
 
				+            sections = outline.get('sections', [])
			
 
				+
			
 
				+        # 获取可用指标总数（这里可以从状态或其他地方动态获取）
			
 
				+        available_count = 26  # 这个可以从API调用中动态获取
			
 
				+
			
 
				+        print('📊 选择统计:')
			
 
				+        print('   ┌─────────────────────────────────────────────────────────────────────┐')
			
 
				+        print('   │  系统可用指标: {}个   │  AI本次选择: {}个   │  选择率: {:.1f}%     │'.format(
			
 
				+            available_count, total_metrics, total_metrics/available_count*100 if available_count > 0 else 0))
			
 
				+        print('   └─────────────────────────────────────────────────────────────────────┘')
			
 
				+        print()
			
 
				+
			
 
				+        print('📋 AI决策过程:')
			
 
				+        print('   大模型已根据用户需求从{}个可用指标中选择了{}个最相关的指标。'.format(available_count, total_metrics))
			
 
				+        print('   选择过程完全由大模型基于语义理解和业务逻辑进行，不涉及任何硬编码规则。')
			
 
				+        print()
			
 
				+
			
 
				+        print('🔍 选择结果:')
			
 
				+        print('   • 总章节数: {}个'.format(len(sections)))
			
 
				+        print('   • 平均每章节指标数: {:.1f}个'.format(total_metrics/len(sections) if sections else 0))
			
 
				+        print('   • 选择策略: 基于用户需求的相关性分析')
			
 
				+        print()
			
 
				+
			
 
				+        print('🎯 AI Agent核心能力:')
			
 
				+        print('   • 语义理解: 理解用户查询的业务意图和分析需求')
			
 
				+        print('   • 智能筛选: 从海量指标中挑选最相关的组合')
			
 
				+        print('   • 逻辑推理: 为每个分析维度提供充分的选择依据')
			
 
				+        print('   • 动态适配: 根据不同场景自动调整选择策略')
			
 
				+        print()
			
 
				+
			
 
				+        print('💡 关键洞察:')
			
 
				+        print('   AI Agent通过大模型的推理能力，实现了超越传统规则引擎的智能化指标选择，')
			
 
				+        print('   能够根据具体业务场景动态调整分析框架，确保分析的针对性和有效性。')
			
 
				+        print()
			
 
				+
			
 
				     async def _metric_evaluator_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
			
 
				         """指标评估节点：根据大纲确定需要计算的指标"""
			
 
				         try:
			
@@ -281,7 +322,15 @@ class CompleteAgentFlow:
 
				                 print("🧮 正在执行指标计算...")
			
 
				 
			
 
				             new_state = state.copy()
			
 
				-            pending_ids = state.get("pending_metric_ids", [])
			
 
				+
			
 
				+            # 使用规划决策指定的指标批次，如果没有指定则使用所有待计算指标
			
 
				+            current_batch = state.get("current_batch_metrics", [])
			
 
				+            if current_batch:
			
 
				+                pending_ids = current_batch
			
 
				+                print(f"🧮 本次计算批次包含 {len(pending_ids)} 个指标")
			
 
				+            else:
			
 
				+                pending_ids = state.get("pending_metric_ids", [])
			
 
				+                print(f"🧮 计算所有待计算指标，共 {len(pending_ids)} 个")
			
 
				 
			
 
				             if not pending_ids:
			
 
				                 print("⚠️ 没有待计算的指标")
			
@@ -408,84 +457,6 @@ class CompleteAgentFlow:
 
				             new_state["errors"].append(f"指标计算错误: {str(e)}")
			
 
				             return convert_numpy_types(new_state)
			
 
				 
			
 
				-    async def _report_finalizer_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
			
 
				-        """报告完成节点：生成最终报告"""
			
 
				-        try:
			
 
				-            print("📋 正在生成最终报告...")
			
 
				-
			
 
				-            # 获取大纲和计算结果
			
 
				-            outline = state.get("outline_draft")
			
 
				-            computed_metrics = state.get("computed_metrics", {})
			
 
				-
			
 
				-            if not outline:
			
 
				-                raise ValueError("没有可用的报告大纲")
			
 
				-
			
 
				-            # 生成最终报告
			
 
				-            final_report = {
			
 
				-                "title": outline.report_title,
			
 
				-                "generated_at": datetime.now().isoformat(),
			
 
				-                "summary": {
			
 
				-                    "total_sections": len(outline.sections),
			
 
				-                    "total_metrics_required": len(outline.global_metrics),
			
 
				-                    "total_metrics_computed": len(computed_metrics),
			
 
				-                    "planning_steps": state.get("planning_step", 0),
			
 
				-                    "completion_rate": len(computed_metrics) / len(outline.global_metrics) if outline.global_metrics else 0
			
 
				-                },
			
 
				-                "sections": [],
			
 
				-                "metrics_detail": {}
			
 
				-            }
			
 
				-
			
 
				-            # 构建章节内容
			
 
				-            for section in outline.sections:
			
 
				-                section_content = {
			
 
				-                    "section_id": section.section_id,
			
 
				-                    "title": section.title,
			
 
				-                    "description": section.description,
			
 
				-                    "metrics": {}
			
 
				-                }
			
 
				-
			
 
				-                # 添加该章节的指标数据
			
 
				-                for metric_id in section.metrics_needed:
			
 
				-                    if metric_id in computed_metrics:
			
 
				-                        section_content["metrics"][metric_id] = computed_metrics[metric_id]
			
 
				-                    else:
			
 
				-                        section_content["metrics"][metric_id] = "数据缺失"
			
 
				-
			
 
				-                final_report["sections"].append(section_content)
			
 
				-
			
 
				-            # 添加详细的指标信息
			
 
				-            for metric_req in outline.global_metrics:
			
 
				-                metric_id = metric_req.metric_id
			
 
				-                final_report["metrics_detail"][metric_id] = {
			
 
				-                    "name": metric_req.metric_name,
			
 
				-                    "logic": metric_req.calculation_logic,
			
 
				-                    "required_fields": metric_req.required_fields,
			
 
				-                    "computed": metric_id in computed_metrics,
			
 
				-                    "value": computed_metrics.get(metric_id, {}).get("value", "N/A")
			
 
				-                }
			
 
				-
			
 
				-            # 更新状态
			
 
				-            new_state = finalize_state_with_report(state, final_report)
			
 
				-
			
 
				-            # 添加完成消息
			
 
				-            new_state["messages"].append({
			
 
				-                "role": "assistant",
			
 
				-                "content": f"🎉 完整报告生成流程完成：{outline.report_title}",
			
 
				-                "timestamp": datetime.now().isoformat()
			
 
				-            })
			
 
				-
			
 
				-            print(f"✅ 最终报告生成完成：{outline.report_title}")
			
 
				-            print(f"   章节数：{len(final_report['sections'])}")
			
 
				-            print(f"   计算指标：{len(computed_metrics)}/{len(outline.global_metrics)}")
			
 
				-            print(".2%")
			
 
				-
			
 
				-            return convert_numpy_types(new_state)
			
 
				-
			
 
				-        except Exception as e:
			
 
				-            print(f"❌ 报告完成失败: {e}")
			
 
				-            new_state = state.copy()
			
 
				-            new_state["errors"].append(f"报告完成错误: {str(e)}")
			
 
				-            return convert_numpy_types(new_state)
			
 
				 
			
 
				     def _decision_to_route(self, decision: str) -> str:
			
 
				         """将规划决策转换为路由"""
			
@@ -622,7 +593,7 @@ async def main():
 
				     # 测试数据
			
 
				     test_data = [
			
 
				         {
			
 
				-           
			
 
				+
			
 
				         }
			
 
				     ]
			
 
				 
			
@@ -633,6 +604,8 @@ async def main():
 
				     result = await run_complete_agent_flow(
			
 
				         question="请生成一份详细的农业经营贷流水分析报告，需要包含：1.总收入和总支出统计 2.收入笔数和支出笔数 3.各类型收入支出占比分析 4.交易对手收入支出TOP3排名 5.按月份的收入支出趋势分析 6.账户数量和交易时间范围统计 7.资金流入流出月度统计等全面指标",
			
 
				         industry = "农业",
			
 
				+        # question="请生成一份详细的黑色金属相关经营贷流水分析报告，需要包含：1.总收入统计 2.收入笔数 3.各类型收入占比分析 4.交易对手收入排名 5.按月份的收入趋势分析 6.账户数量和交易时间范围统计 7.资金流入流出月度统计等全面指标",
			
 
				+        # industry = "黑色金属",
			
 
				         data=test_data,
			
 
				         api_key=config.DEEPSEEK_API_KEY,
			
 
				         session_id="direct-test"
			
--- a/llmops/config.py
+++ b/llmops/config.py
@@ -38,6 +38,12 @@ DEEPSEEK_API_KEY = os.getenv("DEEPSEEK_API_KEY")
 
				 DEEPSEEK_BASE_URL = os.getenv("DEEPSEEK_BASE_URL", "https://api.deepseek.com")
			
 
				 
			
 
				 # ============================================================================
			
 
				+# 规则引擎 API 配置
			
 
				+# ============================================================================
			
 
				+# 规则引擎基础URL配置 - 用于指标计算和知识库访问
			
 
				+RULES_ENGINE_BASE_URL = os.getenv("RULES_ENGINE_BASE_URL", "http://localhost:8081")
			
 
				+
			
 
				+# ============================================================================
			
 
				 # 项目路径配置
			
 
				 # ============================================================================
			
 
				 # 定义项目中各个功能模块的数据存储路径