SHA1
--- a/.env
+++ b/.env
@@ -0,0 +1 @@
 
															+DEEPSEEK_API_KEY=sk-438668d443224063adbb1d295fe44a9f
														
--- a/llmops/agents/metric_calculation_agent.py
+++ b/llmops/agents/metric_calculation_agent.py
@@ -0,0 +1,670 @@
 
															+"""
														
 
															+指标计算Agent (Metric Calculation Agent)
														
 
															+====================================
														
 
															+
														
 
															+此Agent负责根据意图识别结果执行具体的指标计算任务。
														
 
															+
														
 
															+核心功能：
														
 
															+1. 配置文件加载：读取和解析JSON格式的指标计算配置文件
														
 
															+2. API调用管理：根据配置文件调用相应的计算API
														
 
															+3. 结果处理：处理API返回的数据，提取关键指标
														
 
															+4. 错误处理：处理API调用失败、网络异常等错误情况
														
 
															+5. 结果验证：验证计算结果的合理性和完整性
														
 
															+
														
 
															+工作流程：
														
 
															+1. 接收意图识别结果和用户参数
														
 
															+2. 加载对应的指标计算配置文件
														
 
															+3. 构造API请求参数
														
 
															+4. 调用远程计算服务
														
 
															+5. 解析和验证返回结果
														
 
															+6. 返回结构化的计算结果
														
 
															+
														
 
															+技术实现：
														
 
															+- 支持动态加载JSON配置文件
														
 
															+- 使用requests库进行HTTP API调用
														
 
															+- 集成LangChain用于复杂计算逻辑（可选）
														
 
															+- 完善的错误处理和超时机制
														
 
															+- 支持多种计算方法（标准、高级、自定义）
														
 
															+
														
 
															+配置文件结构：
														
 
															+- api_config: API端点和认证信息
														
 
															+- param_mapping: 参数映射规则
														
 
															+- input_schema: 输入数据验证规则
														
 
															+- output_schema: 输出数据结构定义
														
 
															+- calculation_logic: 计算逻辑描述
														
 
															+
														
 
															+作者: Big Agent Team
														
 
															+版本: 1.0.0
														
 
															+创建时间: 2024-12-18
														
 
															+"""
														
 
															+
														
 
															+import os
														
 
															+import json
														
 
															+import requests
														
 
															+from datetime import datetime
														
 
															+from typing import Dict, List, Any, Optional
														
 
															+from langchain_openai import ChatOpenAI
														
 
															+from langchain_core.prompts import ChatPromptTemplate
														
 
															+import re
														
 
															+
														
 
															+
														
 
															+class MetricCalculationAgent:
														
 
															+    """远程指标计算Agent"""
														
 
															+
														
 
															+    def __init__(self, api_key: str, base_url: str = "https://api.deepseek.com"):
														
 
															+        """
														
 
															+        初始化指标计算Agent
														
 
															+
														
 
															+        Args:
														
 
															+            api_key: DeepSeek API密钥
														
 
															+            base_url: DeepSeek API基础URL
														
 
															+        """
														
 
															+        self.llm = ChatOpenAI(
														
 
															+            model="deepseek-chat",
														
 
															+            api_key=api_key,
														
 
															+            base_url=base_url,
														
 
															+            temperature=0.1
														
 
															+        )
														
 
															+
														
 
															+        # 加载配置文件
														
 
															+        self.configs = self._load_configs()
														
 
															+
														
 
															+        # 加载数据文件映射
														
 
															+        self.data_files = self._load_data_files()
														
 
															+
														
 
															+        # 初始化API调用跟踪
														
 
															+        self.api_calls = []
														
 
															+
														
 
															+    def _load_data_files(self) -> Dict[str, str]:
														
 
															+        """加载数据文件映射"""
														
 
															+        data_files = {}
														
 
															+        data_dir = "data_files"
														
 
															+
														
 
															+        if os.path.exists(data_dir):
														
 
															+            for file in os.listdir(data_dir):
														
 
															+                if file.endswith('.json'):
														
 
															+                    try:
														
 
															+                        # 提取文件名中的关键词，用于匹配配置文件
														
 
															+                        key = file.replace('原始数据-流水分析-', '').replace('.json', '')
														
 
															+                        data_files[key] = os.path.join(data_dir, file)
														
 
															+                    except Exception as e:
														
 
															+                        print(f"处理数据文件 {file} 失败: {e}")
														
 
															+
														
 
															+        return data_files
														
 
															+
														
 
															+    def _select_data_file(self, config_name: str) -> Optional[str]:
														
 
															+        """
														
 
															+        根据配置文件名选择对应的数据文件
														
 
															+
														
 
															+        Args:
														
 
															+            config_name: 配置文件名
														
 
															+
														
 
															+        Returns:
														
 
															+            数据文件路径，如果找不到则返回None
														
 
															+        """
														
 
															+        # 配置文件名模式：指标计算-{category}-{metric}.json
														
 
															+        # 数据文件名模式：原始数据-流水分析-{category}.json
														
 
															+
														
 
															+        # 从配置文件名中提取类别信息
														
 
															+        match = re.search(r'指标计算-(.+?)-', config_name)
														
 
															+        if match:
														
 
															+            category = match.group(1)
														
 
															+
														
 
															+            # 优先选择原始数据文件
														
 
															+            # 1. 首先查找完全匹配的原始数据文件
														
 
															+            if category in self.data_files:
														
 
															+                file_path = self.data_files[category]
														
 
															+                if '原始数据' in file_path:
														
 
															+                    return file_path
														
 
															+
														
 
															+            # 2. 如果没有完全匹配，查找包含类别的原始数据文件
														
 
															+            for key, file_path in self.data_files.items():
														
 
															+                if category in key and '原始数据' in file_path:
														
 
															+                    return file_path
														
 
															+
														
 
															+        # 如果找不到匹配的文件，返回默认的农业原始数据文件（如果存在）
														
 
															+        if '农业' in self.data_files:
														
 
															+            return self.data_files['农业']
														
 
															+
														
 
															+        return None
														
 
															+
														
 
															+    def _load_table_data(self, data_file_path: str) -> List[Dict]:
														
 
															+        """加载数据文件中的表格数据"""
														
 
															+        try:
														
 
															+            with open(data_file_path, 'r', encoding='utf-8') as f:
														
 
															+                data = json.load(f)
														
 
															+                return data if isinstance(data, list) else []
														
 
															+        except Exception as e:
														
 
															+            print(f"加载数据文件 {data_file_path} 失败: {e}")
														
 
															+            return []
														
 
															+
														
 
															+    def _load_configs(self) -> Dict[str, Dict]:
														
 
															+        """加载所有配置文件"""
														
 
															+        configs = {}
														
 
															+        json_dir = "json_files"
														
 
															+
														
 
															+        if os.path.exists(json_dir):
														
 
															+            for file in os.listdir(json_dir):
														
 
															+                if file.endswith('.json'):
														
 
															+                    try:
														
 
															+                        with open(os.path.join(json_dir, file), 'r', encoding='utf-8') as f:
														
 
															+                            config = json.load(f)
														
 
															+                            key = file.replace('.json', '')
														
 
															+                            configs[key] = config
														
 
															+                    except Exception as e:
														
 
															+                        print(f"加载配置文件 {file} 失败: {e}")
														
 
															+
														
 
															+        return configs
														
 
															+
														
 
															+    async def calculate_metrics(self, intent_result: Dict[str, Any]) -> Dict[str, Any]:
														
 
															+        """
														
 
															+        根据意图识别结果进行指标计算
														
 
															+
														
 
															+        Args:
														
 
															+            intent_result: 意图识别结果
														
 
															+
														
 
															+        Returns:
														
 
															+            指标计算结果
														
 
															+        """
														
 
															+        try:
														
 
															+            results = []
														
 
															+            target_configs = intent_result.get("target_configs", [])
														
 
															+
														
 
															+            if not target_configs:
														
 
															+                return {
														
 
															+                    "success": False,
														
 
															+                    "message": "没有找到需要调用的配置文件",
														
 
															+                    "results": []
														
 
															+                }
														
 
															+
														
 
															+            for config_name in target_configs:
														
 
															+                if config_name in self.configs:
														
 
															+                    config = self.configs[config_name]
														
 
															+                    result = await self._call_metric_api(config, intent_result, config_name)
														
 
															+                    results.append({
														
 
															+                        "config_name": config_name,
														
 
															+                        "result": result
														
 
															+                    })
														
 
															+                else:
														
 
															+                    results.append({
														
 
															+                        "config_name": config_name,
														
 
															+                        "error": f"配置文件 {config_name} 不存在"
														
 
															+                    })
														
 
															+
														
 
															+            return {
														
 
															+                "success": True,
														
 
															+                "results": results,
														
 
															+                "total_configs": len(target_configs),
														
 
															+                "successful_calculations": len([r for r in results if "result" in r])
														
 
															+            }
														
 
															+
														
 
															+        except Exception as e:
														
 
															+            print(f"指标计算失败: {e}")
														
 
															+            return {
														
 
															+                "success": False,
														
 
															+                "message": f"指标计算过程中发生错误: {str(e)}",
														
 
															+                "results": []
														
 
															+            }
														
 
															+
														
 
															+    async def _call_metric_api(self, config: Dict[str, Any], intent_result: Dict[str, Any], config_name: str) -> Dict[str, Any]:
														
 
															+        """
														
 
															+        调用具体的指标计算API
														
 
															+
														
 
															+        Args:
														
 
															+            config: 配置文件
														
 
															+            intent_result: 意图识别结果
														
 
															+
														
 
															+        Returns:
														
 
															+            API调用结果
														
 
															+        """
														
 
															+        try:
														
 
															+            # 记录API调用开始
														
 
															+            start_time = datetime.now()
														
 
															+
														
 
															+            # 使用真实API服务的配置
														
 
															+            method = "POST"
														
 
															+            url = "http://10.192.72.11:6300/api/data_analyst/full"  # 真实API服务地址
														
 
															+            headers = {
														
 
															+                "Accept": "*/*",
														
 
															+                "Accept-Encoding": "gzip, deflate, br",
														
 
															+                "Connection": "keep-alive",
														
 
															+                "Content-Type": "application/json",
														
 
															+                "User-Agent": "PostmanRuntime-ApipostRuntime/1.1.0"
														
 
															+            }
														
 
															+            timeout = 600  # 10分钟超时，给慢API更多时间
														
 
															+
														
 
															+            # 添加重试机制，最多重试3次
														
 
															+            max_retries = 3
														
 
															+            retry_delay = 5  # 每次重试间隔5秒
														
 
															+
														
 
															+            for attempt in range(max_retries):
														
 
															+                try:
														
 
															+                    print(f"🔄 API调用尝试 {attempt + 1}/{max_retries} (配置: {config_name})")
														
 
															+
														
 
															+                    # 准备请求数据
														
 
															+                    request_data = self._prepare_request_data(config, intent_result, config_name)
														
 
															+
														
 
															+                    # 根据HTTP方法调用API
														
 
															+                    if method.upper() == "GET":
														
 
															+                        params = request_data.get("params", {})
														
 
															+                        response = requests.get(url, headers=headers, params=params, timeout=timeout)
														
 
															+                    elif method.upper() == "POST":
														
 
															+                        json_data = request_data.get("json", {})
														
 
															+                        response = requests.post(url, headers=headers, json=json_data, timeout=timeout)
														
 
															+                    else:
														
 
															+                        return {
														
 
															+                            "success": False,
														
 
															+                            "message": f"不支持的HTTP方法: {method}"
														
 
															+                        }
														
 
															+
														
 
															+                    # 处理响应
														
 
															+                    if response.status_code == 200:
														
 
															+                        try:
														
 
															+                            response_data = response.json()
														
 
															+
														
 
															+                            # 检查API响应结构并提取结果
														
 
															+                            extracted_result = None
														
 
															+                            if isinstance(response_data, dict):
														
 
															+                                # 检查是否有code字段和data.result结构
														
 
															+                                if response_data.get("code") == 0 and "data" in response_data:
														
 
															+                                    data = response_data["data"]
														
 
															+                                    if "result" in data:
														
 
															+                                        # 从result字段中提取JSON
														
 
															+                                        extracted_result = self._extract_json_from_result(data["result"])
														
 
															+
														
 
															+                            # 记录API调用结果
														
 
															+                            end_time = datetime.now()
														
 
															+                            call_id = f"api_{config_name}_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+                            api_call_info = {
														
 
															+                                "call_id": call_id,
														
 
															+                                "timestamp": end_time.isoformat(),
														
 
															+                                "agent": "MetricCalculationAgent",
														
 
															+                                "api_endpoint": url,
														
 
															+                                "config_name": config_name,
														
 
															+                                "request": {
														
 
															+                                    "method": method,
														
 
															+                                    "url": url,
														
 
															+                                    "headers": headers,
														
 
															+                                    "json_data": json_data if method.upper() == "POST" else None,
														
 
															+                                    "params": params if method.upper() == "GET" else None,
														
 
															+                                    "start_time": start_time.isoformat()
														
 
															+                                },
														
 
															+                                "response": {
														
 
															+                                    "status_code": response.status_code,
														
 
															+                                    "data": response_data,
														
 
															+                                    "extracted_result": extracted_result,
														
 
															+                                    "end_time": end_time.isoformat(),
														
 
															+                                    "duration": (end_time - start_time).total_seconds()
														
 
															+                                },
														
 
															+                                "success": True
														
 
															+                            }
														
 
															+                            self.api_calls.append(api_call_info)
														
 
															+
														
 
															+                            # 保存API结果到文件
														
 
															+                            api_results_dir = "api_results"
														
 
															+                            os.makedirs(api_results_dir, exist_ok=True)
														
 
															+                            filename = f"{call_id}.json"
														
 
															+                            filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+                            try:
														
 
															+                                with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                                    json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+                                print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+                            except Exception as e:
														
 
															+                                print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+                            return {
														
 
															+                                "success": True,
														
 
															+                                "data": response_data,
														
 
															+                                "extracted_result": extracted_result,
														
 
															+                                "status_code": response.status_code
														
 
															+                            }
														
 
															+                        except json.JSONDecodeError:
														
 
															+                            # 记录API调用结果（JSON解析失败）
														
 
															+                            end_time = datetime.now()
														
 
															+                            call_id = f"api_{config_name}_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+                            api_call_info = {
														
 
															+                                "call_id": call_id,
														
 
															+                                "timestamp": end_time.isoformat(),
														
 
															+                                "agent": "MetricCalculationAgent",
														
 
															+                                "api_endpoint": url,
														
 
															+                                "config_name": config_name,
														
 
															+                                "request": {
														
 
															+                                    "method": method,
														
 
															+                                    "url": url,
														
 
															+                                    "headers": headers,
														
 
															+                                    "json_data": json_data if method.upper() == "POST" else None,
														
 
															+                                    "params": params if method.upper() == "GET" else None,
														
 
															+                                    "start_time": start_time.isoformat()
														
 
															+                                },
														
 
															+                                "response": {
														
 
															+                                    "status_code": response.status_code,
														
 
															+                                    "data": response.text,
														
 
															+                                    "error": "JSON解析失败",
														
 
															+                                    "end_time": end_time.isoformat(),
														
 
															+                                    "duration": (end_time - start_time).total_seconds()
														
 
															+                                },
														
 
															+                                "success": False
														
 
															+                            }
														
 
															+                            self.api_calls.append(api_call_info)
														
 
															+
														
 
															+                            # 保存API结果到文件
														
 
															+                            api_results_dir = "api_results"
														
 
															+                            os.makedirs(api_results_dir, exist_ok=True)
														
 
															+                            filename = f"{call_id}.json"
														
 
															+                            filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+                            try:
														
 
															+                                with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                                    json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+                                print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+                            except Exception as e:
														
 
															+                                print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+                            return {
														
 
															+                                "success": True,
														
 
															+                                "data": response.text,
														
 
															+                                "extracted_result": None,
														
 
															+                                "status_code": response.status_code
														
 
															+                            }
														
 
															+                    else:
														
 
															+                        # 记录API调用结果（HTTP错误）
														
 
															+                        end_time = datetime.now()
														
 
															+                        call_id = f"api_{config_name}_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+                        api_call_info = {
														
 
															+                            "call_id": call_id,
														
 
															+                            "timestamp": end_time.isoformat(),
														
 
															+                            "agent": "MetricCalculationAgent",
														
 
															+                            "api_endpoint": url,
														
 
															+                            "config_name": config_name,
														
 
															+                            "request": {
														
 
															+                                "method": method,
														
 
															+                                "url": url,
														
 
															+                                "headers": headers,
														
 
															+                                "json_data": json_data if method.upper() == "POST" else None,
														
 
															+                                "params": params if method.upper() == "GET" else None,
														
 
															+                                "start_time": start_time.isoformat()
														
 
															+                            },
														
 
															+                            "response": {
														
 
															+                                "status_code": response.status_code,
														
 
															+                                "error": response.text,
														
 
															+                                "end_time": end_time.isoformat(),
														
 
															+                                "duration": (end_time - start_time).total_seconds()
														
 
															+                            },
														
 
															+                            "success": False
														
 
															+                        }
														
 
															+                        self.api_calls.append(api_call_info)
														
 
															+
														
 
															+                        # 保存API结果到文件
														
 
															+                        api_results_dir = "api_results"
														
 
															+                        os.makedirs(api_results_dir, exist_ok=True)
														
 
															+                        filename = f"{call_id}.json"
														
 
															+                        filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+                        try:
														
 
															+                            with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                                json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+                            print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+                        except Exception as e:
														
 
															+                            print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+                        return {
														
 
															+                            "success": False,
														
 
															+                            "message": f"API调用失败，状态码: {response.status_code}",
														
 
															+                            "response": response.text
														
 
															+                        }
														
 
															+
														
 
															+                    # 如果执行到这里，说明本次尝试成功，跳出重试循环
														
 
															+                    break
														
 
															+
														
 
															+                except requests.exceptions.Timeout:
														
 
															+                    # 记录API调用结果（超时）
														
 
															+                    end_time = datetime.now()
														
 
															+                    call_id = f"api_{config_name}_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+                    api_call_info = {
														
 
															+                        "call_id": call_id,
														
 
															+                        "timestamp": end_time.isoformat(),
														
 
															+                        "agent": "MetricCalculationAgent",
														
 
															+                        "api_endpoint": url,
														
 
															+                        "config_name": config_name,
														
 
															+                        "request": {
														
 
															+                            "method": method,
														
 
															+                            "url": url,
														
 
															+                            "headers": headers,
														
 
															+                            "json_data": json_data if method.upper() == "POST" else None,
														
 
															+                            "params": params if method.upper() == "GET" else None,
														
 
															+                            "start_time": start_time.isoformat()
														
 
															+                        },
														
 
															+                        "response": {
														
 
															+                            "error": "API调用超时",
														
 
															+                            "end_time": end_time.isoformat(),
														
 
															+                            "duration": (end_time - start_time).total_seconds()
														
 
															+                        },
														
 
															+                        "success": False
														
 
															+                    }
														
 
															+                    self.api_calls.append(api_call_info)
														
 
															+
														
 
															+                    # 保存API结果到文件
														
 
															+                    api_results_dir = "api_results"
														
 
															+                    os.makedirs(api_results_dir, exist_ok=True)
														
 
															+                    filename = f"{call_id}.json"
														
 
															+                    filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+                    try:
														
 
															+                        with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                            json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+                        print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+                    except Exception as e:
														
 
															+                        print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+                    # 如果不是最后一次尝试，等待后重试
														
 
															+                    if attempt < max_retries - 1:
														
 
															+                        print(f"⏳ API调用超时，{retry_delay}秒后重试...")
														
 
															+                        import time
														
 
															+                        time.sleep(retry_delay)
														
 
															+                        continue
														
 
															+                    else:
														
 
															+                        return {
														
 
															+                            "success": False,
														
 
															+                            "message": "API调用超时"
														
 
															+                        }
														
 
															+                except requests.exceptions.RequestException as e:
														
 
															+                    # 记录API调用结果（请求异常）
														
 
															+                    end_time = datetime.now()
														
 
															+                    call_id = f"api_{config_name}_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+                    api_call_info = {
														
 
															+                        "call_id": call_id,
														
 
															+                        "timestamp": end_time.isoformat(),
														
 
															+                        "agent": "MetricCalculationAgent",
														
 
															+                        "api_endpoint": url,
														
 
															+                        "config_name": config_name,
														
 
															+                        "request": {
														
 
															+                            "method": method,
														
 
															+                            "url": url,
														
 
															+                            "headers": headers,
														
 
															+                            "json_data": json_data if method.upper() == "POST" else None,
														
 
															+                            "params": params if method.upper() == "GET" else None,
														
 
															+                            "start_time": start_time.isoformat()
														
 
															+                        },
														
 
															+                        "response": {
														
 
															+                            "error": str(e),
														
 
															+                            "end_time": end_time.isoformat(),
														
 
															+                            "duration": (end_time - start_time).total_seconds()
														
 
															+                        },
														
 
															+                        "success": False
														
 
															+                    }
														
 
															+                    self.api_calls.append(api_call_info)
														
 
															+
														
 
															+                    # 保存API结果到文件
														
 
															+                    api_results_dir = "api_results"
														
 
															+                    os.makedirs(api_results_dir, exist_ok=True)
														
 
															+                    filename = f"{call_id}.json"
														
 
															+                    filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+                    try:
														
 
															+                        with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                            json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+                        print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+                    except Exception as e:
														
 
															+                        print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+                    # 如果不是最后一次尝试，等待后重试
														
 
															+                    if attempt < max_retries - 1:
														
 
															+                        print(f"❌ API调用异常: {str(e)}，{retry_delay}秒后重试...")
														
 
															+                        import time
														
 
															+                        time.sleep(retry_delay)
														
 
															+                        continue
														
 
															+                    else:
														
 
															+                        return {
														
 
															+                            "success": False,
														
 
															+                            "message": f"API调用异常: {str(e)}"
														
 
															+                        }
														
 
															+                except Exception as e:
														
 
															+                    # 记录API调用结果（其他异常）
														
 
															+                    end_time = datetime.now()
														
 
															+                    call_id = f"api_{config_name}_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+                    api_call_info = {
														
 
															+                        "call_id": call_id,
														
 
															+                        "timestamp": end_time.isoformat(),
														
 
															+                        "agent": "MetricCalculationAgent",
														
 
															+                        "api_endpoint": url,
														
 
															+                        "config_name": config_name,
														
 
															+                        "request": {
														
 
															+                            "method": method,
														
 
															+                            "url": url,
														
 
															+                            "headers": headers,
														
 
															+                            "json_data": json_data if method.upper() == "POST" else None,
														
 
															+                            "params": params if method.upper() == "GET" else None,
														
 
															+                            "start_time": start_time.isoformat()
														
 
															+                        },
														
 
															+                        "response": {
														
 
															+                            "error": str(e),
														
 
															+                            "end_time": end_time.isoformat(),
														
 
															+                            "duration": (end_time - start_time).total_seconds()
														
 
															+                        },
														
 
															+                        "success": False
														
 
															+                    }
														
 
															+                    self.api_calls.append(api_call_info)
														
 
															+
														
 
															+                    # 保存API结果到文件
														
 
															+                    api_results_dir = "api_results"
														
 
															+                    os.makedirs(api_results_dir, exist_ok=True)
														
 
															+                    filename = f"{call_id}.json"
														
 
															+                    filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+                    try:
														
 
															+                        with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                            json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+                        print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+                    except Exception as e:
														
 
															+                        print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+                    # 如果不是最后一次尝试，等待后重试
														
 
															+                    if attempt < max_retries - 1:
														
 
															+                        print(f"❌ 其他异常: {str(e)}，{retry_delay}秒后重试...")
														
 
															+                        import time
														
 
															+                        time.sleep(retry_delay)
														
 
															+                        continue
														
 
															+                    else:
														
 
															+                        return {
														
 
															+                            "success": False,
														
 
															+                            "message": f"API调用异常: {str(e)}"
														
 
															+                        }
														
 
															+        except Exception as e:
														
 
															+            # 处理所有未捕获的异常
														
 
															+            print(f"❌ API调用过程中发生未预期的错误: {str(e)}")
														
 
															+            return {
														
 
															+                "success": False,
														
 
															+                "message": f"API调用过程中发生未预期的错误: {str(e)}"
														
 
															+            }
														
 
															+
														
 
															+    def _prepare_request_data(self, config: Dict[str, Any], intent_result: Dict[str, Any], config_name: str) -> Dict[str, Any]:
														
 
															+        """
														
 
															+        准备API请求数据
														
 
															+
														
 
															+        Args:
														
 
															+            config: 配置文件
														
 
															+            intent_result: 意图识别结果
														
 
															+            config_name: 配置文件名
														
 
															+
														
 
															+        Returns:
														
 
															+            请求数据
														
 
															+        """
														
 
															+        # 从配置文件中获取question和prompt
														
 
															+        question = config.get("question", "")
														
 
															+        prompt = config.get("prompt", "")
														
 
															+
														
 
															+        # 选择对应的数据文件
														
 
															+        data_file_path = self._select_data_file(config_name)
														
 
															+        table_data = []
														
 
															+
														
 
															+        if data_file_path:
														
 
															+            table_data = self._load_table_data(data_file_path)
														
 
															+        else:
														
 
															+            print(f"警告：找不到配置文件 {config_name} 对应的数据文件")
														
 
															+
														
 
															+        # 构造documents数组
														
 
															+        documents = []
														
 
															+        if table_data:
														
 
															+            # 使用数据文件名作为标题
														
 
															+            title = f"数据表-{config_name}"
														
 
															+            if data_file_path:
														
 
															+                title = os.path.basename(data_file_path).replace('.json', '')
														
 
															+
														
 
															+            documents.append({
														
 
															+                "id": 1,
														
 
															+                "title": title,
														
 
															+                "text": "",
														
 
															+                "table": table_data
														
 
															+            })
														
 
															+
														
 
															+        # 构造API请求体
														
 
															+        request_data = {
														
 
															+            "disable_planning": False,
														
 
															+            "question": question,
														
 
															+            "prompt": prompt,
														
 
															+            "documents": documents
														
 
															+        }
														
 
															+
														
 
															+        return {"json": request_data}
														
 
															+
														
 
															+    def _extract_json_from_result(self, result_text: str) -> Dict[str, Any]:
														
 
															+        """
														
 
															+        从API结果文本中提取JSON内容
														
 
															+
														
 
															+        Args:
														
 
															+            result_text: API返回的result字段内容
														
 
															+
														
 
															+        Returns:
														
 
															+            提取的JSON对象
														
 
															+        """
														
 
															+        import re
														
 
															+        import json
														
 
															+
														
 
															+        try:
														
 
															+            # 查找```json和```之间的内容
														
 
															+            json_match = re.search(r'```json\s*(.*?)\s*```', result_text, re.DOTALL)
														
 
															+            if json_match:
														
 
															+                json_str = json_match.group(1).strip()
														
 
															+                return json.loads(json_str)
														
 
															+
														
 
															+            # 如果没有```json标记，查找大括号包围的内容
														
 
															+            brace_match = re.search(r'\{.*\}', result_text, re.DOTALL)
														
 
															+            if brace_match:
														
 
															+                json_str = brace_match.group(0).strip()
														
 
															+                return json.loads(json_str)
														
 
															+
														
 
															+            # 如果都找不到，尝试直接解析整个文本
														
 
															+            return json.loads(result_text.strip())
														
 
															+
														
 
															+        except json.JSONDecodeError as e:
														
 
															+            print(f"JSON解析失败: {e}")
														
 
															+            return {"error": f"无法解析JSON结果: {str(e)}", "raw_result": result_text}
														
 
															+
														
 
															+    def get_available_configs(self) -> List[str]:
														
 
															+        """获取所有可用的配置文件名"""
														
 
															+        return list(self.configs.keys())
														
 
															+
														
 
															+    def get_config_details(self, config_name: str) -> Optional[Dict]:
														
 
															+        """获取指定配置文件的详细信息"""
														
 
															+        return self.configs.get(config_name)
														
--- a/llmops/agents/outline_agent.py
+++ b/llmops/agents/outline_agent.py
@@ -1,94 +1,375 @@
 
															+"""
														
 
															+报告大纲生成Agent (Report Outline Generation Agent)
														
 
															+===============================================
														
 
															+
														
 
															+此Agent负责根据用户需求和数据样本，生成专业的报告大纲结构。
														
 
															+
														
 
															+核心功能：
														
 
															+1. 分析用户需求：理解报告目标和关键指标
														
 
															+2. 数据结构分析：识别可用字段和数据特征
														
 
															+3. 大纲生成：创建结构化的报告章节和指标需求
														
 
															+4. 智能推断：自动推断所需字段和计算逻辑
														
 
															+
														
 
															+工作流程：
														
 
															+1. 接收用户查询和数据样本
														
 
															+2. 分析数据结构和可用字段
														
 
															+3. 生成报告标题和章节结构
														
 
															+4. 定义全局指标需求
														
 
															+5. 返回结构化的大纲对象
														
 
															+
														
 
															+技术实现：
														
 
															+- 使用LangChain和结构化输出
														
 
															+- 支持异步处理
														
 
															+- 自动字段推断和补全
														
 
															+- 错误处理和默认值提供
														
 
															+
														
 
															+作者: Big Agent Team
														
 
															+版本: 1.0.0
														
 
															+创建时间: 2024-12-20
														
 
															+"""
														
 
															+
														
 
															 from typing import List, Dict, Any
														
 
															 from langchain_openai import ChatOpenAI
														
 
															 from langchain_core.prompts import ChatPromptTemplate
														
 
															-import json  # 确保导入json
														
 
															+import json
														
 
															+import os
														
 
															 import uuid
														
 
															+import requests
														
 
															+from datetime import datetime
														
 
															+
														
 
															+from pydantic import BaseModel, Field
														
 
															+
														
 
															+
														
 
															+# 数据模型定义（与现有项目兼容）
														
 
															+class MetricRequirement(BaseModel):
														
 
															+    """指标需求定义"""
														
 
															+    metric_id: str = Field(description="指标唯一标识，如 'total_income_jan'")
														
 
															+    metric_name: str = Field(description="指标中文名称")
														
 
															+    calculation_logic: str = Field(description="计算逻辑描述")
														
 
															+    required_fields: List[str] = Field(description="所需字段")
														
 
															+    dependencies: List[str] = Field(default_factory=list, description="依赖的其他指标ID")
														
 
															+
														
 
															+
														
 
															+class ReportSection(BaseModel):
														
 
															+    """报告大纲章节"""
														
 
															+    section_id: str = Field(description="章节ID")
														
 
															+    title: str = Field(description="章节标题")
														
 
															+    description: str = Field(description="章节内容要求")
														
 
															+    metrics_needed: List[str] = Field(description="所需指标ID列表")
														
 
															-from llmops.agents.state import AgentState, ReportOutline, ReportSection, MetricRequirement, convert_numpy_types
														
 
															-from llmops.agents.datadev.llm import get_llm
														
 
															+class ReportOutline(BaseModel):
														
 
															+    """完整报告大纲"""
														
 
															+    report_title: str = Field(description="报告标题")
														
 
															+    sections: List[ReportSection] = Field(description="章节列表")
														
 
															+    global_metrics: List[MetricRequirement] = Field(description="全局指标列表")
														
 
															-class OutlineGenerator:
														
 
															+
														
 
															+class OutlineGeneratorAgent:
														
 
															     """大纲生成智能体：将报告需求转化为结构化大纲"""
														
 
															-    def __init__(self, llm):
														
 
															-        self.llm = llm.with_structured_output(ReportOutline)
														
 
															+    def __init__(self, api_key: str, base_url: str = "https://api.deepseek.com"):
														
 
															+        """
														
 
															+        初始化大纲生成Agent
														
 
															+
														
 
															+        Args:
														
 
															+            api_key: DeepSeek API密钥
														
 
															+            base_url: DeepSeek API基础URL
														
 
															+        """
														
 
															+        self.llm = ChatOpenAI(
														
 
															+            model="deepseek-chat",
														
 
															+            api_key=api_key,
														
 
															+            base_url=base_url,
														
 
															+            temperature=0.1
														
 
															+        )
														
 
															-    def create_prompt(self, question: str, sample_data: List[Dict]) -> str:
														
 
															+        # 初始化API调用跟踪
														
 
															+        self.api_calls = []
														
 
															+
														
 
															+        # 获取可用的知识元数据
														
 
															+        self.available_knowledge = self._load_available_knowledge()
														
 
															+
														
 
															+
														
 
															+
														
 
															+    def _convert_new_format_to_outline(self, new_format_data: Dict[str, Any]) -> Dict[str, Any]:
														
 
															+        """将新的JSON格式转换为原来的ReportOutline格式"""
														
 
															+
														
 
															+        # 转换sections
														
 
															+        sections = []
														
 
															+        for section_data in new_format_data.get("sections", []):
														
 
															+            # 从metrics中提取指标名称
														
 
															+            metrics_needed = []
														
 
															+            for metric_type in ["calculation_metrics", "statistical_metrics", "analysis_metrics"]:
														
 
															+                for metric in section_data.get("metrics", {}).get(metric_type, []):
														
 
															+                    # 这里可以根据metric_name映射到实际的metric_id
														
 
															+                    # 暂时使用metric_name作为metric_id
														
 
															+                    metrics_needed.append(metric.get("metric_name", ""))
														
 
															+
														
 
															+            section = {
														
 
															+                "section_id": section_data.get("section_id", ""),
														
 
															+                "title": section_data.get("section_title", ""),
														
 
															+                "description": section_data.get("section_description", ""),
														
 
															+                "metrics_needed": metrics_needed
														
 
															+            }
														
 
															+            sections.append(section)
														
 
															+
														
 
															+        # 生成global_metrics：使用知识ID进行匹配，并强制添加更多农业相关指标
														
 
															+        global_metrics = []
														
 
															+        used_knowledge_ids = set()
														
 
															+
														
 
															+        # 首先处理LLM生成的指标
														
 
															+        for section in sections:
														
 
															+            for metric_name in section["metrics_needed"]:
														
 
															+                # 查找对应的指标描述（从原始数据中获取）
														
 
															+                metric_description = ""
														
 
															+                for section_data in new_format_data.get("sections", []):
														
 
															+                    for metric_type in ["calculation_metrics", "statistical_metrics", "analysis_metrics"]:
														
 
															+                        for metric in section_data.get("metrics", {}).get(metric_type, []):
														
 
															+                            if metric.get("metric_name") == metric_name:
														
 
															+                                metric_description = metric.get("metric_description", "")
														
 
															+                                break
														
 
															+                        if metric_description:
														
 
															+                            break
														
 
															+                    if metric_description:
														
 
															+                        break
														
 
															+
														
 
															+                # 使用知识ID匹配算法找到最佳匹配
														
 
															+                knowledge_id = self._match_metric_to_knowledge(metric_name, metric_description)
														
 
															+
														
 
															+                # 如果找到匹配的知识ID，使用它作为metric_id
														
 
															+                if knowledge_id and knowledge_id not in used_knowledge_ids:
														
 
															+                    global_metrics.append({
														
 
															+                        "metric_id": knowledge_id,  # 使用知识ID作为metric_id
														
 
															+                        "metric_name": metric_name,
														
 
															+                        "calculation_logic": f"使用规则引擎计算{metric_name}: {metric_description}",
														
 
															+                        "required_fields": ["transactions"],  # 规则引擎使用transactions数据
														
 
															+                        "dependencies": []
														
 
															+                    })
														
 
															+                    used_knowledge_ids.add(knowledge_id)
														
 
															+                else:
														
 
															+                    # 如果没有找到匹配的知识ID，生成一个基本的MetricRequirement作为备选
														
 
															+                    if not any(m.get("metric_id") == metric_name for m in global_metrics):
														
 
															+                        print(f"⚠️ 指标 '{metric_name}' 未找到匹配的知识ID，使用默认配置")
														
 
															+                        global_metrics.append({
														
 
															+                            "metric_id": metric_name,
														
 
															+                            "metric_name": metric_name,
														
 
															+                            "calculation_logic": f"计算{metric_name}: {metric_description}",
														
 
															+                            "required_fields": ["txAmount", "txDirection"],
														
 
															+                            "dependencies": []
														
 
															+                        })
														
 
															+
														
 
															+        # 注意：现在依赖LLM根据提示词生成包含所有必需指标的大纲，不再在代码中强制添加
														
 
															+
														
 
															+        # 如果LLM没有提供任何指标，则自动补充基础指标
														
 
															+        if not global_metrics:
														
 
															+            print("⚠️ LLM未提供指标，使用默认基础指标")
														
 
															+            available_metrics = self._load_available_metrics()
														
 
															+
														
 
															+            # 选择前5个基础指标
														
 
															+            base_metrics = [m for m in available_metrics if m.get('type') == '基础统计指标'][:5]
														
 
															+
														
 
															+            for metric in base_metrics:
														
 
															+                metric_name = metric['name']
														
 
															+                knowledge_id = f"metric-{metric_name}"
														
 
															+                if sections:  # 确保有章节
														
 
															+                    sections[0]["metrics_needed"].append(knowledge_id)  # 添加到第一个章节
														
 
															+                global_metrics.append({
														
 
															+                    "metric_id": knowledge_id,
														
 
															+                    "metric_name": metric_name,
														
 
															+                    "calculation_logic": f"使用规则引擎计算{metric_name}: {metric.get('description', '')}",
														
 
															+                    "required_fields": ["transactions"],
														
 
															+                    "dependencies": []
														
 
															+                })
														
 
															+
														
 
															+        print(f"📊 最终生成 {len(global_metrics)} 个指标")
														
 
															+
														
 
															+        return {
														
 
															+            "report_title": new_format_data.get("chapter_title", "流水分析报告"),
														
 
															+            "sections": sections,
														
 
															+            "global_metrics": global_metrics
														
 
															+        }
														
 
															+
														
 
															+    def create_prompt(self) -> str:
														
 
															         """创建大纲生成提示"""
														
 
															-        available_fields = list(sample_data[0].keys()) if sample_data else []
														
 
															-        sample_str = json.dumps(sample_data[:2], ensure_ascii=False, indent=2)
														
 
															-
														
 
															-        # 关键修复：提供详细的字段说明和示例
														
 
															-        return f"""你是银行流水报告大纲专家。根据用户需求和样本数据，生成专业、可执行的报告大纲。
														
 
															-
														
 
															-需求分析：
														
 
															-{question}
														
 
															-
														
 
															-可用字段：
														
 
															-{', '.join(available_fields)}
														
 
															-
														
 
															-样本数据：
														
 
															-{sample_str}
														
 
															-
														
 
															-输出要求（必须生成有效的JSON）：
														
 
															-1. report_title: 报告标题（字符串）
														
 
															-2. sections: 章节列表，每个章节必须包含：
														
 
															-   - section_id: 章节唯一ID（如"sec_1", "sec_2"）
														
 
															-   - title: 章节标题
														
 
															-   - description: 章节描述
														
 
															-   - metrics_needed: 所需指标ID列表（字符串数组，可为空）
														
 
															-3. global_metrics: 全局指标列表，每个指标必须包含：
														
 
															-   - metric_id: 指标唯一ID（如"total_income", "avg_balance"）
														
 
															-   - metric_name: 指标名称
														
 
															-   - calculation_logic: 计算逻辑描述
														
 
															-   - required_fields: 所需字段列表
														
 
															-   - dependencies: 依赖的其他指标ID（可为空）
														
 
															-
														
 
															-重要提示：
														
 
															-- 必须生成section_id，格式为"sec_1", "sec_2"等
														
 
															-- 必须生成metric_id，格式为字母+下划线+描述
														
 
															-- metrics_needed必须是字符串数组
														
 
															-- 确保所有字段都存在，不能缺失
														
 
															-
														
 
															-输出示例：
														
 
															+        # 从API动态获取可用的指标列表
														
 
															+        available_metrics = self._load_available_metrics()
														
 
															+
														
 
															+        # 构建指标列表文本
														
 
															+        metrics_list_text = "指标名称\t指标类型\t指标描述\n"
														
 
															+        for metric in available_metrics:
														
 
															+            metrics_list_text += f"{metric['name']}\t{metric.get('type', '计算型指标')}\t{metric.get('description', '')}\n"
														
 
															+
														
 
															+        # 构建基础提示词
														
 
															+        base_prompt = f"""[角色定义]
														
 
															+你的角色是: 流水分析报告的大纲生成模块。
														
 
															+你的目标是:
														
 
															+基于输入的流水分析业务背景信息,
														
 
															+生成一份可交付、结构清晰、可被程序解析的流水分析报告大纲,
														
 
															+并以结构化 JSON 的形式，明确每个章节及其下属分析主题所需的分析指标与分析项要求,
														
 
															+以指导后续分析能力的调用。
														
 
															+
														
 
															+[职责边界]
														
 
															+你只能完成以下事项:
														
 
															+1.确定流水分析报告应包含的章节结构
														
 
															+2.明确每个章节下需要覆盖的分析主题
														
 
															+3.为每个分析主题列出所需的计算指标、统计指标或分析指标
														
 
															+
														
 
															+你不得做以下任何事情:
														
 
															+1.不得计算任何指标
														
 
															+2.不得对流水数据进行分析
														
 
															+3.不得判断交易是否异常或存在风险
														
 
															+4.不得生成任何分析结论、判断性描述或报告正文
														
 
															+5.不得决定分析执行顺序或分析方法
														
 
															+
														
 
															+你输出的内容仅是"分析需求清单"，而不是"分析结果"。
														
 
															+
														
 
															+[可用指标总览]
														
 
															+系统当前支持 {len(available_metrics)} 个指标。
														
 
															+
														
 
															+[重要要求]
														
 
															+请根据用户需求和可用指标列表，从上述指标中选择最相关的指标。优先选择基础统计指标和时间分析指标，确保报告的完整性和实用性。
														
 
															+
														
 
															+[强制要求]
														
 
															+生成大纲时，请：
														
 
															+1. 从可用指标中选择合适的指标组合
														
 
															+2. 确保选择的指标能够满足用户分析需求
														
 
															+3. 在metrics_needed数组中列出选定的指标名称
														
 
															+4. 在global_metrics数组中包含对应指标的详细定义
														
 
															+
														
 
															+[可选择的指标列表]
														
 
															+{metrics_list_text}
														
 
															+
														
 
															+[重要兼容性要求]
														
 
															+虽然你必须使用上述JSON结构输出，但为了确保与现有系统的兼容性，请在输出中额外包含以下字段：
														
 
															+- 在根级别添加 "report_title": "流水分析报告"
														
 
															+- 在根级别添加 "global_metrics": [] (空数组或根据实际需求填充指标定义)
														
 
															+- 确保输出能被现有系统正确解析和使用
														
 
															+
														
 
															+[输出格式要求]
														
 
															+你必须且只能以 JSON 字符串 形式输出分析大纲，不得输出任何解释性自然语言。
														
 
															+JSON 必须严格遵循以下结构约定:
														
 
															 {{
														
 
															-  "report_title": "2024年第三季度分析报告",
														
 
															+  "chapter_id": "string",
														
 
															+  "chapter_title": "string",
														
 
															+  "chapter_type": "string",
														
 
															   "sections": [
														
 
															     {{
														
 
															-      "section_id": "sec_1",
														
 
															-      "title": "收入概览",
														
 
															-      "description": "分析收入总额",
														
 
															-      "metrics_needed": ["total_income", "avg_income"]
														
 
															+      "section_id": "string",
														
 
															+      "section_title": "string",
														
 
															+      "section_description": "string",
														
 
															+      "metrics_needed": ["string"]
														
 
															     }}
														
 
															   ],
														
 
															-  "global_metrics": [
														
 
															-    {{
														
 
															-      "metric_id": "total_income",
														
 
															-      "metric_name": "总收入",
														
 
															-      "calculation_logic": "sum of all income transactions",
														
 
															-      "required_fields": ["txAmount", "txDirection"],
														
 
															-      "dependencies": []
														
 
															-    }}
														
 
															-  ]
														
 
															+  "global_metrics": []
														
 
															 }}"""
														
 
															-    async def generate(self, state: AgentState) -> ReportOutline:
														
 
															+        return base_prompt
														
 
															+
														
 
															+        print(f"📊 最终生成 {len(global_metrics)} 个指标")
														
 
															+
														
 
															+        return {
														
 
															+            "report_title": new_format_data.get("chapter_title", "流水分析报告"),
														
 
															+            "sections": sections,
														
 
															+            "global_metrics": global_metrics
														
 
															+        }
														
 
															+
														
 
															+
														
 
															+    async def generate_outline(self, question: str, industry: str, sample_data: List[Dict[str, Any]]) -> ReportOutline:
														
 
															         """异步生成大纲（修复版：自动补全缺失字段）"""
														
 
															-        prompt = self.create_prompt(
														
 
															-            question=state["question"],
														
 
															-            sample_data=state["data_set"][:2]
														
 
															-        )
														
 
															+        prompt = self.create_prompt()
														
 
															+
														
 
															+        # 在prompt末尾添加业务背景信息
														
 
															+        full_prompt = f"""{prompt}
														
 
															+
														
 
															+【业务背景信息】
														
 
															+行业：{industry}
														
 
															+产品类型：经营贷
														
 
															+客群类型：小微企业"""
														
 
															         messages = [
														
 
															             ("system", "你是一名专业的报告大纲生成专家，必须输出完整、有效的JSON格式，包含所有必需字段。"),
														
 
															-            ("user", prompt)
														
 
															+            ("user", full_prompt)
														
 
															         ]
														
 
															-        outline = await self.llm.ainvoke(messages)
														
 
															-
														
 
															-        # 关键修复：后处理，补全缺失的section_id和metric_id
														
 
															+        # 记录大模型输入
														
 
															+        print("========================================")
														
 
															+        print("[AGENT] OutlineGeneratorAgent (大纲生成Agent)")
														
 
															+        print(f"[KNOWLEDGE_BASE] 已加载 {len(self.available_knowledge)} 个知识元数据")
														
 
															+        if self.available_knowledge:
														
 
															+            sample_knowledge = self.available_knowledge[:3]  # 显示前3个作为示例
														
 
															+            print(f"[KNOWLEDGE_SAMPLE] 示例知识: {[k.get('id', '') for k in sample_knowledge]}")
														
 
															+        print("[MODEL_INPUT] OutlineGeneratorAgent:")
														
 
															+        print(f"[CONTEXT] 基于用户需求和数据样本生成报告大纲")
														
 
															+        print(f"Question: {question}")
														
 
															+        print(f"Sample data count: {len(sample_data)}")
														
 
															+        print("========================================")
														
 
															+
														
 
															+        # 执行API调用
														
 
															+        start_time = datetime.now()
														
 
															+        response = await self.llm.ainvoke(messages)
														
 
															+        end_time = datetime.now()
														
 
															+
														
 
															+        # 解析JSON响应
														
 
															+        try:
														
 
															+            # 从响应中提取JSON内容
														
 
															+            content = response.content if hasattr(response, 'content') else str(response)
														
 
															+            # 尝试找到JSON部分
														
 
															+            json_start = content.find('{')
														
 
															+            json_end = content.rfind('}') + 1
														
 
															+            if json_start >= 0 and json_end > json_start:
														
 
															+                json_str = content[json_start:json_end]
														
 
															+                outline_data = json.loads(json_str)
														
 
															+
														
 
															+                # 转换新的JSON格式为原来的ReportOutline格式
														
 
															+                converted_data = self._convert_new_format_to_outline(outline_data)
														
 
															+                outline = ReportOutline(**converted_data)
														
 
															+            else:
														
 
															+                raise ValueError("No JSON found in response")
														
 
															+        except Exception as e:
														
 
															+            print(f"解析大纲响应失败: {e}，使用默认大纲")
														
 
															+            # 不在这里创建大纲，在函数末尾统一处理
														
 
															+
														
 
															+        # 记录API调用结果
														
 
															+        call_id = f"api_mll_大纲生成_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+        api_call_info = {
														
 
															+            "call_id": call_id,
														
 
															+            "timestamp": end_time.isoformat(),
														
 
															+            "agent": "OutlineGeneratorAgent",
														
 
															+            "model": "deepseek-chat",
														
 
															+            "request": {
														
 
															+                "question": question,
														
 
															+                "sample_data_count": len(sample_data),
														
 
															+                "prompt": prompt,
														
 
															+                "start_time": start_time.isoformat()
														
 
															+            },
														
 
															+            "response": {
														
 
															+                "content": content,
														
 
															+                "end_time": end_time.isoformat(),
														
 
															+                "duration": (end_time - start_time).total_seconds()
														
 
															+            },
														
 
															+            "success": True
														
 
															+        }
														
 
															+        self.api_calls.append(api_call_info)
														
 
															+
														
 
															+        # 保存API结果到文件
														
 
															+        api_results_dir = "api_results"
														
 
															+        os.makedirs(api_results_dir, exist_ok=True)
														
 
															+        filename = f"{call_id}.json"
														
 
															+        filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+        try:
														
 
															+            with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+            print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+        except Exception as e:
														
 
															+            print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+        # 记录大模型输出
														
 
															+        print(f"[MODEL_OUTPUT] OutlineGeneratorAgent: {json.dumps(outline.dict() if hasattr(outline, 'dict') else outline, ensure_ascii=False)}")
														
 
															+        print("========================================")
														
 
															+
														
 
															+        # 后处理，补全缺失的section_id和metric_id
														
 
															         outline = self._post_process_outline(outline)
														
 
															         return outline
														
@@ -143,92 +424,304 @@ class OutlineGenerator:
 
															         return list(set(fields))
														
 
															+    def _load_available_knowledge(self) -> List[Dict[str, Any]]:
														
 
															+        """
														
 
															+        从规则引擎获取可用的知识元数据
														
 
															-async def outline_node(state: AgentState) -> AgentState:
														
 
															-    """大纲生成节点：设置成功标志，防止重复生成"""
														
 
															-
														
 
															-    llm = get_llm()
														
 
															-    generator = OutlineGenerator(llm)
														
 
															-
														
 
															-    try:
														
 
															-        # 异步生成大纲
														
 
															-        outline = await generator.generate(state)
														
 
															-
														
 
															-        # 更新状态
														
 
															-        new_state = state.copy()
														
 
															-        new_state["outline_draft"] = outline
														
 
															-        new_state["outline_version"] += 1
														
 
															-
														
 
															-        # 防护：设置成功标志
														
 
															-        new_state["outline_ready"] = True  # 明确标志：大纲已就绪
														
 
															-
														
 
															-        new_state["metrics_requirements"] = outline.global_metrics
														
 
															-        new_state["metrics_pending"] = outline.global_metrics.copy()  # 待计算指标
														
 
															-        new_state["messages"].append(
														
 
															-            ("ai", f"✅ 大纲生成完成 v{new_state['outline_version']}：{outline.report_title}")
														
 
															-        )
														
 
															-
														
 
															-        print(f"\n📝 大纲已生成：{outline.report_title}")
														
 
															-        print(f"   章节数：{len(outline.sections)}")
														
 
															-        print(f"   指标数：{len(outline.global_metrics)}")
														
 
															-
														
 
															-        # 新增：详细打印大纲内容
														
 
															-        print("\n" + "=" * 70)
														
 
															-        print("📋 详细大纲内容")
														
 
															-        print("=" * 70)
														
 
															-        print(json.dumps(outline.dict(), ensure_ascii=False, indent=2))
														
 
															-        print("=" * 70)
														
 
															-
														
 
															-        # 关键修复：返回前清理状态
														
 
															-        return convert_numpy_types(new_state)
														
 
															-
														
 
															-    except Exception as e:
														
 
															-        print(f"⚠️ 大纲生成出错: {e}，使用默认结构")
														
 
															-
														
 
															-        # 创建默认大纲
														
 
															-        default_outline = ReportOutline(
														
 
															-            report_title="默认交易分析报告",
														
 
															-            sections=[
														
 
															-                ReportSection(
														
 
															-                    section_id="sec_1",
														
 
															-                    title="交易概览",
														
 
															-                    description="基础交易情况分析",
														
 
															-                    metrics_needed=["total_transactions", "total_income", "total_expense"]
														
 
															-                )
														
 
															-            ],
														
 
															-            global_metrics=[
														
 
															-                MetricRequirement(
														
 
															-                    metric_id="total_transactions",
														
 
															-                    metric_name="总交易笔数",
														
 
															-                    calculation_logic="count all transactions",
														
 
															-                    required_fields=["txId"],
														
 
															-                    dependencies=[]
														
 
															-                ),
														
 
															-                MetricRequirement(
														
 
															-                    metric_id="total_income",
														
 
															-                    metric_name="总收入",
														
 
															-                    calculation_logic="sum of income transactions",
														
 
															-                    required_fields=["txAmount", "txDirection"],
														
 
															-                    dependencies=[]
														
 
															-                )
														
 
															-            ]
														
 
															-        )
														
 
															+        Returns:
														
 
															+            知识元数据列表，包含id和description
														
 
															+        """
														
 
															+        try:
														
 
															+            url = "http://localhost:8081/api/rules/getKnowledgeMeta"
														
 
															+            headers = {
														
 
															+                "Accept": "*/*",
														
 
															+                "Accept-Encoding": "gzip, deflate, br",
														
 
															+                "Connection": "keep-alive",
														
 
															+                "Content-Type": "application/json",
														
 
															+                "User-Agent": "PostmanRuntime-ApipostRuntime/1.1.0"
														
 
															+            }
														
 
															+
														
 
															+            response = requests.post(url, headers=headers, json={}, timeout=30)
														
 
															+
														
 
															+            if response.status_code == 200:
														
 
															+                knowledge_meta = response.json()
														
 
															+                if isinstance(knowledge_meta, list):
														
 
															+                    print(f"✅ 成功获取 {len(knowledge_meta)} 个知识元数据")
														
 
															+                    return knowledge_meta
														
 
															+                else:
														
 
															+                    print(f"⚠️ 知识元数据格式异常: {knowledge_meta}")
														
 
															+                    return []
														
 
															+            else:
														
 
															+                print(f"❌ 获取知识元数据失败，状态码: {response.status_code}")
														
 
															+                print(f"响应内容: {response.text}")
														
 
															+                return []
														
 
															+
														
 
															+        except Exception as e:
														
 
															+            print(f"❌ 获取知识元数据时发生错误: {str(e)}")
														
 
															+            return []
														
 
															+
														
 
															+    def _load_available_metrics(self) -> List[Dict[str, str]]:
														
 
															+        """
														
 
															+        从知识库中提取可用的指标列表
														
 
															-        new_state = state.copy()
														
 
															-        new_state["outline_draft"] = default_outline
														
 
															-        new_state["outline_version"] += 1
														
 
															-        new_state["outline_ready"] = True  # 即使默认也标记为就绪
														
 
															-        new_state["metrics_requirements"] = default_outline.global_metrics
														
 
															-        new_state["messages"].append(
														
 
															-            ("ai", f"⚠️ 使用默认大纲 v{new_state['outline_version']}")
														
 
															-        )
														
 
															+        Returns:
														
 
															+            指标列表，包含name和description字段
														
 
															+        """
														
 
															+        knowledge_list = self._load_available_knowledge()
														
 
															+
														
 
															+        metrics = []
														
 
															+        for knowledge in knowledge_list:
														
 
															+            knowledge_id = knowledge.get("id", "")
														
 
															+            description = knowledge.get("description", "")
														
 
															+
														
 
															+            # 从知识ID中提取指标名称
														
 
															+            if knowledge_id.startswith("metric-"):
														
 
															+                metric_name = knowledge_id.replace("metric-", "")
														
 
															+
														
 
															+                # 从描述中提取更简洁的指标描述
														
 
															+                short_description = self._extract_metric_description(description)
														
 
															+
														
 
															+                metrics.append({
														
 
															+                    "name": metric_name,
														
 
															+                    "description": short_description,
														
 
															+                    "type": self._classify_metric_type(metric_name, description)
														
 
															+                })
														
 
															+
														
 
															+        print(f"✅ 从知识库中提取了 {len(metrics)} 个可用指标")
														
 
															+        return metrics
														
 
															+
														
 
															+    def _extract_metric_description(self, full_description: str) -> str:
														
 
															+        """从完整描述中提取简洁的指标描述"""
														
 
															+        # 移除"因子概述："等前缀
														
 
															+        description = full_description.replace("因子概述：", "").strip()
														
 
															+
														
 
															+        # 如果描述太长，取前50个字符
														
 
															+        if len(description) > 50:
														
 
															+            description = description[:50] + "..."
														
 
															+
														
 
															+        return description
														
 
															+
														
 
															+    def _classify_metric_type(self, metric_name: str, description: str) -> str:
														
 
															+        """根据指标名称和描述分类指标类型"""
														
 
															+        if any(keyword in metric_name for keyword in ["收入", "支出", "金额", "交易笔数"]):
														
 
															+            return "基础统计指标"
														
 
															+        elif any(keyword in metric_name for keyword in ["时间范围", "时间跨度"]):
														
 
															+            return "时间分析指标"
														
 
															+        elif any(keyword in metric_name for keyword in ["比例", "占比", "构成"]):
														
 
															+            return "结构分析指标"
														
 
															+        elif any(keyword in metric_name for keyword in ["排名", "TOP", "前三"]):
														
 
															+            return "专项分析指标"
														
 
															+        elif any(keyword in metric_name for keyword in ["账户", "数量"]):
														
 
															+            return "账户分析指标"
														
 
															+        else:
														
 
															+            return "其他指标"
														
 
															+
														
 
															+    def _match_metric_to_knowledge(self, metric_name: str, metric_description: str) -> str:
														
 
															+        """
														
 
															+        根据指标名称和描述匹配最合适的知识ID
														
 
															-        # 新增：详细打印默认大纲内容
														
 
															-        print("\n" + "=" * 70)
														
 
															-        print("📋 默认大纲内容")
														
 
															-        print("=" * 70)
														
 
															-        print(json.dumps(default_outline.dict(), ensure_ascii=False, indent=2))
														
 
															-        print("=" * 70)
														
 
															+        Args:
														
 
															+            metric_name: 指标名称
														
 
															+            metric_description: 指标描述
														
 
															-        # 关键修复：返回前清理状态
														
 
															-        return convert_numpy_types(new_state)
														
 
															+        Returns:
														
 
															+            匹配的知识ID，如果没有找到则返回空字符串
														
 
															+        """
														
 
															+        if not self.available_knowledge:
														
 
															+            return ""
														
 
															+
														
 
															+        # 精确匹配：直接用指标名称匹配知识ID
														
 
															+        for knowledge in self.available_knowledge:
														
 
															+            knowledge_id = knowledge.get("id", "")
														
 
															+            # 去掉前缀匹配，如 "metric-分析账户数量" 匹配 "分析账户数量"
														
 
															+            if knowledge_id.startswith("metric-") and knowledge_id.replace("metric-", "") == metric_name:
														
 
															+                print(f"🔗 精确匹配指标 '{metric_name}' -> 知识ID: {knowledge_id}")
														
 
															+                return knowledge_id
														
 
															+
														
 
															+        # 扩展匹配：匹配更多的农业相关指标
														
 
															+        if "农业" in metric_name:
														
 
															+            if "总经营收入" in metric_name:
														
 
															+                # 匹配农业总经营收入
														
 
															+                for knowledge in self.available_knowledge:
														
 
															+                    if knowledge.get("id") == "metric-农业总经营收入":
														
 
															+                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业总经营收入")
														
 
															+                        return "metric-农业总经营收入"
														
 
															+            if "总经营支出" in metric_name:
														
 
															+                # 匹配农业总经营支出
														
 
															+                for knowledge in self.available_knowledge:
														
 
															+                    if knowledge.get("id") == "metric-农业总经营支出":
														
 
															+                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业总经营支出")
														
 
															+                        return "metric-农业总经营支出"
														
 
															+            if "交易对手收入排名TOP3" in metric_name or "收入排名" in metric_name:
														
 
															+                # 匹配农业交易对手收入TOP3
														
 
															+                for knowledge in self.available_knowledge:
														
 
															+                    if knowledge.get("id") == "metric-农业交易对手经营收入top3":
														
 
															+                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业交易对手经营收入top3")
														
 
															+                        return "metric-农业交易对手经营收入top3"
														
 
															+            if "交易对手支出排名TOP3" in metric_name or "支出排名" in metric_name:
														
 
															+                # 匹配农业交易对手支出TOP3
														
 
															+                for knowledge in self.available_knowledge:
														
 
															+                    if knowledge.get("id") == "metric-农业交易对手经营支出top3":
														
 
															+                        print(f"🔗 扩展匹配指标 '{metric_name}' -> 知识ID: metric-农业交易对手经营支出top3")
														
 
															+                        return "metric-农业交易对手经营支出top3"
														
 
															+
														
 
															+        # 如果精确匹配失败，使用关键词匹配
														
 
															+        keywords = [metric_name]
														
 
															+        if metric_description:
														
 
															+            # 从描述中提取关键信息
														
 
															+            desc_lower = metric_description.lower()
														
 
															+            if "收入" in metric_name or "收入" in desc_lower:
														
 
															+                keywords.extend(["收入", "总收入", "经营收入"])
														
 
															+            if "支出" in metric_name or "支出" in desc_lower:
														
 
															+                keywords.extend(["支出", "总支出", "经营支出"])
														
 
															+            if "排名" in metric_name or "top" in desc_lower:
														
 
															+                keywords.append("排名")
														
 
															+            if "比例" in metric_name or "占比" in desc_lower:
														
 
															+                keywords.append("比例")
														
 
															+            if "时间范围" in metric_name:
														
 
															+                keywords.append("时间范围")
														
 
															+            if "账户" in metric_name:
														
 
															+                keywords.append("账户")
														
 
															+
														
 
															+        best_match = None
														
 
															+        best_score = 0
														
 
															+
														
 
															+        for knowledge in self.available_knowledge:
														
 
															+            knowledge_id = knowledge.get("id", "")
														
 
															+            knowledge_desc = knowledge.get("description", "").lower()
														
 
															+
														
 
															+            # 计算匹配分数
														
 
															+            score = 0
														
 
															+            for keyword in keywords:
														
 
															+                if keyword.lower() in knowledge_desc:
														
 
															+                    score += 1
														
 
															+
														
 
															+            # 行业匹配加分
														
 
															+            if "黑色金属" in knowledge_desc and "黑色金属" in metric_name:
														
 
															+                score += 2
														
 
															+            if "农业" in knowledge_desc and "农业" in metric_name:
														
 
															+                score += 2
														
 
															+
														
 
															+            # 直接名称匹配加分
														
 
															+            if metric_name.lower() in knowledge_desc:
														
 
															+                score += 3
														
 
															+
														
 
															+            if score > best_score:
														
 
															+                best_score = score
														
 
															+                best_match = knowledge_id
														
 
															+
														
 
															+        if best_match and best_score > 0:
														
 
															+            print(f"🔗 关键词匹配指标 '{metric_name}' -> 知识ID: {best_match} (匹配分数: {best_score})")
														
 
															+            return best_match
														
 
															+
														
 
															+        print(f"❌ 指标 '{metric_name}' 未找到匹配的知识ID")
														
 
															+        return ""
														
 
															+
														
 
															+
														
 
															+async def generate_report_outline(question: str, industry: str, sample_data: List[Dict[str, Any]], api_key: str, max_retries: int = 3, retry_delay: float = 2.0) -> ReportOutline:
														
 
															+    """
														
 
															+    生成报告大纲的主函数，支持重试机制
														
 
															+
														
 
															+    Args:
														
 
															+        question: 用户查询问题
														
 
															+        industry: 行业
														
 
															+        sample_data: 数据样本
														
 
															+        api_key: API密钥
														
 
															+        max_retries: 最大重试次数，默认3次
														
 
															+        retry_delay: 重试间隔时间（秒），默认2秒
														
 
															+
														
 
															+    Returns:
														
 
															+        生成的报告大纲
														
 
															+    """
														
 
															+    import asyncio
														
 
															+    import time
														
 
															+
														
 
															+    agent = OutlineGeneratorAgent(api_key)
														
 
															+
														
 
															+    print(f"📝 开始生成报告大纲（最多重试 {max_retries} 次）...")
														
 
															+
														
 
															+    for attempt in range(max_retries):
														
 
															+        try:
														
 
															+            print(f"   尝试 {attempt + 1}/{max_retries}...")
														
 
															+            start_time = time.time()
														
 
															+
														
 
															+            outline = await agent.generate_outline(question, industry, sample_data)
														
 
															+
														
 
															+            elapsed_time = time.time() - start_time
														
 
															+            print(".2f")
														
 
															+            print("\n📝 大纲生成成功：")
														
 
															+            print(f"   标题：{outline.report_title}")
														
 
															+            print(f"   章节数：{len(outline.sections)}")
														
 
															+            print(f"   指标数：{len(outline.global_metrics)}")
														
 
															+
														
 
															+            return outline
														
 
															+
														
 
															+        except Exception as e:
														
 
															+            elapsed_time = time.time() - start_time if 'start_time' in locals() else 0
														
 
															+            print(".2f")
														
 
															+            print(f"   错误详情: {str(e)}")
														
 
															+
														
 
															+            # 如果不是最后一次尝试，等待后重试
														
 
															+            if attempt < max_retries - 1:
														
 
															+                print(f"   ⏳ {retry_delay} 秒后进行第 {attempt + 2} 次重试...")
														
 
															+                await asyncio.sleep(retry_delay)
														
 
															+                # 增加重试间隔，避免频繁调用
														
 
															+                retry_delay = min(retry_delay * 1.5, 10.0)  # 最多等待10秒
														
 
															+            else:
														
 
															+                print(f"   ❌ 已达到最大重试次数 ({max_retries})，使用默认结构")
														
 
															+
														
 
															+    # 所有重试都失败后，使用默认结构
														
 
															+    print("⚠️ 所有重试均失败，使用默认大纲结构")
														
 
															+
														
 
															+    # 获取实际可用的指标来构建默认大纲
														
 
															+    available_metrics = self._load_available_metrics()
														
 
															+
														
 
															+    # 选择一些基础指标作为默认值
														
 
															+    default_metric_ids = []
														
 
															+    default_global_metrics = []
														
 
															+
														
 
															+    # 优先选择基础统计指标
														
 
															+    base_metrics = [m for m in available_metrics if m.get('type') == '基础统计指标']
														
 
															+    if base_metrics:
														
 
															+        # 选择前3个基础指标
														
 
															+        for metric in base_metrics[:3]:
														
 
															+            metric_name = metric['name']
														
 
															+            knowledge_id = f"metric-{metric_name}"
														
 
															+            default_metric_ids.append(knowledge_id)
														
 
															+            default_global_metrics.append(MetricRequirement(
														
 
															+                metric_id=knowledge_id,
														
 
															+                metric_name=metric_name,
														
 
															+                calculation_logic=f"使用规则引擎计算{metric_name}: {metric.get('description', '')}",
														
 
															+                required_fields=["transactions"],
														
 
															+                dependencies=[]
														
 
															+            ))
														
 
															+
														
 
															+    # 如果基础指标不够，补充其他类型的指标
														
 
															+    if len(default_metric_ids) < 3:
														
 
															+        other_metrics = [m for m in available_metrics if m.get('type') != '基础统计指标']
														
 
															+        for metric in other_metrics[:3-len(default_metric_ids)]:
														
 
															+            metric_name = metric['name']
														
 
															+            knowledge_id = f"metric-{metric_name}"
														
 
															+            default_metric_ids.append(knowledge_id)
														
 
															+            default_global_metrics.append(MetricRequirement(
														
 
															+                metric_id=knowledge_id,
														
 
															+                metric_name=metric_name,
														
 
															+                calculation_logic=f"使用规则引擎计算{metric_name}: {metric.get('description', '')}",
														
 
															+                required_fields=["transactions"],
														
 
															+                dependencies=[]
														
 
															+            ))
														
 
															+
														
 
															+    # 创建使用实际指标的默认大纲
														
 
															+    default_outline = ReportOutline(
														
 
															+        report_title="默认交易分析报告",
														
 
															+        sections=[
														
 
															+            ReportSection(
														
 
															+                section_id="sec_1",
														
 
															+                title="交易概览",
														
 
															+                description="基础交易情况分析",
														
 
															+                metrics_needed=default_metric_ids
														
 
															+            )
														
 
															+        ],
														
 
															+        global_metrics=default_global_metrics
														
 
															+    )
														
 
															+    return default_outline
														
--- a/llmops/agents/planning_agent.py
+++ b/llmops/agents/planning_agent.py
@@ -1,17 +1,46 @@
 
															+"""
														
 
															+规划Agent (Planning Agent)
														
 
															+=========================
														
 
															+
														
 
															+此Agent负责分析当前状态并做出智能决策，决定下一步行动。
														
 
															+
														
 
															+核心功能：
														
 
															+1. 状态评估：分析大纲、指标计算进度和完整性
														
 
															+2. 决策制定：决定生成大纲、计算指标、完成报告或澄清需求
														
 
															+3. 优先级排序：确定最关键的任务和指标
														
 
															+4. 流程控制：管理整个报告生成工作流的执行顺序
														
 
															+
														
 
															+决策逻辑：
														
 
															+- 大纲为空 → 生成大纲
														
 
															+- 指标覆盖率 < 80% → 计算指标
														
 
															+- 指标覆盖率 ≥ 80% → 生成报告
														
 
															+- 需求模糊 → 澄清需求
														
 
															+
														
 
															+技术实现：
														
 
															+- 使用LangChain和结构化输出
														
 
															+- 支持异步处理
														
 
															+- 智能状态评估
														
 
															+- 灵活的决策机制
														
 
															+
														
 
															+作者: Big Agent Team
														
 
															+版本: 1.0.0
														
 
															+创建时间: 2024-12-20
														
 
															+"""
														
 
															+
														
 
															 from typing import List, Dict, Optional, Any, Union
														
 
															 from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
														
 
															 from pydantic import BaseModel, Field
														
 
															 from langchain_openai import ChatOpenAI
														
 
															 import json
														
 
															-
														
 
															-from llmops.agents.state import AgentState, MetricRequirement, convert_numpy_types
														
 
															-from llmops.agents.datadev.llm import get_llm
														
 
															+import os
														
 
															+from datetime import datetime
														
 
															+# 数据模型定义
														
 
															 class ActionItem(BaseModel):
														
 
															     """动作项定义"""
														
 
															     action: str = Field(description="动作名称")
														
 
															-    parameters: Optional[Dict[str, Any]] = Field(default_factory=dict)
														
 
															+    parameters: Optional[Dict[str, Any]] = Field(default_factory=dict, description="动作参数")
														
 
															 class ClarificationRequest(BaseModel):
														
@@ -20,27 +49,30 @@ class ClarificationRequest(BaseModel):
 
															     missing_fields: List[str] = Field(default_factory=list, description="缺少的字段或信息")
														
 
															-class PlanningOutput(BaseModel):
														
 
															-    """规划决策输出 - 支持灵活格式"""
														
 
															+class PlanningDecision(BaseModel):
														
 
															+    """规划决策输出"""
														
 
															     decision: str = Field(
														
 
															-        description="决策类型: generate_outline, compute_metrics, finalize, clarify"
														
 
															+        description="决策类型: generate_outline, compute_metrics, finalize_report, clarify_requirements"
														
 
															     )
														
 
															     reasoning: str = Field(description="详细推理过程")
														
 
															     next_actions: List[Union[str, ActionItem]] = Field(
														
 
															         default_factory=list,
														
 
															         description="下一步动作列表"
														
 
															     )
														
 
															-    # 关键修复：明确传递待计算指标ID列表
														
 
															     metrics_to_compute: List[str] = Field(
														
 
															         default_factory=list,
														
 
															         description="待计算指标ID列表（如 ['total_income', 'avg_balance']）"
														
 
															     )
														
 
															+    priority_metrics: List[str] = Field(
														
 
															+        default_factory=list,
														
 
															+        description="优先级高的指标ID"
														
 
															+    )
														
 
															     additional_requirements: Optional[
														
 
															         Union[Dict[str, Any], List[Any], ClarificationRequest]
														
 
															     ] = Field(default=None, description="额外需求或澄清信息")
														
 
															-def normalize_additional_requirements(req: Any) -> Optional[Dict[str, Any]]:
														
 
															+def normalize_requirements(req: Any) -> Optional[Dict[str, Any]]:
														
 
															     """
														
 
															     规范化 additional_requirements
														
 
															     将列表转换为字典格式
														
@@ -61,160 +93,363 @@ def normalize_additional_requirements(req: Any) -> Optional[Dict[str, Any]]:
 
															     return {"raw": str(req)}
														
 
															-def create_planning_agent(llm, state: AgentState):
														
 
															-    """创建规划智能体（修复版：移除JSON示例，避免变量冲突）"""
														
 
															-    prompt = ChatPromptTemplate.from_messages([
														
 
															-        ("system", """你是报告规划总控智能体，核心职责是精准分析当前状态并决定下一步行动。
														
 
															+class PlanningAgent:
														
 
															+    """规划智能体：负责状态分析和决策制定"""
														
 
															+
														
 
															+    def __init__(self, api_key: str, base_url: str = "https://api.deepseek.com"):
														
 
															+        """
														
 
															+        初始化规划Agent
														
 
															+
														
 
															+        Args:
														
 
															+            api_key: DeepSeek API密钥
														
 
															+            base_url: DeepSeek API基础URL
														
 
															+        """
														
 
															+        self.llm = ChatOpenAI(
														
 
															+            model="deepseek-chat",
														
 
															+            api_key=api_key,
														
 
															+            base_url=base_url,
														
 
															+            temperature=0.1
														
 
															+        )
														
 
															+
														
 
															+        # 初始化API调用跟踪
														
 
															+        self.api_calls = []
														
 
															+
														
 
															+    def create_planning_prompt(self) -> ChatPromptTemplate:
														
 
															+        """创建规划提示模板"""
														
 
															+        return ChatPromptTemplate.from_messages([
														
 
															+            ("system", """你是报告规划总控智能体，核心职责是精准分析当前状态并决定下一步行动。
														
 
															 ### 决策选项（四选一）
														
 
															 1. generate_outline：大纲未生成或大纲无效
														
 
															 2. compute_metrics：大纲已生成但指标未完成（覆盖率<80%）
														
 
															-3. finalize：指标覆盖率≥80%，信息充足
														
 
															-4. clarify：用户需求模糊，缺少关键信息
														
 
															+3. finalize_report：指标覆盖率≥80%，信息充足
														
 
															+4. clarify_requirements：用户需求模糊，缺少关键信息
														
 
															 ### 决策规则（按顺序检查）
														
 
															 1. 检查 outline_draft 是否为空 → 空则选择 generate_outline
														
 
															 2. 检查 metrics_requirements 是否为空 → 空则选择 generate_outline
														
 
															-3. 计算指标覆盖率 = 已计算指标 / 总需求指标
														
 
															-   - 覆盖率 < 0.8 → 选择 compute_metrics
														
 
															-   - 覆盖率 ≥ 0.8 → 选择 finalize
														
 
															-4. 如果无法理解需求 → 选择 clarify
														
 
															+3. 检查是否有待计算指标 → 有则选择 compute_metrics
														
 
															+4. 所有指标都已计算完成 → 选择 finalize_report
														
 
															+5. 如果无法理解需求 → 选择 clarify_requirements
														
 
															 ### 重要原则
														
 
															 - 大纲草稿已存在时，不要重复生成大纲
														
 
															-- 决策为 compute_metrics 时，必须提供具体的指标ID列表
														
 
															+- 决策为 compute_metrics 时，必须从状态信息中的"有效待计算指标ID列表"中选择
														
 
															 - 确保 metrics_to_compute 是字符串数组格式
														
 
															+- 确保指标ID与大纲中的global_metrics.metric_id完全一致
														
 
															+- 从状态信息中的"有效待计算指标ID列表"中提取metric_id作为metrics_to_compute的值
														
 
															+- 计算失败的指标可以重试最多3次
														
 
															+- 绝对不要自己生成新的指标ID，必须严格使用状态信息中提供的已有指标ID
														
 
															+- 如果状态信息中没有可用的指标ID，不要生成compute_metrics决策
														
 
															 ### 输出字段说明
														
 
															 - decision: 决策字符串
														
 
															 - reasoning: 决策原因说明
														
 
															 - next_actions: 动作列表（可选）
														
 
															-- metrics_to_compute: 待计算指标ID列表（决策为compute_metrics时必须提供）
														
 
															+- metrics_to_compute: 待计算指标ID列表，必须从状态信息中的可用指标ID中选择（决策为compute_metrics时必须提供）
														
 
															+- priority_metrics: 优先级指标列表（前2-3个最重要的指标）
														
 
															 - additional_requirements: 额外需求（可选）
														
 
															 必须输出有效的JSON格式！"""),
														
 
															-    MessagesPlaceholder("messages"),
														
 
															+            MessagesPlaceholder("messages"),
														
 
															+
														
 
															+            ("user", "报告需求：{question}\n\n请输出决策结果。")
														
 
															+        ])
														
 
															+
														
 
															+    async def make_decision(self, question: str, industry: str, current_state: Dict[str, Any]) -> PlanningDecision:
														
 
															+        """
														
 
															+        根据当前状态做出规划决策
														
 
															+
														
 
															+        Args:
														
 
															+            question: 用户查询
														
 
															+            industry: 行业
														
 
															+            current_state: 当前状态信息
														
 
															+
														
 
															+        Returns:
														
 
															+            规划决策结果
														
 
															+        """
														
 
															+        planner = self.create_planning_prompt() | self.llm
														
 
															+
														
 
															+        # 构建状态评估上下文
														
 
															+        status_info = self._build_status_context(current_state)
														
 
															+
														
 
															+        # 记录大模型输入
														
 
															+        print("========================================")
														
 
															+        print("[AGENT] PlanningAgent (规划Agent)")
														
 
															+        print("[MODEL_INPUT] PlanningAgent:")
														
 
															+        print(f"[CONTEXT] 基于当前状态做出规划决策")
														
 
															+        print(f"Question: {question}")
														
 
															+        print(f"Status info: {status_info}")
														
 
															+        print("========================================")
														
 
															+
														
 
															+        # 执行规划
														
 
															+        start_time = datetime.now()
														
 
															+        response = await planner.ainvoke({
														
 
															+            "question": question,
														
 
															+            "industry": industry,
														
 
															+            "messages": [("system", status_info)]
														
 
															+        })
														
 
															+        end_time = datetime.now()
														
 
															+
														
 
															+        # 解析JSON响应
														
 
															+        try:
														
 
															+            # 从响应中提取JSON内容
														
 
															+            content = response.content if hasattr(response, 'content') else str(response)
														
 
															+            # 尝试找到JSON部分
														
 
															+            json_start = content.find('{')
														
 
															+            json_end = content.rfind('}') + 1
														
 
															+            if json_start >= 0 and json_end > json_start:
														
 
															+                json_str = content[json_start:json_end]
														
 
															+                decision_data = json.loads(json_str)
														
 
															+
														
 
															+                # 预处理 additional_requirements 字段
														
 
															+                if "additional_requirements" in decision_data:
														
 
															+                    req = decision_data["additional_requirements"]
														
 
															+                    if isinstance(req, str):
														
 
															+                        # 如果是字符串，尝试将其转换为合适的格式
														
 
															+                        if req.strip():
														
 
															+                            # 将字符串包装为字典格式
														
 
															+                            decision_data["additional_requirements"] = {"raw_content": req}
														
 
															+                        else:
														
 
															+                            # 空字符串设为 None
														
 
															+                            decision_data["additional_requirements"] = None
														
 
															+                    elif isinstance(req, list):
														
 
															+                        # 如果是列表，转换为字典格式
														
 
															+                        decision_data["additional_requirements"] = {
														
 
															+                            "questions": [str(item) for item in req],
														
 
															+                            "missing_fields": []
														
 
															+                        }
														
 
															+                    # 如果已经是 dict 或其他允许的类型，保持不变
														
 
															+
														
 
															+                decision = PlanningDecision(**decision_data)
														
 
															+
														
 
															+                # 验证决策的合理性
														
 
															+                if decision.decision == "compute_metrics":
														
 
															+                    if not decision.metrics_to_compute:
														
 
															+                        raise ValueError("AI决策缺少具体的指标ID")
														
 
															+                    # 如果AI生成的指标ID明显是错误的（比如metric_001），使用默认逻辑
														
 
															+                    if any(mid.startswith("metric_") and mid.replace("metric_", "").isdigit()
														
 
															+                          for mid in decision.metrics_to_compute):
														
 
															+                        raise ValueError("AI生成的指标ID格式不正确")
														
 
															+
														
 
															+            else:
														
 
															+                raise ValueError("No JSON found in response")
														
 
															+        except Exception as e:
														
 
															+            print(f"解析规划决策响应失败: {e}，使用默认决策")
														
 
															+            # 返回默认决策
														
 
															+            decision = self._get_default_decision(current_state)
														
 
															+
														
 
															+        # 记录API调用结果
														
 
															+        content = response.content if hasattr(response, 'content') else str(response)
														
 
															+        call_id = f"api_mll_规划决策_{'{:.2f}'.format((end_time - start_time).total_seconds())}"
														
 
															+        api_call_info = {
														
 
															+            "call_id": call_id,
														
 
															+            "timestamp": end_time.isoformat(),
														
 
															+            "agent": "PlanningAgent",
														
 
															+            "model": "deepseek-chat",
														
 
															+            "request": {
														
 
															+                "question": question,
														
 
															+                "status_info": status_info,
														
 
															+                "start_time": start_time.isoformat()
														
 
															+            },
														
 
															+            "response": {
														
 
															+                "content": content,
														
 
															+                "decision": decision.dict() if hasattr(decision, 'dict') else decision,
														
 
															+                "end_time": end_time.isoformat(),
														
 
															+                "duration": (end_time - start_time).total_seconds()
														
 
															+            },
														
 
															+            "success": True
														
 
															+        }
														
 
															+        self.api_calls.append(api_call_info)
														
 
															+
														
 
															+        # 保存API结果到文件
														
 
															+        api_results_dir = "api_results"
														
 
															+        os.makedirs(api_results_dir, exist_ok=True)
														
 
															+        filename = f"{call_id}.json"
														
 
															+        filepath = os.path.join(api_results_dir, filename)
														
 
															+
														
 
															+        try:
														
 
															+            with open(filepath, 'w', encoding='utf-8') as f:
														
 
															+                json.dump(api_call_info, f, ensure_ascii=False, indent=2)
														
 
															+            print(f"[API_RESULT] 保存API结果文件: {filepath}")
														
 
															+        except Exception as e:
														
 
															+            print(f"[ERROR] 保存API结果文件失败: {filepath}, 错误: {str(e)}")
														
 
															+
														
 
															+        # 记录大模型输出
														
 
															+        print(f"[MODEL_OUTPUT] PlanningAgent: {json.dumps(decision.dict() if hasattr(decision, 'dict') else decision, ensure_ascii=False)}")
														
 
															+        print("========================================")
														
 
															+
														
 
															+        return decision
														
 
															+
														
 
															+    def _build_status_context(self, state: Dict[str, Any]) -> str:
														
 
															+        """构建状态评估上下文"""
														
 
															+        required_count = len(state.get("metrics_requirements", []))
														
 
															+        computed_count = len(state.get("computed_metrics", {}))
														
 
															+        coverage = computed_count / required_count if required_count > 0 else 0
														
 
															+
														
 
															+        # 计算失败统计
														
 
															+        failed_attempts = state.get("failed_metric_attempts", {})
														
 
															+        pending_ids = state.get("pending_metric_ids", [])
														
 
															+
														
 
															+        # 过滤掉失败次数过多的指标
														
 
															+        max_retry = 3
														
 
															+        filtered_pending_ids = [
														
 
															+            mid for mid in pending_ids
														
 
															+            if failed_attempts.get(mid, 0) < max_retry
														
 
															+        ]
														
 
															+
														
 
															+        # 获取可用的指标ID
														
 
															+        available_metric_ids = []
														
 
															+        if state.get('outline_draft') and state.get('outline_draft').get('global_metrics'):
														
 
															+            available_metric_ids = [m.get('metric_id', '') for m in state['outline_draft']['global_metrics']]
														
 
															+            available_metric_ids = [mid for mid in available_metric_ids if mid]  # 过滤空值
														
 
															+
														
 
															+        return f"""当前状态评估：
														
 
															+- 规划步骤: {state.get('planning_step', 0)}
														
 
															+- 大纲版本: {state.get('outline_version', 0)}
														
 
															+- 大纲草稿存在: {state.get('outline_draft') is not None}
														
 
															+- 指标需求总数: {required_count}
														
 
															+- 已计算指标数: {computed_count}
														
 
															+- 指标覆盖率: {coverage:.2%}
														
 
															+- 待计算指标数: {len(pending_ids)}
														
 
															+- 有效待计算指标ID列表: {filtered_pending_ids}
														
 
															+- 可用指标ID列表: {available_metric_ids}
														
 
															+- 失败尝试记录: {failed_attempts}
														
 
															+"""
														
 
															-    ("user", "报告需求：{question}\n\n请输出决策结果。")
														
 
															-    ])
														
 
															-    return prompt | llm.with_structured_output(PlanningOutput)
														
 
															+def analyze_current_state(state: Dict[str, Any]) -> Dict[str, Any]:
														
 
															+    """
														
 
															+    分析当前状态，返回关键信息
														
 
															+    Args:
														
 
															+        state: 当前状态
														
 
															-async def planning_node(state: AgentState) -> AgentState:
														
 
															-    """规划节点：正确识别待计算指标并传递"""
														
 
															-    llm = get_llm()
														
 
															-    planner = create_planning_agent(llm, state)
														
 
															+    Returns:
														
 
															+        状态分析结果
														
 
															+    """
														
 
															+    required_metrics = state.get("metrics_requirements", [])
														
 
															+    computed_metrics = state.get("computed_metrics", {})
														
 
															-    # 构建完整的状态评估上下文
														
 
															-    required_count = len(state["metrics_requirements"])
														
 
															-    computed_count = len(state["computed_metrics"])
														
 
															+    # 计算覆盖率
														
 
															+    required_count = len(required_metrics)
														
 
															+    computed_count = len(computed_metrics)
														
 
															     coverage = computed_count / required_count if required_count > 0 else 0
														
 
															-    # 新增：跟踪失败次数，避免无限循环
														
 
															-    failed_attempts = state.get("failed_metric_attempts", {})
														
 
															-    pending_ids = state.get("pending_metric_ids", [])
														
 
															+    # 找出未计算的指标
														
 
															+    computed_ids = set(computed_metrics.keys())
														
 
															+    pending_metrics = [
														
 
															+        m for m in required_metrics
														
 
															+        if m.metric_id not in computed_ids
														
 
															+    ]
														
 
															-    # 过滤掉失败次数过多的指标
														
 
															+    # 检查失败次数
														
 
															+    failed_attempts = state.get("failed_metric_attempts", {})
														
 
															     max_retry = 3
														
 
															-    filtered_pending_ids = [
														
 
															-        mid for mid in pending_ids
														
 
															-        if failed_attempts.get(mid, 0) < max_retry
														
 
															+    valid_pending_metrics = [
														
 
															+        m for m in pending_metrics
														
 
															+        if failed_attempts.get(m.metric_id, 0) < max_retry
														
 
															     ]
														
 
															-    status_snapshot = f"""当前状态评估：
														
 
															-- 规划步骤: {state['planning_step']}
														
 
															-- 大纲版本: {state['outline_version']}
														
 
															-- 大纲草稿存在: {state['outline_draft'] is not None}
														
 
															-- 指标需求总数: {required_count}
														
 
															-- 已计算指标数: {computed_count}
														
 
															-- 指标覆盖率: {coverage:.2%}
														
 
															-- 待计算指标数: {len(pending_ids)}
														
 
															-- 有效待计算指标数: {len(filtered_pending_ids)}
														
 
															-- 失败尝试记录: {failed_attempts}
														
 
															+    return {
														
 
															+        "has_outline": state.get("outline_draft") is not None,
														
 
															+        "required_count": required_count,
														
 
															+        "computed_count": computed_count,
														
 
															+        "coverage": coverage,
														
 
															+        "pending_metrics": pending_metrics,
														
 
															+        "valid_pending_metrics": valid_pending_metrics,
														
 
															+        "pending_ids": [m.metric_id for m in pending_metrics],
														
 
															+        "valid_pending_ids": [m.metric_id for m in valid_pending_metrics],
														
 
															+        "planning_step": state.get("planning_step", 0),
														
 
															+        "outline_version": state.get("outline_version", 0)
														
 
															+    }
														
 
															+
														
 
															+
														
 
															+async def plan_next_action(question: str, industry: str, current_state: Dict[str, Any], api_key: str) -> PlanningDecision:
														
 
															+    """
														
 
															+    规划下一步行动的主函数
														
 
															-建议下一步: {"计算指标" if coverage < 0.8 else "生成报告"}"""
														
 
															+    Args:
														
 
															+        question: 用户查询
														
 
															+        current_state: 当前状态
														
 
															+        api_key: API密钥
														
 
															-    # 执行规划
														
 
															-    result = await planner.ainvoke({
														
 
															-        "question": state["question"],
														
 
															-        "messages": [("system", status_snapshot)]
														
 
															-    })
														
 
															+    Returns:
														
 
															+        规划决策结果
														
 
															+    """
														
 
															+    agent = PlanningAgent(api_key)
														
 
															-    # 规范化结果
														
 
															-    normalized_req = normalize_additional_requirements(result.additional_requirements)
														
 
															+    try:
														
 
															+        decision = await agent.make_decision(question, industry, current_state)
														
 
															-    # 找出所有未计算的指标
														
 
															-    computed_ids = set(state["computed_metrics"].keys())
														
 
															-    required_metrics = state["metrics_requirements"]
														
 
															+        print(f"\n🧠 规划决策：{decision.decision}")
														
 
															+        print(f"   推理：{decision.reasoning[:100]}...")
														
 
															-    pending_metrics = [
														
 
															-        m for m in required_metrics
														
 
															-        if m.metric_id not in computed_ids
														
 
															-    ]
														
 
															+        if decision.metrics_to_compute:
														
 
															+            print(f"   待计算指标：{decision.metrics_to_compute}")
														
 
															-    # 关键：使用 LLM 返回的指标ID，如果没有则使用全部待计算指标
														
 
															-    if result.metrics_to_compute:
														
 
															-        pending_ids = result.metrics_to_compute
														
 
															-        valid_ids = [m.metric_id for m in pending_metrics]
														
 
															-        pending_metrics = [m for m in pending_metrics if m.metric_id in pending_ids and m.metric_id in valid_ids]
														
 
															+        return decision
														
 
															-    # 更新状态
														
 
															-    new_state = state.copy()
														
 
															-    new_state["plan_history"].append(
														
 
															-        f"Step {new_state['planning_step']}: {result.decision}"
														
 
															-    )
														
 
															-    new_state["planning_step"] += 1
														
 
															-    new_state["additional_requirements"] = normalized_req
														
 
															-
														
 
															-    # 关键：保存待计算指标ID列表
														
 
															-    if pending_metrics:
														
 
															-        pending_ids = [m.metric_id for m in pending_metrics]
														
 
															-        new_state["pending_metric_ids"] = pending_ids
														
 
															-        new_state["metrics_to_compute"] = pending_metrics  # 保存完整对象
														
 
															-
														
 
															-    # 设置路由标志
														
 
															-    if result.decision == "generate_outline":
														
 
															-        new_state["messages"].append(
														
 
															-            ("ai", f"📋 规划决策：生成大纲 (v{new_state['outline_version'] + 1})")
														
 
															-        )
														
 
															-        new_state["next_route"] = "outline_generator"
														
 
															-    elif result.decision == "compute_metrics":
														
 
															-        # 修复：确保显示正确的数量
														
 
															-        if not pending_metrics:
														
 
															-            # 如果没有待计算指标但有需求，则计算所有未完成的
														
 
															-            computed_ids = set(state["computed_metrics"].keys())
														
 
															-            pending_metrics = [m for m in required_metrics if m.metric_id not in computed_ids]
														
 
															-
														
 
															-        # 新增：如果有效待计算指标为空但还有指标未计算，说明都失败了太多次
														
 
															-        if not filtered_pending_ids and pending_ids:
														
 
															-            new_state["messages"].append(
														
 
															-                ("ai", f"⚠️ 剩余 {len(pending_ids)} 个指标已多次计算失败，将跳过这些指标直接生成报告")
														
 
															-            )
														
 
															-            new_state["next_route"] = "report_compiler"
														
 
															-            # 关键修复：返回前清理状态
														
 
															-            return convert_numpy_types(new_state)
														
 
															+    except Exception as e:
														
 
															+        print(f"⚠️ 规划决策出错: {e}，使用默认决策")
														
 
															-        new_state["messages"].append(
														
 
															-            ("ai", f"🧮 规划决策：计算 {len(pending_metrics)} 个指标 ({[m.metric_id for m in pending_metrics]})")
														
 
															-        )
														
 
															-        new_state["next_route"] = "metrics_calculator"
														
 
															-    elif result.decision == "finalize":
														
 
															-        new_state["is_complete"] = True
														
 
															-        new_state["messages"].append(
														
 
															-            ("ai", f"✅ 规划决策：信息充足，生成最终报告（覆盖率 {coverage:.2%}）")
														
 
															-        )
														
 
															-        new_state["next_route"] = "report_compiler"
														
 
															-    elif result.decision == "clarify":
														
 
															-        questions = []
														
 
															-        if normalized_req and "questions" in normalized_req:
														
 
															-            questions = normalized_req["questions"]
														
 
															-
														
 
															-        new_state["messages"].append(
														
 
															-            ("ai", f"❓ 需要澄清：{'；'.join(questions) if questions else '请提供更详细的需求'}")
														
 
															+        # 直接返回最基本的默认决策，避免复杂的默认决策逻辑
														
 
															+        return PlanningDecision(
														
 
															+            decision="finalize_report",
														
 
															+            reasoning="规划决策失败，使用默认的报告生成决策",
														
 
															+            next_actions=["生成最终报告"],
														
 
															+            metrics_to_compute=[],
														
 
															+            priority_metrics=[]
														
 
															         )
														
 
															-        new_state["next_route"] = "clarify_node"
														
 
															-    # 关键修复：返回前清理状态
														
 
															-    return convert_numpy_types(new_state)
														
 
															+    def _get_default_decision(self, current_state: Dict[str, Any]) -> PlanningDecision:
														
 
															+        """
														
 
															+        基于状态分析的默认决策逻辑
														
 
															+
														
 
															+        Args:
														
 
															+            current_state: 当前状态信息
														
 
															+
														
 
															+        Returns:
														
 
															+            默认规划决策
														
 
															+        """
														
 
															+        state_analysis = analyze_current_state(current_state)
														
 
															+
														
 
															+        if not state_analysis["has_outline"]:
														
 
															+            default_decision = PlanningDecision(
														
 
															+                decision="generate_outline",
														
 
															+                reasoning="大纲不存在，需要先生成大纲",
														
 
															+                next_actions=["生成报告大纲"],
														
 
															+                metrics_to_compute=[],
														
 
															+                priority_metrics=[]
														
 
															+            )
														
 
															+        elif state_analysis["coverage"] < 0.8 and state_analysis["valid_pending_metrics"]:
														
 
															+            # 计算指标 - 使用实际的指标ID
														
 
															+            metrics_to_compute = state_analysis["valid_pending_ids"][:5]  # 最多计算5个
														
 
															+            default_decision = PlanningDecision(
														
 
															+                decision="compute_metrics",
														
 
															+                reasoning=f"指标覆盖率{state_analysis['coverage']:.1%}，需要计算更多指标",
														
 
															+                next_actions=[f"计算指标: {', '.join(metrics_to_compute)}"],
														
 
															+                metrics_to_compute=metrics_to_compute,
														
 
															+                priority_metrics=metrics_to_compute[:2]  # 前2个为优先级
														
 
															+            )
														
 
															+        elif state_analysis["valid_pending_ids"]:
														
 
															+            # 还有指标但都失败了，生成报告
														
 
															+            default_decision = PlanningDecision(
														
 
															+                decision="finalize_report",
														
 
															+                reasoning="部分指标计算失败，但已有足够信息生成报告",
														
 
															+                next_actions=["生成最终报告"],
														
 
															+                metrics_to_compute=[],
														
 
															+                priority_metrics=[]
														
 
															+            )
														
 
															+        else:
														
 
															+            # 信息充足，生成报告
														
 
															+            default_decision = PlanningDecision(
														
 
															+                decision="finalize_report",
														
 
															+                reasoning="所有必要指标已计算完成",
														
 
															+                next_actions=["生成最终报告"],
														
 
															+                metrics_to_compute=[],
														
 
															+                priority_metrics=[]
														
 
															+            )
														
 
															+
														
 
															+        return default_decision
														
--- a/llmops/config.py
+++ b/llmops/config.py
@@ -0,0 +1,88 @@
 
															+"""
														
 
															+Big Agent 配置文件
														
 
															+================
														
 
															+
														
 
															+此配置文件包含了Big Agent系统的所有核心配置信息，包括：
														
 
															+- API密钥配置（DeepSeek等）
														
 
															+- 工作流参数设置
														
 
															+- 路径配置
														
 
															+- 环境变量加载
														
 
															+
														
 
															+主要功能：
														
 
															+1. 从环境变量或.env文件加载API密钥
														
 
															+2. 定义系统工作流的基本参数
														
 
															+3. 配置项目文件路径
														
 
															+4. 验证配置完整性
														
 
															+
														
 
															+作者: Big Agent Team
														
 
															+版本: 1.0.0
														
 
															+更新时间: 2024-12-18
														
 
															+"""
														
 
															+
														
 
															+import os
														
 
															+from dotenv import load_dotenv
														
 
															+
														
 
															+# ============================================================================
														
 
															+# 环境变量加载
														
 
															+# ============================================================================
														
 
															+# 从.env文件加载环境变量，确保敏感信息不被硬编码到源码中
														
 
															+load_dotenv()
														
 
															+
														
 
															+# ============================================================================
														
 
															+# DeepSeek API 配置
														
 
															+# ============================================================================
														
 
															+# API密钥配置 - 优先从环境变量读取，支持通过.env文件配置
														
 
															+DEEPSEEK_API_KEY = os.getenv("DEEPSEEK_API_KEY")
														
 
															+
														
 
															+# API基础URL配置 - 默认使用DeepSeek官方API地址
														
 
															+DEEPSEEK_BASE_URL = os.getenv("DEEPSEEK_BASE_URL", "https://api.deepseek.com")
														
 
															+
														
 
															+# ============================================================================
														
 
															+# 项目路径配置
														
 
															+# ============================================================================
														
 
															+# 定义项目中各个功能模块的数据存储路径
														
 
															+PATHS = {
														
 
															+    "json_configs": "json_files",      # JSON配置文件目录 - 存储指标计算配置
														
 
															+    "knowledge_base": "knowledge_base", # 知识库目录 - 存储生成的知识文档
														
 
															+    "logs": "logs",                   # 日志目录 - 存储系统运行日志
														
 
															+    "api_results": "api_results"      # API结果目录 - 存储所有API调用结果
														
 
															+}
														
 
															+
														
 
															+# ============================================================================
														
 
															+# 目录初始化
														
 
															+# ============================================================================
														
 
															+# 确保所有必要的目录都存在，避免文件操作时的路径错误
														
 
															+for path in PATHS.values():
														
 
															+    os.makedirs(path, exist_ok=True)
														
 
															+
														
 
															+# ============================================================================
														
 
															+# 配置验证函数
														
 
															+# ============================================================================
														
 
															+def validate_config():
														
 
															+    """
														
 
															+    验证系统配置是否正确
														
 
															+
														
 
															+    此函数检查所有必要的配置项是否已正确设置，包括：
														
 
															+    - API密钥是否存在
														
 
															+    - API URL格式是否正确
														
 
															+
														
 
															+    Returns:
														
 
															+        list: 配置错误列表，如果为空则表示配置正确
														
 
															+    """
														
 
															+    errors = []
														
 
															+
														
 
															+    # 检查API密钥
														
 
															+    if not DEEPSEEK_API_KEY:
														
 
															+        errors.append("DEEPSEEK_API_KEY环境变量未设置")
														
 
															+
														
 
															+    # 检查API URL格式
														
 
															+    if not DEEPSEEK_BASE_URL.startswith("https://"):
														
 
															+        errors.append("DEEPSEEK_BASE_URL必须是HTTPS URL")
														
 
															+
														
 
															+    return errors
														
 
															+
														
 
															+# ============================================================================
														
 
															+# 配置状态标识
														
 
															+# ============================================================================
														
 
															+# 全局配置状态标识，True表示配置正确，False表示存在配置问题
														
 
															+CONFIG_VALID = len(validate_config()) == 0
														
--- a/llmops/workflow_state.py
+++ b/llmops/workflow_state.py
@@ -0,0 +1,328 @@
 
															+"""
														
 
															+整合的工作流状态定义
														
 
															+===================
														
 
															+
														
 
															+此文件定义了整合了多个Agent的工作流状态，兼容现有的Big Agent状态管理和新增的报告生成Agent状态。
														
 
															+
														
 
															+状态层次：
														
 
															+1. 输入层：用户查询和数据
														
 
															+2. 意图层：意图识别结果
														
 
															+3. 规划层：规划决策和大纲生成
														
 
															+4. 计算层：指标计算结果
														
 
															+5. 结果层：最终报告生成
														
 
															+6. 对话层：消息历史和错误处理
														
 
															+
														
 
															+兼容性：
														
 
															+- 兼容现有的Big Agent WorkflowState
														
 
															+- 整合来自other_agents的AgentState
														
 
															+- 支持扩展新的Agent状态需求
														
 
															+
														
 
															+作者: Big Agent Team
														
 
															+版本: 1.0.0
														
 
															+创建时间: 2024-12-20
														
 
															+"""
														
 
															+
														
 
															+from typing import TypedDict, List, Dict, Any, Optional
														
 
															+from datetime import datetime
														
 
															+from langchain_core.messages import BaseMessage
														
 
															+from pydantic import BaseModel, Field
														
 
															+
														
 
															+
														
 
															+# ============= 数据模型 =============
														
 
															+
														
 
															+class MetricRequirement(BaseModel):
														
 
															+    """指标需求定义"""
														
 
															+    metric_id: str = Field(description="指标唯一标识，如 'total_income_jan'")
														
 
															+    metric_name: str = Field(description="指标中文名称")
														
 
															+    calculation_logic: str = Field(description="计算逻辑描述")
														
 
															+    required_fields: List[str] = Field(description="所需字段")
														
 
															+    dependencies: List[str] = Field(default_factory=list, description="依赖的其他指标ID")
														
 
															+
														
 
															+
														
 
															+class ReportSection(BaseModel):
														
 
															+    """报告大纲章节"""
														
 
															+    section_id: str = Field(description="章节ID")
														
 
															+    title: str = Field(description="章节标题")
														
 
															+    description: str = Field(description="章节内容要求")
														
 
															+    metrics_needed: List[str] = Field(description="所需指标ID列表")
														
 
															+
														
 
															+
														
 
															+class ReportOutline(BaseModel):
														
 
															+    """完整报告大纲"""
														
 
															+    report_title: str = Field(description="报告标题")
														
 
															+    sections: List[ReportSection] = Field(description="章节列表")
														
 
															+    global_metrics: List[MetricRequirement] = Field(description="全局指标列表")
														
 
															+
														
 
															+
														
 
															+# ============= 序列化工具函数 =============
														
 
															+
														
 
															+def convert_numpy_types(obj: Any) -> Any:
														
 
															+    """
														
 
															+    递归转换所有numpy类型为Python原生类型
														
 
															+    确保所有数据可序列化
														
 
															+    """
														
 
															+    if isinstance(obj, dict):
														
 
															+        return {str(k): convert_numpy_types(v) for k, v in obj.items()}
														
 
															+    elif isinstance(obj, list):
														
 
															+        return [convert_numpy_types(item) for item in obj]
														
 
															+    elif isinstance(obj, tuple):
														
 
															+        return tuple(convert_numpy_types(item) for item in obj)
														
 
															+    elif isinstance(obj, set):
														
 
															+        return {convert_numpy_types(item) for item in obj}
														
 
															+    elif hasattr(obj, 'item') and hasattr(obj, 'dtype'):  # numpy scalar
														
 
															+        return convert_numpy_types(obj.item())
														
 
															+    else:
														
 
															+        return obj
														
 
															+
														
 
															+
														
 
															+# ============= 整合的工作流状态定义 =============
														
 
															+
														
 
															+class IntegratedWorkflowState(TypedDict):
														
 
															+    """整合的工作流状态定义 - 兼容多个Agent系统"""
														
 
															+
														
 
															+    # === 基础输入层 (兼容Big Agent) ===
														
 
															+    user_input: str
														
 
															+    question: str  # 别名，兼容报告生成Agent
														
 
															+
														
 
															+    industry: str  # 行业
														
 
															+
														
 
															+    # === 数据层 ===
														
 
															+    data_set: List[Dict[str, Any]]  # 报告生成Agent的数据格式
														
 
															+    transactions_df: Optional[Any]  # 可选的数据框格式
														
 
															+
														
 
															+    # === 意图识别层 (Big Agent原有) ===
														
 
															+    intent_result: Optional[Dict[str, Any]]
														
 
															+
														
 
															+    # === 规划和大纲层 (新增) ===
														
 
															+    planning_step: int
														
 
															+    plan_history: List[str]
														
 
															+    outline_draft: Optional[ReportOutline]
														
 
															+    outline_version: int
														
 
															+    outline_ready: bool
														
 
															+
														
 
															+    # === 指标计算层 ===
														
 
															+    metrics_requirements: List[MetricRequirement]  # 报告生成Agent格式
														
 
															+    computed_metrics: Dict[str, Any]  # 计算结果
														
 
															+    metrics_cache: Dict[str, Any]  # 缓存
														
 
															+    pending_metric_ids: List[str]  # 待计算指标ID
														
 
															+    failed_metric_attempts: Dict[str, int]  # 失败统计
														
 
															+    calculation_results: Optional[Dict[str, Any]]  # Big Agent格式的计算结果
														
 
															+
														
 
															+    # === 结果层 ===
														
 
															+    report_draft: Dict[str, Any]  # 报告草稿
														
 
															+    knowledge_result: Optional[Dict[str, Any]]  # Big Agent知识沉淀结果
														
 
															+    is_complete: bool
														
 
															+    completeness_score: float
														
 
															+    answer: Optional[str]  # 最终答案
														
 
															+
														
 
															+    # === 对话和消息层 ===
														
 
															+    messages: List[Dict[str, Any]]  # Big Agent消息格式
														
 
															+    current_node: str
														
 
															+    session_id: str
														
 
															+    next_route: str
														
 
															+
														
 
															+    # === 错误处理层 ===
														
 
															+    errors: List[str]
														
 
															+    last_decision: str
														
 
															+
														
 
															+    # === 时间跟踪层 ===
														
 
															+    start_time: str
														
 
															+    end_time: Optional[str]
														
 
															+    api_result: Dict[str, Any]  # 存储所有API调用结果
														
 
															+
														
 
															+
														
 
															+# ============= 状态创建和初始化函数 =============
														
 
															+
														
 
															+def create_initial_integrated_state(question: str, industry: str, data: List[Dict[str, Any]], session_id: str = None) -> IntegratedWorkflowState:
														
 
															+    """
														
 
															+    创建初始的整合状态
														
 
															+
														
 
															+    Args:
														
 
															+        question: 用户查询
														
 
															+        data: 数据集
														
 
															+        session_id: 会话ID
														
 
															+
														
 
															+    Returns:
														
 
															+        初始化后的状态
														
 
															+    """
														
 
															+    current_time = datetime.now().isoformat()
														
 
															+    session = session_id or f"session_{int(datetime.now().timestamp())}"
														
 
															+
														
 
															+    return {
														
 
															+        # 基础输入
														
 
															+        "user_input": question,
														
 
															+        "question": question,
														
 
															+        "industry": industry,
														
 
															+
														
 
															+        # 数据层
														
 
															+        "data_set": convert_numpy_types(data),
														
 
															+        "transactions_df": None,
														
 
															+
														
 
															+        # 意图识别层
														
 
															+        "intent_result": None,
														
 
															+
														
 
															+        # 规划和大纲层
														
 
															+        "planning_step": 0,
														
 
															+        "plan_history": [],
														
 
															+        "outline_draft": None,
														
 
															+        "outline_version": 0,
														
 
															+        "outline_ready": False,
														
 
															+
														
 
															+        # 指标计算层
														
 
															+        "metrics_requirements": [],
														
 
															+        "computed_metrics": {},
														
 
															+        "metrics_cache": {},
														
 
															+        "pending_metric_ids": [],
														
 
															+        "failed_metric_attempts": {},
														
 
															+        "calculation_results": None,
														
 
															+
														
 
															+        # 结果层
														
 
															+        "report_draft": {},
														
 
															+        "knowledge_result": None,
														
 
															+        "is_complete": False,
														
 
															+        "completeness_score": 0.0,
														
 
															+        "answer": None,
														
 
															+
														
 
															+        # 对话和消息层
														
 
															+        "messages": [{
														
 
															+            "role": "user",
														
 
															+            "content": question,
														
 
															+            "timestamp": current_time
														
 
															+        }],
														
 
															+        "current_node": "start",
														
 
															+        "session_id": session,
														
 
															+        "next_route": "planning_node",
														
 
															+
														
 
															+        # 错误处理层
														
 
															+        "errors": [],
														
 
															+        "last_decision": "init",
														
 
															+
														
 
															+        # 时间跟踪层
														
 
															+        "start_time": current_time,
														
 
															+        "end_time": None,
														
 
															+        "api_result": {},  # 存储所有API调用结果
														
 
															+
														
 
															+        # 计算模式配置层
														
 
															+        "use_rules_engine_only": False,
														
 
															+        "use_traditional_engine_only": False
														
 
															+    }
														
 
															+
														
 
															+
														
 
															+def is_state_ready_for_calculation(state: IntegratedWorkflowState) -> bool:
														
 
															+    """
														
 
															+    检查状态是否准备好进行指标计算
														
 
															+
														
 
															+    Args:
														
 
															+        state: 当前状态
														
 
															+
														
 
															+    Returns:
														
 
															+        是否准备好
														
 
															+    """
														
 
															+    return (
														
 
															+        state.get("outline_draft") is not None and
														
 
															+        len(state.get("metrics_requirements", [])) > 0 and
														
 
															+        len(state.get("pending_metric_ids", [])) > 0
														
 
															+    )
														
 
															+
														
 
															+
														
 
															+def get_calculation_progress(state: IntegratedWorkflowState) -> Dict[str, Any]:
														
 
															+    """
														
 
															+    获取指标计算进度信息
														
 
															+
														
 
															+    Args:
														
 
															+        state: 当前状态
														
 
															+
														
 
															+    Returns:
														
 
															+        进度信息
														
 
															+    """
														
 
															+    required = len(state.get("metrics_requirements", []))
														
 
															+    computed = len(state.get("computed_metrics", {}))
														
 
															+    pending = len(state.get("pending_metric_ids", []))
														
 
															+
														
 
															+    return {
														
 
															+        "required_count": required,
														
 
															+        "computed_count": computed,
														
 
															+        "pending_count": pending,
														
 
															+        "coverage_rate": computed / required if required > 0 else 0,
														
 
															+        "is_complete": computed >= required * 0.8  # 80%覆盖率视为完成
														
 
															+    }
														
 
															+
														
 
															+
														
 
															+def update_state_with_outline_generation(state: IntegratedWorkflowState, outline: ReportOutline) -> IntegratedWorkflowState:
														
 
															+    """
														
 
															+    使用大纲生成结果更新状态
														
 
															+
														
 
															+    Args:
														
 
															+        state: 当前状态
														
 
															+        outline: 生成的大纲
														
 
															+
														
 
															+    Returns:
														
 
															+        更新后的状态
														
 
															+    """
														
 
															+    new_state = state.copy()
														
 
															+    new_state["outline_draft"] = outline
														
 
															+    new_state["outline_version"] += 1
														
 
															+    new_state["outline_ready"] = True
														
 
															+    new_state["metrics_requirements"] = outline.global_metrics
														
 
															+    new_state["pending_metric_ids"] = [m.metric_id for m in outline.global_metrics]
														
 
															+
														
 
															+    # 添加消息
														
 
															+    new_state["messages"].append({
														
 
															+        "role": "assistant",
														
 
															+        "content": f"✅ 大纲生成完成 v{new_state['outline_version']}：{outline.report_title}",
														
 
															+        "timestamp": datetime.now().isoformat()
														
 
															+    })
														
 
															+
														
 
															+    return new_state
														
 
															+
														
 
															+
														
 
															+def update_state_with_planning_decision(state: IntegratedWorkflowState, decision: Dict[str, Any]) -> IntegratedWorkflowState:
														
 
															+    """
														
 
															+    使用规划决策结果更新状态
														
 
															+
														
 
															+    Args:
														
 
															+        state: 当前状态
														
 
															+        decision: 规划决策
														
 
															+
														
 
															+    Returns:
														
 
															+        更新后的状态
														
 
															+    """
														
 
															+    new_state = state.copy()
														
 
															+    new_state["planning_step"] += 1
														
 
															+    new_state["last_decision"] = decision.get("decision", "unknown")
														
 
															+    new_state["next_route"] = decision.get("next_route", "planning_node")
														
 
															+
														
 
															+    # 如果有待计算指标，更新待计算列表
														
 
															+    if decision.get("metrics_to_compute"):
														
 
															+        new_state["pending_metric_ids"] = decision["metrics_to_compute"]
														
 
															+
														
 
															+    # 添加规划历史
														
 
															+    new_state["plan_history"].append(
														
 
															+        f"Step {new_state['planning_step']}: {decision.get('decision', 'unknown')}"
														
 
															+    )
														
 
															+
														
 
															+    return new_state
														
 
															+
														
 
															+
														
 
															+def finalize_state_with_report(state: IntegratedWorkflowState, final_report: Dict[str, Any]) -> IntegratedWorkflowState:
														
 
															+    """
														
 
															+    使用最终报告完成状态
														
 
															+
														
 
															+    Args:
														
 
															+        state: 当前状态
														
 
															+        final_report: 最终报告
														
 
															+
														
 
															+    Returns:
														
 
															+        完成的状态
														
 
															+    """
														
 
															+    new_state = state.copy()
														
 
															+    new_state["report_draft"] = final_report
														
 
															+    new_state["is_complete"] = True
														
 
															+    new_state["answer"] = final_report
														
 
															+    new_state["end_time"] = datetime.now().isoformat()
														
 
															+
														
 
															+    # 计算完整性分数
														
 
															+    progress = get_calculation_progress(new_state)
														
 
															+    new_state["completeness_score"] = progress["coverage_rate"]
														
 
															+
														
 
															+    return new_state
Autor	SHA1 Mensagem	Data
JiaQiang	740c3f723d Merge remote-tracking branch 'origin/master'	há 1 semana atrás
JiaQiang	3974dfd443 配置类	há 1 semana atrás
JiaQiang	3f83f56356 deepseek api_key环境设置	há 1 semana atrás
JiaQiang	b58d5ebd8f 图状态	há 1 semana atrás
JiaQiang	b3b426aa3e 指标计算智能体	há 1 semana atrás
JiaQiang	d4b9658338 指标计算智能体	há 1 semana atrás
JiaQiang	996fbc71d6 大纲生成智能体	há 1 semana atrás
JiaQiang	bb2a88db45 规划智能体	há 1 semana atrás
	`@@ -0,0 +1 @@`
			`+DEEPSEEK_API_KEY=sk-438668d443224063adbb1d295fe44a9f`