jiaqiang
/
tx_flow_analysis


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985
							"""
完整的智能体工作流 (Complete Agent Flow)
=====================================

此工作流整合了规划、大纲生成和指标计算四个核心智能体，实现完整的报告生成流程。

包含的智能体：
1. PlanningAgent (规划智能体) - 分析状态并做出决策
2. OutlineAgent (大纲生成智能体) - 生成报告结构和指标需求
3. MetricCalculationAgent (指标计算智能体) - 执行标准指标计算
4. RulesEngineMetricCalculationAgent (规则引擎指标计算智能体) - 执行规则引擎指标计算

工作流程：
1. 规划节点 → 分析当前状态，决定下一步行动
2. 大纲生成节点 → 生成报告大纲和指标需求
3. 指标判断节点 → 根据大纲确定需要计算的指标
4. 指标计算节点 → 执行具体的指标计算任务

技术特点：
- 基于LangGraph的状态机工作流
- 支持条件路由和状态管理
- 完善的错误处理机制
- 详细的执行日志记录

作者: Big Agent Team
版本: 1.0.0
创建时间: 2024-12-20
"""

import asyncio
from typing import Dict, Any, List
from datetime import datetime
from langgraph.graph import StateGraph, END

from llmops.workflow_state import (
    IntegratedWorkflowState,
    create_initial_integrated_state,
    get_calculation_progress,
    update_state_with_outline_generation,
    update_state_with_planning_decision,
    update_state_with_data_classified,
    convert_numpy_types,
    update_state_with_data_standardize,
    update_state_with_report,
    update_state_with_anomaly_recognition
)
from llmops.agents.outline_agent import generate_report_outline
from llmops.agents.planning_agent import  plan_next_action
from llmops.agents.rules_engine_metric_calculation_agent import RulesEngineMetricCalculationAgent
from llmops.agents.anomaly_recognizer_agent import AnomalyRecognitionAgent
from llmops.agents.data_manager import DataManager
import os
from llmops.agents.data_classify_agent import data_classify
from llmops.config import multimodal_api_url, LLM_API_KEY, LLM_BASE_URL, LLM_MODEL_NAME
from llmops.agents.data_stardard import data_standardize
from llmops.agents.report_agent import generate_report_section_content

class CompleteAgentFlow:
    """完整的智能体工作流"""

    def __init__(self, api_key: str, base_url: str = "https://api.deepseek.com", model_name: str = "deepseek-chat"):
        """
        初始化完整的工作流

        Args:
            api_key: DeepSeek API密钥
            base_url: DeepSeek API基础URL
            model_name: 模型名称
        """
        self.api_key = api_key
        self.base_url = base_url
        self.model_name = model_name

        # 初始规则引擎智能体
        self.rules_engine_agent = RulesEngineMetricCalculationAgent(api_key, base_url)
        # 异常识别智能体
        self.anomaly_recognizer = None

        # 创建工作流图
        self.workflow = self._create_workflow()

    def _create_workflow(self) -> StateGraph:
        """创建LangGraph工作流"""
        workflow = StateGraph(IntegratedWorkflowState)

        # 添加节点
        workflow.add_node("planning_node", self._planning_node)
        workflow.add_node("outline_generator", self._outline_generator_node)
        workflow.add_node("metric_calculator", self._metric_calculator_node)
        workflow.add_node("data_classify", self._data_classify_node)
        workflow.add_node("data_standardize", self._data_standardize_node)
        workflow.add_node("anomaly_recognition", self._anomaly_recognition_node)
        workflow.add_node("report_generator", self._report_generator_node)

        # 设置入口点
        workflow.set_entry_point("planning_node")

        # 添加条件边 - 基于规划决策路由
        workflow.add_conditional_edges(
            "planning_node",
            self._route_from_planning,
            {
                "outline_generator": "outline_generator",
                "metric_calculator": "metric_calculator",
                "data_classify": "data_classify",
                "data_standardize": "data_standardize",
                "anomaly_recognition": "anomaly_recognition",
                "report_generator": "report_generator",
                END: END
            }
        )

        # 从各个节点返回规划节点重新决策
        workflow.add_edge("data_standardize", "planning_node")
        workflow.add_edge("data_classify", "planning_node")
        workflow.add_edge("outline_generator", "planning_node")
        workflow.add_edge("metric_calculator", "planning_node")
        workflow.add_edge("anomaly_recognition", "planning_node")
        workflow.add_edge("report_generator", END)

        return workflow

    def _route_from_planning(self, state: IntegratedWorkflowState) -> str:
        """
        从规划节点路由到下一个节点

        Args:
            state: 当前状态

        Returns:
            目标节点名称
        """
        print(f"\n🔍 [路由决策] 步骤={state['planning_step']}, "
              f"数据集分类打标数量={len(state.get('data_set_classified', []))}",
              f"大纲={state.get('outline_draft') is not None}, "
              f"指标需求={len(state.get('metrics_requirements', []))}")

        # 防止无限循环
        if state['planning_step'] > 30:
            print("⚠️ 规划步骤超过30次，强制结束流程")
            return END

        # 数据标准化状态 0 → 数据标准化
        if state.get("is_standardized", 0) == 0:
            print("→ 路由到 data_standardize（数据标准化）")
            return "data_standardize"

        # 数据分类打标数量为0 → 分类打标
        if len(state.get("data_set_classified", [])) == 0:
            print("→ 路由到 data_classify（分类打标）")
            return "data_classify"

        # 异常识别未完成且有标准化数据 → 异常识别
        if not state.get("anomaly_recognition_completed", False) and state.get("standardized_file_path"):
            print("→ 路由到 anomaly_recognition（异常识别）")
            return "anomaly_recognition"

        # 如果大纲为空 → 生成大纲
        if not state.get("outline_draft"):
            print("→ 路由到 outline_generator（生成大纲）")
            return "outline_generator"

        # 如果指标需求为空但大纲已生成 → 评估指标需求
        if not state.get("metrics_requirements") and state.get("outline_draft"):
            print("→ 路由到 metric_evaluator（评估指标需求）")
            return "metric_evaluator"

        # 计算覆盖率
        progress = get_calculation_progress(state)
        coverage = progress["coverage_rate"]

        print(f"  指标覆盖率 = {coverage:.2%}")

        # 如果有待计算指标且覆盖率 < 100% → 计算指标
        if state.get("pending_metric_ids") and coverage < 1.0:
            print(f"→ 路由到 metric_calculator（计算指标，覆盖率={coverage:.2%}）")
            return "metric_calculator"

        # 检查是否应该结束流程
        pending_ids = state.get("pending_metric_ids", [])
        failed_attempts = state.get("failed_metric_attempts", {})
        max_retries = 3

        # 计算还有哪些指标可以重试（未达到最大重试次数）
        retryable_metrics = [
            mid for mid in pending_ids
            if failed_attempts.get(mid, 0) < max_retries
        ]

        # 如果覆盖率 >= 80%，或者没有可重试的指标 → 生成报告
        if coverage >= 0.8 or not retryable_metrics:
            reason = "覆盖率达到80%" if coverage >= 0.8 else "没有可重试指标"
            print(f"→ 指标计算完成，进入生成报告（覆盖率={coverage:.2%}，原因：{reason}）")
            return "report_generator"

        # 默认返回规划节点
        return "planning_node"

    async def _planning_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """规划节点：分析状态并做出决策"""
        try:
            print("🧠 正在执行规划分析...")

            # 使用规划智能体做出决策
            decision = await plan_next_action(
                question=state["question"],
                industry=state["industry"],
                current_state=state,
                api_key=self.api_key,
                base_url=self.base_url,
                model_name=self.model_name
            )

            # 更新状态
            new_state = update_state_with_planning_decision(state, {
                "decision": decision.decision,
                "next_route": self._decision_to_route(decision.decision),
                "metrics_to_compute": decision.metrics_to_compute
            })

            # 添加决策消息
            decision_msg = self._format_decision_message(decision)
            new_state["messages"].append({
                "role": "assistant",
                "content": decision_msg,
                "timestamp": datetime.now().isoformat()
            })

            print(f"✅ 规划决策完成：{decision.decision}")
            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 规划节点执行失败: {e}")
            new_state = state.copy()
            new_state["errors"].append(f"规划节点错误: {str(e)}")
            return convert_numpy_types(new_state)

    async def _outline_generator_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """大纲生成节点"""
        try:
            print("📝 正在生成报告大纲...")

            # 生成大纲（支持重试机制）
            outline = await generate_report_outline(
                question=state["question"],
                industry=state["industry"],
                sample_data=state["data_set"][:3],  # 使用前3个样本
                api_key=self.api_key,
                base_url=self.base_url,
                model_name=self.model_name,
                max_retries=3,  # 最多重试5次
                retry_delay=3.0  # 每次重试间隔3秒
            )

            # 更新状态
            new_state = update_state_with_outline_generation(state, outline)

            print(f"✅ 大纲生成完成：{outline.report_title}")
            print(f"   包含 {len(outline.sections)} 个章节，{len(outline.global_metrics)} 个指标需求")

            # 分析并打印AI的指标选择推理过程
            self._print_ai_selection_analysis(outline)

            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 大纲生成失败: {e}")
            new_state = state.copy()
            new_state["errors"].append(f"大纲生成错误: {str(e)}")
            return convert_numpy_types(new_state)

    async def _data_classify_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """数据分类打标节点"""
        try:
            standardized_file_path = state["standardized_file_path"]
            file_name = os.path.basename(standardized_file_path)

            # 读取标准化后的数据文件
            data_set = DataManager.load_data_from_csv_file(standardized_file_path)
            # 加载测试数据集并展示两条样例
            print(f"📊 读取标准化数据文件: {file_name}, 加载 {len(data_set)} 条记录")
            print(f"测试数据样例: {data_set[0:1]}")

            print("📝 正在对数据进行分类打标...")

            # 对数据进行分类打标
            data_set_classified = await data_classify(
                industry=state["industry"],
                data_set=data_set,
                file_name=state["file_name"]
            )

            # 更新状态
            new_state = update_state_with_data_classified(state, data_set_classified)

            print(f"✅ 数据分类打标完成，打标记录数: {len(data_set_classified)}")

            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 数据分类打标失败: {e}")
            new_state = state.copy()
            new_state["errors"].append(f"数据分类打标错误: {str(e)}")
            return convert_numpy_types(new_state)


    async def _data_standardize_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """数据标准化节点"""
        try:
            print("📝 正在对数据进行标准化处理...")

            # 数据标准化处理
            result = await data_standardize(
                api_key=self.api_key,
                base_url=self.base_url,
                model_name=self.model_name,
                multimodal_api_url=multimodal_api_url,
                input_file_path=state["original_file_path"]
            )
            is_succ = 0
            standardized_file_path = None
            if result["status"] == "success":  # 数据标准化成功
                is_succ = 1
                standardized_file_path = result["file_path"]

            # 更新状态
            new_state = update_state_with_data_standardize(state, is_succ, standardized_file_path)

            print(f"✅ 数据标准化完成，处理状态: {is_succ}，标准化文件路径：{standardized_file_path}")

            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 数据标准化失败: {e}")
            new_state = state.copy()
            new_state["errors"].append(f"数据标准化错误: {str(e)}")
            return convert_numpy_types(new_state)

    async def _report_generator_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """报告完成节点：生成最终报告"""
        try:
            print("📋 正在生成最终报告...")

            # 获取大纲和计算结果
            outline = state.get("outline_draft")
            computed_metrics = state.get("computed_metrics", {})
            anomaly_summary = state.get("anomaly_summary", {})

            print(f"已经完成的计算指标：{computed_metrics}")
            print(f"异常识别结果：{anomaly_summary.get('total_anomalies', 0)}条异常")

            if not outline:
                raise ValueError("没有可用的报告大纲")

            # 生成最终报告
            final_report = {
                "title": outline.report_title,
                "generated_at": datetime.now().isoformat(),
                "summary": {
                    "total_sections": len(outline.sections),
                    "total_metrics_required": len(outline.global_metrics),
                    "total_metrics_computed": len(computed_metrics),
                    "planning_steps": state.get("planning_step", 0),
                    "completion_rate": len(computed_metrics) / len(
                        outline.global_metrics) if outline.global_metrics else 0
                },
                "sections": [],
                # "metrics_detail": {},
                "anomaly_analysis": anomaly_summary
            }

            chapter_num = 0
            total_sections = len(outline.sections)

            # 构建章节内容
            for section in outline.sections:
                section_content = {
                    "section_id": section.section_id,
                    "title": section.title,
                    "description": section.description,
                    "metrics": {}
                }

                # 添加该章节的指标数据
                for metric_id in section.metrics_needed:
                    if metric_id in computed_metrics:
                        section_content["metrics"][metric_id] = computed_metrics[metric_id]
                    else:
                        if not metric_id.startswith("metric-"):
                            # 指标缺少metric前缀，进行补充
                            section_content["metrics"][metric_id] = computed_metrics["metric-"+metric_id]
                        else:
                            section_content["metrics"][metric_id] = "数据缺失"

                chapter_num += 1
                # 生成章节内容
                chapter_content = await generate_report_section_content(api_key=self.api_key, base_url=self.base_url, model_name=self.model_name, section=section_content, chapter_num=chapter_num, total_sections=total_sections)
                print(f"生成章节内容：{chapter_content}")
                section_content["content"] = chapter_content
                final_report["sections"].append(section_content)

            # 添加详细的指标信息
            # for metric_req in outline.global_metrics:
            #     metric_id = metric_req.metric_id
            #     final_report["metrics_detail"][metric_id] = {
            #         "name": metric_req.metric_name,
            #         "logic": metric_req.calculation_logic,
            #         "required_fields": metric_req.required_fields,
            #         "computed": metric_id in computed_metrics,
            #         "value": computed_metrics.get(metric_id, {}).get("value", "N/A")
            #     }

            # 添加异常识别章节（如果存在异常）
            if anomaly_summary.get('total_anomalies', 0) > 0:
                anomaly_section = {
                    "section_id": "anomaly_analysis",
                    "title": "交易异常识别分析",
                    "description": "基于交易流水数据识别的异常交易情况分析",
                    "content": self._generate_anomaly_analysis_content(anomaly_summary),
                    "metrics": {}
                }
                final_report["sections"].append(anomaly_section)

            # 更新状态
            new_state = update_state_with_report(state, final_report)

            # 添加完成消息
            new_state["messages"].append({
                "role": "assistant",
                "content": f"🎉 完整报告生成流程完成：{outline.report_title}",
                "timestamp": datetime.now().isoformat()
            })

            print(f"✅ 最终报告生成完成：{outline.report_title}")
            print(f"   章节数：{len(final_report['sections'])}")
            print(f"   计算指标：{len(computed_metrics)}/{len(outline.global_metrics)}")
            print(f"   识别异常：{anomaly_summary.get('total_anomalies', 0)}条")
            print(".2%")

            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 报告完成失败: {e}")
            new_state = state.copy()
            new_state["errors"].append(f"报告完成错误: {str(e)}")
            return convert_numpy_types(new_state)

    def _generate_anomaly_analysis_content(self, anomaly_summary: Dict[str, Any]) -> str:
        """生成异常分析章节内容"""
        total_anomalies = anomaly_summary.get('total_anomalies', 0)
        anomaly_ratio = anomaly_summary.get('anomaly_ratio', '0%')

        content = f"""
            ## 交易异常识别分析
        
            ### 异常识别概况
            本次分析共识别出 **{total_anomalies}** 条异常交易记录，异常识别率为 **{anomaly_ratio}**。
        
            ### 异常类型分布
            """

        # 添加异常类型分布
        anomaly_distribution = anomaly_summary.get('anomaly_distribution', {})
        if anomaly_distribution:
            content += "\n| 异常类型 | 数量 | 占比 |\n|----------|------|------|\n"
            for anomaly_type, count in anomaly_distribution.items():
                percentage = (count / total_anomalies * 100) if total_anomalies > 0 else 0
                content += f"| {anomaly_type} | {count} | {percentage:.1f}% |\n"

        # 添加严重程度分布
        severity_distribution = anomaly_summary.get('severity_distribution', {})
        if severity_distribution:
            content += "\n### 严重程度分布\n"
            for severity, count in severity_distribution.items():
                percentage = (count / total_anomalies * 100) if total_anomalies > 0 else 0
                content += f"- **{severity.upper()}** 级别：{count} 条 ({percentage:.1f}%)\n"

        content += """
            ### 分析建议
            1. 建议对高风险异常进行重点核查
            2. 结合业务背景判断异常交易的真实性
            3. 建立异常交易监控机制
            """

        return content


    def _print_ai_selection_analysis(self, outline):
        """打印AI指标选择的推理过程分析 - 完全通用版本"""
        print()
        print('╔══════════════════════════════════════════════════════════════════════════════╗')
        print('║                          🤖 AI指标选择分析                                    ║')
        print('╚══════════════════════════════════════════════════════════════════════════════╝')
        print()

        # 计算总指标数 - outline可能是字典格式，需要适配
        if hasattr(outline, 'sections'):
            # Pydantic模型格式
            total_metrics = sum(len(section.metrics_needed) for section in outline.sections)
            sections = outline.sections
        else:
            # 字典格式
            total_metrics = sum(len(section.get('metrics_needed', [])) for section in outline.get('sections', []))
            sections = outline.get('sections', [])

        # 获取可用指标总数（这里可以从状态或其他地方动态获取）
        available_count = 26  # 这个可以从API调用中动态获取

        print('📊 选择统计:')
        print('   ┌─────────────────────────────────────────────────────────────────────┐')
        print('   │  系统可用指标: {}个   │  AI本次选择: {}个   │  选择率: {:.1f}%     │'.format(
            available_count, total_metrics, total_metrics/available_count*100 if available_count > 0 else 0))
        print('   └─────────────────────────────────────────────────────────────────────┘')
        print()

        print('📋 AI决策过程:')
        print('   大模型已根据用户需求从{}个可用指标中选择了{}个最相关的指标。'.format(available_count, total_metrics))
        print('   选择过程完全由大模型基于语义理解和业务逻辑进行，不涉及任何硬编码规则。')
        print()

        print('🔍 选择结果:')
        print('   • 总章节数: {}个'.format(len(sections)))
        print('   • 平均每章节指标数: {:.1f}个'.format(total_metrics/len(sections) if sections else 0))
        print('   • 选择策略: 基于用户需求的相关性分析')
        print()

        print('🎯 AI Agent核心能力:')
        print('   • 语义理解: 理解用户查询的业务意图和分析需求')
        print('   • 智能筛选: 从海量指标中挑选最相关的组合')
        print('   • 逻辑推理: 为每个分析维度提供充分的选择依据')
        print('   • 动态适配: 根据不同场景自动调整选择策略')
        print()

        print('💡 关键洞察:')
        print('   AI Agent通过大模型的推理能力，实现了超越传统规则引擎的智能化指标选择，')
        print('   能够根据具体业务场景动态调整分析框架，确保分析的针对性和有效性。')
        print()

    async def _metric_calculator_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """指标计算节点"""
        try:
            # 检查计算模式
            use_rules_engine_only = state.get("use_rules_engine_only", False)
            use_traditional_engine_only = state.get("use_traditional_engine_only", False)

            if use_rules_engine_only:
                print("🧮 正在执行规则引擎指标计算（专用模式）...")
            elif use_traditional_engine_only:
                print("🧮 正在执行传统引擎指标计算（专用模式）...")
            else:
                print("🧮 正在执行指标计算...")

            new_state = state.copy()

            # 使用规划决策指定的指标批次，如果没有指定则使用所有待计算指标
            current_batch = state.get("current_batch_metrics", [])
            if current_batch:
                pending_ids = current_batch
                print(f"🧮 本次计算批次包含 {len(pending_ids)} 个指标")
            else:
                pending_ids = state.get("pending_metric_ids", [])
                print(f"🧮 计算所有待计算指标，共 {len(pending_ids)} 个")

            if not pending_ids:
                print("⚠️ 没有待计算的指标")
                return convert_numpy_types(new_state)

            # 获取指标需求信息
            metrics_requirements = state.get("metrics_requirements", [])
            if not metrics_requirements:
                print("⚠️ 没有指标需求信息")
                return convert_numpy_types(new_state)

            # 计算成功和失败的指标
            successful_calculations = 0
            failed_calculations = 0

            # 遍历待计算的指标（创建副本避免修改时遍历的问题）
            for metric_id in pending_ids.copy():
                try:
                    # 找到对应的指标需求
                    metric_req = next((m for m in metrics_requirements if m.metric_id == metric_id), None)
                    if not metric_req:
                        # 修复：找不到指标需求时，创建临时的指标需求结构，避免跳过指标
                        print(f"⚠️ 指标 {metric_id} 找不到需求信息，创建临时配置继续计算")
                        metric_req = type('MetricRequirement', (), {
                            'metric_id': metric_id,
                            'metric_name': metric_id.replace('metric-', '') if metric_id.startswith('metric-') else metric_id,
                            'calculation_logic': f'计算 {metric_id}',
                            'required_fields': ['transactions'],
                            'dependencies': []
                        })()

                    print(f"🧮 计算指标: {metric_id} - {metric_req.metric_name}")

                    # 根据模式决定使用哪种计算方式
                    if use_rules_engine_only:
                        # 只使用规则引擎计算
                        use_rules_engine = True
                        print(f"   使用规则引擎模式")
                    elif use_traditional_engine_only:
                        # 只使用传统引擎计算
                        use_rules_engine = False
                        print(f"   使用传统引擎模式")
                    else:
                        # 自动选择计算方式：优先使用规则引擎，只在规则引擎不可用时使用传统计算
                        use_rules_engine = True  # 默认使用规则引擎计算所有指标

                    if use_rules_engine:
                        # 使用规则引擎计算
                        # 现在metric_id已经是知识ID，直接使用它作为配置名
                        config_name = metric_id  # metric_id 已经是知识ID，如 "metric-分析账户数量"
                        intent_result = {
                            "target_configs": [config_name],
                            "intent_category": "指标计算"
                        }
                        print(f"   使用知识ID: {config_name}")
                        # 将打好标的数据集传入指标计算函数中
                        data_set_classified = state.get("data_set_classified", [])
                        results = await self.rules_engine_agent.calculate_metrics(intent_result, data_set_classified)
                    else:
                        # 使用传统指标计算（模拟）
                        # 这里简化处理，实际应该根据配置文件调用相应的API
                        results = {
                            "success": True,
                            "results": [{
                                "config_name": metric_req.metric_id,
                                "result": {
                                    "success": True,
                                    "data": f"传统引擎计算结果：{metric_req.metric_name}",
                                    "value": 100.0  # 模拟数值
                                }
                            }]
                        }

                    # 处理计算结果
                    calculation_success = False
                    for result in results.get("results", []):
                        if result.get("result", {}).get("success"):
                            # 计算成功
                            new_state["computed_metrics"][metric_id] = result["result"]
                            successful_calculations += 1
                            calculation_success = True
                            print(f"✅ 指标 {metric_id} 计算成功")
                            break  # 找到一个成功的就算成功
                        else:
                            # 计算失败
                            failed_calculations += 1
                            print(f"❌ 指标 {metric_id} 计算失败")

                    # 初始化失败尝试记录
                    if "failed_metric_attempts" not in new_state:
                        new_state["failed_metric_attempts"] = {}

                    # 根据计算结果处理指标
                    if calculation_success:
                        # 计算成功：从待计算列表中移除
                        if metric_id in new_state["pending_metric_ids"]:
                            new_state["pending_metric_ids"].remove(metric_id)
                        # 重置失败计数
                        new_state["failed_metric_attempts"].pop(metric_id, None)
                    else:
                        # 计算失败：记录失败次数，不从待计算列表移除
                        new_state["failed_metric_attempts"][metric_id] = new_state["failed_metric_attempts"].get(metric_id, 0) + 1
                        max_retries = 3
                        if new_state["failed_metric_attempts"][metric_id] >= max_retries:
                            print(f"⚠️ 指标 {metric_id} 已达到最大重试次数 ({max_retries})，从待计算列表中移除")
                            if metric_id in new_state["pending_metric_ids"]:
                                new_state["pending_metric_ids"].remove(metric_id)

                except Exception as e:
                    print(f"❌ 计算指标 {metric_id} 时发生异常: {e}")
                    failed_calculations += 1

                    # 初始化失败尝试记录
                    if "failed_metric_attempts" not in new_state:
                        new_state["failed_metric_attempts"] = {}

                    # 记录失败次数
                    new_state["failed_metric_attempts"][metric_id] = new_state["failed_metric_attempts"].get(metric_id, 0) + 1
                    max_retries = 3
                    if new_state["failed_metric_attempts"][metric_id] >= max_retries:
                        print(f"⚠️ 指标 {metric_id} 异常已达到最大重试次数 ({max_retries})，从待计算列表中移除")
                        if metric_id in new_state["pending_metric_ids"]:
                            new_state["pending_metric_ids"].remove(metric_id)

            # 更新计算结果统计
            new_state["calculation_results"] = {
                "total_configs": len(pending_ids),
                "successful_calculations": successful_calculations,
                "failed_calculations": failed_calculations
            }

            # 添加消息
            if use_rules_engine_only:
                message_content = f"🧮 规则引擎指标计算完成：{successful_calculations} 成功，{failed_calculations} 失败"
            elif use_traditional_engine_only:
                message_content = f"🧮 传统引擎指标计算完成：{successful_calculations} 成功，{failed_calculations} 失败"
            else:
                message_content = f"🧮 指标计算完成：{successful_calculations} 成功，{failed_calculations} 失败"

            new_state["messages"].append({
                "role": "assistant",
                "content": message_content,
                "timestamp": datetime.now().isoformat()
            })

            if use_rules_engine_only:
                print(f"✅ 规则引擎指标计算完成：{successful_calculations} 成功，{failed_calculations} 失败")
            elif use_traditional_engine_only:
                print(f"✅ 传统引擎指标计算完成：{successful_calculations} 成功，{failed_calculations} 失败")
            else:
                print(f"✅ 指标计算完成：{successful_calculations} 成功，{failed_calculations} 失败")

            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 指标计算节点失败: {e}")
            new_state = state.copy()
            new_state["errors"].append(f"指标计算错误: {str(e)}")
            return convert_numpy_types(new_state)


    async def _anomaly_recognition_node(self, state: IntegratedWorkflowState) -> IntegratedWorkflowState:
        """异常识别节点"""
        try:
            print("🔍 正在执行异常识别...")

            # 检查是否已初始化异常识别智能体
            if self.anomaly_recognizer is None:
                print("🤖 初始化异常识别智能体...")
                from llmops.agents.anomaly_recognizer_agent import AnomalyRecognitionAgent
                from llmops.config import anomaly_recognizer_config

                self.anomaly_recognizer = AnomalyRecognitionAgent(
                    csv_path=state["standardized_file_path"],
                    api_key=self.api_key,
                    base_url=self.base_url,
                    model_name=self.model_name,
                    config=anomaly_recognizer_config
                )

            # 加载交易数据
            print("📥 加载交易数据...")
            transaction_data = self.anomaly_recognizer.load_transaction_data()

            # 执行异常识别
            print("🔍 执行异常识别分析...")
            recognition_results = self.anomaly_recognizer.execute_full_recognition()

            # 生成异常报告
            print("📊 生成异常识别报告...")
            output_dir = "outputs/anomaly_reports"
            report_path = self.anomaly_recognizer.generate_recognition_report(output_dir)

            # 使用 update_state_with_anomaly_recognition 函数更新状态
            new_state = update_state_with_anomaly_recognition(
                state,
                recognition_results,
                report_path
            )

            print(f"✅ 异常识别完成：发现 {recognition_results.get('summary', {}).get('total_identified_anomalies', 0)} 条异常")
            return convert_numpy_types(new_state)

        except Exception as e:
            print(f"❌ 异常识别失败: {e}")
            import traceback
            traceback.print_exc()

            # 即使失败也标记为完成，避免阻塞流程
            new_state = state.copy()
            new_state["anomaly_recognition_completed"] = True  # 标记为完成，避免卡住
            new_state["errors"].append(f"异常识别错误: {str(e)}")

            # 使用默认的异常摘要
            new_state["anomaly_summary"] = {
                "total_anomalies": 0,
                "anomaly_ratio": "0%",
                "severity_distribution": {},
                "anomaly_distribution": {}
            }

            # 添加消息
            new_state["messages"].append({
                "role": "assistant",
                "content": f"⚠️ 异常识别失败，跳过异常分析: {str(e)}",
                "timestamp": datetime.now().isoformat()
            })

            return convert_numpy_types(new_state)


    def _decision_to_route(self, decision: str) -> str:
        """将规划决策转换为路由"""
        decision_routes = {
            "data_classify": "data_classify",
            "generate_outline": "outline_generator",
            "compute_metrics": "metric_calculator",
            "finalize_report": END  # 直接结束流程
        }
        return decision_routes.get(decision, "planning_node")

    def _format_decision_message(self, decision: Any) -> str:
        """格式化决策消息"""
        try:
            decision_type = getattr(decision, 'decision', 'unknown')
            reasoning = getattr(decision, 'reasoning', '')

            if decision_type == "compute_metrics" and hasattr(decision, 'metrics_to_compute'):
                metrics = decision.metrics_to_compute
                return f"🧮 规划决策：计算 {len(metrics)} 个指标"
            elif decision_type == "finalize_report":
                return f"✅ 规划决策：生成最终报告"
            elif decision_type == "generate_outline":
                return f"📋 规划决策：生成大纲"
            else:
                return f"🤔 规划决策：{decision_type}"
        except:
            return "🤔 规划决策已完成"

    async def run_workflow(self, question: str, industry: str, original_file_path: str, session_id: str = None, use_rules_engine_only: bool = False, use_traditional_engine_only: bool = False) -> Dict[str, Any]:
        """
        运行完整的工作流

        Args:
            question: 用户查询
            industry: 行业
            original_file_path: 原始文件路径
            session_id: 会话ID
            use_rules_engine_only: 是否只使用规则引擎指标计算
            use_traditional_engine_only: 是否只使用传统引擎指标计算

        Returns:
            工作流结果
        """
        try:
            print("🚀 启动完整智能体工作流...")
            print(f"问题：{question}")
            print(f"行业：{industry}")
            print(f"数据文件：{original_file_path}")

            if use_rules_engine_only:
                print("计算模式：只使用规则引擎")
            elif use_traditional_engine_only:
                print("计算模式：只使用传统引擎")
            else:
                print("计算模式：标准模式")

            # 创建初始状态
            initial_state = create_initial_integrated_state(question, industry, original_file_path, session_id)

            # 设置计算模式标记
            if use_rules_engine_only:
                initial_state["use_rules_engine_only"] = True
                initial_state["use_traditional_engine_only"] = False
            elif use_traditional_engine_only:
                initial_state["use_rules_engine_only"] = False
                initial_state["use_traditional_engine_only"] = True
            else:
                initial_state["use_rules_engine_only"] = False
                initial_state["use_traditional_engine_only"] = False

            # 编译工作流
            app = self.workflow.compile()

            # 执行工作流
            result = await app.ainvoke(initial_state)

            print("✅ 工作流执行完成")
            return {
                "success": True,
                "result": result,
                "answer": result.get("answer"),
                "report": result.get("report_draft"),
                "session_id": result.get("session_id"),
                "execution_summary": {
                    "planning_steps": result.get("planning_step", 0),
                    "outline_generated": result.get("outline_draft") is not None,
                    "metrics_computed": len(result.get("computed_metrics", {})),
                    "completion_rate": result.get("completeness_score", 0)
                }
            }

        except Exception as e:
            print(f"❌ 工作流执行失败: {e}")
            return {
                "success": False,
                "error": str(e),
                "result": None
            }


# 便捷函数
async def run_complete_agent_flow(question: str, industry: str, data: List[Dict[str, Any]], file_name: str, api_key: str, session_id: str = None, use_rules_engine_only: bool = False, use_traditional_engine_only: bool = False) -> Dict[str, Any]:
    """
    运行完整智能体工作流的便捷函数

    Args:
        question: 用户查询
        data: 数据集
        file_name: 数据文件名称
        api_key: API密钥
        session_id: 会话ID
        use_rules_engine_only: 是否只使用规则引擎指标计算
        use_traditional_engine_only: 是否只使用传统引擎指标计算

    Returns:
        工作流结果
    """
    workflow = CompleteAgentFlow(api_key)
    return await workflow.run_workflow(question, industry, data, file_name, session_id, use_rules_engine_only, use_traditional_engine_only)


# 便捷函数
async def run_flow(question: str, industry: str, original_file_path: str, api_key: str, base_url: str, model_name: str, session_id: str = None, use_rules_engine_only: bool = False, use_traditional_engine_only: bool = False) -> Dict[str, Any]:
    """
    运行完整智能体工作流的便捷函数

    Args:
        question: 用户查询
        data: 数据集
        original_file_path: 原始文件路径(pdf/img/csv)
        api_key: API密钥
        base_url: LLM base url
        model_name: LLM model name
        session_id: 会话ID
        use_rules_engine_only: 是否只使用规则引擎指标计算
        use_traditional_engine_only: 是否只使用传统引擎指标计算

    Returns:
        工作流结果
    """
    workflow = CompleteAgentFlow(api_key, base_url, model_name)
    return await workflow.run_workflow(question, industry, original_file_path, session_id, use_rules_engine_only, use_traditional_engine_only)


# 主函数用于测试
async def main():
    """主函数：执行系统测试"""
    import os
    os.environ["LANGCHAIN_TRACING_V2"] = "false"
    os.environ["LANGCHAIN_API_KEY"] = ""
    # 禁用 LangGraph 的追踪
    os.environ["LANGSMITH_TRACING"] = "false"

    print("🚀 执行CompleteAgentFlow系统测试")
    print("=" * 50)

    # 行业
    industry = "农业"

    # 测试文件（pdf/img/csv)
    file_name = "11111.png"
    curr_dir = os.path.dirname(os.path.abspath(__file__))
    file_path = os.path.join(curr_dir, "..", "data_files", file_name)

    print(f"使用LLM：{LLM_MODEL_NAME}")

    # 执行测试
    result = await run_flow(
        question="请生成一份详细的农业经营贷流水分析报告，需要包含：1.总收入和总支出统计 2.收入笔数和支出笔数 3.各类型收入支出占比分析 4.交易对手收入支出TOP3排名 5.按月份的收入支出趋势分析 6.账户数量和交易时间范围统计 7.资金流入流出月度统计等全面指标",
        industry = industry,
        original_file_path=file_path,
        api_key=LLM_API_KEY,
        base_url=LLM_BASE_URL,
        model_name=LLM_MODEL_NAME,
        session_id="direct-test"
    )

    print(f"📋 结果: {'✅ 成功' if result.get('success') else '❌ 失败'}")
    print(f"{result}")

    if result.get('success'):
        summary = result.get('execution_summary', {})
        print(f"   规划步骤: {summary.get('planning_steps', 0)}")
        print(f"   指标计算: {summary.get('metrics_computed', 0)}")
        print("🎉 测试成功！")
    return result

if __name__ == "__main__":
    import asyncio
    asyncio.run(main())