Repository: foreveryh/mentis
Branch: main
Commit: 7859b536b98b
Files: 240
Total size: 1.4 MB

Directory structure:
gitextract_zde6lsy3/

├── .gitignore
├── README.md
├── __init__.py
├── api/
│   ├── __init__.py
│   ├── agent/
│   │   ├── __init__.py
│   │   └── loader.py
│   ├── server.py
│   └── utils.py
├── core/
│   ├── __init__.py
│   ├── a2a/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── agent_task_manager.py
│   │   ├── client/
│   │   │   ├── __init__.py
│   │   │   ├── card_resolver.py
│   │   │   └── client.py
│   │   ├── config.json
│   │   ├── server/
│   │   │   ├── __init__.py
│   │   │   ├── server.py
│   │   │   ├── task_manager.py
│   │   │   └── utils.py
│   │   ├── types.py
│   │   └── utils/
│   │       ├── __init__.py
│   │       ├── in_memory_cache.py
│   │       └── push_notification_auth.py
│   ├── agents/
│   │   ├── __init__.py
│   │   ├── base/
│   │   │   ├── base_agent.py
│   │   │   ├── create_react_agent_wrapper.py
│   │   │   └── react_agent.py
│   │   ├── react_based_supervisor/
│   │   │   ├── __init__.py
│   │   │   ├── agent_name.py
│   │   │   ├── handoff.py
│   │   │   ├── planning_handler.py
│   │   │   ├── simple_planning_tool.py
│   │   │   ├── state_schema.py
│   │   │   └── supervisor.py
│   │   ├── react_supervisor_agent.py
│   │   ├── sb_supervisor_agent.py
│   │   ├── state_based_supervisor/
│   │   │   ├── __init__.py
│   │   │   ├── agent_name.py
│   │   │   ├── evaluate_result_node.py
│   │   │   ├── handoff.py
│   │   │   ├── planner_node.py
│   │   │   ├── planning_handler.py
│   │   │   ├── prompt.py
│   │   │   ├── state_schema.py
│   │   │   ├── supervisor_graph.py
│   │   │   └── supervisor_node.py
│   │   └── sub_agents/
│   │       ├── __init__.py
│   │       ├── coder_agent.py
│   │       ├── data_analyst_agent.py
│   │       ├── designer_agent.py
│   │       ├── reporter_agent.py
│   │       └── research_agent.py
│   ├── llm/
│   │   ├── llm_manager.py
│   │   └── model_config.py
│   ├── mcp/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── client.py
│   │   ├── config_loader.py
│   │   ├── mcp_server_config.json
│   │   ├── run_server.py
│   │   ├── server.py
│   │   └── test/
│   │       ├── README.md
│   │       ├── __init__.py
│   │       ├── minimal_fastmcp_test.py
│   │       └── test_minimal_client.py
│   ├── tools/
│   │   ├── __init__.py
│   │   ├── e2b_tool.py
│   │   ├── firecrawl_tool.py
│   │   ├── registry.py
│   │   └── replicate_flux_tool.py
│   └── utils/
│       ├── agent_utils.py
│       └── timezone.py
├── examples/
│   ├── 01_supervisor_test.py
│   ├── 02_supervisor_agent_test.py
│   ├── 03_tavily_tools_test.py
│   ├── 04_react_agent_test.py
│   ├── 05_react_agent_user_input.py
│   ├── 06_web_extraction_tools_test.py
│   ├── 07_web_extraction_with_filesystem.py
│   ├── 08_react_agent_tool_registry_test.py
│   ├── 09_e2b_code_interpreter_test.py
│   ├── 10_financial_data_analysis.py
│   ├── 11_e2b_sandbox_test.py
│   ├── 12_planning_supervisor_test.py
│   ├── 13_multi_agent_roles_test.py
│   ├── 14_mcp_client_fetch_test.py
│   ├── 15_mcp_agent_test.py
│   ├── 16_google_a2a/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── agent_task_manager_test.py
│   │   ├── client_example.py
│   │   ├── currency_agent_test.py
│   │   ├── currency_agent_test_README.md
│   │   └── langgraph_integration.py
│   ├── TODO_computer_tool_demo.py
│   ├── __init__.py
│   ├── state_based_supervisor_examples/
│   │   ├── 01_simple.py
│   │   ├── 02_tavily.py
│   │   └── 03_multi_agents.py
│   └── web_agents/
│       ├── README.md
│       ├── README_SPEC.md
│       ├── __init__.py
│       ├── research_assistant/
│       │   ├── README.md
│       │   ├── __init__.py
│       │   └── graph.py
│       └── weather_agent/
│           ├── README.md
│           └── __init__.py
├── instructions/
│   ├── 00.Langgraph 和 React Agent.md
│   ├── 01.supervisor_pattern.md
│   ├── 02.supervisor_pattern_agent.md
│   ├── 03.tavily_search_integration.md
│   ├── 04.react_agent.md
│   ├── 05.react_agent_user_input.md
│   ├── 06.web_extraction_tools.md
│   ├── 07.web_extraction_with_filesystem.md
│   ├── 08.react_agent_tool_registry.md
│   └── 09.e2b_sandbox_integration.md
├── log_analyzer.py
├── pyproject.toml
├── requirements.txt
├── setup.py
├── super_agents/
│   ├── __init__.py
│   ├── browser_use/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── agent/
│   │   │   ├── __init__.py
│   │   │   ├── graph.py
│   │   │   ├── nodes.py
│   │   │   ├── prompts.py
│   │   │   ├── schemas.py
│   │   │   ├── state.py
│   │   │   └── tools.py
│   │   ├── agent.py
│   │   ├── browser/
│   │   │   ├── browser.py
│   │   │   ├── detector.py
│   │   │   ├── findVisibleInteractiveElements.js
│   │   │   ├── models.py
│   │   │   └── utils.py
│   │   ├── llm.py
│   │   └── main.py
│   ├── customized_deep_research/
│   │   ├── PRD_README.md
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── main.py
│   │   └── reason_graph/
│   │       ├── __init__.py
│   │       ├── graph.py
│   │       ├── nodes.py
│   │       ├── prompt.py
│   │       ├── schemas.py
│   │       ├── state.py
│   │       └── tools.py
│   └── deep_research/
│       ├── README.md
│       ├── __init__.py
│       ├── a2a_adapter/
│       │   ├── README.md
│       │   ├── __init__.py
│       │   ├── client_example.py
│       │   ├── deep_research_task_manager.py
│       │   ├── dr_terminal_output.md
│       │   ├── run_server.py
│       │   └── setup.py
│       ├── main.py
│       ├── output/
│       │   ├── research_report_analyze_smartvalue_co_ltds_9417t_core_business_key_productsservices_eg_government_cloud_solutions_mo_20250418_125137.md
│       │   ├── research_report_id_like_a_thorough_analysis_of_li_auto_stock_including_summary_company_overview_key_metrics_performa_20250327_121800.md
│       │   └── research_report_id_like_a_thorough_analysis_of_xpev_stock_including_summary_company_overview_key_metrics_performance_20250327_105350.md
│       ├── reason_graph/
│       │   ├── __init__.py
│       │   ├── graph.py
│       │   ├── nodes.py
│       │   ├── prompt.py
│       │   ├── schemas.py
│       │   ├── state.py
│       │   └── tools.py
│       └── tests/
│           ├── __init__.py
│           └── test_graph.py
├── web/
│   ├── .gitignore
│   ├── README.md
│   ├── app/
│   │   ├── api/
│   │   │   └── agent/
│   │   │       └── route.ts
│   │   ├── chat/
│   │   │   ├── [id]/
│   │   │   │   ├── agent-types.ts
│   │   │   │   ├── components/
│   │   │   │   │   ├── chatbot-node.tsx
│   │   │   │   │   ├── checkpoint-card.tsx
│   │   │   │   │   ├── node-card.tsx
│   │   │   │   │   ├── reminder.tsx
│   │   │   │   │   ├── research/
│   │   │   │   │   │   ├── report-preview.tsx
│   │   │   │   │   │   ├── research-node.tsx
│   │   │   │   │   │   ├── research-status.tsx
│   │   │   │   │   │   └── search-results.tsx
│   │   │   │   │   └── weather/
│   │   │   │   │       ├── cloudy.tsx
│   │   │   │   │       ├── rainy.tsx
│   │   │   │   │       ├── snowy.tsx
│   │   │   │   │       ├── sunny.tsx
│   │   │   │   │       └── weather-node.tsx
│   │   │   │   └── page.tsx
│   │   │   └── page.tsx
│   │   ├── deep-research/
│   │   │   ├── [id]/
│   │   │   │   └── page.tsx
│   │   │   └── page.tsx
│   │   ├── globals.css
│   │   ├── layout.tsx
│   │   └── page.tsx
│   ├── components/
│   │   ├── app-sidebar.tsx
│   │   ├── theme-provider.tsx
│   │   ├── theme-switcher.tsx
│   │   └── ui/
│   │       ├── badge.tsx
│   │       ├── button.tsx
│   │       ├── card.tsx
│   │       ├── checkbox.tsx
│   │       ├── dialog.tsx
│   │       ├── input.tsx
│   │       ├── popover.tsx
│   │       ├── progress.tsx
│   │       ├── separator.tsx
│   │       ├── sheet.tsx
│   │       ├── sidebar.tsx
│   │       ├── skeleton.tsx
│   │       ├── textarea.tsx
│   │       └── tooltip.tsx
│   ├── components.json
│   ├── eslint.config.mjs
│   ├── hooks/
│   │   ├── use-mobile.tsx
│   │   └── useLangGraphAgent/
│   │       ├── actions.ts
│   │       ├── api.ts
│   │       ├── ascii-tree.ts
│   │       ├── types.ts
│   │       └── useLangGraphAgent.tsx
│   ├── next.config.ts
│   ├── package.json
│   ├── postcss.config.mjs
│   ├── stores/
│   │   └── chat-store.tsx
│   ├── tailwind.config.ts
│   └── tsconfig.json
└── web_for_a2a/
    ├── .gitignore
    ├── Instruction.md
    ├── README.md
    ├── app/
    │   ├── api/
    │   │   └── a2a/
    │   │       └── route.ts
    │   ├── deepresearch/
    │   │   └── page.tsx
    │   ├── globals.css
    │   ├── layout.tsx
    │   └── page.tsx
    ├── package.json
    ├── postcss.config.js
    ├── tailwind.config.js
    └── tsconfig.json

================================================
FILE CONTENTS
================================================

================================================
FILE: .gitignore
================================================
# Python
__pycache__/
*.py[cod]
*$py.class
*.so
.Python
build/
develop-eggs/
dist/
downloads/
eggs/
.eggs/
lib/
lib64/
parts/
sdist/
var/
wheels/
*.egg-info/
.installed.cfg
*.egg

# Virtual Environment
venv/
env/
ENV/

# IDE
.idea/
.vscode/
*.swp
*.swo

# OS specific
.DS_Store
Thumbs.db

# LangSmith
.langchain.db
.langsmith/

# Logs
*.log

# Env
.env

# output
exampels/logs/
exampels/output/
examples/output/sandbox_test

================================================
FILE: README.md
================================================
# Mentis - Agent Development Kit

[![Python Version](https://img.shields.io/badge/python-3.11+-blue.svg)](https://www.python.org/downloads/)
[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT) 
## 概述 (Overview)

Mentis 是一个基于 LangGraph 构建的、可扩展的多 Agent ADK(Agent Development Kit)。它的核心是一个**状态驱动的规划型 Supervisor Agent**，负责理解用户复杂请求、制定执行计划，并智能地协调一组具有不同专业能力的子 Agent (Specialist Agents) 来共同完成任务。

此框架旨在实现复杂任务的自动化处理，通过 Agent 间的协作提供比单一 Agent 更强大、更灵活的问题解决能力。

## 核心特性 (Core Features)

* **Multi-Agent 架构**: 采用中心化的 Supervisor 协调多个专门的子 Agent (如 Research, Coder, Reporter, Designer, Data Analyst)。
* **State-Based Planning**: 引入独立的 `Planner` 节点负责初始规划，`Supervisor` 专注于基于计划状态的执行和调度，`Evaluator` 节点负责评估子 Agent 结果并更新状态。计划状态通过 LangGraph 持久化（需配置 Checkpointer）。
* **模块化 Agent 设计**: 基于 `BaseAgent` 和 `ReactAgent` 构建，易于添加或修改具有不同能力的子 Agent。
* **工具注册与管理**: 通过 `core/tools/registry.py` 实现工具的集中注册、分类和动态加载。
* **可配置 LLM**: 支持通过 `LLMManager` (或环境变量) 配置和切换不同的 LLM Provider (OpenAI, DeepSeek, XAI Grok via compatible endpoint) 和模型。
* **持久化支持**: 基于 LangGraph 的 Checkpointer 机制，可以实现对话状态和计划的持久化。
* **清晰的执行流程**: Planner -> Supervisor -> (Handoff -> Agent -> Evaluator -> Supervisor 循环) -> 最终输出/Reporter。
* **A2A 协议支持**: 实现了 Google 的 Agent-to-Agent (A2A) 协议，使 Mentis Agents 能够与其他支持 A2A 协议的系统进行互操作。

## 架构概览 (Architecture Overview)

1.  **用户请求 (Input)**: 用户通过入口点 (`main.py` 或 API) 提交任务请求。
2.  **规划节点 (Planner Node)**: 分析请求，生成一个包含任务步骤、建议 Agent 的初始计划 (`Plan`)，并更新到图状态 (`PlanningAgentState`)。
3.  **主管节点 (Supervisor Node)**: 接收带有计划的状态，根据计划状态和消息历史决定下一步行动：
    * 启动新任务 (标记 'in_progress')。
    * 委派 'in_progress' 的任务给合适的子 Agent (通过 Handoff 工具)。
    * 等待子 Agent 完成。
    * 判断计划是否最终完成。
    * 决定最终输出方式（自己总结或调用 Reporter）。
4.  **切换执行器 (Handoff Executor)**: 处理 Supervisor 发出的 `transfer_to_` 工具调用，并将控制权和状态传递给目标子 Agent。
5.  **子 Agent 节点 (Specialist Agent Nodes)**: 继承自 `ReactAgent` 或 `BaseAgent`，执行具体的任务（研究、编码、生成报告/图像、数据分析），可能调用其自身的工具。
6.  **评估节点 (Evaluate Result Node)**: 接收子 Agent 的执行结果，进行确定性评估（成功/失败），更新对应任务的状态和 Plan 的整体状态。
7.  **循环与结束**: 流程在 Evaluator -> Supervisor 之间循环，直到 Supervisor 判断 Plan 完成，然后路由到 `END` 或 `ReporterAgent`。

## 快速开始 (Getting Started)

### 1. 环境设置 (Prerequisites)

* Python 3.11+
* 使用 `pip` 或 `uv` 等工具管理依赖。

### 2. 安装依赖 (Installation)

在项目根目录运行：
建议使用 uv 管理
```bash
uv venv
source .venv/bin/activate
uv sync
```

```bash
# pip install -r requirements.txt 
# 或者 uv pip install -r requirements.txt
```
(requirements.txt 我没维护，请确保 `requirements.txt` 文件包含了所有必要的库，如 `langchain`, `langgraph`, `langchain-openai`, `e2b` (如果使用 E2B), `replicate` (如果使用 Replicate), `tavily-python`, `exa-py`, `python-dotenv`, `anyio`, `tiktoken` 等)。

### 3. 配置环境 (Configuration)

* 复制 `.env.example` 文件为 `.env`。
* 在 `.env` 文件中填入您所需的 API Keys/Tokens：
    * `OPENAI_API_KEY` (如果使用 OpenAI 模型)
    * `DEEPSEEK_API_KEY` (如果使用 DeepSeek 模型)
    * `XAI_API_KEY` (如果使用 XAI Grok，并确认 Base URL)
    * `REPLICATE_API_TOKEN` (如果使用 Replicate 工具)
    * `E2B_API_KEY` (如果使用 E2B Code Interpreter，推荐！)
    * `TAVILY_API_KEY` (如果使用 Tavily 搜索，推荐！)
    * `EXA_API_KEY` (如果使用 Exa 搜索)
    * `LANGCHAIN_TRACING_V2="true"` (强烈推荐，用于 LangSmith 调试)
    * `LANGCHAIN_API_KEY="ls_..."` (您的 LangSmith Key)
    * `LANGCHAIN_PROJECT="Your_Project_Name"` (您在 LangSmith 上的项目名)
* **LLM 配置**:
    * 如果您使用了 `LLMManager`（如示例所示），请检查并配置其读取的模型配置文件（例如 `config/models.yaml`，路径可能不同）。
    * 如果您在 `tools.py` 中直接根据环境变量初始化 LLM，请确保设置了对应的环境变量，如 `LLM_PROVIDER`, `LLM_MODEL_NAME`, `LLM_BASE_URL` (用于兼容 API)。
* **工具配置**: 确保 `core/tools/__init__.py` 或 `registry.py` 中的工具预注册逻辑能够正确找到并初始化您需要的工具。

### 4. 运行示例 (Running Examples)

项目包含示例脚本以演示框架的使用：
```bash
# 从项目根目录 (mentis/) 运行
python examples/state_based_supervisor_examples/03_multi_agents.py 
```
脚本会提示您输入初始请求。您可以进行简单尝试：

* `"What is the capital of France?"` (简单测试)
* `"Write a short, four-line poem about spring."` (测试 Reporter)
* `"Generate an image of a cat wearing a top hat, oil painting style."` (测试 Designer)
* `"Write a Python function to calculate factorial and run it for 5."` (测试 Coder)

## 项目结构 (Project Structure)

```
mentis/
├── api/             # (可选) API 服务相关代码
├── core/            # 核心框架代码
│   ├── a2a/         # A2A 协议的客户端和服务器实现
│   ├── agents/      # Agent 定义 (base, react, supervisor, sub-agents)
│   │   ├── base/
│   │   ├── state_based_supervisor/ # Supervisor 相关 (graph, node, planner, evaluator)
│   │   ├── sub_agents/             # 具体子 Agent 实现 (research, coder, etc.)
│   │   └── sb_supervisor_agent.py  # SupervisorAgent 类定义
│   ├── llm/         # (可选) LLM 管理或配置
│   ├── tools/       # 工具定义和注册表 (registry, e2b, replicate, etc.)
│   └── utils/       # 通用辅助函数
├── examples/        # 示例和测试脚本
│   └── state_based_supervisor_examples/
│       └── 03_multi_agents.py # 我们使用的测试脚本
├── super_agents/    # 独立功能型 Agent 实现
│   └── deep_research/ # DeepResearch Agent 实现
│       └── a2a_adapter/ # DeepResearch 的 A2A 协议适配器
├── web/             # (可选) Web 客户端代码
├── web_for_a2a/     # 基于 A2A 协议的 Web 界面
├── .env.example     # 环境变量示例
├── requirements.txt # Python 依赖
└── README.md        # 本文件
```

## Super Agents (独立功能型 Agent)

除了由 Supervisor 协调的、专注于单一技能的 Specialist Agents (如 Coder, Researcher) 之外，本框架也支持构建和集成更复杂的 **"Super Agents"**。

Super Agent 可以理解为一个**独立的、具有端到端能力、能够完成一个相对完整且复杂任务的 Agent 图**。它可以包含自己的规划、执行、甚至内部协调逻辑。

这些 Super Agents 既可以**独立运行**以完成特定的大型任务，也可以被更高层的协调者（例如我们的 Supervisor Agent）**视为一种强大的“能力”或“工具”**来调用，以处理其复杂计划中的某个步骤。

### DeepResearch Agent (第一个实例)


https://github.com/user-attachments/assets/2a685709-5be0-43a3-9e2d-934ef5fa3315


`DeepResearch Agent` 是我们在此框架理念下实现的第一个 Super Agent 实例（其早期版本是我们开发此 Multi-Agent 框架的基础）。

* **核心功能**: 旨在针对用户给定的**任意主题**，自动化地执行一个**深度研究**流程。
* **内部工作流**: 它包含自己的一套完整的内部步骤，大致如下：
    1.  **研究规划 (Plan Research)**: 分析主题，生成初步的搜索查询和分析点。
    2.  **多源搜索 (Multi-Source Search)**: 调用网页搜索 (Tavily)、学术搜索 (Exa) 等工具获取信息。
    3.  **(可选) 分析执行 (Perform Analysis)**: 对搜索结果进行初步分析（如情感、SWOT 等）。
    4.  **差距分析 (Gap Analysis)**: 评估已有信息，识别知识空白和局限性。
    5.  **(可选) 补充搜索 (Gap Filling)**: 针对知识空白进行额外的、更具针对性的搜索。
    6.  **最终综合 (Final Synthesis)**: 整合所有信息，提炼关键发现和不确定性。
    7.  **报告生成 (Report Generation)**: 将综合结果和上下文信息，撰写成一份详细的、带引用的 Markdown 研究报告。
* **当前状态**: 该 Agent 的核心逻辑和节点已基本实现，并且现在支持 A2A 协议和专用 Web 界面。

#### A2A 协议支持

我们为 DeepResearch Agent 实现了完整的 A2A 协议适配器，使其能够：

* 作为标准的 A2A 服务被发现和调用
* 通过 `tasks/send` 和 `tasks/sendSubscribe` 端点接收研究任务
* 提供实时的流式研究进度更新
* 返回结构化的研究结果
* 支持推送通知机制

这使得 DeepResearch Agent 可以轻松地与其他支持 A2A 协议的系统（如 Google Assistant）集成，或者被自定义的前端应用调用。

#### 专用 Web 界面


https://github.com/user-attachments/assets/640365c7-839b-4765-b9ac-ee0ac961ceb8


我们还开发了一个基于 Next.js 的现代 Web 界面，专门用于与 DeepResearch A2A 服务交互：

* 提供直观的用户界面，用于输入研究主题和启动研究任务
* 实时显示研究进度和中间更新（通过 Server-Sent Events）
* 美观地展示最终生成的研究报告
* 演示了如何在前端应用中使用浏览器原生 API 处理 A2A 流式响应

**如何体验 DeepResearch Agent:**

1. **独立运行模式**:
   * 确保环境配置: 确认您的 `.env` 文件中包含了所需的所有 API Keys（例如 `OPENAI_API_KEY`/`DEEPSEEK_API_KEY`, `TAVILY_API_KEY`, `EXA_API_KEY`）。
   * 运行脚本: 在项目根目录执行：
     ```bash
     python super_agents/deep_research/main.py
     ```
   * 输入主题并查看结果: 生成的报告通常会保存在 `output/` 文件夹中。

2. **A2A 服务模式**:
   * 启动 A2A 服务器:
     ```bash
     cd super_agents/deep_research/a2a_adapter
     python run_server.py
     ```
   * 服务器将在默认端口（通常是 8000）启动，并提供符合 A2A 规范的 API 端点。

3. **Web 界面模式**:
   * 确保 A2A 服务器正在运行
   * 启动 Web 界面:
     ```bash
     cd web_for_a2a
     npm install
     npm run dev
     ```
   * 在浏览器中访问 http://localhost:3000/deepresearch 使用图形界面与 DeepResearch Agent 交互。

## 未来工作 (Future Work / Contributing)

* 完善子 Agent 的工具集和 Prompt。
* 增强 Evaluator Node 的评估逻辑。
* 添加更复杂的任务依赖处理。
* 优化长对话历史的管理。
* 集成持久化 Checkpointer (如 SQLite, Redis)。
* 欢迎提出 Issue 或 Pull Request！
* 有问题也可以添加我的微信 brown🩷cony999


## 许可证 (License)

This project is licensed under the MIT License - see the LICENSE file for details.


================================================
FILE: __init__.py
================================================
# Project package initialization


================================================
FILE: api/__init__.py
================================================


================================================
FILE: api/agent/__init__.py
================================================


================================================
FILE: api/agent/loader.py
================================================
# Agent Loader Module
# This module is responsible for loading agents from the web_agents directory

import importlib
import os
import sys
from typing import Dict, Optional, Any, List
from langgraph.graph import StateGraph
from langgraph.graph.graph import CompiledGraph  # Add this import

# Try to import deep_research_app
try:
    # Adjust this import path based on your project structure
    from super_agents.deep_research.reason_graph.graph import web_app as deep_research_app
except ImportError:
    print("Warning: Failed to import deep_research_app. DeepResearchAgent will be unavailable.")
    deep_research_app = None

# Add examples directory to Python path to allow importing web_agents
examples_path = os.path.join(os.path.dirname(os.path.dirname(os.path.dirname(__file__))), 'examples')
if examples_path not in sys.path:
    sys.path.append(examples_path)


def list_available_agents() -> Dict[str, str]:
    """List all available agents in the web_agents directory
    
    Returns:
        Dict[str, str]: A dictionary mapping agent names to their descriptions
    """
    agents = {}
    web_agents_dir = os.path.join(examples_path, 'web_agents')
    
    # Check if web_agents directory exists
    if not os.path.exists(web_agents_dir) or not os.path.isdir(web_agents_dir):
        pass  # Continue with empty agents dict
    else:
        # Iterate through subdirectories in web_agents
        for item in os.listdir(web_agents_dir):
            agent_dir = os.path.join(web_agents_dir, item)
            
            # Skip non-directories and special directories
            if not os.path.isdir(agent_dir) or item.startswith('__') or item.startswith('.'):
                continue
            
            # Check if the directory contains an __init__.py file with get_graph function
            init_file = os.path.join(agent_dir, '__init__.py')
            if os.path.exists(init_file):
                # Try to get description from README.md
                readme_file = os.path.join(agent_dir, 'README.md')
                description = item  # Default description is the directory name
                
                if os.path.exists(readme_file):
                    try:
                        with open(readme_file, 'r', encoding='utf-8') as f:
                            first_line = f.readline().strip()
                            if first_line.startswith('# '):
                                description = first_line[2:]
                    except Exception:
                        pass
                
                agents[item] = description
    
    # Add deep_research to available agents if it's imported successfully
    if deep_research_app is not None:
        agents["deep_research"] = "Deep Research Agent for in-depth topic exploration"
    
    return agents


def load_agent(agent_name: str) -> Optional[CompiledGraph]:
    """Load an agent from the web_agents directory or special agents
    
    Args:
        agent_name (str): The name of the agent to load
        
    Returns:
        Optional[CompiledGraph]: The compiled graph for the agent, or None if the agent could not be loaded
    """
    # Special case for deep_research agent
    if agent_name == "deep_research":
        if deep_research_app:
            return deep_research_app
        else:
            print(f"ERROR: DeepResearchAgent requested but not available.")
            return None
    
    # Standard agents from web_agents directory
    try:
        # Import the agent module
        module = importlib.import_module(f'web_agents.{agent_name}')
        
        # Check if the module has a get_graph function
        if hasattr(module, 'get_graph'):
            # Call the get_graph function to get the compiled graph
            return module.get_graph()
        else:
            print(f"Error: Agent '{agent_name}' does not have a get_graph function")
            return None
    except ImportError as e:
        print(f"Error importing agent '{agent_name}': {e}")
        return None
    except Exception as e:
        print(f"Error loading agent '{agent_name}': {e}")
        return None


# Default agent to use if none is specified
DEFAULT_AGENT = 'research_assistant'
# DEFAULT_AGENT = 'weather_agent'


def get_default_agent() -> Optional[CompiledGraph]:
    """Get the default agent
    
    Returns:
        Optional[CompiledGraph]: The compiled graph for the default agent, or None if it could not be loaded
    """
    return load_agent(DEFAULT_AGENT)

================================================
FILE: api/server.py
================================================
import uvicorn
from langgraph.types import Command, Interrupt
from fastapi import FastAPI, Request, HTTPException, Query
from fastapi.middleware.cors import CORSMiddleware
from sse_starlette.sse import EventSourceResponse
from typing import AsyncGenerator, Dict, Optional, Union, Any
from api.utils import message_chunk_event, interrupt_event, custom_event, checkpoint_event, format_state_snapshot, stream_update_event
import asyncio
import traceback
import json
from langchain_core.messages import HumanMessage
from langchain_core.runnables import RunnableConfig

# Import the agent loader
from api.agent.loader import load_agent, list_available_agents, get_default_agent

# Load the default agent
graph = get_default_agent()

# Track active connections
active_connections: Dict[str, asyncio.Event] = {}

app = FastAPI(
    title="LangGraph API",
    description="API for LangGraph interactions",
    version="0.1.0"
)

# Configure CORS
app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],  # In production, replace with specific origins
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)


@app.get("/agents")
async def list_agents():
    """Endpoint returning a list of available agents."""
    return list_available_agents()


@app.get("/state")
async def state(thread_id: str | None = None, agent: Optional[str] = Query(None)):
    """Endpoint returning current graph state."""
    if not thread_id:
        raise HTTPException(status_code=400, detail="thread_id is required")
    
    # Load the specified agent if provided
    current_graph = load_agent(agent) if agent else graph
    if not current_graph:
        raise HTTPException(status_code=404, detail=f"Agent '{agent}' not found")

    config: RunnableConfig = {"configurable": {"thread_id": thread_id}}

    state = await current_graph.aget_state(config)
    return format_state_snapshot(state)


@app.get("/history")
async def history(thread_id: str | None = None, agent: Optional[str] = Query(None)):
    """Endpoint returning complete state history. Used for restoring graph."""
    if not thread_id:
        raise HTTPException(status_code=400, detail="thread_id is required")
    
    # Load the specified agent if provided
    current_graph = load_agent(agent) if agent else graph
    if not current_graph:
        raise HTTPException(status_code=404, detail=f"Agent '{agent}' not found")

    config: RunnableConfig  = {"configurable": {"thread_id": thread_id}}

    records = []
    async for state in current_graph.aget_state_history(config):
        records.append(format_state_snapshot(state))
    return records


@app.post("/agent/stop")
async def stop_agent(request: Request):
    """Endpoint for stopping the running agent."""
    body = await request.json()
    thread_id = body.get("thread_id")
    if not thread_id:
        raise HTTPException(status_code=400, detail="thread_id is required")

    if thread_id in active_connections:
        active_connections[thread_id].set()
        return {"status": "stopped", "thread_id": thread_id}
    raise HTTPException(status_code=404, detail="Thread is not running")


@app.post("/agent")
async def agent(request: Request):
    """Endpoint for running the agent."""
    body = await request.json()

    request_type = body.get("type")
    if not request_type:
        raise HTTPException(status_code=400, detail="type is required")

    thread_id = body.get("thread_id")
    if not thread_id:
        raise HTTPException(status_code=400, detail="thread_id is required")

    # Get the agent name if provided
    agent_name = body.get("agent")
    
    # Load the specified agent if provided
    current_graph = load_agent(agent_name) if agent_name else graph
    if not current_graph:
        raise HTTPException(status_code=404, detail=f"Agent '{agent_name or 'default'}' not found")

    stop_event = asyncio.Event()
    active_connections[thread_id] = stop_event

    config: RunnableConfig = {"configurable": {"thread_id": thread_id}}
    initial_graph_state: Dict[str, Any] = {}
    input_for_astream: Optional[Union[Dict, Command]] = None  # input for astream

    # Get initial state or messages from frontend
    initial_state_input = body.get("state", {"messages": []})
    if not isinstance(initial_state_input, dict):
        raise HTTPException(status_code=400, detail="state must be a dictionary")

    if agent_name == "deep_research":
        # --- Prepare state for DeepResearch Agent ---
        print("Preparing state for DeepResearchAgent...")
        # Extract topic from the first message in state['messages']
        first_message_content = ""
        try:
            # Ensure initial_state_input['messages'] is a list and not empty
            if isinstance(initial_state_input.get('messages'), list) and initial_state_input['messages']:
                # Assume the first message's content is the topic
                first_message_content = initial_state_input['messages'][0]['content']
            else:
                # Try to get topic from other fields in state (alternative)
                first_message_content = initial_state_input.get('topic', '')
                
        except Exception as e:
            print(f"Warning: Could not extract topic from initial state input: {e}")

        if not first_message_content or not isinstance(first_message_content, str):
            raise HTTPException(status_code=400, detail="A valid 'topic' string is required for deep_research agent, expected in state.messages[0].content or state.topic")

        # Build the ResearchState needed by DeepResearch Agent (at least topic and depth)
        initial_graph_state = {
            "topic": first_message_content,
            "depth": initial_state_input.get("depth", "advanced"),  # Optional: allow frontend to specify depth
            "messages": [],  # DeepResearch manages its own message history
            "stream_updates": [],  # Initialize stream_updates
            # Initialize other ResearchState fields to None or default values
            "plan": None, "research_plan": None, "search_results": [], 
            "gap_analysis": None, "final_synthesis": None, 
            "final_report_markdown": None,
        }
        print(f"Initial ResearchState: {{'topic': '{initial_graph_state['topic']}', 'depth': '{initial_graph_state['depth']}', ...}}")
        
        # DeepResearch Agent's astream input is the complete initial state
        if request_type == "run":
            input_for_astream = initial_graph_state
        elif request_type == "resume":
            # DeepResearch Agent might not support or need different resume approach
            print("Warning: 'resume' might not be fully supported for DeepResearchAgent yet.")
            # Assume resume Command can be understood by the graph
            input_for_astream = Command(resume=body.get("resume"))
            config["configurable"]["checkpoint_id"] = body.get("resume")  # Resume usually needs checkpoint ID
        else:  # Fork, Replay typically only need config
            config_from_request = body.get("config")
            if not config_from_request:
                raise HTTPException(status_code=400, detail="config is required for fork/replay")
            config = config_from_request  # Use complete config provided in the request
            input_for_astream = None

    else:  # For Supervisor or other Agents (assume using PlanningAgentState)
        print("Preparing state for Supervisor/Other Agent...")
        # --- Prepare PlanningAgentState ---
        # Ensure messages list contains correct BaseMessage objects (or let BaseAgent preprocess)
        initial_messages = initial_state_input.get("messages", [])

        initial_graph_state = {
            "messages": initial_messages,
            "plan": None,  # Planner node will create it
            "error": None
            # Add other fields needed by PlanningAgentState and set to None or default values
        }
        
        # --- Set astream input (logic similar to before) ---
        if request_type == "run":
            # For PlanningAgentState, initial input typically only contains messages
            input_for_astream = {"messages": initial_messages}
        elif request_type == "resume":
            resume_val = body.get("resume")
            if not resume_val:
                raise HTTPException(status_code=400, detail="resume value is required")
            input_for_astream = Command(resume=resume_val)
            # Ensure config includes checkpoint_id for resuming
            if "configurable" not in config:
                config["configurable"] = {}
            config["configurable"]["checkpoint_id"] = resume_val 
        elif request_type == "fork": 
            config_from_request = body.get("config")
            if not config_from_request:
                raise HTTPException(status_code=400, detail="config is required for fork")
            config = config_from_request  # Fork uses complete config provided
            # Fork typically starts from specified checkpoint, no extra state dict input needed
            input_for_astream = None 
        elif request_type == "replay": 
            config_from_request = body.get("config")
            if not config_from_request:
                raise HTTPException(status_code=400, detail="config is required for replay")
            config = config_from_request
            input_for_astream = None
        else:
            raise HTTPException(status_code=400, detail="invalid request type")
             
    # Ensure config always has thread_id (important for all agents)
    if "configurable" not in config:
        config["configurable"] = {}
    config["configurable"]["thread_id"] = thread_id

    # --- State and Input preparation complete ---

    async def generate_events() -> AsyncGenerator[dict, None]:
        try:
            # 设置recursion_limit为100，解决深度研究时的递归限制问题
            if agent_name == "deep_research" and "recursion_limit" not in config:
                config["recursion_limit"] = 100
                
            async for chunk in current_graph.astream(
                input_for_astream,  # Use prepared input
                config,             # Use prepared config
                stream_mode=["debug", "messages", "updates", "custom"],
            ):
                if stop_event.is_set():
                    break

                chunk_type, chunk_data = chunk

                if chunk_type == "debug":
                    # type can be checkpoint, task, task_result
                    if isinstance(chunk_data, dict) and "type" in chunk_data:
                        debug_type = chunk_data["type"]
                        if debug_type == "checkpoint":
                            yield checkpoint_event(chunk_data)
                        elif debug_type == "task_result":
                            interrupts = chunk_data["payload"].get(
                                "interrupts", [])
                            if interrupts and len(interrupts) > 0:
                                yield interrupt_event(interrupts)
                elif chunk_type == "messages":
                    # 确保chunk_data是一个包含至少两个元素的列表/元组，并且第二个元素是一个包含langgraph_node的字典
                    if isinstance(chunk_data, (list, tuple)) and len(chunk_data) > 1 and isinstance(chunk_data[1], dict) and "langgraph_node" in chunk_data[1]:
                        yield message_chunk_event(chunk_data[1]["langgraph_node"], chunk_data[0])
                    else:
                        print(f"Warning: Unexpected messages chunk_data format: {chunk_data}")
                        # 尝试使用安全的默认值
                        node_name = chunk_data[1].get("langgraph_node", "unknown") if isinstance(chunk_data, (list, tuple)) and len(chunk_data) > 1 and isinstance(chunk_data[1], dict) else "unknown"
                        message = chunk_data[0] if isinstance(chunk_data, (list, tuple)) and len(chunk_data) > 0 else None
                        if message is not None:
                            yield message_chunk_event(node_name, message)
                elif chunk_type == "custom":
                    # Check if this is a StreamUpdate
                    if isinstance(chunk_data, dict) and all(k in chunk_data for k in ['id', 'type', 'status', 'title']):
                        yield stream_update_event(chunk_data)
                    else:
                        yield custom_event(chunk_data)
                elif chunk_type == "updates":
                    # Handle state update events (e.g., real-time Plan updates)
                    pass  # Currently ignore updates events, rely on checkpoint or custom
            
            # --- Loop ended ---
            yield {"event": "end", "data": "{}"}  # Send an end event to frontend

        except Exception as e:
            print(f"Error during agent execution stream: {e}")
            traceback.print_exc()
            # Send error event to frontend
            yield {"event": "error", "data": json.dumps({"message": f"Agent execution error: {e}"})}
        finally:
            if thread_id in active_connections:
                del active_connections[thread_id]

    return EventSourceResponse(generate_events())


def main():
    uvicorn.run("api.server:app", host="0.0.0.0", port=8000, reload=True)


if __name__ == "__main__":
    import sys
    import os
    # 将项目根目录添加到 Python 路径中
    sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
    main()


================================================
FILE: api/utils.py
================================================
import json
from typing import Dict, Any, List, Optional
from langchain_core.messages import BaseMessage, AIMessage, HumanMessage, ToolMessage
from langgraph.types import StateSnapshot


def checkpoint_event(value):
    """Create a checkpoint event for the client."""

    def format_values(values: dict):
        formatted_values = values.copy()
        if "messages" in formatted_values:
            formatted_values["messages"] = [
                {
                    "type": msg.get("type") if isinstance(msg, dict) else msg.type,
                    "content": msg.get("content") if isinstance(msg, dict) else msg.content,
                    "id": msg.get("id") if isinstance(msg, dict) else msg.id,
                    "tool_calls": msg.get("tool_calls") if isinstance(msg, dict) else (msg.tool_calls if hasattr(msg, 'tool_calls') else None)
                }
                for msg in formatted_values["messages"]
            ]
        return formatted_values

    def format_writes(writes: dict):
        if writes is None:
            return None
        formatted_writes = {}
        for key, value in writes.items():
            if isinstance(value, dict):
                formatted_writes[key] = format_values(value)
            elif isinstance(value, list):
                formatted_writes[key] = [format_values(item) if isinstance(
                    item, dict) else item for item in value]
            else:
                formatted_writes[key] = value
        return formatted_writes

    configurable = value["payload"]["config"]["configurable"]
    data = {
        "next": value["payload"]["next"],
        "values": format_values(value["payload"]["values"]),
        "config": {
            "configurable": {
                "checkpoint_id": configurable["checkpoint_id"],
                "checkpoint_ns": configurable["checkpoint_ns"],
                "thread_id": configurable["thread_id"]
            }
        },
        "metadata": {
            "source": value["payload"]["metadata"]["source"],
            "step": value["payload"]["metadata"]["step"],
            "writes": format_writes(value["payload"]["metadata"]["writes"]),
            "parents": value["payload"]["metadata"]["parents"]
        }
    }
    return {
        "event": "checkpoint",
        "data": json.dumps(data)
    }


def message_chunk_event(node_name, message_chunk):
    """Create a message chunk event for the client."""

    def format_messages(value):
        """Format message chunk into a serializable dictionary. 
        This is needed because the message class is not serializable.
        """
        return {
            "content": value.content,
            "id": value.id,
            "tool_calls": value.tool_calls if hasattr(value, 'tool_calls') else None,
            "tool_call_chunks": value.tool_call_chunks if hasattr(value, 'tool_call_chunks') else None
        }

    return {
        "event": "message_chunk",
        "data": json.dumps({
            "node_name": node_name,
            "message_chunk": format_messages(message_chunk)
        })
    }


def interrupt_event(interrupts):
    """Create an interrupt event for the client."""
    formatted_interrupts = [{"value": interrupt["value"]}
                            for interrupt in interrupts]
    return {
        "event": "interrupt",
        "data": json.dumps(formatted_interrupts)
    }


def custom_event(value):
    """Create a custom event for the client."""
    return {
        "event": "custom",
        "data": json.dumps(value)
    }


def format_state_snapshot(snapshot: StateSnapshot):
    interrupts = []
    for task in snapshot.tasks:
        for interrupt in task.interrupts:
            interrupts.append({"value": interrupt.value})
    return {
        "values": snapshot.values,
        "next": snapshot.next,
        "config": snapshot.config,
        "interrupts": interrupts,
        "parent_config": snapshot.parent_config,
        "metadata": snapshot.metadata
    }


def stream_update_event(data: dict):
    """为 DeepResearch Agent 的 StreamUpdateData 创建一个 stream_update 事件。

    Args:
        data: 从 add_stream_update 产生的、符合 StreamUpdateData 结构的字典。

    Returns:
        符合 SSE EventSourceResponse 格式的字典。
    """
    if not isinstance(data, dict):
        # 如果传入的不是字典，返回一个错误事件
        return {
            "event": "error",
            "data": json.dumps({"message": "Internal server error: Invalid stream update data type."})
        }
    
    return {
        "event": "stream_update",
        "data": json.dumps(data, default=str)
    }


================================================
FILE: core/__init__.py
================================================
# Core module initialization

================================================
FILE: core/a2a/README.md
================================================
# Mentis A2A (Agent2Agent) 协议集成

本目录 (`core/a2a/`) 包含用于实现 Agent2Agent (A2A) 协议的客户端和服务器实现，使 Mentis Agents 能够与其他支持 A2A 协议的代理系统进行通信和协作。

## 背景

A2A 是由 Google 发起的开放标准，旨在使不同框架（如 LangGraph、CrewAI、Google ADK、Genkit）或不同供应商构建的 AI 代理能够发现彼此的能力，协商交互模式（文本、文件、数据等），并在任务上进行协作。

## 核心组件

### 1. A2A 客户端 (`A2AClient`)

`A2AClient` 类（位于 `client/client.py`）提供了与支持 A2A 协议的服务器进行交互的功能：

* **代理发现:** 支持通过 `.well-known/agent.json` 端点自动发现代理能力（Agent Card）。
* **任务管理:** 提供发送、获取和取消任务的方法。
* **推送通知:** 支持设置和获取任务的推送通知配置。
* **流式响应:** 支持通过流式API接收任务执行的实时更新。
* **异步架构:** 基于 `asyncio` 和 `httpx` 构建，适合异步应用。

### 2. A2A 服务器 (`A2AServer`)

`A2AServer` 类（位于 `server/server.py`）允许将现有的 Mentis Agent 暴露为支持 A2A 协议的服务：

* **基于 Starlette:** 使用 Starlette 框架提供 HTTP 和 SSE 端点。
* **任务处理:** 支持任务的创建、执行和状态跟踪。
* **流式更新:** 通过 Server-Sent Events (SSE) 提供任务执行的实时更新。
* **Agent Card:** 通过 `.well-known/agent.json` 端点公开代理能力。

### 3. 辅助工具

#### 推送通知认证 (`PushNotificationAuth`)

`PushNotificationAuth` 类（位于 `utils/push_notification_auth.py`）提供了安全的推送通知机制：

* **发送方认证 (`PushNotificationSenderAuth`):** 
  - 生成和管理 JWT 密钥对
  - 验证推送通知 URL
  - 签名并发送推送通知
  - 提供 JWKS 端点供接收方获取公钥

* **接收方认证 (`PushNotificationReceiverAuth`):** 
  - 从 JWKS URL 加载公钥
  - 验证接收到的推送通知的完整性和时效性
  - 防止重放攻击

#### 内存缓存 (`InMemoryCache`)

`InMemoryCache` 类（位于 `utils/in_memory_cache.py`）提供了线程安全的内存缓存实现：

* **单例模式:** 确保应用中只有一个缓存实例
* **TTL 支持:** 支持设置缓存项的过期时间
* **线程安全:** 使用锁机制确保并发安全

## 数据类型

A2A 协议定义了几个关键数据类型（位于 `types.py`）：

* **AgentCard:** 描述代理的元数据，包括名称、描述、URL、能力和技能。
* **Task:** 表示代理执行的任务，包含状态、内容和产物。
* **Part:** 内容的一部分，可以是文本、文件或数据。
* **Artifact:** 代理产生的产物，如结果、生成的文件等。
* **TaskState:** 任务状态枚举（已提交、进行中、需要输入、已完成、已取消、失败）。
* **PushNotificationConfig:** 推送通知配置，包含回调URL和认证信息。

## 如何使用

### 1. 创建和使用 A2A 客户端

```python
import asyncio
from common.types import AgentCard
from core.a2a.client.client import A2AClient

async def main():
    # 方式1：直接指定URL创建客户端
    async with A2AClient(url="http://localhost:8000/a2a") as client:
        # 发送任务
        response = await client.send_task({"text": "请帮我研究人工智能"})
        task_id = response["result"]["taskId"]
        
        # 获取任务结果
        task_response = await client.get_task({"id": task_id})
        
        # 设置推送通知
        await client.set_task_callback({
            "taskId": task_id,
            "callbackUrl": "https://your-callback-url.com/webhook"
        })
        
    # 方式2：通过Agent Card创建客户端
    agent_card = AgentCard(name="Example Agent", url="http://localhost:8000/a2a")
    async with A2AClient(agent_card=agent_card) as client:
        # 使用流式API接收实时更新
        async for update in client.send_task_streaming({"text": "分析最新的AI趋势"}):
            print(update)

# 运行
asyncio.run(main())
```

### 2. 创建 A2A 服务器

```python
from core.a2a.server.server import A2AServer
from core.a2a.server.task_manager import InMemoryTaskManager
from common.types import AgentCard

# 创建Agent卡片
agent_card = AgentCard(
    name="My Agent",
    description="一个示例代理",
    url="http://localhost:5000"
)

# 创建任务管理器
task_manager = InMemoryTaskManager()

# 创建服务器
server = A2AServer(
    host="0.0.0.0",
    port=5000,
    endpoint="/",
    agent_card=agent_card,
    task_manager=task_manager
)

# 启动服务器
server.start()
```

### 3. 配置推送通知

#### 发送方配置

```python
from core.a2a.utils.push_notification_auth import PushNotificationSenderAuth

# 创建发送方认证
sender_auth = PushNotificationSenderAuth()

# 生成密钥对
sender_auth.generate_jwk()

# 添加JWKS端点到你的服务器
app.add_route("/.well-known/jwks.json", sender_auth.handle_jwks_endpoint)

# 验证接收方URL
is_valid = await sender_auth.verify_push_notification_url("https://receiver-url.com/webhook")

# 发送推送通知
if is_valid:
    await sender_auth.send_push_notification(
        "https://receiver-url.com/webhook",
        {"event": "task_completed", "taskId": "123"}
    )
```

#### 接收方配置

```python
from core.a2a.utils.push_notification_auth import PushNotificationReceiverAuth
from starlette.requests import Request

# 创建接收方认证
receiver_auth = PushNotificationReceiverAuth()

# 加载发送方的公钥
await receiver_auth.load_jwks("https://sender-url.com/.well-known/jwks.json")

# 在webhook处理函数中验证推送通知
async def webhook_handler(request: Request):
    is_valid = await receiver_auth.verify_push_notification(request)
    if is_valid:
        # 处理推送通知...
        data = await request.json()
        print(f"收到有效的推送通知: {data}")
```

### 4. 使用内存缓存

```python
from core.a2a.utils.in_memory_cache import InMemoryCache

# 获取缓存实例
cache = InMemoryCache()

# 设置缓存项（带TTL）
cache.set("api_result", {"data": "some_value"}, ttl=300)  # 5分钟过期

# 获取缓存项
result = cache.get("api_result")
if result:
    print(f"从缓存获取结果: {result}")
else:
    print("缓存已过期或不存在")
    
# 删除缓存项
cache.delete("api_result")

# 清空所有缓存
cache.clear()
```

## 完整示例

查看 `examples/16_a2a_integration_test.py` 获取完整的集成示例，包括：

1. 创建 A2A 服务器，将现有 Agent 暴露为 A2A 服务
2. 使用 A2A 客户端连接到 A2A 服务器
3. 创建一个 Agent，使用 A2A 客户端作为工具

运行示例：

```bash
# 启动 A2A 服务器
python -m examples.16_a2a_integration_test server

# 运行 A2A 客户端
python -m examples.16_a2a_integration_test client

# 运行带有 A2A 工具的 Agent
python -m examples.16_a2a_integration_test agent
```

## 与 MCP 的关系

Mentis 同时支持 MCP（Model Context Protocol）和 A2A（Agent2Agent）协议：

* **MCP:** 专注于 AI 模型与外部工具/服务的交互，主要用于扩展单个 Agent 的能力。
* **A2A:** 专注于不同 Agent 之间的通信和协作，使多个 Agent 能够协同工作。

这两个协议是互补的，可以同时使用以构建功能强大的 Agent 系统。

================================================
FILE: core/a2a/__init__.py
================================================


================================================
FILE: core/a2a/agent_task_manager.py
================================================
import asyncio
import logging
import traceback
from typing import Dict, Any, Union, AsyncIterable, Optional
from core.a2a.types import (
    TaskState, TaskStatus, Task, Artifact, Message, TextPart,
    SendTaskRequest, SendTaskResponse, GetTaskRequest, GetTaskResponse,
    CancelTaskRequest, CancelTaskResponse, SendTaskStreamingRequest, SendTaskStreamingResponse,
    SetTaskPushNotificationRequest, SetTaskPushNotificationResponse,
    GetTaskPushNotificationRequest, GetTaskPushNotificationResponse,
    TaskResubscriptionRequest, TaskSendParams, JSONRPCResponse, InvalidParamsError,
    TaskNotFoundError, TaskNotCancelableError, PushNotificationNotSupportedError,
    TaskArtifactUpdateEvent, TaskStatusUpdateEvent, InternalError, TaskIdParams,
    PushNotificationConfig
)
from core.a2a.server.task_manager import TaskManager, InMemoryTaskManager
from core.a2a.server import utils

logger = logging.getLogger(__name__)

class AgentTaskManager(InMemoryTaskManager):
    """
    AgentTaskManager是连接LangGraph Agent与A2A协议的关键组件。
    它负责管理任务生命周期、处理流式响应、更新任务状态以及发送推送通知。
    """
    def __init__(self, agent, notification_sender_auth=None):
        """
        初始化AgentTaskManager
        
        Args:
            agent: LangGraph Agent实例
            notification_sender_auth: 推送通知认证（可选）
        """
        super().__init__()
        self.agent = agent
        self.notification_sender_auth = notification_sender_auth
    
    async def _run_streaming_agent(self, request: SendTaskStreamingRequest):
        """
        运行流式Agent并处理响应
        
        Args:
            request: 流式任务请求
        """
        task_send_params: TaskSendParams = request.params
        query = self._get_user_query(task_send_params)
        try:
            async for item in self.agent.stream(query, task_send_params.sessionId):
                is_task_complete = item["is_task_complete"]
                require_user_input = item["require_user_input"]
                artifact = None
                message = None
                parts = [{"type": "text", "text": item["content"]}]
                end_stream = False
                
                if not is_task_complete and not require_user_input:
                    task_state = TaskState.WORKING
                    message = Message(role="agent", parts=parts)
                elif require_user_input:
                    task_state = TaskState.INPUT_REQUIRED
                    message = Message(role="agent", parts=parts)
                    end_stream = True
                else:
                    task_state = TaskState.COMPLETED
                    artifact = Artifact(parts=parts, index=0, append=False)
                    end_stream = True
                
                task_status = TaskStatus(state=task_state, message=message)
                latest_task = await self.update_store(
                    task_send_params.id,
                    task_status,
                    None if artifact is None else [artifact],
                )
                await self.send_task_notification(latest_task)

                if artifact:
                    task_artifact_update_event = TaskArtifactUpdateEvent(
                        id=task_send_params.id, artifact=artifact
                    )
                    await self.enqueue_events_for_sse(
                        task_send_params.id, task_artifact_update_event
                    )                    
                task_update_event = TaskStatusUpdateEvent(
                    id=task_send_params.id, status=task_status, final=end_stream
                )
                await self.enqueue_events_for_sse(
                    task_send_params.id, task_update_event
                )
        except Exception as e:
            logger.error(f"An error occurred while streaming the response: {e}")
            await self.enqueue_events_for_sse(
                task_send_params.id,
                InternalError(message=f"An error occurred while streaming the response: {e}")                
            )

    def _get_user_query(self, task_send_params: TaskSendParams) -> str:
        """
        从任务参数中提取用户查询 (采用 Google Demo 的严格方法)

        Args:
            task_send_params: 任务发送参数

        Returns:
            str: 用户查询文本
        """
        if not task_send_params.message or not task_send_params.message.parts:
            logger.warning(f"[_get_user_query] Message or parts are empty for task {task_send_params.id}")
            return "" # 或者可以抛出错误，取决于你的设计

        # 直接获取第一个 part
        part = task_send_params.message.parts[0]
        logger.debug(f"[_get_user_query] First part: type={type(part)}, value={part!r}") # 保留调试日志

        # 严格检查第一个 part 是否为 TextPart 实例
        if not isinstance(part, TextPart):
            logger.error(f"[_get_user_query] First part is not a TextPart instance! Type: {type(part)}")
            # 直接抛出错误，这会中断流程并提供明确信息
            raise ValueError(f"Expected first message part to be TextPart, but got {type(part)}")

        # 如果检查通过，直接返回文本
        logger.debug(f"[_get_user_query] Extracted query from TextPart: '{part.text}'")
        return part.text


    def _validate_request(
        self, request: Union[SendTaskRequest, SendTaskStreamingRequest]
    ) -> JSONRPCResponse | None:
        """
        验证请求参数
        
        Args:
            request: 任务请求
            
        Returns:
            JSONRPCResponse | None: 错误响应或None
        """
        task_send_params: TaskSendParams = request.params
        if not utils.are_modalities_compatible(
            task_send_params.acceptedOutputModes, self.agent.SUPPORTED_CONTENT_TYPES
        ):
            logger.warning(
                "Unsupported output mode. Received %s, Support %s",
                task_send_params.acceptedOutputModes,
                self.agent.SUPPORTED_CONTENT_TYPES,
            )
            return utils.new_incompatible_types_error(request.id)
        
        if task_send_params.pushNotification and not task_send_params.pushNotification.url:
            logger.warning("Push notification URL is missing")
            return JSONRPCResponse(id=request.id, error=InvalidParamsError(message="Push notification URL is missing"))
        
        return None
        
    async def on_send_task(self, request: SendTaskRequest) -> SendTaskResponse:
        """
        处理发送任务请求
        
        Args:
            request: 任务请求
            
        Returns:
            SendTaskResponse: 任务响应
        """
        validation_error = self._validate_request(request)
        if validation_error:
            return SendTaskResponse(id=request.id, error=validation_error.error)
        
        if request.params.pushNotification:
            if not await self.set_push_notification_info(request.params.id, request.params.pushNotification):
                return SendTaskResponse(id=request.id, error=InvalidParamsError(message="Push notification URL is invalid"))

        await self.upsert_task(request.params)
        task = await self.update_store(
            request.params.id, TaskStatus(state=TaskState.WORKING), None
        )
        await self.send_task_notification(task)

        task_send_params: TaskSendParams = request.params
        query = self._get_user_query(task_send_params)
        try:
            agent_response = self.agent.invoke(query, task_send_params.sessionId)
            # 处理Agent响应并更新任务状态
            parts = [{"type": "text", "text": agent_response}]
            artifact = Artifact(parts=parts, index=0, append=False)
            task = await self.update_store(
                task_send_params.id, 
                TaskStatus(state=TaskState.COMPLETED), 
                [artifact]
            )
            await self.send_task_notification(task)
            return SendTaskResponse(id=request.id, result=task)

        except Exception as e:
            # 建议也稍微改进一下异常处理日志和返回信息
            logger.error(f"Error during agent invocation or task processing: {e}", exc_info=True)
            # 记录失败状态
            try:
                # 确保即使在异常处理中也能更新状态
                task_failed : Task = await self.update_store(
                    task_send_params.id,
                    TaskStatus(state=TaskState.FAILED, error={"message": str(e)}),
                    None
                )
                await self.send_task_notification(task_failed)
            except Exception as update_err:
                # 如果更新状态也失败，记录下来
                logger.error(f"Failed to update task status to FAILED after initial error: {update_err}", exc_info=True)

            # 返回更合适的错误类型和消息
            # return SendTaskResponse(id=request.id, error=InvalidParamsError(message=f"Error processing task: {e}"))
            # InternalError 可能更合适，因为错误发生在服务器内部处理中
            return SendTaskResponse(id=request.id, error=InternalError(message=f"Error processing task: {str(e) or type(e).__name__}"))

    
    async def on_send_task_subscribe(
        self, request: SendTaskStreamingRequest
    ) -> AsyncIterable[SendTaskStreamingResponse] | JSONRPCResponse:
        """
        处理流式任务请求
        
        Args:
            request: 流式任务请求
            
        Returns:
            AsyncIterable[SendTaskStreamingResponse] | JSONRPCResponse: 流式响应或错误
        """
        try:
            error = self._validate_request(request)
            if error:
                return error
            
            await self.upsert_task(request.params)
            
            if request.params.pushNotification:
                if not await self.set_push_notification_info(request.params.id, request.params.pushNotification):
                    return JSONRPCResponse(id=request.id, error=InvalidParamsError(message="Push notification URL is invalid"))
            
            task_send_params: TaskSendParams = request.params
            sse_event_queue = await self.setup_sse_consumer(task_send_params.id, False)            
            asyncio.create_task(self._run_streaming_agent(request))
            
            return self.dequeue_events_for_sse(
                request.id, task_send_params.id, sse_event_queue
            )
        except Exception as e:
            logger.error(f"Error in SSE stream: {e}")
            print(traceback.format_exc())
            return JSONRPCResponse(
                id=request.id,
                error=InternalError(
                    message="An error occurred while streaming the response"
                ),
            )

    async def _process_agent_response(
        self, request: SendTaskRequest, agent_response: dict
    ) -> SendTaskResponse:
        """Processes the agent's response and updates the task store."""
        task_send_params: TaskSendParams = request.params
        task_id = task_send_params.id
        history_length = task_send_params.historyLength
        task_status = None

        parts = [{"type": "text", "text": agent_response["content"]}]
        artifact = None
        if agent_response["require_user_input"]:
            task_status = TaskStatus(
                state=TaskState.INPUT_REQUIRED,
                message=Message(role="agent", parts=parts),
            )
        else:
            task_status = TaskStatus(state=TaskState.COMPLETED)
            artifact = Artifact(parts=parts)
        task = await self.update_store(
            task_id, task_status, None if artifact is None else [artifact]
        )
        task_result = self.append_task_history(task, history_length)
        await self.send_task_notification(task)
        return SendTaskResponse(id=request.id, result=task_result)
    
    async def on_resubscribe_to_task(
        self, request: TaskResubscriptionRequest
    ) -> AsyncIterable[SendTaskStreamingResponse] | JSONRPCResponse:
        task_id_params: TaskIdParams = request.params
        try:
            sse_event_queue = await self.setup_sse_consumer(task_id_params.id, True)
            return self.dequeue_events_for_sse(request.id, task_id_params.id, sse_event_queue)
        except Exception as e:
            logger.error(f"Error while reconnecting to SSE stream: {e}")
            return JSONRPCResponse(
                id=request.id,
                error=InternalError(
                    message=f"An error occurred while reconnecting to stream: {e}"
                ),
            )
    
    async def send_task_notification(self, task: Task):
        if not await self.has_push_notification_info(task.id):
            logger.info(f"No push notification info found for task {task.id}")
            return
        push_info = await self.get_push_notification_info(task.id)

        logger.info(f"Notifying for task {task.id} => {task.status.state}")
        await self.notification_sender_auth.send_push_notification(
            push_info.url,
            data=task.model_dump(exclude_none=True)
        )

    async def set_push_notification_info(self, task_id: str, push_notification_config: PushNotificationConfig):
        # Verify the ownership of notification URL by issuing a challenge request.
        if self.notification_sender_auth:
            is_verified = await self.notification_sender_auth.verify_push_notification_url(push_notification_config.url)
            if not is_verified:
                return False
        
        await super().set_push_notification_info(task_id, push_notification_config)
        return True

================================================
FILE: core/a2a/client/__init__.py
================================================


================================================
FILE: core/a2a/client/card_resolver.py
================================================
import httpx
from core.a2a.types import (
    AgentCard,
    A2AClientJSONError,
)
import json


class A2ACardResolver:
    def __init__(self, base_url, agent_card_path="/.well-known/agent.json"):
        self.base_url = base_url.rstrip("/")
        self.agent_card_path = agent_card_path.lstrip("/")

    def get_agent_card(self) -> AgentCard:
        with httpx.Client() as client:
            response = client.get(self.base_url + "/" + self.agent_card_path)
            response.raise_for_status()
            try:
                return AgentCard(**response.json())
            except json.JSONDecodeError as e:
                raise A2AClientJSONError(str(e)) from e

================================================
FILE: core/a2a/client/client.py
================================================
import httpx
from httpx_sse import connect_sse
from typing import Any, AsyncIterable
from core.a2a.types import (
    AgentCard,
    GetTaskRequest,
    SendTaskRequest,
    SendTaskResponse,
    JSONRPCRequest,
    GetTaskResponse,
    CancelTaskResponse,
    CancelTaskRequest,
    SetTaskPushNotificationRequest,
    SetTaskPushNotificationResponse,
    GetTaskPushNotificationRequest,
    GetTaskPushNotificationResponse,
    A2AClientHTTPError,
    A2AClientJSONError,
    SendTaskStreamingRequest,
    SendTaskStreamingResponse,
)
import json


class A2AClient:
    def __init__(self, agent_card: AgentCard = None, url: str = None):
        if agent_card:
            self.url = agent_card.url
        elif url:
            self.url = url
        else:
            raise ValueError("Must provide either agent_card or url")

    async def send_task(self, payload: dict[str, Any]) -> SendTaskResponse:
        request = SendTaskRequest(params=payload)
        return SendTaskResponse(**await self._send_request(request))

    async def send_task_streaming(
        self, payload: dict[str, Any]
    ) -> AsyncIterable[SendTaskStreamingResponse]:
        request = SendTaskStreamingRequest(params=payload)
        with httpx.Client(timeout=None) as client:
            with connect_sse(
                client, "POST", self.url, json=request.model_dump()
            ) as event_source:
                try:
                    for sse in event_source.iter_sse():
                        yield SendTaskStreamingResponse(**json.loads(sse.data))
                except json.JSONDecodeError as e:
                    raise A2AClientJSONError(str(e)) from e
                except httpx.RequestError as e:
                    raise A2AClientHTTPError(400, str(e)) from e

    async def _send_request(self, request: JSONRPCRequest) -> dict[str, Any]:
        async with httpx.AsyncClient() as client:
            try:
                # Image generation could take time, adding timeout
                response = await client.post(
                    self.url, json=request.model_dump(), timeout=30
                )
                response.raise_for_status()
                return response.json()
            except httpx.HTTPStatusError as e:
                raise A2AClientHTTPError(e.response.status_code, str(e)) from e
            except json.JSONDecodeError as e:
                raise A2AClientJSONError(str(e)) from e

    async def get_task(self, payload: dict[str, Any]) -> GetTaskResponse:
        request = GetTaskRequest(params=payload)
        return GetTaskResponse(**await self._send_request(request))

    async def cancel_task(self, payload: dict[str, Any]) -> CancelTaskResponse:
        request = CancelTaskRequest(params=payload)
        return CancelTaskResponse(**await self._send_request(request))

    async def set_task_callback(
        self, payload: dict[str, Any]
    ) -> SetTaskPushNotificationResponse:
        request = SetTaskPushNotificationRequest(params=payload)
        return SetTaskPushNotificationResponse(**await self._send_request(request))

    async def get_task_callback(
        self, payload: dict[str, Any]
    ) -> GetTaskPushNotificationResponse:
        request = GetTaskPushNotificationRequest(params=payload)
        return GetTaskPushNotificationResponse(**await self._send_request(request))

================================================
FILE: core/a2a/config.json
================================================
{
  "local_agent": {
    "url": "http://127.0.0.1:8000/",
    "auth": {
      "type": "none"
    }
  }
}

================================================
FILE: core/a2a/server/__init__.py
================================================


================================================
FILE: core/a2a/server/server.py
================================================
# core/a2a/server/server.py
from starlette.applications import Starlette
from starlette.responses import JSONResponse
from sse_starlette.sse import EventSourceResponse
from starlette.requests import Request
from starlette.middleware import Middleware
from starlette.middleware.cors import CORSMiddleware

# --- 添加 Pydantic 的 ValidationError 导入 ---
from pydantic import ValidationError
# --- 导入结束 ---

from core.a2a.types import (
    A2ARequest,
    JSONRPCResponse,
    InvalidRequestError,
    JSONParseError,
    GetTaskRequest,
    CancelTaskRequest,
    SendTaskRequest,
    SetTaskPushNotificationRequest,
    GetTaskPushNotificationRequest,
    InternalError,
    AgentCard,
    TaskResubscriptionRequest,
    SendTaskStreamingRequest,
    MethodNotFoundError,
    # 确保 ValidationError 没有在这里导入
)
import json
from typing import AsyncIterable, Any, Optional, Union
from core.a2a.server.task_manager import TaskManager

import logging

logger = logging.getLogger(__name__)


class A2AServer:
    def __init__(
        self,
        host="0.0.0.0",
        port=5000,
        endpoint="/",
        agent_card: AgentCard = None,
        task_manager: TaskManager = None,
        allowed_origins: Optional[list[str]] = None,
    ):
        self.host = host
        self.port = port
        self.endpoint = endpoint
        self.task_manager = task_manager
        self.agent_card = agent_card

        if allowed_origins is None:
            # 本地开发时默认只允许 localhost:3000
            allowed_origins = ["http://localhost:3000"]
            logger.warning("CORS allow_origins set to 'http://localhost:3000' for local development.")
        else:
            logger.info(f"CORS allow_origins configured: {allowed_origins}")

        middleware = [
            Middleware(
                CORSMiddleware,
                allow_origins=allowed_origins,
                allow_credentials=True,
                allow_methods=["*"],
                allow_headers=["*"],
            )
        ]
        self.app = Starlette(middleware=middleware, debug=True)
        self.app.add_route(self.endpoint, self._process_request, methods=["POST"])
        self.app.add_route(
            "/.well-known/agent.json", self._get_agent_card, methods=["GET"]
        )
        logger.info(f"A2AServer initialized. Endpoint: {self.endpoint}, Agent Card Endpoint: /.well-known/agent.json")

    def start(self):
        if self.agent_card is None: raise ValueError("agent_card must be provided to A2AServer")
        if self.task_manager is None: raise ValueError("task_manager must be provided to A2AServer")
        import uvicorn
        logger.info(f"Starting Uvicorn server on {self.host}:{self.port}...")
        uvicorn.run(self.app, host=self.host, port=self.port)

    def _get_agent_card(self, request: Request) -> JSONResponse:
        logger.debug("Received request for /.well-known/agent.json")
        if not self.agent_card:
             logger.error("Agent card requested but not configured in A2AServer.")
             return JSONResponse({"error": "Agent card not configured"}, status_code=500)
        return JSONResponse(self.agent_card.model_dump(exclude_none=True))

    async def _process_request(self, request: Request) -> Union[JSONResponse, EventSourceResponse]:
        result = None; json_rpc_request = None; request_id_for_error = None
        try:
            try: body = await request.json(); logger.debug(f"Received request body: {body}")
            except json.JSONDecodeError as e: logger.error(f"JSON decoding failed: {e}"); raise JSONParseError()

            try:
                json_rpc_request = A2ARequest.validate_python(body); request_id_for_error = getattr(json_rpc_request, 'id', None)
                logger.info(f"Processing valid A2A request: Method='{json_rpc_request.method}', ID='{request_id_for_error}', TaskID='{getattr(json_rpc_request.params, 'id', 'N/A')}'")
            except ValidationError as e:
                logger.error(f"A2A request validation failed: {e}"); req_id_fallback = body.get('id') if isinstance(body, dict) else None
                # 注意: 这里抛出的 InvalidRequestError 会在下面的 except Exception 中被捕获
                raise InvalidRequestError(data=json.loads(e.json())) from e

            # 分发给 TaskManager
            if isinstance(json_rpc_request, GetTaskRequest): result = await self.task_manager.on_get_task(json_rpc_request)
            elif isinstance(json_rpc_request, SendTaskRequest): result = await self.task_manager.on_send_task(json_rpc_request)
            elif isinstance(json_rpc_request, SendTaskStreamingRequest): result = await self.task_manager.on_send_task_subscribe(json_rpc_request)
            elif isinstance(json_rpc_request, CancelTaskRequest): result = await self.task_manager.on_cancel_task(json_rpc_request)
            elif isinstance(json_rpc_request, SetTaskPushNotificationRequest): result = await self.task_manager.on_set_task_push_notification(json_rpc_request)
            elif isinstance(json_rpc_request, GetTaskPushNotificationRequest): result = await self.task_manager.on_get_task_push_notification(json_rpc_request)
            elif isinstance(json_rpc_request, TaskResubscriptionRequest): result = await self.task_manager.on_resubscribe_to_task(json_rpc_request)
            else: logger.warning(f"Unhandled validated request type: {type(json_rpc_request)}"); raise MethodNotFoundError(data={"method": getattr(json_rpc_request, 'method', 'unknown')})

            logger.debug(f"[A2AServer] Result from TaskManager method '{json_rpc_request.method}': type={type(result)}")
            return self._create_response(result) # 调用 _create_response

        except Exception as e:
            # 统一处理所有在请求处理（包括验证和 task manager 调用）中发生的异常
            logger.error(f"Exception during request processing: {e}", exc_info=True)
            return self._handle_exception(e, request_id=request_id_for_error) # 使用 _handle_exception

    def _handle_exception(self, e: Exception, request_id: Optional[Union[str, int]] = None) -> JSONResponse:
        status_code = 500; json_rpc_error: Optional[JSONRPCError] = None
        if isinstance(e, JSONParseError): json_rpc_error = e; status_code = 400
        elif isinstance(e, InvalidRequestError): json_rpc_error = e; status_code = 400
        elif isinstance(e, MethodNotFoundError): json_rpc_error = e; status_code = 404 # 或 501
        # --- 现在可以正确捕获 Pydantic 的 ValidationError ---
        elif isinstance(e, ValidationError):
            logger.warning(f"Pydantic Validation error caught in handler: {e}")
            error_data = str(e); 
            try: error_data = json.loads(e.json()) 
            except: pass
            # 通常 Pydantic 验证错误发生在请求处理阶段是 InvalidRequestError 的一种
            # 如果发生在响应创建阶段则更像是 InternalError
            json_rpc_error = InvalidRequestError(message="Request/Response data validation failed", data=error_data)
            status_code = 400 # 认为是客户端请求或服务器返回的数据结构问题
        # --- 捕获结束 ---
        elif isinstance(e, ValueError) and "Unexpected result type" in str(e):
             logger.error(f"Internal error due to unexpected result type: {e}", exc_info=False)
             json_rpc_error = InternalError(message="Server error: Unexpected result type from handler.")
             status_code = 500
        elif isinstance(e, NotImplementedError):
             logger.error(f"Method not implemented: {e}", exc_info=True)
             json_rpc_error = MethodNotFoundError(message=f"Method not implemented: {e}")
             status_code = 501
        else:
            logger.error(f"Unhandled internal exception: {e}", exc_info=True)
            json_rpc_error = InternalError(message=f"An internal server error occurred: {type(e).__name__}")
            status_code = 500

        response = JSONRPCResponse(id=request_id, error=json_rpc_error)
        logger.debug(f"Returning error response: {response.model_dump(exclude_none=True)}")
        return JSONResponse(response.model_dump(exclude_none=True), status_code=status_code)

    def _create_response(self, result: Any) -> Union[JSONResponse, EventSourceResponse]:
        if isinstance(result, AsyncIterable):
            logger.debug("[A2AServer] Creating EventSourceResponse (text/event-stream)")
            async def event_generator(stream_result: AsyncIterable) -> AsyncIterable[dict[str, str]]:
                try:
                    async for item in stream_result:
                        if hasattr(item, 'model_dump_json'):
                            json_data = item.model_dump_json(exclude_none=True)
                            logger.debug(f"A2AServer yielding SSE data: {json_data}")
                            yield {"data": json_data}
                        else:
                            logger.warning(f"Yielding non-Pydantic object in event stream: {type(item)}")
                            yield {"data": json.dumps(str(item))}
                except Exception as gen_err:
                    logger.error(f"Error during SSE event generation: {gen_err}", exc_info=True)
                    try:
                        # 尝试 yield 一个标准的 JSON-RPC 错误事件
                        error_payload = JSONRPCResponse(id=None, error=InternalError(message=f"Streaming generation error: {gen_err}"))
                        yield {"event": "error", "data": error_payload.model_dump_json(exclude_none=True)}
                    except Exception as yield_err:
                         logger.error(f"Failed to yield error event to SSE stream: {yield_err}", exc_info=True)

            return EventSourceResponse(event_generator(result))
        elif isinstance(result, JSONRPCResponse):
            logger.debug("[A2AServer] Creating JSONResponse (application/json)")
            return JSONResponse(result.model_dump(exclude_none=True))
        else:
            logger.error(f"Unexpected result type received by _create_response: {type(result)}")
            raise ValueError(f"Unexpected result type: {type(result)}")

================================================
FILE: core/a2a/server/task_manager.py
================================================
from abc import ABC, abstractmethod
from typing import Union, AsyncIterable, List
from core.a2a.types import Task
from core.a2a.types import (
    JSONRPCResponse,
    TaskIdParams,
    TaskQueryParams,
    GetTaskRequest,
    TaskNotFoundError,
    SendTaskRequest,
    CancelTaskRequest,
    TaskNotCancelableError,
    SetTaskPushNotificationRequest,
    GetTaskPushNotificationRequest,
    GetTaskResponse,
    CancelTaskResponse,
    SendTaskResponse,
    SetTaskPushNotificationResponse,
    GetTaskPushNotificationResponse,
    PushNotificationNotSupportedError,
    TaskSendParams,
    TaskStatus,
    TaskState,
    TaskResubscriptionRequest,
    SendTaskStreamingRequest,
    SendTaskStreamingResponse,
    Artifact,
    PushNotificationConfig,
    TaskStatusUpdateEvent,
    JSONRPCError,
    TaskPushNotificationConfig,
    InternalError,
)
from core.a2a.server.utils import new_not_implemented_error
import asyncio
import logging

logger = logging.getLogger(__name__)

class TaskManager(ABC):
    @abstractmethod
    async def on_get_task(self, request: GetTaskRequest) -> GetTaskResponse:
        pass

    @abstractmethod
    async def on_cancel_task(self, request: CancelTaskRequest) -> CancelTaskResponse:
        pass

    @abstractmethod
    async def on_send_task(self, request: SendTaskRequest) -> SendTaskResponse:
        pass

    @abstractmethod
    async def on_send_task_subscribe(
        self, request: SendTaskStreamingRequest
    ) -> Union[AsyncIterable[SendTaskStreamingResponse], JSONRPCResponse]:
        pass

    @abstractmethod
    async def on_set_task_push_notification(
        self, request: SetTaskPushNotificationRequest
    ) -> SetTaskPushNotificationResponse:
        pass

    @abstractmethod
    async def on_get_task_push_notification(
        self, request: GetTaskPushNotificationRequest
    ) -> GetTaskPushNotificationResponse:
        pass

    @abstractmethod
    async def on_resubscribe_to_task(
        self, request: TaskResubscriptionRequest
    ) -> Union[AsyncIterable[SendTaskResponse], JSONRPCResponse]:
        pass


class InMemoryTaskManager(TaskManager):
    def __init__(self):
        self.tasks: dict[str, Task] = {}
        self.push_notification_infos: dict[str, PushNotificationConfig] = {}
        self.lock = asyncio.Lock()
        self.task_sse_subscribers: dict[str, List[asyncio.Queue]] = {}
        self.subscriber_lock = asyncio.Lock()

    async def on_get_task(self, request: GetTaskRequest) -> GetTaskResponse:
        logger.info(f"Getting task {request.params.id}")
        task_query_params: TaskQueryParams = request.params

        async with self.lock:
            task = self.tasks.get(task_query_params.id)
            if task is None:
                return GetTaskResponse(id=request.id, error=TaskNotFoundError())

            task_result = self.append_task_history(
                task, task_query_params.historyLength
            )

        return GetTaskResponse(id=request.id, result=task_result)

    async def on_cancel_task(self, request: CancelTaskRequest) -> CancelTaskResponse:
        logger.info(f"Cancelling task {request.params.id}")
        task_id_params: TaskIdParams = request.params

        async with self.lock:
            task = self.tasks.get(task_id_params.id)
            if task is None:
                return CancelTaskResponse(id=request.id, error=TaskNotFoundError())

        return CancelTaskResponse(id=request.id, error=TaskNotCancelableError())

    @abstractmethod
    async def on_send_task(self, request: SendTaskRequest) -> SendTaskResponse:
        pass

    @abstractmethod
    async def on_send_task_subscribe(
        self, request: SendTaskStreamingRequest
    ) -> Union[AsyncIterable[SendTaskStreamingResponse], JSONRPCResponse]:
        pass

    async def set_push_notification_info(self, task_id: str, notification_config: PushNotificationConfig):
        async with self.lock:
            task = self.tasks.get(task_id)
            if task is None:
                raise ValueError(f"Task not found for {task_id}")

            self.push_notification_infos[task_id] = notification_config

        return
    
    async def get_push_notification_info(self, task_id: str) -> PushNotificationConfig:
        async with self.lock:
            task = self.tasks.get(task_id)
            if task is None:
                raise ValueError(f"Task not found for {task_id}")

            return self.push_notification_infos[task_id]
            
        return
    
    async def has_push_notification_info(self, task_id: str) -> bool:
        async with self.lock:
            return task_id in self.push_notification_infos
            

    async def on_set_task_push_notification(
        self, request: SetTaskPushNotificationRequest
    ) -> SetTaskPushNotificationResponse:
        logger.info(f"Setting task push notification {request.params.id}")
        task_notification_params: TaskPushNotificationConfig = request.params

        try:
            await self.set_push_notification_info(task_notification_params.id, task_notification_params.pushNotificationConfig)
        except Exception as e:
            logger.error(f"Error while setting push notification info: {e}")
            return JSONRPCResponse(
                id=request.id,
                error=InternalError(
                    message="An error occurred while setting push notification info"
                ),
            )
            
        return SetTaskPushNotificationResponse(id=request.id, result=task_notification_params)

    async def on_get_task_push_notification(
        self, request: GetTaskPushNotificationRequest
    ) -> GetTaskPushNotificationResponse:
        logger.info(f"Getting task push notification {request.params.id}")
        task_params: TaskIdParams = request.params

        try:
            notification_info = await self.get_push_notification_info(task_params.id)
        except Exception as e:
            logger.error(f"Error while getting push notification info: {e}")
            return GetTaskPushNotificationResponse(
                id=request.id,
                error=InternalError(
                    message="An error occurred while getting push notification info"
                ),
            )
        
        return GetTaskPushNotificationResponse(id=request.id, result=TaskPushNotificationConfig(id=task_params.id, pushNotificationConfig=notification_info))

    async def upsert_task(self, task_send_params: TaskSendParams) -> Task:
        logger.info(f"Upserting task {task_send_params.id}")
        async with self.lock:
            task = self.tasks.get(task_send_params.id)
            if task is None:
                task = Task(
                    id=task_send_params.id,
                    sessionId = task_send_params.sessionId,
                    messages=[task_send_params.message],
                    status=TaskStatus(state=TaskState.SUBMITTED),
                    history=[task_send_params.message],
                )
                self.tasks[task_send_params.id] = task
            else:
                task.history.append(task_send_params.message)

            return task

    async def on_resubscribe_to_task(
        self, request: TaskResubscriptionRequest
    ) -> Union[AsyncIterable[SendTaskStreamingResponse], JSONRPCResponse]:
        return new_not_implemented_error(request.id)

    async def update_store(
        self, task_id: str, status: TaskStatus, artifacts: list[Artifact]
    ) -> Task:
        async with self.lock:
            try:
                task = self.tasks[task_id]
            except KeyError:
                logger.error(f"Task {task_id} not found for updating the task")
                raise ValueError(f"Task {task_id} not found")

            task.status = status

            if status.message is not None:
                task.history.append(status.message)

            if artifacts is not None:
                if task.artifacts is None:
                    task.artifacts = []
                task.artifacts.extend(artifacts)

            return task

    def append_task_history(self, task: Task, historyLength: int | None):
        new_task = task.model_copy()
        if historyLength is not None and historyLength > 0:
            new_task.history = new_task.history[-historyLength:]
        else:
            new_task.history = []

        return new_task        

    async def setup_sse_consumer(self, task_id: str, is_resubscribe: bool = False):
        async with self.subscriber_lock:
            if task_id not in self.task_sse_subscribers:
                if is_resubscribe:
                    raise ValueError("Task not found for resubscription")
                else:
                    self.task_sse_subscribers[task_id] = []

            sse_event_queue = asyncio.Queue(maxsize=0) # <=0 is unlimited
            self.task_sse_subscribers[task_id].append(sse_event_queue)
            return sse_event_queue

    async def enqueue_events_for_sse(self, task_id, task_update_event):
        async with self.subscriber_lock:
            if task_id not in self.task_sse_subscribers:
                return

            current_subscribers = self.task_sse_subscribers[task_id]
            for subscriber in current_subscribers:
                await subscriber.put(task_update_event)

    async def dequeue_events_for_sse(
        self, request_id, task_id, sse_event_queue: asyncio.Queue
    ) -> AsyncIterable[SendTaskStreamingResponse] | JSONRPCResponse:
        try:
            while True:                
                event = await sse_event_queue.get()
                if isinstance(event, JSONRPCError):
                    yield SendTaskStreamingResponse(id=request_id, error=event)
                    break
                                                
                yield SendTaskStreamingResponse(id=request_id, result=event)
                if isinstance(event, TaskStatusUpdateEvent) and event.final:
                    break
        finally:
            async with self.subscriber_lock:
                if task_id in self.task_sse_subscribers:
                    self.task_sse_subscribers[task_id].remove(sse_event_queue)


================================================
FILE: core/a2a/server/utils.py
================================================
from core.a2a.types import (
    JSONRPCResponse,
    ContentTypeNotSupportedError,
    UnsupportedOperationError,
)
from typing import List


def are_modalities_compatible(
    server_output_modes: List[str], client_output_modes: List[str]
):
    """Modalities are compatible if they are both non-empty
    and there is at least one common element."""
    if client_output_modes is None or len(client_output_modes) == 0:
        return True

    if server_output_modes is None or len(server_output_modes) == 0:
        return True

    return any(x in server_output_modes for x in client_output_modes)


def new_incompatible_types_error(request_id):
    return JSONRPCResponse(id=request_id, error=ContentTypeNotSupportedError())


def new_not_implemented_error(request_id):
    return JSONRPCResponse(id=request_id, error=UnsupportedOperationError())

================================================
FILE: core/a2a/types.py
================================================
from typing import Union, Any
from pydantic import BaseModel, Field, TypeAdapter
from typing import Literal, List, Annotated, Optional
from datetime import datetime
from pydantic import model_validator, ConfigDict, field_serializer
from uuid import uuid4
from enum import Enum
from typing_extensions import Self


class TaskState(str, Enum):
    SUBMITTED = "submitted"
    WORKING = "working"
    INPUT_REQUIRED = "input-required"
    COMPLETED = "completed"
    CANCELED = "canceled"
    FAILED = "failed"
    UNKNOWN = "unknown"


class TextPart(BaseModel):
    type: Literal["text"] = "text"
    text: str
    metadata: dict[str, Any] | None = None


class FileContent(BaseModel):
    name: str | None = None
    mimeType: str | None = None
    bytes: str | None = None
    uri: str | None = None

    @model_validator(mode="after")
    def check_content(self) -> Self:
        if not (self.bytes or self.uri):
            raise ValueError("Either 'bytes' or 'uri' must be present in the file data")
        if self.bytes and self.uri:
            raise ValueError(
                "Only one of 'bytes' or 'uri' can be present in the file data"
            )
        return self


class FilePart(BaseModel):
    type: Literal["file"] = "file"
    file: FileContent
    metadata: dict[str, Any] | None = None


class DataPart(BaseModel):
    type: Literal["data"] = "data"
    data: dict[str, Any]
    metadata: dict[str, Any] | None = None


Part = Annotated[Union[TextPart, FilePart, DataPart], Field(discriminator="type")]


class Message(BaseModel):
    role: Literal["user", "agent"]
    parts: List[Part]
    metadata: dict[str, Any] | None = None


class TaskStatus(BaseModel):
    state: TaskState
    message: Message | None = None
    timestamp: datetime = Field(default_factory=datetime.now)

    @field_serializer("timestamp")
    def serialize_dt(self, dt: datetime, _info):
        return dt.isoformat()


class Artifact(BaseModel):
    name: str | None = None
    description: str | None = None
    parts: List[Part]
    metadata: dict[str, Any] | None = None
    index: int = 0
    append: bool | None = None
    lastChunk: bool | None = None


class Task(BaseModel):
    id: str
    sessionId: str | None = None
    status: TaskStatus
    artifacts: List[Artifact] | None = None
    history: List[Message] | None = None
    metadata: dict[str, Any] | None = None


class TaskStatusUpdateEvent(BaseModel):
    id: str
    status: TaskStatus
    final: bool = False
    metadata: dict[str, Any] | None = None


class TaskArtifactUpdateEvent(BaseModel):
    id: str
    artifact: Artifact    
    metadata: dict[str, Any] | None = None


class AuthenticationInfo(BaseModel):
    model_config = ConfigDict(extra="allow")

    schemes: List[str]
    credentials: str | None = None


class PushNotificationConfig(BaseModel):
    url: str
    token: str | None = None
    authentication: AuthenticationInfo | None = None


class TaskIdParams(BaseModel):
    id: str
    metadata: dict[str, Any] | None = None


class TaskQueryParams(TaskIdParams):
    historyLength: int | None = None


class TaskSendParams(BaseModel):
    id: str
    sessionId: str = Field(default_factory=lambda: uuid4().hex)
    message: Message
    acceptedOutputModes: Optional[List[str]] = None
    pushNotification: PushNotificationConfig | None = None
    historyLength: int | None = None
    metadata: dict[str, Any] | None = None


class TaskPushNotificationConfig(BaseModel):
    id: str
    pushNotificationConfig: PushNotificationConfig


## RPC Messages


class JSONRPCMessage(BaseModel):
    jsonrpc: Literal["2.0"] = "2.0"
    id: int | str | None = Field(default_factory=lambda: uuid4().hex)


class JSONRPCRequest(JSONRPCMessage):
    method: str
    params: dict[str, Any] | None = None


class JSONRPCError(BaseModel):
    code: int
    message: str
    data: Any | None = None


class JSONRPCResponse(JSONRPCMessage):
    result: Any | None = None
    error: JSONRPCError | None = None


class SendTaskRequest(JSONRPCRequest):
    method: Literal["tasks/send"] = "tasks/send"
    params: TaskSendParams


class SendTaskResponse(JSONRPCResponse):
    result: Task | None = None


class SendTaskStreamingRequest(JSONRPCRequest):
    method: Literal["tasks/sendSubscribe"] = "tasks/sendSubscribe"
    params: TaskSendParams


class SendTaskStreamingResponse(JSONRPCResponse):
    result: TaskStatusUpdateEvent | TaskArtifactUpdateEvent | None = None


class GetTaskRequest(JSONRPCRequest):
    method: Literal["tasks/get"] = "tasks/get"
    params: TaskQueryParams


class GetTaskResponse(JSONRPCResponse):
    result: Task | None = None


class CancelTaskRequest(JSONRPCRequest):
    method: Literal["tasks/cancel",] = "tasks/cancel"
    params: TaskIdParams


class CancelTaskResponse(JSONRPCResponse):
    result: Task | None = None


class SetTaskPushNotificationRequest(JSONRPCRequest):
    method: Literal["tasks/pushNotification/set",] = "tasks/pushNotification/set"
    params: TaskPushNotificationConfig


class SetTaskPushNotificationResponse(JSONRPCResponse):
    result: TaskPushNotificationConfig | None = None


class GetTaskPushNotificationRequest(JSONRPCRequest):
    method: Literal["tasks/pushNotification/get",] = "tasks/pushNotification/get"
    params: TaskIdParams


class GetTaskPushNotificationResponse(JSONRPCResponse):
    result: TaskPushNotificationConfig | None = None


class TaskResubscriptionRequest(JSONRPCRequest):
    method: Literal["tasks/resubscribe",] = "tasks/resubscribe"
    params: TaskIdParams


A2ARequest = TypeAdapter(
    Annotated[
        Union[
            SendTaskRequest,
            GetTaskRequest,
            CancelTaskRequest,
            SetTaskPushNotificationRequest,
            GetTaskPushNotificationRequest,
            TaskResubscriptionRequest,
            SendTaskStreamingRequest,
        ],
        Field(discriminator="method"),
    ]
)

## Error types


class JSONParseError(JSONRPCError):
    code: int = -32700
    message: str = "Invalid JSON payload"
    data: Any | None = None


class InvalidRequestError(JSONRPCError):
    code: int = -32600
    message: str = "Request payload validation error"
    data: Any | None = None


class MethodNotFoundError(JSONRPCError):
    code: int = -32601
    message: str = "Method not found"
    data: None = None


class InvalidParamsError(JSONRPCError):
    code: int = -32602
    message: str = "Invalid parameters"
    data: Any | None = None


class InternalError(JSONRPCError):
    code: int = -32603
    message: str = "Internal error"
    data: Any | None = None


class TaskNotFoundError(JSONRPCError):
    code: int = -32001
    message: str = "Task not found"
    data: None = None


class TaskNotCancelableError(JSONRPCError):
    code: int = -32002
    message: str = "Task cannot be canceled"
    data: None = None


class PushNotificationNotSupportedError(JSONRPCError):
    code: int = -32003
    message: str = "Push Notification is not supported"
    data: None = None


class UnsupportedOperationError(JSONRPCError):
    code: int = -32004
    message: str = "This operation is not supported"
    data: None = None


class ContentTypeNotSupportedError(JSONRPCError):
    code: int = -32005
    message: str = "Incompatible content types"
    data: None = None


class AgentProvider(BaseModel):
    organization: str
    url: str | None = None


class AgentCapabilities(BaseModel):
    streaming: bool = False
    pushNotifications: bool = False
    stateTransitionHistory: bool = False


class AgentAuthentication(BaseModel):
    schemes: List[str]
    credentials: str | None = None


class AgentSkill(BaseModel):
    id: str
    name: str
    description: str | None = None
    tags: List[str] | None = None
    examples: List[str] | None = None
    inputModes: List[str] | None = None
    outputModes: List[str] | None = None


class AgentCard(BaseModel):
    name: str
    description: str | None = None
    url: str
    provider: AgentProvider | None = None
    version: str
    documentationUrl: str | None = None
    capabilities: AgentCapabilities
    authentication: AgentAuthentication | None = None
    defaultInputModes: List[str] = ["text"]
    defaultOutputModes: List[str] = ["text"]
    skills: List[AgentSkill]


class A2AClientError(Exception):
    pass


class A2AClientHTTPError(A2AClientError):
    def __init__(self, status_code: int, message: str):
        self.status_code = status_code
        self.message = message
        super().__init__(f"HTTP Error {status_code}: {message}")


class A2AClientJSONError(A2AClientError):
    def __init__(self, message: str):
        self.message = message
        super().__init__(f"JSON Error: {message}")


class MissingAPIKeyError(Exception):
    """Exception for missing API key."""

    pass

================================================
FILE: core/a2a/utils/__init__.py
================================================


================================================
FILE: core/a2a/utils/in_memory_cache.py
================================================
"""In Memory Cache utility."""

import threading
import time
from typing import Any, Dict, Optional


class InMemoryCache:
    """A thread-safe Singleton class to manage cache data.

    Ensures only one instance of the cache exists across the application.
    """

    _instance: Optional["InMemoryCache"] = None
    _lock: threading.Lock = threading.Lock()
    _initialized: bool = False

    def __new__(cls):
        """Override __new__ to control instance creation (Singleton pattern).

        Uses a lock to ensure thread safety during the first instantiation.

        Returns:
            The singleton instance of InMemoryCache.
        """
        if cls._instance is None:
            with cls._lock:
                if cls._instance is None:
                    cls._instance = super().__new__(cls)
        return cls._instance

    def __init__(self):
        """Initialize the cache storage.

        Uses a flag (_initialized) to ensure this logic runs only on the very first
        creation of the singleton instance.
        """
        if not self._initialized:
            with self._lock:
                if not self._initialized:
                    # print("Initializing SessionCache storage")
                    self._cache_data: Dict[str, Dict[str, Any]] = {}
                    self._ttl: Dict[str, float] = {}
                    self._data_lock: threading.Lock = threading.Lock()
                    self._initialized = True

    def set(self, key: str, value: Any, ttl: Optional[int] = None) -> None:
        """Set a key-value pair.

        Args:
            key: The key for the data.
            value: The data to store.
            ttl: Time to live in seconds. If None, data will not expire.
        """
        with self._data_lock:
            self._cache_data[key] = value

            if ttl is not None:
                self._ttl[key] = time.time() + ttl
            else:
                if key in self._ttl:
                    del self._ttl[key]

    def get(self, key: str, default: Any = None) -> Any:
        """Get the value associated with a key.

        Args:
            key: The key for the data within the session.
            default: The value to return if the session or key is not found.

        Returns:
            The cached value, or the default value if not found.
        """
        with self._data_lock:
            if key in self._ttl and time.time() > self._ttl[key]:
                del self._cache_data[key]
                del self._ttl[key]
                return default
            return self._cache_data.get(key, default)

    def delete(self, key: str) -> None:
        """Delete a specific key-value pair from a cache.

        Args:
            key: The key to delete.

        Returns:
            True if the key was found and deleted, False otherwise.
        """

        with self._data_lock:
            if key in self._cache_data:
                del self._cache_data[key]
                if key in self._ttl:
                    del self._ttl[key]
                return True
            return False

    def clear(self) -> bool:
        """Remove all data.

        Returns:
            True if the data was cleared, False otherwise.
        """
        with self._data_lock:
            self._cache_data.clear()
            self._ttl.clear()
            return True
        return False

================================================
FILE: core/a2a/utils/push_notification_auth.py
================================================
from jwcrypto import jwk
import uuid
from starlette.responses import JSONResponse
from starlette.requests import Request
from typing import Any

import jwt
import time
import json
import hashlib
import httpx
import logging

from jwt import PyJWK, PyJWKClient

logger = logging.getLogger(__name__)
AUTH_HEADER_PREFIX = 'Bearer '

class PushNotificationAuth:
    def _calculate_request_body_sha256(self, data: dict[str, Any]):
        """Calculates the SHA256 hash of a request body.

        This logic needs to be same for both the agent who signs the payload and the client verifier.
        """
        body_str = json.dumps(
            data,
            ensure_ascii=False,
            allow_nan=False,
            indent=None,
            separators=(",", ":"),
        )
        return hashlib.sha256(body_str.encode()).hexdigest()

class PushNotificationSenderAuth(PushNotificationAuth):
    def __init__(self):
        self.public_keys = []
        self.private_key_jwk: PyJWK = None

    @staticmethod
    async def verify_push_notification_url(url: str) -> bool:
        async with httpx.AsyncClient(timeout=10) as client:
            try:
                validation_token = str(uuid.uuid4())
                response = await client.get(
                    url,
                    params={"validationToken": validation_token}
                )
                response.raise_for_status()
                is_verified = response.text == validation_token

                logger.info(f"Verified push-notification URL: {url} => {is_verified}")            
                return is_verified                
            except Exception as e:
                logger.warning(f"Error during sending push-notification for URL {url}: {e}")

        return False

    def generate_jwk(self):
        key = jwk.JWK.generate(kty='RSA', size=2048, kid=str(uuid.uuid4()), use="sig")
        self.public_keys.append(key.export_public(as_dict=True))
        self.private_key_jwk = PyJWK.from_json(key.export_private())
    
    def handle_jwks_endpoint(self, _request: Request):
        """Allow clients to fetch public keys.
        """
        return JSONResponse({
            "keys": self.public_keys
        })
    
    def _generate_jwt(self, data: dict[str, Any]):
        """JWT is generated by signing both the request payload SHA digest and time of token generation.

        Payload is signed with private key and it ensures the integrity of payload for client.
        Including iat prevents from replay attack.
        """
        
        iat = int(time.time())

        return jwt.encode(
            {"iat": iat, "request_body_sha256": self._calculate_request_body_sha256(data)},
            key=self.private_key_jwk,
            headers={"kid": self.private_key_jwk.key_id},
            algorithm="RS256"
        )

    async def send_push_notification(self, url: str, data: dict[str, Any]):
        jwt_token = self._generate_jwt(data)
        headers = {'Authorization': f"Bearer {jwt_token}"}
        async with httpx.AsyncClient(timeout=10) as client: 
            try:
                response = await client.post(
                    url,
                    json=data,
                    headers=headers
                )
                response.raise_for_status()
                logger.info(f"Push-notification sent for URL: {url}")                            
            except Exception as e:
                logger.warning(f"Error during sending push-notification for URL {url}: {e}")

class PushNotificationReceiverAuth(PushNotificationAuth):
    def __init__(self):
        self.public_keys_jwks = []
        self.jwks_client = None

    async def load_jwks(self, jwks_url: str):
        self.jwks_client = PyJWKClient(jwks_url)
    
    async def verify_push_notification(self, request: Request) -> bool:
        auth_header = request.headers.get("Authorization")
        if not auth_header or not auth_header.startswith(AUTH_HEADER_PREFIX):
            print("Invalid authorization header")
            return False
        
        token = auth_header[len(AUTH_HEADER_PREFIX):]
        signing_key = self.jwks_client.get_signing_key_from_jwt(token)

        decode_token = jwt.decode(
            token,
            signing_key,
            options={"require": ["iat", "request_body_sha256"]},
            algorithms=["RS256"],
        )

        actual_body_sha256 = self._calculate_request_body_sha256(await request.json())
        if actual_body_sha256 != decode_token["request_body_sha256"]:
            # Payload signature does not match the digest in signed token.
            raise ValueError("Invalid request body")
        
        if time.time() - decode_token["iat"] > 60 * 5:
            # Do not allow push-notifications older than 5 minutes.
            # This is to prevent replay attack.
            raise ValueError("Token is expired")
        
        return True

================================================
FILE: core/agents/__init__.py
================================================
# Agents module initialization

================================================
FILE: core/agents/base/base_agent.py
================================================
import json
from typing import List, Dict, Any, Optional, Union, Callable, Sequence, TypeVar, cast
from langchain_core.language_models.chat_models import BaseChatModel
from langchain_core.language_models import LanguageModelLike
from langchain_core.messages import BaseMessage, SystemMessage, HumanMessage, AIMessage, ToolMessage
from langchain_core.tools import BaseTool
from langchain_core.runnables import RunnableConfig
from langgraph.graph import StateGraph
from langgraph.types import Checkpointer
from langgraph.graph.graph import CompiledGraph
from langgraph.graph.state import CompiledStateGraph
import logging
try:
    import tiktoken
    TIKTOKEN_AVAILABLE = True
except ImportError:
    TIKTOKEN_AVAILABLE = False
    print("Warning: Tiktoken not installed. Using naive token estimation.")

logger = logging.getLogger(__name__)
DEFAULT_MODEL_NAME = "gpt-4o-mini"

StateSchema = TypeVar("StateSchema", bound=Union[dict, Any])

class BaseAgent:
    def __init__(
        self,
        name: str,
        model: Union[BaseChatModel, LanguageModelLike],
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[Union[str, SystemMessage, Callable]] = None,
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,  # Limit number of recent messages
        max_context_tokens: Optional[int] = None,    # Limit total estimated tokens
        model_name: Optional[str] = "gpt-4o-mini", # Optional, used for future token estimation improvements
        description: str = "No description provided."
        
    ):
        if max_context_messages and max_context_tokens:
            raise ValueError("Only one of max_context_messages or max_context_tokens should be set.")
        if name is None or name == "LangGraph":
             raise ValueError("Agent name must be specified.")

        self.name = name
        self.model = model
        self.tools = tools or []
        self.base_prompt = prompt
        self.checkpointer = checkpointer
        self.max_context_messages = max_context_messages
        self.max_context_tokens = max_context_tokens
        self.model_name = model_name or getattr(model, "model_name", DEFAULT_MODEL_NAME)
        self.description = description
        
        self._workflow: Optional[StateGraph] = None
        self._compiled_agent: Optional[CompiledGraph] = None # Stores the final compiled graph

        self._tokenizer = None
        if TIKTOKEN_AVAILABLE:
            try: self._tokenizer = tiktoken.encoding_for_model(self.model_name)
            except KeyError:
                try:
                     self._tokenizer = tiktoken.get_encoding("cl100k_base")
                     # print(f"Warning: Tiktoken encoding for model '{self.model_name}' not found. Using 'cl100k_base'.")
                except Exception as e: print(f"Error getting tiktoken encoding 'cl100k_base': {e}.")
            except Exception as e: print(f"Error initializing tiktoken for model '{self.model_name}': {e}.")


    def _estimate_tokens(self, message: BaseMessage) -> int:
        content_to_encode = ""
        if isinstance(message, (HumanMessage, SystemMessage, AIMessage)):
            if isinstance(message.content, str): content_to_encode = message.content
            elif isinstance(message.content, list):
                 for block in message.content:
                     if isinstance(block, dict) and block.get("type") == "text": content_to_encode += block.get("text", "") + "\n"
        elif isinstance(message, ToolMessage):
             content_to_encode = message.content if isinstance(message.content, str) else json.dumps(message.content)
        else: content_to_encode = str(message)
        if self._tokenizer:
            try: return len(self._tokenizer.encode(content_to_encode, disallowed_special=()))
            except Exception: pass
        return len(content_to_encode) // 2

   
    def _truncate_by_tokens(self, messages: Sequence[BaseMessage]) -> List[BaseMessage]:
        if not self.max_context_tokens: return list(messages)
        truncated_messages: List[BaseMessage] = []
        total_tokens = 0
        preserved_system_message: Optional[SystemMessage] = None
        # Check if the first message is a SystemMessage, preserve it if so
        # Note: This assumes only ONE leading SystemMessage should be preserved.
        if messages and isinstance(messages[0], SystemMessage):
            preserved_system_message = messages[0]
            messages_to_truncate = messages[1:]
            try: 
                system_tokens = self._estimate_tokens(preserved_system_message)
                # Only count if it doesn't exceed limit by itself
                if system_tokens <= self.max_context_tokens:
                     total_tokens += system_tokens
                else:
                     print(f"Warning: System message alone ({system_tokens} tokens) exceeds token limit ({self.max_context_tokens}). It might be truncated if context grows.")
                     # Don't add to total_tokens yet, let truncation logic handle it.
                     preserved_system_message = None # Don't preserve if it's too big initially

            except Exception: pass # Ignore errors estimating system message
        else:
            messages_to_truncate = messages

        # Iterate backwards from the most recent message
        for msg in reversed(messages_to_truncate):
            try:
                msg_tokens = self._estimate_tokens(msg)
                # Check if adding this message exceeds the limit
                if total_tokens + msg_tokens <= self.max_context_tokens:
                    truncated_messages.append(msg)
                    total_tokens += msg_tokens
                else:
                    print(f"Context Token Limit ({self.max_context_tokens}) reached. Truncating older messages.")
                    break # Limit reached
            except Exception as e:
                print(f"Warning: Failed to estimate tokens for message, skipping: {e}")
                continue

        # Re-add the system message at the beginning if it was preserved
        final_list = list(reversed(truncated_messages))
        if preserved_system_message:
             try: system_tokens = self._estimate_tokens(preserved_system_message)
             except Exception: system_tokens = 0
             # Ensure adding system message doesn't push over limit *again* (edge case)
             if total_tokens - (msg_tokens if 'msg_tokens' in locals() and total_tokens + msg_tokens > self.max_context_tokens else 0) + system_tokens <= self.max_context_tokens:
                 final_list.insert(0, preserved_system_message)
             elif not final_list: # If only system message fits
                 return [preserved_system_message]
             # Else: System message doesn't fit with the truncated history, omit it.

        return final_list


    def _truncate_messages(self, messages: Sequence[BaseMessage]) -> List[BaseMessage]:
        """根据配置（优先 token 数，其次消息数）截断消息历史。"""
        if self.max_context_tokens is not None:
            return self._truncate_by_tokens(messages)
        elif self.max_context_messages is not None:
            if messages and isinstance(messages[0], SystemMessage):
                # Keep system message + last N-1 messages
                keep_count = self.max_context_messages - 1
                return [messages[0]] + list(messages[-keep_count:]) if keep_count > 0 and len(messages) > 1 else [messages[0]]
            else:
                return list(messages[-self.max_context_messages:])
        return list(messages)

    def _get_state_value(self, state: StateSchema, key: str, default: Any = None) -> Any:
         return state.get(key, default) if isinstance(state, dict) else getattr(state, key, default)
    
    def _format_tools_for_prompt(self, tools: List[Union[BaseTool, Callable]]) -> str:
        """Formats the tool list for inclusion in the prompt."""
        if not tools:
            return "No tools available for use."
        # 使用 getattr 安全地访问 name 和 description
        return "\n".join([
            f"- **{getattr(t, 'name', 'Unnamed Tool')}**: {getattr(t, 'description', 'No description available.')}"
            for t in tools
        ])
        
    # --- build/compile/get_agent ---
    def build(self) -> Optional[StateGraph]:
        """构建 Agent 的 LangGraph 工作流图定义。子类应实现。"""
        raise NotImplementedError("Subclasses must implement build() or override compile() directly.")

    def compile(self) -> CompiledGraph:
        """编译 Agent 工作流。"""
        if self._compiled_agent is not None:
            return self._compiled_agent

        # 尝试调用 build() 来获取 StateGraph
        workflow = self.build()

        if workflow is None or not isinstance(workflow, StateGraph):
             # 如果 build() 不返回 StateGraph (例如 ReactAgent),
             # 子类的 compile() 需要被覆盖以处理编译
             raise ValueError(
                 f"Agent '{self.name}': build() did not return a valid StateGraph, "
                 "and compile() was not overridden to handle direct compilation."
             )

        print(f"Compiling graph for agent: {self.name}")
        try:
            # 编译 StateGraph 并存储结果
            self._compiled_agent = workflow.compile(
                 checkpointer=self.checkpointer,
                 debug=getattr(self, 'debug', False) # 传递 debug 标志
            )
            print(f"Graph compiled successfully for agent: {self.name}")
            return self._compiled_agent
        except Exception as e:
             print(f"!!! Error compiling graph for agent {self.name}: {e}")
             import traceback
             traceback.print_exc()
             raise e

    def get_agent(self) -> CompiledGraph:
         """获取编译后的核心图实例，如果未编译则先编译。"""
         if self._compiled_agent is None:
              print(f"Agent '{self.name}' not compiled yet. Compiling now.")
              self.compile()
         if self._compiled_agent is None:
              raise RuntimeError(f"Failed to get compiled agent for '{self.name}'.")
         return self._compiled_agent
        
    # --- invoke/ainvoke: 标准入口点，调用编译后的图 ---
    def invoke(self, state: Dict[str, Any], config: Optional[RunnableConfig] = None) -> Dict[str, Any]:
        """同步调用编译后的 Agent 图。"""
        try:
            compiled_agent = self.get_agent() # 获取 (或编译) 图
            print(f"--- Invoking Agent: {self.name} ---")
            # 直接调用编译后的图，预处理由图内部的 prompt callable 处理 (如果使用 ReactAgent)
            # 或由 Supervisor 节点逻辑处理 (如果使用自定义 Supervisor)
            result = compiled_agent.invoke(state, config=config)
            print(f"--- Agent Invocation Complete: {self.name} ---")
            return cast(Dict[str, Any], result) # 假设返回字典
        except Exception as e:
            print(f"!!! Error during {self.name} agent invocation: {e}")
            import traceback
            traceback.print_exc()
            # 返回带错误标记的状态 (可能是输入状态)
            state["error"] = f"Agent invocation failed: {e}"
            return state

    async def ainvoke(self, state: Dict[str, Any], config: Optional[RunnableConfig] = None) -> Dict[str, Any]:
        """异步调用编译后的 Agent 图。"""
        try:
            compiled_agent = self.get_agent() # 获取 (或编译) 图
            print(f"--- Invoking Agent Async: {self.name} ---")
            # 直接调用编译后的图
            result = await compiled_agent.ainvoke(state, config=config)
            print(f"--- Agent Invocation Complete Async: {self.name} ---")
            return cast(Dict[str, Any], result) # 假设返回字典
        except Exception as e:
            print(f"!!! Error during {self.name} agent async invocation: {e}")
            import traceback
            traceback.print_exc()
            state["error"] = f"Agent async invocation failed: {e}"
            return state

    def run(self, state: Dict[str, Any]) -> Dict[str, Any]:
        """Run the supervisor workflow synchronously.

        Args:
            state: The input state for the workflow

        Returns:
            The output state from the workflow
        """
        return self.invoke(state)
    
    async def arun(self, state: Dict[str, Any]) -> Dict[str, Any]:
        """Run the supervisor workflow asynchronously.
        Args:
            state: The input state for the workflow
        Returns:
            The output state from the workflow
        """
        return await self.ainvoke(state)

    def reset(self):
        """重置编译状态，强制下次重新编译。"""
        print(f"Resetting compiled graph for agent '{self.name}'. Will recompile on next use.")
        self._compiled_agent = None
        self._workflow = None

    def add_tools(self, tools: List[Union[BaseTool, Callable]]) -> None:
        """添加工具到 Agent 的工具列表。"""
        print(f"Warning: Adding tools to {self.name} post-initialization. Agent needs recompilation.")
        self.tools.extend(tools)
        self.reset()


================================================
FILE: core/agents/base/create_react_agent_wrapper.py
================================================
import logging
from typing import Optional, Callable, Dict
from langgraph.utils.runnable import RunnableCallable
from langchain_core.runnables.config import RunnableConfig

logger = logging.getLogger(__name__)

class CreateReactAgentWrapper(RunnableCallable):
    def __init__(
        self, 
        agent, 
        name: str = "agent", 
        before_invoke: Optional[Callable[[dict], dict]] = None,
        before_ainvoke: Optional[Callable[[dict], dict]] = None,
        after_invoke: Optional[Callable[[dict, dict], None]] = None,
        after_ainvoke: Optional[Callable[[dict, dict], None]] = None
    ):
        """
        :param agent: The underlying compiled graph or runnable
        :param name: Unique name for this wrapper (avoid duplicates)
        :param before_invoke: A sync callback that modifies the state before the wrapped agent call
        :param before_ainvoke: An async callback that modifies the state before the wrapped agent call
        :param after_invoke: A sync callback that inspects (state, output) after the wrapped call
        :param after_ainvoke: An async callback that inspects (state, output) after the wrapped call
        """
        self._agent = agent
        self.name = name or getattr(agent, "name", "agent")
        self.before_invoke = before_invoke
        self.after_invoke = after_invoke
        self.before_ainvoke = before_ainvoke
        self.after_ainvoke = after_ainvoke

        # We define the sync/async "call" functions for RunnableCallable
        def call(state: Dict, config: Optional[RunnableConfig] = None, **kwargs) -> Dict:
            logger.info(f"[{self.name}] (sync) call() - started. State keys: {list(state.keys())}")
            # Or use print if you prefer
            # print(f"🟢 [Sync] Invoking wrapper: {self.name}, state keys: {list(state.keys())}")

            # before_invoke callback
            if self.before_invoke:
                state = self.before_invoke(state)

            # Call the underlying agent
            output = self._agent.invoke(state, config, **kwargs)

            # after_invoke callback
            if self.after_invoke:
                self.after_invoke(state, output)

            logger.info(f"[{self.name}] (sync) call() - finished. Output keys: {list(output.keys())}")
            return output

        async def acall(state: Dict, config: Optional[RunnableConfig] = None, **kwargs) -> Dict:
            logger.info(f"[{self.name}] (async) acall() - started. State keys: {list(state.keys())}")
            # print(f"🟢 [Async] Invoking wrapper: {self.name}, state keys: {list(state.keys())}")

            if self.before_ainvoke:
                state = await self.before_ainvoke(state)

            output = await self._agent.ainvoke(state, config, **kwargs)

            if self.after_ainvoke:
                await self.after_ainvoke(state, output)

            logger.info(f"[{self.name}] (async) acall() - finished. Output keys: {list(output.keys())}")
            return output

        # Pass these to RunnableCallable
        super().__init__(call, acall, name=self.name)

================================================
FILE: core/agents/base/react_agent.py
================================================
from typing import Any, Callable, Dict, List, Optional, Type, Union, Literal, Sequence

from langchain_core.language_models import LanguageModelLike, LanguageModelInput
from langchain_core.tools import BaseTool
from langgraph.graph import StateGraph
from langgraph.graph.graph import CompiledGraph
from langgraph.types import Checkpointer
from langgraph.store.base import BaseStore
from langchain_core.messages import BaseMessage, SystemMessage # 导入 SystemMessage
from langgraph.prebuilt import create_react_agent
from langgraph.prebuilt.chat_agent_executor import (
    AgentState,
    StateSchemaType,
    StructuredResponseSchema,
)
from core.agents.base.base_agent import BaseAgent
import logging
logger = logging.getLogger(__name__)

class ReactAgent(BaseAgent):
    """ReAct Agent class for reasoning and acting with tools.
    
    This class provides a high-level interface for creating a ReAct agent workflow
    that can perform multi-step reasoning and tool calling.
    """
    
    def __init__(
        self,
        model: LanguageModelLike,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[str] = None,
        response_format: Optional[
            Union[StructuredResponseSchema, tuple[str, StructuredResponseSchema]]
        ] = None,
        state_schema: StateSchemaType = AgentState,
        config_schema: Type[Any] = None,
        checkpointer: Optional[Checkpointer] = None,
        store: Optional[BaseStore] = None,
        interrupt_before: Optional[List[str]] = None,
        interrupt_after: Optional[List[str]] = None,
        debug: bool = False,
        version: Literal["v1", "v2"] = "v1",
        name: str = "react_agent",
        description: str = "ReAct agent for reasoning and acting with tools.",
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = None,
        model_name: Optional[str] = "gpt-4o-mini",
    ):
        """Initialize a ReAct agent.
        
        Args:
            model: Language model to use for the agent
            tools: Optional list of tools available to the agent
            prompt: Optional prompt to use for the agent
            response_format: Optional schema for structured output
            state_schema: State schema to use for the agent graph
            config_schema: Optional schema for configuration
            interrupt_before: Optional list of nodes to interrupt before execution
            interrupt_after: Optional list of nodes to interrupt after execution
            debug: Whether to enable debug mode
            version: Version of the ReAct agent ("v1" or "v2")
            name: Name of the agent
            max_context_messages: Optional limit on number of recent messages
            max_context_tokens: Optional limit on total estimated tokens
            model_name: Optional model name for token estimation
        """
        # Call BaseAgent's __init__ to initialize parent class attributes
        super().__init__(
            name=name,
            model=model,
            tools=tools or [],
            prompt=prompt,
            description=description,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            model_name=model_name
        )
        
        # Initialize ReactAgent specific attributes
        self.response_format = response_format
        self.react_state_schema = state_schema
        self.react_config_schema = config_schema
        self.react_store = store
        self.react_interrupt_before = interrupt_before
        self.react_interrupt_after = interrupt_after
        self.react_debug = debug
        self.react_version = version

    def _prepare_llm_input(self, state: Dict[str, Any]) -> LanguageModelInput:
        """
        准备 LLM 输入：截断消息历史并添加基础 System Prompt (如果存在)。
        作为 Callable 传递给 create_react_agent 的 prompt 参数。
        """
        # 1. 从状态获取消息 (BaseAgent 的方法)
        messages = self._get_state_value(state, "messages", [])
        
        # 2. 截断消息 (BaseAgent 的方法)
        # 注意：这里截断的是进入 LLM 前的列表，checkpointer 中的完整历史不受影响
        # --- 添加 Debug 打印 (截断前) ---
        # print(f"\nDEBUG _prepare_llm_input ({self.name}): BEFORE truncation (length {len(messages)}):")
        # for i, msg in enumerate(messages[-5:]): # 只看最后几条
        #     print(f"  Msg {i-5}: Type={type(msg).__name__}, ToolCallID={getattr(msg, 'tool_call_id', 'N/A')}")
        # ---

        truncated_messages = self._truncate_messages(messages)

        # --- 添加 Debug 打印 (截断后) ---
        # print(f"DEBUG _prepare_llm_input ({self.name}): AFTER truncation (length {len(truncated_messages)}):")
        # for i, msg in enumerate(truncated_messages[-5:]): # 只看最后几条
        #     print(f"  Msg {i-5}: Type={type(msg).__name__}, ToolCallID={getattr(msg, 'tool_call_id', 'N/A')}")
        # ---
        
        # 3. 添加基础 System Prompt (如果存在)
        final_messages: List[BaseMessage] = []
        if self.base_prompt:
            if isinstance(self.base_prompt, str):
                final_messages.append(SystemMessage(content=self.base_prompt))
            elif isinstance(self.base_prompt, SystemMessage):
                 final_messages.append(self.base_prompt)
            # 如果 self.base_prompt 是其他 Runnable 或 Callable，需要相应处理
            # 但 create_react_agent 的 prompt 通常是 str 或 SystemMessage
            
        final_messages.extend(truncated_messages)
        
        # print(f"DEBUG [{self.name}]: Preparing LLM input with {len(final_messages)} messages.") # Optional debug log
        # 返回最终的消息列表给 LLM
        return final_messages
    
    def build(self) -> Optional[StateGraph]:
        """对于 ReactAgent，核心图由 create_react_agent 直接创建，无需 build。"""
        print(f"Note: ReactAgent '{self.name}' uses create_react_agent in compile(). Build returns None.")
        self._workflow = None
        return None
    
    def compile(self) -> CompiledGraph:
        """使用 create_react_agent 构建并编译核心 ReAct 工作流，存储在 _compiled_agent。"""
        if self._compiled_agent is not None:
            return self._compiled_agent

        print(f"[[DEBUG]] Compiling core ReAct agent for: {self.name} using create_react_agent")
        try:
            # 使用 create_react_agent 创建编译后的图
            # 将 self._prepare_llm_input 作为 prompt callable 传入
            compiled_agent = create_react_agent(
                model=self.model,
                tools=self.tools,
                prompt=self._prepare_llm_input, # <--- 关键改动：传入准备函数
                state_schema=self.react_state_schema,
                config_schema=self.react_config_schema,
                checkpointer=self.checkpointer,
                store=self.react_store,
                interrupt_before=self.react_interrupt_before,
                interrupt_after=self.react_interrupt_after,
                debug=self.react_debug,
                version=self.react_version,
                name=self.name,
            )
            # 存储编译好的图
            self._compiled_agent = compiled_agent
            print(f"Core ReAct graph compiled successfully for agent: {self.name}")
            return self._compiled_agent
        except Exception as e:
             print(f"!!! Error compiling graph for agent {self.name} using create_react_agent: {e}")
             import traceback
             traceback.print_exc()
             self._compiled_agent = None
             raise e

================================================
FILE: core/agents/react_based_supervisor/__init__.py
================================================
# 从当前目录导入create_supervisor函数
from .supervisor import create_supervisor

__all__ = ["create_supervisor"]


================================================
FILE: core/agents/react_based_supervisor/agent_name.py
================================================
import re
from typing import Literal

from langchain_core.language_models import LanguageModelLike
from langchain_core.messages import AIMessage, BaseMessage
from langchain_core.runnables import RunnableLambda

NAME_PATTERN = re.compile(r"<name>(.*?)</name>", re.DOTALL)
CONTENT_PATTERN = re.compile(r"<content>(.*?)</content>", re.DOTALL)

AgentNameMode = Literal["inline"]


def _is_content_blocks_content(content: list[dict] | str) -> bool:
    return (
        isinstance(content, list)
        and len(content) > 0
        and isinstance(content[0], dict)
        and "type" in content[0]
    )


def add_inline_agent_name(message: BaseMessage) -> BaseMessage:
    """Add name and content XML tags to the message content.

    Examples:

        >>> add_inline_agent_name(AIMessage(content="Hello", name="assistant"))
        AIMessage(content="<name>assistant</name><content>Hello</content>", name="assistant")

        >>> add_inline_agent_name(AIMessage(content=[{"type": "text", "text": "Hello"}], name="assistant"))
        AIMessage(content=[{"type": "text", "text": "<name>assistant</name><content>Hello</content>"}], name="assistant")
    """
    if not isinstance(message, AIMessage) or not message.name:
        return message

    formatted_message = message.model_copy()
    if _is_content_blocks_content(formatted_message.content):
        text_blocks = [block for block in message.content if block["type"] == "text"]
        non_text_blocks = [block for block in message.content if block["type"] != "text"]
        content = text_blocks[0]["text"] if text_blocks else ""
        formatted_content = f"<name>{message.name}</name><content>{content}</content>"
        formatted_message.content = non_text_blocks + [{"type": "text", "text": formatted_content}]
    else:
        formatted_message.content = (
            f"<name>{message.name}</name><content>{formatted_message.content}</content>"
        )
    return formatted_message


def remove_inline_agent_name(message: BaseMessage) -> BaseMessage:
    """Remove explicit name and content XML tags from the AI message content.

    Examples:

        >>> remove_inline_agent_name(AIMessage(content="<name>assistant</name><content>Hello</content>", name="assistant"))
        AIMessage(content="Hello", name="assistant")

        >>> remove_inline_agent_name(AIMessage(content=[{"type": "text", "text": "<name>assistant</name><content>Hello</content>"}], name="assistant"))
        AIMessage(content=[{"type": "text", "text": "Hello"}], name="assistant")
    """
    if not isinstance(message, AIMessage) or not message.name:
        return message

    is_content_blocks_content = _is_content_blocks_content(message.content)
    if is_content_blocks_content:
        text_blocks = [block for block in message.content if block["type"] == "text"]
        if not text_blocks:
            return message

        non_text_blocks = [block for block in message.content if block["type"] != "text"]
        content = text_blocks[0]["text"]
    else:
        content = message.content

    name_match: re.Match | None = NAME_PATTERN.search(content)
    content_match: re.Match | None = CONTENT_PATTERN.search(content)
    if not name_match or not content_match:
        return message

    if name_match.group(1) != message.name:
        return message

    parsed_content = content_match.group(1)
    parsed_message = message.model_copy()
    if is_content_blocks_content:
        content_blocks = non_text_blocks
        if parsed_content:
            content_blocks.append({"type": "text", "text": parsed_content})

        parsed_message.content = content_blocks
    else:
        parsed_message.content = parsed_content
    return parsed_message


def with_agent_name(
    model: LanguageModelLike,
    agent_name_mode: AgentNameMode,
) -> LanguageModelLike:
    """Attach formatted agent names to the messages passed to and from a language model.

    This is useful for making a message history with multiple agents more coherent.

    NOTE: agent name is consumed from the message.name field.
        If you're using an agent built with create_react_agent, name is automatically set.
        If you're building a custom agent, make sure to set the name on the AI message returned by the LLM.

    Args:
        model: Language model to add agent name formatting to.
        agent_name_mode: Use to specify how to expose the agent name to the LLM.
            - "inline": Add the agent name directly into the content field of the AI message using XML-style tags.
                Example: "How can I help you" -> "<name>agent_name</name><content>How can I help you?</content>".
    """
    if agent_name_mode == "inline":
        process_input_message = add_inline_agent_name
        process_output_message = remove_inline_agent_name
    else:
        raise ValueError(
            f"Invalid agent name mode: {agent_name_mode}. Needs to be one of: {AgentNameMode.__args__}"
        )

    def process_input_messages(messages: list[BaseMessage]) -> list[BaseMessage]:
        return [process_input_message(message) for message in messages]

    model = (
        process_input_messages
        | model
        | RunnableLambda(process_output_message, name="process_output_message")
    )
    return model


================================================
FILE: core/agents/react_based_supervisor/handoff.py
================================================
import re
import uuid

from langchain_core.messages import AIMessage, ToolCall, ToolMessage
from langchain_core.tools import BaseTool, InjectedToolCallId, tool
from langgraph.prebuilt import InjectedState
from langgraph.types import Command
from typing_extensions import Annotated

WHITESPACE_RE = re.compile(r"\s+")


def _normalize_agent_name(agent_name: str) -> str:
    """Normalize an agent name to be used inside the tool name."""
    return WHITESPACE_RE.sub("_", agent_name.strip()).lower()


def create_handoff_tool(*, agent_name: str) -> BaseTool:
    """Create a tool that can handoff control to the requested agent.

    Args:
        agent_name: The name of the agent to handoff control to, i.e.
            the name of the agent node in the multi-agent graph.
            Agent names should be simple, clear and unique, preferably in snake_case,
            although you are only limited to the names accepted by LangGraph
            nodes as well as the tool names accepted by LLM providers
            (the tool name will look like this: `transfer_to_<agent_name>`).
    """
    tool_name = f"transfer_to_{_normalize_agent_name(agent_name)}"

    @tool(tool_name)
    def handoff_to_agent(
        state: Annotated[dict, InjectedState],
        tool_call_id: Annotated[str, InjectedToolCallId],
    ):
        """Ask another agent for help."""
        tool_message = ToolMessage(
            content=f"Successfully transferred to {agent_name}",
            name=tool_name,
            tool_call_id=tool_call_id,
        )
        return Command(
            goto=agent_name,
            graph=Command.PARENT,
            update={"messages": state["messages"] + [tool_message]},
        )

    return handoff_to_agent


def create_handoff_back_messages(
    agent_name: str, supervisor_name: str
) -> tuple[AIMessage, ToolMessage]:
    """Create a pair of (AIMessage, ToolMessage) to add to the message history when returning control to the supervisor."""
    tool_call_id = str(uuid.uuid4())
    tool_name = f"transfer_back_to_{_normalize_agent_name(supervisor_name)}"
    tool_calls = [ToolCall(name=tool_name, args={}, id=tool_call_id)]
    return (
        AIMessage(
            content=f"Transferring back to {supervisor_name}",
            tool_calls=tool_calls,
            name=agent_name,
        ),
        ToolMessage(
            content=f"Successfully transferred back to {supervisor_name}",
            name=tool_name,
            tool_call_id=tool_call_id,
        ),
    )


================================================
FILE: core/agents/react_based_supervisor/planning_handler.py
================================================
import uuid
import datetime
from typing import List, Dict, Optional

class PlanningStateHandler:
    """
    Manages a project plan.
    A plan is a dict with:
      - title (str)
      - description (str)
      - status (str): "planning", "in_progress", or "completed"
      - tasks (list): each task is a dict with:
           id, description, status, agent, notes, evaluation
      - current_task_id (str or None)
      - created_at (str)
      - updated_at (str)
    """

    @staticmethod
    def _now() -> str:
        return datetime.datetime.now().isoformat()

    @staticmethod
    def _gen_id() -> str:
        return str(uuid.uuid4())

    @staticmethod
    def create_plan(title: str, description: str) -> Dict:
        now = PlanningStateHandler._now()
        return {
            "title": title,
            "description": description,
            "status": "planning",  # initial status
            "tasks": [],
            "current_task_id": None,
            "created_at": now,
            "updated_at": now
        }

    @staticmethod
    def create_task(description: str,
                    status: str = "pending",
                    agent: str = "",
                    notes: str = "",
                    evaluation: str = "") -> Dict:
        return {
            "id": PlanningStateHandler._gen_id(),
            "description": description.strip(),
            "status": status.strip() if status else "pending",
            "agent": agent.strip(),
            "notes": notes.strip(),
            "evaluation": evaluation.strip()
        }

    @staticmethod
    def add_tasks(plan: Dict, tasks_data: List[Dict]) -> Dict:
        for tinfo in tasks_data:
            desc = tinfo.get("description", "Untitled Task")
            status = tinfo.get("status", "pending")
            agent = tinfo.get("agent", "")
            notes = tinfo.get("notes", "")
            eval_ = tinfo.get("evaluation", "")
            task = PlanningStateHandler.create_task(desc, status, agent, notes, eval_)
            plan["tasks"].append(task)
        plan["updated_at"] = PlanningStateHandler._now()
        return plan

    @staticmethod
    def update_task(plan: Dict,
                    by_id: Optional[str] = None,
                    new_desc: Optional[str] = None,
                    new_status: Optional[str] = None,
                    new_agent: Optional[str] = None,
                    new_notes: Optional[str] = None,
                    new_evaluation: Optional[str] = None) -> Dict:
        """
        Update a task identified by by_id.
        """
        if not by_id:
            raise ValueError("Must provide 'by_id' to update a task.")
        task = next((t for t in plan["tasks"] if t["id"] == by_id), None)
        if not task:
            raise ValueError("No matching task found with the given ID.")

        if new_desc is not None:
            task["description"] = new_desc.strip()
        if new_status is not None:
            task["status"] = new_status.strip()
        if new_agent is not None:
            task["agent"] = new_agent.strip()
        if new_notes is not None:
            task["notes"] = new_notes.strip()
        if new_evaluation is not None:
            task["evaluation"] = new_evaluation.strip()

        plan["updated_at"] = PlanningStateHandler._now()

        # Determine overall plan status
        if any(t["status"] == "in_progress" for t in plan["tasks"]):
            plan["status"] = "in_progress"
        if all(t["status"] == "completed" for t in plan["tasks"]) and plan["tasks"]:
            plan["status"] = "completed"

        return plan

    @staticmethod
    def set_current_task(plan: Dict, task_id: str) -> Dict:
        found = any(t["id"] == task_id for t in plan["tasks"])
        if not found:
            raise ValueError("Task ID not found in plan.")
        plan["current_task_id"] = task_id
        plan["updated_at"] = PlanningStateHandler._now()
        return plan

    @staticmethod
    def finish_plan(plan: Dict) -> Dict:
        """
        Forcefully mark the plan as completed.
        """
        plan["status"] = "completed"
        plan["updated_at"] = PlanningStateHandler._now()
        return plan

================================================
FILE: core/agents/react_based_supervisor/simple_planning_tool.py
================================================
import json
from typing import Dict, List, Optional
from langchain_core.tools import BaseTool
from core.agents.supervisor.planning_handler import PlanningStateHandler

class SimplePlanningTool(BaseTool):
    """
    A tool that manages a single project plan in memory.
    It supports creating, viewing, adding tasks, updating tasks, setting the current task,
    and finishing the plan. All operations return a JSON string.
    """
    name: str = "planning"
    description: str = ("Manage a project plan with actions to create, view, add tasks, update tasks, "
                        "set current task, and finish the plan. All data is stored in JSON.")

    def __init__(self):
        super().__init__()
        self._plan: Optional[Dict] = None

    def _run(self, action: str, **kwargs) -> str:
        try:
            if action == "create_plan":
                return self._handle_create_plan(**kwargs)
            elif action == "view_plan":
                return self._handle_view_plan()
            elif action == "add_tasks":
                return self._handle_add_tasks(**kwargs)
            elif action == "update_task":
                return self._handle_update_task(**kwargs)
            elif action == "set_current_task":
                return self._handle_set_current_task(**kwargs)
            elif action == "finish_plan":
                return self._handle_finish_plan()
            else:
                return self._json_error(f"Unknown action: {action}")
        except Exception as e:
            return self._json_error(str(e))

    async def _arun(self, action: str, **kwargs) -> str:
        return self._run(action, **kwargs)

    def _handle_create_plan(self, **kwargs) -> str:
        title = kwargs.get("title", "Untitled Plan")
        description = kwargs.get("description", "")
        tasks_data = kwargs.get("tasks", [])
        new_plan = PlanningStateHandler.create_plan(title, description)
        PlanningStateHandler.add_tasks(new_plan, tasks_data)
        self._plan = new_plan
        return self._json_ok(self._plan)

    def _handle_view_plan(self) -> str:
        if not self._plan:
            self._plan = PlanningStateHandler.create_plan("Untitled", "")
        return self._json_ok(self._plan)

    def _handle_add_tasks(self, **kwargs) -> str:
        if not self._plan:
            self._plan = PlanningStateHandler.create_plan("Untitled", "")
        tasks_data = kwargs.get("tasks", [])
        PlanningStateHandler.add_tasks(self._plan, tasks_data)
        return self._json_ok(self._plan)

    def _handle_update_task(self, **kwargs) -> str:
        if not self._plan:
            raise ValueError("No plan exists. Please create a plan first.")
        # Use 'by_id' instead of 'task_id'
        by_id = kwargs.get("by_id")
        new_desc = kwargs.get("description")
        new_status = kwargs.get("status")
        new_agent = kwargs.get("agent")
        new_notes = kwargs.get("notes")
        new_evaluation = kwargs.get("evaluation")
        updated = PlanningStateHandler.update_task(
            self._plan,
            by_id=by_id,
            new_desc=new_desc,
            new_status=new_status,
            new_agent=new_agent,
            new_notes=new_notes,
            new_evaluation=new_evaluation
        )
        self._plan = updated
        return self._json_ok(self._plan)

    def _handle_set_current_task(self, **kwargs) -> str:
        if not self._plan:
            raise ValueError("No plan available to set current task.")
        tid = kwargs.get("task_id")
        if not tid:
            raise ValueError("Must provide 'task_id' for set_current_task.")
        PlanningStateHandler.set_current_task(self._plan, tid)
        return self._json_ok(self._plan)

    def _handle_finish_plan(self) -> str:
        if not self._plan:
            raise ValueError("No plan exists to finish.")
        finished_plan = PlanningStateHandler.finish_plan(self._plan)
        self._plan = finished_plan
        return self._json_ok(finished_plan)

    def _json_ok(self, plan_data: Dict) -> str:
        return json.dumps({"ok": True, "plan": plan_data}, ensure_ascii=False, indent=2)

    def _json_error(self, message: str) -> str:
        return json.dumps({"ok": False, "error": message}, ensure_ascii=False, indent=2)

================================================
FILE: core/agents/react_based_supervisor/state_schema.py
================================================
from typing import Dict, List, Optional, Any, Literal, TypedDict, Union
from langchain_core.messages import BaseMessage
from langgraph.prebuilt.chat_agent_executor import AgentState

# 定义计划状态类型
PlanningStatus = Literal["not_started", "planning", "executing", "completed", "failed"]

# 定义任务状态类型
TaskStatus = Literal["pending", "in_progress", "completed", "failed"]

# 定义任务项
class Task(TypedDict, total=False):
    """任务项定义
    
    表示计划中的一个任务项，包含任务描述、状态、分配的代理等信息
    """
    id: str  # 任务唯一标识符
    description: str  # 任务描述
    status: TaskStatus  # 任务状态
    agent: Optional[str]  # 分配的代理名称
    created_at: str  # 创建时间
    updated_at: str  # 更新时间
    completed_at: Optional[str]  # 完成时间
    dependencies: Optional[List[str]]  # 依赖的任务ID列表
    notes: Optional[str]  # 任务备注

# 定义计划
class Plan(TypedDict, total=False):
    """计划定义
    
    表示一个完整的计划，包含计划状态、任务列表等信息
    """
    status: PlanningStatus  # 计划状态
    tasks: List[Task]  # 任务列表
    current_task_id: Optional[str]  # 当前执行的任务ID
    created_at: str  # 创建时间
    updated_at: str  # 更新时间
    completed_at: Optional[str]  # 完成时间
    title: Optional[str]  # 计划标题
    description: Optional[str]  # 计划描述

# 扩展AgentState以支持计划功能
class PlanningAgentState(AgentState):
    """支持计划功能的代理状态
    
    扩展了AgentState，添加了plan字段用于存储计划信息
    """
    plan: Optional[Plan] = None

================================================
FILE: core/agents/react_based_supervisor/supervisor.py
================================================
import inspect
from typing import Any, Callable, Literal, Optional, Type, Union, Dict, Optional

from langchain_core.language_models import BaseChatModel, LanguageModelLike
from langchain_core.tools import BaseTool
from langgraph.graph import END, START, StateGraph
from langgraph.prebuilt.chat_agent_executor import (
    create_react_agent,
    AgentState,
    Prompt,
    StateSchemaType,
    StructuredResponseSchema,
)
from langgraph.pregel import Pregel
from langgraph.utils.runnable import RunnableCallable
from core.agents.base.react_agent import ReactAgent
from core.agents.supervisor.agent_name import AgentNameMode, with_agent_name
from core.agents.supervisor.handoff import (
    create_handoff_back_messages,
    create_handoff_tool,
)
OutputMode = Literal["full_history", "last_message"]
"""Mode for adding agent outputs to the message history in the multi-agent workflow

- `full_history`: add the entire agent message history
- `last_message`: add only the last message
"""


MODELS_NO_PARALLEL_TOOL_CALLS = {"o3-mini"}


def _supports_disable_parallel_tool_calls(model: LanguageModelLike) -> bool:
    if not isinstance(model, BaseChatModel):
        return False

    if hasattr(model, "model_name") and model.model_name in MODELS_NO_PARALLEL_TOOL_CALLS:
        return False

    if not hasattr(model, "bind_tools"):
        return False

    if "parallel_tool_calls" not in inspect.signature(model.bind_tools).parameters:
        return False

    return True


def _make_call_agent(
    agent: Pregel,
    output_mode: OutputMode,
    add_handoff_back_messages: bool,
    supervisor_name: str,
) -> Callable[[dict], dict] | RunnableCallable:
    if output_mode not in OutputMode.__args__:
        raise ValueError(
            f"Invalid agent output mode: {output_mode}. Needs to be one of {OutputMode.__args__}"
        )

    def _process_output(output: dict) -> dict:
        messages = output["messages"]
        if output_mode == "full_history":
            pass
        elif output_mode == "last_message":
            messages = messages[-1:]
        else:
            raise ValueError(
                f"Invalid agent output mode: {output_mode}. "
                f"Needs to be one of {OutputMode.__args__}"
            )

        if add_handoff_back_messages:
            messages.extend(create_handoff_back_messages(agent.name, supervisor_name))

        return {
            **output,
            "messages": messages,
        }

    def call_agent(state: dict) -> dict:
        #print(f"🟡 [Sync invoke] Handoff to agent '{agent.name}' with state keys: {list(state.keys())}")
        output = agent.invoke(state)
        #print(f"✅ [Sync invoke] Agent '{agent.name}' completed.")
        return _process_output(output)

    async def acall_agent(state: dict) -> dict:
        #print(f"🟡 [Async invoke] Handoff to agent '{agent.name}' with state keys: {list(state.keys())}")
        output = await agent.ainvoke(state)
        #print(f"✅ [Async invoke] Agent '{agent.name}' completed.")
        return _process_output(output)

    return RunnableCallable(call_agent, acall_agent)


def create_supervisor(
    agents: list[Pregel],
    *,
    model: LanguageModelLike,
    tools: list[BaseTool | Callable] | None = None,
    prompt: Prompt | None = None,
    response_format: Optional[
        Union[StructuredResponseSchema, tuple[str, StructuredResponseSchema]]
    ] = None,
    state_schema: StateSchemaType = AgentState,
    config_schema: Type[Any] | None = None,
    output_mode: OutputMode = "last_message",
    add_handoff_back_messages: bool = True,
    supervisor_name: str = "supervisor",
    include_agent_name: AgentNameMode | None = None,
) -> StateGraph:
    """Create a multi-agent supervisor.

    Args:
        agents: List of agents to manage
        model: Language model to use for the supervisor
        tools: Tools to use for the supervisor
        prompt: Optional prompt to use for the supervisor. Can be one of:
            - str: This is converted to a SystemMessage and added to the beginning of the list of messages in state["messages"].
            - SystemMessage: this is added to the beginning of the list of messages in state["messages"].
            - Callable: This function should take in full graph state and the output is then passed to the language model.
            - Runnable: This runnable should take in full graph state and the output is then passed to the language model.
        response_format: An optional schema for the final supervisor output.

            If provided, output will be formatted to match the given schema and returned in the 'structured_response' state key.
            If not provided, `structured_response` will not be present in the output state.
            Can be passed in as:

                - an OpenAI function/tool schema,
                - a JSON Schema,
                - a TypedDict class,
                - or a Pydantic class.
                - a tuple (prompt, schema), where schema is one of the above.
                    The prompt will be used together with the model that is being used to generate the structured response.

            !!! Important
                `response_format` requires the model to support `.with_structured_output`

            !!! Note
                `response_format` requires `structured_response` key in your state schema.
                You can use the prebuilt `langgraph.prebuilt.chat_agent_executor.AgentStateWithStructuredResponse`.
        state_schema: State schema to use for the supervisor graph.
        config_schema: An optional schema for configuration.
            Use this to expose configurable parameters via supervisor.config_specs.
        output_mode: Mode for adding managed agents' outputs to the message history in the multi-agent workflow.
            Can be one of:
            - `full_history`: add the entire agent message history
            - `last_message`: add only the last message (default)
        add_handoff_back_messages: Whether to add a pair of (AIMessage, ToolMessage) to the message history
            when returning control to the supervisor to indicate that a handoff has occurred.
        supervisor_name: Name of the supervisor node.
        include_agent_name: Use to specify how to expose the agent name to the underlying supervisor LLM.

            - None: Relies on the LLM provider using the name attribute on the AI message. Currently, only OpenAI supports this.
            - "inline": Add the agent name directly into the content field of the AI message using XML-style tags.
                Example: "How can I help you" -> "<name>agent_name</name><content>How can I help you?</content>"
    """
    agent_names = set()
    for agent in agents:
        if agent.name is None or agent.name == "LangGraph":
            raise ValueError(
                "Please specify a name when you create your agent, either via `create_react_agent(..., name=agent_name)` "
                "or via `graph.compile(name=name)`."
            )

        if agent.name in agent_names:
            raise ValueError(
                f"Agent with name '{agent.name}' already exists. Agent names must be unique."
            )

        agent_names.add(agent.name)

    handoff_tools = [create_handoff_tool(agent_name=agent.name) for agent in agents]
    all_tools = (tools or []) + handoff_tools

    if _supports_disable_parallel_tool_calls(model):
        model = model.bind_tools(all_tools, parallel_tool_calls=False)
    else:
        model = model.bind_tools(all_tools)

    if include_agent_name:
        model = with_agent_name(model, include_agent_name)
                
    supervisor = create_react_agent(
        name=supervisor_name,
        model=model,
        tools=all_tools,
        prompt=prompt,
        state_schema=state_schema,
        response_format=response_format,
        debug=False,
    )
    # Build the multi-agent supervisor graph using the langgraph StateGraph setup
    builder = StateGraph(state_schema, config_schema=config_schema)
    builder.add_node(supervisor, destinations=tuple(agent_names) + (END,))
    builder.add_edge(START, supervisor.name)
    for agent in agents:
        # If agent is a "ReactAgent" or similar
        if hasattr(agent, "get_agent") and callable(agent.get_agent):
            agent = agent.get_agent()  # retrieve the compiled subgraph
       
        builder.add_node(
            agent.name,
            _make_call_agent(
                agent,
                output_mode,
                add_handoff_back_messages,
                supervisor_name,
            ),
        )
        builder.add_edge(agent.name, supervisor.name)

    return builder


================================================
FILE: core/agents/react_supervisor_agent.py
================================================
from typing import Any, Callable, Dict, List, Optional, Union
import re

from langchain_core.language_models import LanguageModelLike
from langchain_core.tools import BaseTool
from langgraph.graph import StateGraph
from langgraph.graph.state import CompiledStateGraph
from langgraph.types import Checkpointer
from langgraph.prebuilt.chat_agent_executor import (
    AgentState,
    StateSchemaType,
)
from langgraph.utils.runnable import RunnableCallable
from core.agents.react_based_supervisor import create_supervisor
from core.agents.react_based_supervisor.simple_planning_tool import SimplePlanningTool
from core.agents.base.base_agent import BaseAgent
from core.agents.react_based_supervisor.state_schema import PlanningAgentState
import logging

logger = logging.getLogger(__name__)

class SupervisorAgent(BaseAgent):
    """Supervisor class for managing multiple agents with planning capabilities.
    
    This class provides a high-level interface for creating a supervisor workflow
    that can manage and coordinate multiple agents. It also includes planning capabilities
    to create and manage a plan for complex tasks using a state-driven approach.
    
    The planning functionality is implemented using PlanningStateHandler and PlanningTool,
    which provide a more structured and flexible way to manage tasks compared to the
    previous TodolistTool approach.
    """
    _PROMPT_TEMPLATE = """You are a Supervisor Agent. Your job is to analyze user requests and coordinate multiple agents to complete tasks.

## Task Approach Methodology

### Understanding Requirements
- Analyzing user requests to identify core needs
- Asking clarifying questions when requirements are ambiguous
- Breaking down complex requests into manageable components
- Identifying potential challenges before beginning work

### Coordination
- Identifying appropriate agents for each task
- Delegating tasks to specialized agents
- Tracking progress and ensuring task completion
- Synthesizing information from multiple agents

Remember: Effective coordination is essential for successful task completion. Take time to understand the request and delegate appropriately.
 {tools}
"""

    _PLANNING_PROMPT_TEMPLATE = """You are a Supervisor agent. Your role is to analyze user requests, break them down into actionable tasks, and coordinate specialized agents (e.g., research_expert, coder_expert, reporter_expert) to complete them.

# Working with Complex Requests
1. FIRST, carefully analyze the user's request and break it down into clear, actionable tasks
2. Identify which agent is best suited for each part of the task
3. Use the handoff tools to delegate tasks to appropriate agents ONE AT A TIME
4. WAIT for each agent to COMPLETELY FINISH their assigned task before proceeding
5. Review the output from each agent before delegating the next task
6. Maintain a sequential workflow - never delegate multiple tasks simultaneously
7. Synthesize the results and provide a coherent response to the user
8. Provide a final summary when all tasks are done
"""

    _PLANNING_TOOL_TEMPLATE = """
# Planning Tool Instructions
You have access to a "planning" tool that uses JSON for all operations. Do NOT include any "state" field in your calls. Use the following actions exactly as defined:

1. "create_plan": Create a new plan.
   - Required fields:
     - title (string)
     - description (string)
     - tasks (list of task objects). Each task object must include:
         "description": string,
         "status": "pending" (all tasks must have "status": "pending" initially),
         "agent": string (empty if not assigned),
         "notes": string (empty if none),
         "evaluation": string (empty if none)
   - Example:
   {
     "action": "create_plan",
     "title": "Python Scraper for Tech News",
     "description": "Build a Python scraper to fetch the latest tech news and save it as CSV",
     "tasks": [
       {"description": "Research Python scraping libraries", "status": "pending", "agent": "", "notes": "", "evaluation": ""},
       {"description": "Implement the scraper", "status": "pending", "agent": "", "notes": "", "evaluation": ""},
       {"description": "Test the code", "status": "pending", "agent": "", "notes": "", "evaluation": ""}
     ]
   }

2. "view_plan": Retrieve the current plan.
   - Example:
   {
     "action": "view_plan"
   }

3. "add_tasks": Add additional tasks to the plan.
   - Required:
     - tasks: list of task objects (same format as above)
   - Example:
   {
     "action": "add_tasks",
     "tasks": [
       {"description": "Write documentation", "status": "pending", "agent": "", "notes": "", "evaluation": ""}
     ]
   }

4. "update_task": Update an existing task.
   - Identify the task by "by_id" (the task's unique ID from the plan).
   - You may update any of: "description", "status", "agent", "notes", "evaluation".
   - Example:
   {
     "action": "update_task",
     "by_id": "TASK-UUID",
     "status": "completed",
     "evaluation": "The scraper works perfectly."
   }

5. "set_current_task": Set the current task by its ID.
   - Example:
   {
     "action": "set_current_task",
     "task_id": "TASK-UUID"
   }

6. "finish_plan": Mark the entire plan as completed.
   - Example:
   {
     "action": "finish_plan"
   }

Important:
- Always produce valid JSON for your tool calls.
- Continuously update and monitor the plan until every task's status is "completed" before delivering your final answer.
- If the plan is not fully completed, do not stop; keep updating the plan with appropriate calls.
"""
    def __init__(
        self,
        agents: List[BaseAgent],
        model: LanguageModelLike,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[str] = None,
        state_schema: StateSchemaType = AgentState,
        supervisor_name: str = "supervisor",
        checkpointer: Optional[Checkpointer] = None,
        output_mode: str = "last_message", # * full_history or last_message *
        enable_planning: bool = True, # * True or False *
    ):
        """Initialize a supervisor.
        
        Args:
            agents: List of agents to manage
            model: Language model to use for the supervisor
            tools: Optional list of tools available to the supervisor
            prompt: Optional prompt to use for the supervisor
            state_schema: State schema to use for the supervisor graph
            supervisor_name: Name of the supervisor node
            checkpointer: Optional checkpointer to use for the supervisor
            output_mode: Mode for adding agent outputs to the message history
                ("full_history" or "last_message")
            enable_planning: Whether to enable planning capabilities
            auto_planning: Whether to automatically generate plans for complex tasks
        """
        # 设置规划相关属性
        self._enable_planning = enable_planning
        
        # 如果启用规划功能，设置状态模式为PlanningAgentState
        if self._enable_planning and state_schema == AgentState:
            state_schema = PlanningAgentState
            
        # Store agent-specific attributes before super().__init__
        self.agents = agents
        self.output_mode = output_mode
        self.supervisor_name = supervisor_name
        self.state_schema = state_schema
        self.checkpointer = checkpointer
        self.tools = tools or []
        self._workflow = None
            
        # 生成基础提示词
        # _agents_prompt = self._generate_agents_prompt()
        _final_prompt = self._PLANNING_PROMPT_TEMPLATE + "/n/n" + self._PLANNING_TOOL_TEMPLATE if self._enable_planning else self._PROMPT_TEMPLATE
        
        if tools is None:
            tools = []
        # 如果启用规划功能，添加规划提示模板并添加规划工具
        if self._enable_planning:
            tools.append(SimplePlanningTool())
        
        # 初始化BaseAgent父类
        super().__init__(
            name=supervisor_name,
            model=model,
            tools=tools,
            checkpointer=checkpointer,
            prompt=_final_prompt,
        )
    
    def build(self) -> StateGraph:
        """Build the supervisor workflow.
        
        Returns:
            The built StateGraph
        """
        
        if self._workflow is not None:
            return self._workflow
            
        self._workflow = create_supervisor(
            agents=self.agents,
            model=self.model,
            tools=self.tools,
            prompt=self.base_prompt,
            state_schema=self.state_schema,
            supervisor_name=self.supervisor_name,
            output_mode=self.output_mode,
        )
        
        return self._workflow

================================================
FILE: core/agents/sb_supervisor_agent.py
================================================
# reason_graph/supervisor_agent.py
from typing import  Callable, List, Optional, Union, cast, Literal
from langchain_core.language_models import LanguageModelLike
from langchain_core.tools import BaseTool
from langgraph.graph import StateGraph
from langgraph.types import Checkpointer

# 内部导入
from core.agents.base.base_agent import BaseAgent
from core.agents.state_based_supervisor.state_schema import PlanningAgentState, StateSchemaType # 导入 PlanningAgentState
# 导入重构后的 create_supervisor 函数
from core.agents.state_based_supervisor.supervisor_graph import create_supervisor
from core.agents.state_based_supervisor.agent_name import AgentNameMode

import logging
logger = logging.getLogger(__name__)

class SupervisorAgent(BaseAgent):
    """
    Supervisor Agent 类 (最终版)
    负责协调子 Agent 并管理规划 (使用状态驱动方法)。
    invoke/ainvoke 继承自 BaseAgent，负责完整流程。
    """

    def __init__(
        self,
        agents: List[BaseAgent], # 子 Agent 实例列表
        model: LanguageModelLike, # Supervisor 使用的 LLM
        tools: Optional[List[Union[BaseTool, Callable]]] = None, # Supervisor 特有工具
        state_schema: StateSchemaType = PlanningAgentState,
        supervisor_name: str = "supervisor",
        checkpointer: Optional[Checkpointer] = None,
        output_mode: str = "last_message",
        # enable_planning: bool = True, # 不再需要，强制使用 Planning
        include_agent_name: Optional[str] = "inline",
        # BaseAgent 参数
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = None,
        model_name: Optional[str] = None,
    ):
        """初始化 Supervisor Agent"""
        if state_schema != PlanningAgentState:
             print("Warning: SupervisorAgent forces state_schema to PlanningAgentState.")
             state_schema = PlanningAgentState

        self.sub_agents = agents
        self.output_mode = output_mode
        self.include_agent_name = cast(Optional[AgentNameMode], include_agent_name)

        # 初始化 BaseAgent 父类
        super().__init__(
            name=supervisor_name,
            model=model,
            tools=tools or [],
            checkpointer=checkpointer,
            prompt=None, # 核心 Prompt 在 supervisor_node_logic 中处理
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            model_name=model_name,
        )
        # _workflow_definition 和 _executable_agent 由 BaseAgent 管理

    def build(self) -> Optional[StateGraph]:
        """构建 Supervisor 的 LangGraph 工作流图定义。"""
        # 调用重构后的 create_supervisor 函数来获取 StateGraph 定义
        # 这个 StateGraph 包含了手写的 supervisor_node_logic
        if self._workflow: return self._workflow
        
        print(f"Building supervisor graph definition for '{self.name}'...")
        try:
            graph_definition = create_supervisor(
                model=self.model,
                sub_agents=self.sub_agents,
                state_schema=PlanningAgentState, # 强制使用
                tools=self.tools,
                output_mode=cast(Literal["full_history", "last_message"], self.output_mode),
                supervisor_name=self.name,
                include_agent_name=self.include_agent_name,
            )
            self._workflow = graph_definition # 存储图定义
            print(f"Supervisor graph definition built for '{self.name}'.")
            return self._workflow
        except Exception as e:
            print(f"!!! Error building supervisor graph definition '{self.name}': {e}")
            import traceback
            traceback.print_exc()
            self._workflow = None
            raise e

    # compile 方法继承自 BaseAgent
    # 它会调用上面的 build() 获取 StateGraph 定义，然后编译它，
    # 并创建包含预处理步骤的最终 _executable_agent

    # invoke, ainvoke, get_agent, reset 继承自 BaseAgent

================================================
FILE: core/agents/state_based_supervisor/__init__.py
================================================


================================================
FILE: core/agents/state_based_supervisor/agent_name.py
================================================
import re
from typing import Literal

from langchain_core.language_models import LanguageModelLike
from langchain_core.messages import AIMessage, BaseMessage
from langchain_core.runnables import RunnableLambda

NAME_PATTERN = re.compile(r"<name>(.*?)</name>", re.DOTALL)
CONTENT_PATTERN = re.compile(r"<content>(.*?)</content>", re.DOTALL)

AgentNameMode = Literal["inline"]


def _is_content_blocks_content(content: list[dict] | str) -> bool:
    return (
        isinstance(content, list)
        and len(content) > 0
        and isinstance(content[0], dict)
        and "type" in content[0]
    )


def add_inline_agent_name(message: BaseMessage) -> BaseMessage:
    """Add name and content XML tags to the message content.

    Examples:

        >>> add_inline_agent_name(AIMessage(content="Hello", name="assistant"))
        AIMessage(content="<name>assistant</name><content>Hello</content>", name="assistant")

        >>> add_inline_agent_name(AIMessage(content=[{"type": "text", "text": "Hello"}], name="assistant"))
        AIMessage(content=[{"type": "text", "text": "<name>assistant</name><content>Hello</content>"}], name="assistant")
    """
    if not isinstance(message, AIMessage) or not message.name:
        return message

    formatted_message = message.model_copy()
    if _is_content_blocks_content(formatted_message.content):
        text_blocks = [block for block in message.content if block["type"] == "text"]
        non_text_blocks = [block for block in message.content if block["type"] != "text"]
        content = text_blocks[0]["text"] if text_blocks else ""
        formatted_content = f"<name>{message.name}</name><content>{content}</content>"
        formatted_message.content = non_text_blocks + [{"type": "text", "text": formatted_content}]
    else:
        formatted_message.content = (
            f"<name>{message.name}</name><content>{formatted_message.content}</content>"
        )
    return formatted_message


def remove_inline_agent_name(message: BaseMessage) -> BaseMessage:
    """Remove explicit name and content XML tags from the AI message content.

    Examples:

        >>> remove_inline_agent_name(AIMessage(content="<name>assistant</name><content>Hello</content>", name="assistant"))
        AIMessage(content="Hello", name="assistant")

        >>> remove_inline_agent_name(AIMessage(content=[{"type": "text", "text": "<name>assistant</name><content>Hello</content>"}], name="assistant"))
        AIMessage(content=[{"type": "text", "text": "Hello"}], name="assistant")
    """
    if not isinstance(message, AIMessage) or not message.name:
        return message

    is_content_blocks_content = _is_content_blocks_content(message.content)
    if is_content_blocks_content:
        text_blocks = [block for block in message.content if block["type"] == "text"]
        if not text_blocks:
            return message

        non_text_blocks = [block for block in message.content if block["type"] != "text"]
        content = text_blocks[0]["text"]
    else:
        content = message.content

    name_match: re.Match | None = NAME_PATTERN.search(content)
    content_match: re.Match | None = CONTENT_PATTERN.search(content)
    if not name_match or not content_match:
        return message

    if name_match.group(1) != message.name:
        return message

    parsed_content = content_match.group(1)
    parsed_message = message.model_copy()
    if is_content_blocks_content:
        content_blocks = non_text_blocks
        if parsed_content:
            content_blocks.append({"type": "text", "text": parsed_content})

        parsed_message.content = content_blocks
    else:
        parsed_message.content = parsed_content
    return parsed_message


def with_agent_name(
    model: LanguageModelLike,
    agent_name_mode: AgentNameMode,
) -> LanguageModelLike:
    """Attach formatted agent names to the messages passed to and from a language model.

    This is useful for making a message history with multiple agents more coherent.

    NOTE: agent name is consumed from the message.name field.
        If you're using an agent built with create_react_agent, name is automatically set.
        If you're building a custom agent, make sure to set the name on the AI message returned by the LLM.

    Args:
        model: Language model to add agent name formatting to.
        agent_name_mode: Use to specify how to expose the agent name to the LLM.
            - "inline": Add the agent name directly into the content field of the AI message using XML-style tags.
                Example: "How can I help you" -> "<name>agent_name</name><content>How can I help you?</content>".
    """
    if agent_name_mode == "inline":
        process_input_message = add_inline_agent_name
        process_output_message = remove_inline_agent_name
    else:
        raise ValueError(
            f"Invalid agent name mode: {agent_name_mode}. Needs to be one of: {AgentNameMode.__args__}"
        )

    def process_input_messages(messages: list[BaseMessage]) -> list[BaseMessage]:
        return [process_input_message(message) for message in messages]

    model = (
        process_input_messages
        | model
        | RunnableLambda(process_output_message, name="process_output_message")
    )
    return model


================================================
FILE: core/agents/state_based_supervisor/evaluate_result_node.py
================================================
# reason_graph/evaluate_result_node.py

import json
import time
import copy
import traceback
import anyio 
from typing import Dict, Any, List, Optional, Union
from langchain_core.messages import BaseMessage, AIMessage, ToolMessage
from langchain_core.runnables import RunnableConfig

# 内部导入 (确保路径正确)
try:
    from .state_schema import PlanningAgentState, TaskStatus, Plan, Task
    from .planning_handler import PlanningStateHandler
except ImportError as e:
    print(f"Error importing modules in evaluate_result_node.py: {e}")
    # Fallbacks
    class PlanningAgentState(Dict): pass; 
    class Plan(Dict): pass; 
    class Task(Dict): pass
    TaskStatus = str 
    class PlanningStateHandler: # Dummy
        @staticmethod 
        def update_task(plan, by_id, **kwargs): return plan
        @staticmethod
        def set_current_task(plan, task_id): return plan
        @staticmethod
        def get_task(plan, task_id): return None
        @staticmethod
        def update_plan_status(plan): return plan


async def evaluate_result_node_logic(state: PlanningAgentState, config: Optional[RunnableConfig] = None) -> Dict[str, Any]:
    """
    评估子 Agent 返回结果并更新计划状态的节点逻辑 (异步, 优化评估逻辑)。
    """
    print(f"--- Entering Evaluate Result Node ---")
    messages: List[BaseMessage] = state.get('messages', [])
    plan: Optional[Plan] = state.get('plan')
    last_message = messages[-1] if messages else None
    error_message: Optional[str] = None
    plan_updated: bool = False
    updated_plan: Optional[Plan] = copy.deepcopy(plan) if plan else None 

    if not updated_plan:
        print("Evaluate Result Node: No plan found in state. Skipping.")
        return {} 

    current_task_id = updated_plan.get("current_task_id")
    if not current_task_id:
        # Fallback logic for finding current task (不变)
        print("Warning: Evaluate Result Node - No current_task_id found in plan...")
        in_progress_tasks = [t for t in updated_plan.get('tasks', []) if t.get('status') == 'in_progress']
        if len(in_progress_tasks) == 1: current_task_id = in_progress_tasks[0].get('id'); print(f"  Fallback: Found task {current_task_id}")
        else: error_message = "Evaluation failed: Cannot determine finished task."; print(f"ERROR: {error_message}"); return {"plan": updated_plan, "error": error_message, "messages": []}

    agent_result_content: Optional[str] = None
    agent_name: Optional[str] = None
    if isinstance(last_message, AIMessage): 
        agent_result_content = str(last_message.content) if last_message.content is not None else "" # Ensure string
        agent_name = last_message.name or "SubAgent"
        print(f"  Evaluating result from: {agent_name} for task ID: {current_task_id}")
    else:
        agent_result_content = f"Error: Expected AIMessage result, got {type(last_message).__name__}."
        agent_name = "System/Error"
        print(f"Warning: Last message not AIMessage. Assuming task failed for {current_task_id}.")


    # --- 优化的评估逻辑 ---
    new_status: TaskStatus = "completed" # 默认成功
    evaluation_notes = f"Result received from {agent_name}."
    
    # 1. 检查是否为空内容 (或只有空白符)
    if agent_result_content is None or not agent_result_content.strip():
        new_status = "failed"
        evaluation_notes = f"Task failed: Agent {agent_name} returned empty content."
        print(f"  Task {current_task_id} evaluated as FAILED (Empty Result).")
    # 2. 检查是否以明确的错误标识开头 (需要工具配合)
    #    假设工具出错时会在返回字符串前加上 "Error: " 或 "Execution Failed: "
    elif agent_result_content.strip().startswith(("Error:", "Execution Failed:", "Tool Error:")):
        new_status = "failed"
        evaluation_notes = f"Task failed: Agent {agent_name} reported an error: {agent_result_content[:150]}..."
        print(f"  Task {current_task_id} evaluated as FAILED (Explicit Error Signal).")
    # 3. (可选) 添加其他特定检查，例如检查是否只是"我不明白"之类的回复
    elif len(agent_result_content) < 50 and any(kw in agent_result_content.lower() for kw in ["don't know", "cannot fulfill", "无法回答", "不明白"]):
         new_status = "failed" # 或 "pending_review" ? 暂时设为 failed
         evaluation_notes = f"Task likely failed: Agent {agent_name} indicated inability to fulfill request."
         print(f"  Task {current_task_id} evaluated as FAILED (Agent Indicated Inability).")
    else:
        # 如果以上都不是，则认为是成功
        new_status = "completed"
        print(f"  Task {current_task_id} evaluated as COMPLETED.")
    # --- 评估逻辑结束 ---


    # --- 更新 Plan 状态 (逻辑不变) ---
    try:
        update_kwargs = {
            "new_status": new_status, 
            "new_evaluation": evaluation_notes,
            "new_notes": agent_result_content[:1000] + "..." if agent_result_content and len(agent_result_content) > 1000 else agent_result_content 
        }
        print(f"  Updating task {current_task_id} with: {{'status': '{new_status}', ...}}")
        
        if updated_plan and PlanningStateHandler.get_task(updated_plan, current_task_id):
             updated_plan = PlanningStateHandler.update_task(updated_plan, by_id=current_task_id, **update_kwargs)
             updated_plan = PlanningStateHandler.set_current_task(updated_plan, None) 
             updated_plan = PlanningStateHandler.update_plan_status(updated_plan)
             print(f"  Plan status after evaluation update: {updated_plan.get('status')}")
             plan_updated = True
        else:
             raise ValueError(f"Task ID '{current_task_id}' not found or plan invalid before update.")

    except ValueError as ve: error_message = f"Error updating plan: {ve}"; print(f"ERROR: {error_message}"); traceback.print_exc()
    except Exception as e: error_message = f"Unexpected error updating plan: {e}"; print(f"ERROR: {error_message}"); traceback.print_exc()

    # --- 准备返回字典 (逻辑不变) ---
    updates: Dict[str, Any] = {}
    if updated_plan is not None: updates["plan"] = updated_plan 
    elif plan is not None: updates["plan"] = plan 
    
    # 记录本节点错误，或清除旧错误
    current_state_error = state.get("error") 
    if error_message: updates["error"] = error_message 
    elif current_state_error: updates["error"] = None 

    updates["messages"] = [] # Evaluator 不添加消息

    print(f"--- Exiting Evaluate Result Node. Plan updated: {plan_updated} ---")
    return updates

# --- 同步包装器 (保持不变) ---
def evaluate_result_node_logic_sync(state: PlanningAgentState, config: Optional[RunnableConfig] = None) -> Dict[str, Any]:
    """evaluate_result_node_logic 的同步包装器"""
    print(f"--- Entering Evaluate Result Node (Sync Wrapper) ---")
    try:
        import anyio 
        return anyio.run(evaluate_result_node_logic, state, config) # type: ignore
    except Exception as e:
        print(f"Error running evaluate_result_node_logic synchronously: {e}")
        traceback.print_exc()
        return {"error": f"Evaluate Result sync execution failed: {e}", "plan": state.get("plan"), "messages": []}

================================================
FILE: core/agents/state_based_supervisor/handoff.py
================================================
# reason_graph/handoff.py
# (Paste the code user provided for handoff.py here)
import re
import uuid
from typing import List, Tuple # Import Tuple

from langchain_core.messages import AIMessage, ToolCall, ToolMessage, BaseMessage # Import BaseMessage
from langchain_core.tools import BaseTool, InjectedToolCallId, tool
from langgraph.prebuilt import InjectedState
from langgraph.types import Command
from typing_extensions import Annotated

WHITESPACE_RE = re.compile(r"\s+")

def _normalize_agent_name(agent_name: str) -> str:
    """Normalize an agent name to be used inside the tool name."""
    if not agent_name: return "unknown_agent"
    return WHITESPACE_RE.sub("_", agent_name.strip()).lower()

# Note: The original code uses @tool decorator which requires function arguments.
# To inject state, the decorated function needs the Annotated state argument.
# Let's define the function first and then apply the decorator, or use functools.partial.
# Using the function approach first for clarity.

def _handoff_to_agent_implementation(
    state: Annotated[dict, InjectedState], # Inject state here
    tool_call_id: Annotated[str, InjectedToolCallId], # Inject tool_call_id
    target_agent_name: str, # Pass the target agent name
    tool_name: str # Pass the specific tool name for the ToolMessage
) -> Command:
    """Ask another agent for help. This is the core logic."""
    # Create the ToolMessage confirming the handoff BEFORE generating the Command
    """Handoff 核心逻辑，添加日志"""
    print(f"\n--- DEBUG: Entering _handoff_to_agent_implementation ---")
    print(f"  - Target Agent: {target_agent_name}")
    print(f"  - Tool Name: {tool_name}")
    print(f"  - Tool Call ID: {tool_call_id}")
    # print(f"  - Current State Keys: {list(state.keys())}") # 可选：打印状态键
    tool_message = ToolMessage(
        content=f"Okay, handing off to {target_agent_name}. The current state and task context have been passed.",
        name=tool_name,
        tool_call_id=tool_call_id,
    )
    print(f"  - Created ToolMessage: ID={tool_message.tool_call_id}, Name={tool_message.name}")
    # The Command tells LangGraph to route to the target agent node
    # It also includes the ToolMessage in the state update for the next step
    command_obj = Command(
        goto=target_agent_name,
        # graph=Command.PARENT, # PARENT is default, usually not needed unless nested graphs
        update={"messages": [tool_message]}, # Return only the NEW message to be added
    )
    print(f"  - Created Command: goto='{command_obj.goto}', update contains {len(command_obj.update.get('messages',[]))} message(s)")
    print(f"--- DEBUG: Exiting _handoff_to_agent_implementation ---")
    return command_obj

def create_handoff_tool(*, agent_name: str) -> BaseTool:
    """Create a tool that can handoff control to the requested agent."""
    if not agent_name:
         raise ValueError("agent_name cannot be empty for create_handoff_tool")

    normalized_name = _normalize_agent_name(agent_name)
    tool_name = f"transfer_to_{normalized_name}"

    # Use functools.partial to fix the target_agent_name and tool_name arguments
    import functools
    specific_handoff_logic = functools.partial(
        _handoff_to_agent_implementation,
        target_agent_name=agent_name,
        tool_name=tool_name
    )

    # Decorate the partial function
    # The arguments 'state' and 'tool_call_id' will be automatically injected by LangGraph
    # when the tool is called due to the Annotations used in _handoff_to_agent_implementation
    @tool(tool_name)
    def handoff_tool_wrapper(
         state: Annotated[dict, InjectedState],
         tool_call_id: Annotated[str, InjectedToolCallId]
     ) -> Command:
        """Dynamically generated tool description: Ask the '{agent_name}' agent for help with the current task or question."""
        # --- 添加 Debug 日志 ---
        print(f"\n--- DEBUG: Handoff Tool '{tool_name}' (wrapper) CALLED ---")
        # ---
        return specific_handoff_logic(state=state, tool_call_id=tool_call_id) # type: ignore

    # Set a more descriptive description
    handoff_tool_wrapper.description = f"Use this tool to delegate the current task or ask a question to the '{agent_name}' agent. Pass the necessary context or instructions in your reasoning before calling this tool."

    return handoff_tool_wrapper


def create_handoff_back_messages(
    agent_name: str, supervisor_name: str
) -> Tuple[AIMessage, ToolMessage]:
    """Create a pair of (AIMessage, ToolMessage) to add to the message history when returning control to the supervisor."""
    tool_call_id = str(uuid.uuid4())
    # Although no tool exists for transferring back, we simulate the pattern
    # The AIMessage signals intent, the ToolMessage confirms the transition occurred in the graph logic
    simulated_tool_name = f"transfer_back_to_{_normalize_agent_name(supervisor_name)}"

    # The AIMessage contains the *final output* of the sub-agent in its content field
    # It should also indicate the intent to hand back, though the graph logic forces this anyway.
    # The content here is just a placeholder - the actual content comes from the agent's final response.
    ai_message_content = f"Task completed. Transferring back to {supervisor_name}."

    # We still generate a ToolCall structure for consistency in the AIMessage, even if no real tool is called on supervisor side for hand-back.
    tool_calls = [ToolCall(name=simulated_tool_name, args={}, id=tool_call_id)]

    # Create the AIMessage - crucial to include the sub-agent's name
    ai_message = AIMessage(
            content=ai_message_content, # Placeholder - see note below
            tool_calls=tool_calls,
            name=agent_name, # Identify which agent is responding
        )

    # The ToolMessage confirms the transition happened from the graph's perspective
    tool_message = ToolMessage(
            content=f"Successfully transferred back to {supervisor_name} from {agent_name}.",
            name=simulated_tool_name,
            tool_call_id=tool_call_id,
        )

    # IMPORTANT NOTE: The `_make_call_agent` helper function should populate the
    # `ai_message.content` with the *actual* final response message(s) from the sub-agent,
    # replacing the placeholder content above. It keeps the tool_calls structure.
    # The code provided for `_make_call_agent` seems to handle extracting `output['messages']`.
    # We need to ensure it correctly structures the AIMessage part of the tuple returned here.
    # Let's refine create_handoff_back_messages to just create the ToolMessage,
    # as the AIMessage content comes from the sub-agent's actual final output.

    # Refined approach: _make_call_agent gets the final AI response, we only need the ToolMessage here?
    # No, the pattern expects both. Let's assume _make_call_agent takes the *last* message from the
    # sub-agent's output and packages it into this AIMessage structure.

    return ai_message, tool_message # Return both for the standard pattern

================================================
FILE: core/agents/state_based_supervisor/planner_node.py
================================================
import re
import json
import time
import copy
import ast
import traceback
import anyio # <--- 导入 anyio
from typing import Dict, Any, List, Optional, Union
from datetime import datetime
from langchain_core.messages import BaseMessage, AIMessage, SystemMessage, HumanMessage
from langchain_core.runnables import RunnableConfig

# 内部导入
try:
    from .state_schema import PlanningAgentState, Plan
    from .planning_handler import PlanningStateHandler
    from .prompt import PLANNER_SYSTEM_PROMPT_TEMPLATE
except ImportError as e:
    print(f"Error importing modules in planner_node.py: {e}")
    class PlanningAgentState(Dict): pass; 
    class Plan(Dict): pass; 
    class PlanningStateHandler: pass
    PLANNER_SYSTEM_PROMPT_TEMPLATE = "Fallback Planner Prompt: Error loading template. Args: {agent_descriptions}"

# --- Planner 节点核心逻辑 (异步) ---
async def planner_node_logic(
    state: PlanningAgentState,
    config: Optional[RunnableConfig],
    model: Any, # Planner 使用的 LLM
    agent_description_map: Dict[str, str] # 需要 Agent 描述来分配任务
) -> Dict[str, Any]:
    """Planner 节点逻辑：分析请求，生成初始计划"""
    print(f"--- Entering Planner Node ---")
    messages: List[BaseMessage] = state.get('messages', [])
    # Planner 通常在 plan 为空时运行
    plan: Optional[Plan] = state.get('plan')
    if plan:
         print("Planner Node: Plan already exists. Skipping plan creation.")
         # 如果计划已存在，Planner 不应再执行，直接返回当前状态？
         # 或者返回一个空更新，让图流向 Supervisor？
         # 返回空更新更安全，让 Supervisor 继续
         return {} # 返回空字典，状态不变

    if not messages:
         print("Planner Node: No messages found to create a plan from.")
         return {"error": "Planner received no messages."}

    # --- 1. 准备 Planner Prompt ---
    # Planner 只需要 Agent 描述，不需要 plan_json 或 current_date?
    # 可以让它知道日期
    desc_list = [f"- {name}: {desc}" for name, desc in agent_description_map.items()]
    agent_descriptions_str = "\n".join(desc_list)
    current_date_str = datetime.now().strftime("%a, %b %d, %Y") # Planner 也可能需要日期

    system_prompt_text = "Error: Planner prompt template could not be loaded/formatted."
    try:
        # 加载 Planner 的模板
        from .prompt import PLANNER_SYSTEM_PROMPT_TEMPLATE
        system_prompt_text = PLANNER_SYSTEM_PROMPT_TEMPLATE.format(
            agent_descriptions=agent_descriptions_str,
            # 如果 Planner Prompt 需要日期：
            current_date=current_date_str
        )
    except ImportError: print("ERROR: Could not import PLANNER_SYSTEM_PROMPT_TEMPLATE")
    except KeyError as e: print(f"ERROR: Missing key in planner prompt formatting: {e}")
    except Exception as e: print(f"ERROR: Unexpected error loading/formatting planner prompt: {e}")

    # Planner 的输入只需要 System Prompt 和用户的初始请求（通常是第一条）
    # 或者传递最后几条消息？为了简单，先只用第一条 HumanMessage
    initial_user_request = next((m for m in messages if isinstance(m, HumanMessage)), None)
    if not initial_user_request:
         print("Planner Node: No HumanMessage found in initial state.")
         return {"error": "Planner did not find initial user request."}

    llm_input_messages = [SystemMessage(content=system_prompt_text), initial_user_request]

    # --- 2. 调用 Planner LLM ---
    print("--- Calling Planner LLM ---")
    response: Optional[AIMessage] = None
    llm_error_msg: Optional[str] = None
    try:
        response = await model.ainvoke(llm_input_messages, config=config)
        if not isinstance(response, AIMessage): raise TypeError("Planner LLM returned non-AIMessage.")
        # Planner 的回复主要是指令，可以不设置 name
        print(f"Planner LLM Raw Response Content: {response.content[:300]}...")
        # Planner 不应该调用工具
        if response.tool_calls: print("Warning: Planner LLM unexpectedly generated tool calls!")
        messages_to_add: List[BaseMessage] = [response] # 可以选择是否将 Planner 的思考过程加入 history
    except Exception as e:
        print(f"!!! Error invoking Planner LLM: {e}"); traceback.print_exc()
        llm_error_msg = f"Planner LLM invocation failed: {e}"
        messages_to_add = []
        response = None

    # --- 3. 处理 Planner LLM 回复 (解析 CREATE_PLAN) ---
    new_plan: Optional[Plan] = None
    plan_updated: bool = False # 标记计划是否在本节点成功创建
    directive_error_msg: Optional[str] = None

    if response and isinstance(response.content, str):
        try:
            plan_match = re.search(r"PLAN_UPDATE:\s*CREATE_PLAN\s*(\{.*?\})\s*$", response.content, re.IGNORECASE | re.DOTALL | re.MULTILINE)
            if plan_match:
                args_json_str = plan_match.group(1)
                print(f"Planner directive found: CREATE_PLAN with args: {args_json_str[:100]}...")
                try:
                     args = json.loads(args_json_str)
                     if not isinstance(args, dict): raise ValueError("Args JSON not a dict.")
                     
                     title=args.get("title", "Plan"); desc=args.get("description",""); tasks=args.get("tasks",[])
                     if isinstance(tasks, list) and all(isinstance(t, dict) and 'description' in t for t in tasks):
                          for task_data in tasks: task_data['status'] = 'pending' # 强制状态
                          new_plan = PlanningStateHandler.create_plan(title, desc)
                          new_plan = PlanningStateHandler.add_tasks(new_plan, tasks); plan_updated = True
                          print("DEBUG: Plan successfully created by Planner node.")
                     else: raise ValueError("Invalid 'tasks' format (must be list of dicts with 'description').")

                except (json.JSONDecodeError, ValueError, KeyError, TypeError) as e:
                     err_msg = f"Error processing CREATE_PLAN directive: {type(e).__name__} - {e}"
                     print(err_msg); traceback.print_exc(); directive_error_msg = err_msg
                except Exception as e:
                     err_msg = f"Unexpected error processing CREATE_PLAN: {type(e).__name__} - {e}"
                     print(err_msg); traceback.print_exc(); directive_error_msg = err_msg
            else:
                 directive_error_msg = "Planner LLM did not output a valid PLAN_UPDATE: CREATE_PLAN directive."
                 print(f"Warning: {directive_error_msg}")
                 # 即使没有指令，也可能需要返回 Planner 的回复消息
                 # 但如果没有 plan，流程可能无法继续，所以记录错误

        except Exception as outer_e:
             directive_error_msg = f"Error searching for PLAN_UPDATE directive: {outer_e}"
             print(f"ERROR: {directive_error_msg}"); traceback.print_exc()

    # --- 4. 准备返回的状态更新 ---
    updates: Dict[str, Any] = {"messages": messages_to_add} # 添加 Planner 的回复消息
    if plan_updated and new_plan:
        updates["plan"] = new_plan # 返回新创建的 Plan
    
    final_error = llm_error_msg or directive_error_msg
    if final_error: # 记录 Planner 步骤中遇到的第一个错误
        updates["error"] = final_error

    print(f"--- Exiting Planner Node. Plan created: {plan_updated} ---")
    return updates


# --- Planner 节点的同步包装器 (使用 anyio) ---
def planner_node_logic_sync(
    state: PlanningAgentState,
    config: Optional[RunnableConfig],
    model: Any,
    agent_description_map: Dict[str, str]
) -> Dict[str, Any]:
    """planner_node_logic 的同步包装器"""
    print(f"--- Entering Planner Node (Sync Wrapper) ---")
    try:
        # 使用 anyio 在同步函数中运行异步函数
        return anyio.run( # type: ignore
            planner_node_logic, state, config, model, agent_description_map
        )
    except Exception as e:
        print(f"Error running planner_node_logic synchronously: {e}")
        traceback.print_exc()
        return {"error": f"Planner sync execution failed: {e}", "messages": state.get("messages",[])}

================================================
FILE: core/agents/state_based_supervisor/planning_handler.py
================================================
# reason_graph/planning_handler.py
import uuid
import datetime
from typing import List, Dict, Optional, Any
from .state_schema import TaskStatus, PlanningStatus, Task, Plan # 从 state_schema 导入类型

class PlanningStateHandler:
    """
    使用静态方法管理一个表示项目计划的字典。
    计划现在存储在 LangGraph 的状态中，此类提供操作该字典的函数。
    """

    @staticmethod
    def _now() -> str:
        return datetime.datetime.now(datetime.timezone.utc).isoformat()

    @staticmethod
    def _gen_id() -> str:
        # 生成更易读的任务 ID (可选)
        # return f"task_{str(uuid.uuid4())[:8]}"
        return str(uuid.uuid4())

    @staticmethod
    def create_plan(title: str, description: str) -> Plan:
        """创建一个新的 Plan 字典"""
        now = PlanningStateHandler._now()
        return Plan(
            title=title,
            description=description,
            status="planning",  # 初始状态为规划中
            tasks=[],
            current_task_id=None,
            created_at=now,
            updated_at=now,
            completed_at=None,
        )

    @staticmethod
    def create_task(description: str,
                    agent: Optional[str] = None,
                    dependencies: Optional[List[str]] = None) -> Task:
        """创建一个新的 Task 字典"""
        now = PlanningStateHandler._now()
        return Task(
            id=PlanningStateHandler._gen_id(),
            description=description.strip(),
            status="pending", # 初始状态为待处理
            agent=agent.strip() if agent else None,
            created_at=now,
            updated_at=now,
            completed_at=None,
            dependencies=dependencies or [],
            notes=None,
            evaluation=None,
            result=None,
        )

    @staticmethod
    def add_tasks(plan: Plan, tasks_data: List[Dict[str, Any]]) -> Plan:
        """向 Plan 字典中添加任务"""
        if not isinstance(plan, dict) or "tasks" not in plan:
             raise ValueError("Invalid plan structure provided.")
        if not isinstance(tasks_data, list):
             raise ValueError("tasks_data must be a list of task dictionaries.")

        for tinfo in tasks_data:
            desc = tinfo.get("description")
            if not desc: continue # 跳过没有描述的任务
            agent = tinfo.get("agent")
            deps = tinfo.get("dependencies")
            task = PlanningStateHandler.create_task(desc, agent, deps)
            plan["tasks"].append(task)

        # 如果添加任务时计划仍在 planning 阶段，可以转为 ready
        if plan.get("status") == "planning":
             plan["status"] = "ready"

        plan["updated_at"] = PlanningStateHandler._now()
        return plan

    @staticmethod
    def update_task(plan: Plan,
                    by_id: Optional[str] = None,
                    new_desc: Optional[str] = None,
                    new_status: Optional[TaskStatus] = None,
                    new_agent: Optional[str] = None,
                    new_notes: Optional[str] = None,
                    new_evaluation: Optional[str] = None,
                    new_result: Optional[Any] = None) -> Plan:
        """更新 Plan 字典中指定 ID 的任务"""
        if not isinstance(plan, dict) or "tasks" not in plan:
             raise ValueError("Invalid plan structure provided.")
        if not by_id:
            raise ValueError("Must provide 'by_id' to update a task.")

        task = next((t for t in plan["tasks"] if t.get("id") == by_id), None)
        if not task:
            raise ValueError(f"No matching task found with ID: {by_id}")

        updated = False
        if new_desc is not None and task.get("description") != new_desc.strip():
            task["description"] = new_desc.strip()
            updated = True
        if new_status is not None and task.get("status") != new_status.strip():
            task["status"] = new_status.strip()
            if new_status.strip() == "completed":
                task["completed_at"] = PlanningStateHandler._now()
            updated = True
        if new_agent is not None and task.get("agent") != new_agent.strip():
            task["agent"] = new_agent.strip()
            updated = True
        if new_notes is not None and task.get("notes") != new_notes.strip():
            task["notes"] = new_notes.strip()
            updated = True
        if new_evaluation is not None and task.get("evaluation") != new_evaluation.strip():
            task["evaluation"] = new_evaluation.strip()
            updated = True
        if new_result is not None: # 直接更新结果（谨慎使用，可能很大）
             task["result"] = new_result
             updated = True

        if updated:
            task["updated_at"] = PlanningStateHandler._now()
            plan["updated_at"] = PlanningStateHandler._now() # 更新整个计划的更新时间

        # 检查并更新整个计划的状态
        plan = PlanningStateHandler.update_plan_status(plan)

        return plan

    @staticmethod
    def update_plan_status(plan: Plan) -> Plan:
         """根据任务状态自动更新计划状态"""
         if not isinstance(plan, dict) or "tasks" not in plan:
              return plan # Return as is if invalid

         tasks = plan["tasks"]
         if not tasks: # 没有任务
              if plan.get("status") not in ["completed", "failed", "error"]:
                   plan["status"] = "ready" # 或 "completed" 如果没有任务就算完成? 设为 ready 似乎更合理
              return plan

         all_completed = all(t.get("status") == "completed" for t in tasks)
         any_failed = any(t.get("status") == "failed" for t in tasks)
         any_in_progress = any(t.get("status") in ["in_progress", "pending_review"] for t in tasks)
         any_pending = any(t.get("status") == "pending" for t in tasks)

         current_status = plan.get("status")
         new_status = current_status

         if any_failed:
             new_status = "failed" # 或 "error"
         elif all_completed:
             new_status = "completed"
             plan["completed_at"] = PlanningStateHandler._now()
         elif any_in_progress:
             new_status = "executing"
         elif any_pending or not any_in_progress: # 如果还有 pending 或所有任务都结束了但不是 completed/failed
              if current_status not in ["completed", "failed", "error"]: # 避免覆盖最终状态
                 new_status = "ready" # 准备好执行或等待新任务

         if new_status != current_status:
              plan["status"] = new_status
              plan["updated_at"] = PlanningStateHandler._now()

         return plan

    @staticmethod
    def set_current_task(plan: Plan, task_id: Optional[str]) -> Plan:
        """设置 Plan 字典中的当前任务 ID"""
        if not isinstance(plan, dict):
             raise ValueError("Invalid plan structure provided.")

        if task_id is None:
             plan["current_task_id"] = None
             plan["updated_at"] = PlanningStateHandler._now()
             return plan

        found = any(t.get("id") == task_id for t in plan.get("tasks", []))
        if not found:
            raise ValueError(f"Task ID '{task_id}' not found in plan.")

        if plan.get("current_task_id") != task_id:
            plan["current_task_id"] = task_id
            plan["updated_at"] = PlanningStateHandler._now()
        return plan

    @staticmethod
    def get_task(plan: Plan, task_id: str) -> Optional[Task]:
         """根据 ID 获取任务字典"""
         if not isinstance(plan, dict) or "tasks" not in plan:
              return None
         return next((t for t in plan["tasks"] if t.get("id") == task_id), None)

    @staticmethod
    def get_next_pending_task(plan: Plan) -> Optional[Task]:
         """获取下一个处于 pending 状态且所有依赖已完成的任务"""
         if not isinstance(plan, dict) or "tasks" not in plan:
              return None

         completed_task_ids = {t["id"] for t in plan["tasks"] if t.get("status") == "completed"}

         for task in plan["tasks"]:
              if task.get("status") == "pending":
                   dependencies = task.get("dependencies", [])
                   if not dependencies or all(dep_id in completed_task_ids for dep_id in dependencies):
                        return task
         return None # 没有找到合适的下一个任务

    @staticmethod
    def finish_plan(plan: Plan) -> Plan:
        """强制将 Plan 标记为完成"""
        if not isinstance(plan, dict):
             raise ValueError("Invalid plan structure provided.")
        if plan.get("status") != "completed":
            plan["status"] = "completed"
            plan["completed_at"] = PlanningStateHandler._now()
            plan["updated_at"] = PlanningStateHandler._now()
        return plan

================================================
FILE: core/agents/state_based_supervisor/prompt.py
================================================
# # --- Planner Agent System Prompt (新增) ---
# PLANNER_SYSTEM_PROMPT_TEMPLATE = """You are an expert planning agent. Your sole responsibility is to analyze a user request and create a detailed, step-by-step plan to fulfill it by coordinating specialized agents.

# The current date is {current_date}.

# ## Agent Descriptions:
# {agent_descriptions}
# *(This list includes the capabilities of available specialist agents.)*

# ## Task:
# Analyze the user request provided in the message history. Break it down into a sequence of logical tasks. For each task, determine the most suitable agent from the descriptions provided.

# ## Output Format:
# You MUST output **ONLY** a single `PLAN_UPDATE: CREATE_PLAN <JSON_ARGS>` directive in your response content. The JSON arguments MUST be valid and contain:
# - "title": A concise title for the overall plan.
# - "description": A brief description summarizing the user's goal.
# - "tasks": A list of task objects. Each task object MUST contain:
#     - "description": A clear and actionable description of the specific sub-task.
#     - "agent": The name of the MOST SUITABLE agent from the Agent Descriptions to perform this task. Leave empty ("") if unsure or if it's a general task.
#     - "status": Set **all** initial tasks to **"pending"**.
#     - (Optional) "dependencies": A list of task IDs (UUIDs that will be generated later) this task depends on, if any (usually empty for initial plan).

# **Example JSON Args:**
# `{{"title": "Research and Report on AI Ethics", "description": "User wants a report on AI ethics, including research and writing.", "tasks": [{{"description": "Research current trends in AI ethics using web search", "agent": "research_expert", "status": "pending"}}, {{"description": "Write a structured report summarizing the findings", "agent": "reporter_expert", "status": "pending", "dependencies": ["<ID_of_research_task>"]}}]}}` 
# *(Note: Actual IDs are UUIDs generated later, dependencies often added via UPDATE_TASK)*

# **CRITICAL**: Output **ONLY** the `PLAN_UPDATE: CREATE_PLAN <JSON_ARGS>` directive and nothing else. Do not add conversational text. Make sure the JSON is valid.
# """

# SUPERVISOR_PLANNING_PROMPT_TEMPLATE = """You are a meticulous top-level Supervisor agent responsible for executing an existing plan, coordinating specialist agents, and managing task execution based on the provided state. You rely on an external evaluator node to assess task completion after agents run.

# The current date is {current_date}.

# ## Current Plan State:
# ```json
# {plan_json}
# ```
# *(Review plan status and individual task statuses and IDs (UUIDs). Your main goal is to drive the plan status to 'completed'.)*

# ## Agent Descriptions:
# {agent_descriptions}

# ## Your Goal:
# Execute the **existing plan** strictly step-by-step towards 'completed' status. Make **exactly one** logical primary decision per turn. **Do NOT evaluate agent results or mark tasks 'completed'/'failed' yourself.**

# ## Workflow & Decision Process (Strict Sequence):
# 1.  **Analyze State**: Review the latest messages and the 'Current Plan State'. (Note: If the last message is from a sub-agent, an evaluator node has already processed it and updated the plan state before your turn).
# 2.  **Determine ONE Next Action**: Execute the FIRST matching condition below and **IMMEDIATELY END YOUR TURN**:

#     * **A. Initiate Next Task**: If the plan is 'ready' or 'executing', AND no task is currently 'in_progress', AND a 'pending' task is ready (dependencies met):
#         * **Action**: Find the FIRST such task. Output **ONLY** `PLAN_UPDATE: UPDATE_TASK <JSON_ARGS_status_in_progress>`. **CRITICAL: Use the exact UUID for `by_id`!** JSON Args should be ` {{"by_id": "<task_uuid>", "status": "in_progress"}}`.
#     * **B. Delegate In-Progress Task**: If a task **currently has status 'in_progress'** (check plan state):
#         * **Action**: Identify the best agent. Output **ONLY** the `transfer_to_<agent_name>` tool call. **CRITICAL**: Tool call args **MUST** include `"task_id": "<TASK_UUID_FROM_PLAN>"` and clear `"instructions"`.
#     * **C. Finish Plan**: If **ALL** tasks in the plan now have status 'completed' AND the plan status is NOT 'completed' yet (check plan state provided):
#         * **Action**: Output **ONLY** `PLAN_UPDATE: FINISH_PLAN {{}}`.
#     * **D. Generate Final Output**: If the **Plan Status IS 'completed'** (check plan state provided):
#         * **Action**: Decide final output format based on original request. EITHER call `transfer_to_reporter_expert` (passing context in args, like relevant task IDs) OR generate the final `AIMessage` content yourself summarizing the overall result.
#     * **E. Waiting/Blocked/Failed**: If no other action is appropriate (e.g., plan status 'failed', or waiting for dependencies):
#         * **Action**: Output a brief waiting or status message explaining the situation.

# ## Output Constraints:
# - Your response MUST contain exactly ONE primary action (ONE PLAN_UPDATE directive OR ONE transfer_to tool call OR the final answer OR a status message).
# - `PLAN_UPDATE:` directives MUST be in the text content with **valid JSON arguments**.
# - **CRITICAL**: `UPDATE_TASK` **MUST** use the correct Task UUID string for `"by_id"`.

# ## Planning Directives Format (Mandatory - JSON Args in text):
# - `PLAN_UPDATE: ADD_TASKS {{"tasks": [...]}}` # You can still add tasks if needed mid-plan
# - `PLAN_UPDATE: UPDATE_TASK {{"by_id": "<task-uuid-from-plan>", "status": "in_progress", "notes": "<optional notes>"}}` (**UUID!** Only use non-terminal statuses).
# - `PLAN_UPDATE: FINISH_PLAN {{}}`

# ## Tool Usage:
# - Only `transfer_to_<agent_name>` tools. Args **MUST** include `"task_id"` and `"instructions"`.

# Now, analyze the current state (which reflects any recent evaluations) and the LAST message, and determine the single next action based strictly on the workflow for **executing the existing plan**. Remember, you do **not** evaluate results or mark tasks complete/failed.
# """

# --- Planner Agent System Prompt  ---
PLANNER_SYSTEM_PROMPT_TEMPLATE = """You are an expert planning agent. Your sole responsibility is to analyze a user request and create a detailed, step-by-step plan to fulfill it by coordinating specialized agents.

The current date is {current_date}.

## Agent Descriptions:
{agent_descriptions}
*(This list includes the capabilities of available specialist agents.)*

## Task:
Analyze the user request provided in the message history. Break it down into a sequence of logical tasks. For each task, determine the most suitable agent from the descriptions provided.

## Task Granularity Guidelines:
- **IMPORTANT**: Maintain appropriate task granularity based on complexity:
  - For simple requests, create just 1-2 tasks that can be completed by a single agent
  - For complex requests, break down into 3-5 logical steps
  - Avoid excessive fragmentation of simple tasks
  - Each task should represent a meaningful unit of work

## Output Format:
You MUST output **ONLY** a single `PLAN_UPDATE: CREATE_PLAN <JSON_ARGS>` directive in your response content. The JSON arguments MUST be valid and contain:
- "title": A concise title for the overall plan.
- "description": A brief description summarizing the user's goal.
- "tasks": A list of task objects. Each task object MUST contain:
    - "description": A clear and actionable description of the specific sub-task.
    - "agent": The name of the MOST SUITABLE agent from the Agent Descriptions to perform this task. Leave empty ("") if unsure or if it's a general task.
    - "status": Set **all** initial tasks to **"pending"**.
    - (Optional) "dependencies": Usually empty for initial plan.

**Example JSON Args for SIMPLE request:**
`{{"title": "Answer Question About Python", "description": "User wants to know how to use list comprehensions in Python", "tasks": [{{"description": "Provide a comprehensive explanation of Python list comprehensions with examples", "agent": "coder_expert", "status": "pending"}}]}}`

**Example JSON Args for COMPLEX request:**
`{{"title": "Research and Report on AI Ethics", "description": "User wants a detailed report on AI ethics", "tasks": [{{"description": "Research current trends in AI ethics using web search", "agent": "research_expert", "status": "pending"}}, {{"description": "Write a structured report summarizing the findings", "agent": "reporter_expert", "status": "pending"}}]}}`

**CRITICAL**: Output **ONLY** the `PLAN_UPDATE: CREATE_PLAN <JSON_ARGS>` directive and nothing else. Do not add conversational text. Make sure the JSON is valid.
"""

# --- Supervisor Planning Prompt (允许动作组合 + 强制UUID/JSON) ---
SUPERVISOR_PLANNING_PROMPT_TEMPLATE = """You are a meticulous top-level Supervisor agent responsible for executing an existing plan, coordinating specialist agents, and managing task execution based on the provided state.

The current date is {current_date}.

## Current Plan State:
```json
{plan_json}
```
*(Review plan status and individual task statuses and IDs (UUIDs). Your main goal is to drive the plan status to 'completed'.)*

## Agent Descriptions:
{agent_descriptions}
*(This list includes specialist agents and yourself.)*

## Your Goal:
Execute the **existing plan** step-by-step towards 'completed' status by making logical decisions and issuing appropriate directives and tool calls.

## Workflow & Decision Guidelines:
1.  **Analyze State**: Review the latest messages (especially agent results) and the 'Current Plan State'.
2.  **Determine Next Action(s)**: Based on the analysis, decide the next logical step(s).

    * **If a sub-agent just returned results**:
        a. Evaluate the result against the task.
        b. Issue the `PLAN_UPDATE: UPDATE_TASK <JSON_ARGS_status_completed_or_other>`. **CRITICAL: Use the exact Task UUID for `by_id`!** Include `evaluation` and `notes`.
        c. **After** the update directive, **if** more tasks are pending and ready, you **CAN** identify the next task, issue `PLAN_UPDATE: UPDATE_TASK <JSON_ARGS_status_in_progress>` (using its UUID), **AND** issue the corresponding `transfer_to_<agent_name>` tool call **in the same response**.
    * **If no agent just returned, AND a 'pending' task is ready**:
        a. Identify the *next* suitable 'pending' task.
        b. Issue `PLAN_UPDATE: UPDATE_TASK <JSON_ARGS_status_in_progress>` (using its UUID).
        c. **Immediately following** the directive in the same response, issue the corresponding `transfer_to_<agent_name>` tool call with instructions (including Task UUID).
    * **If ALL tasks are 'completed' AND plan status is NOT 'completed' yet**:
        a. Issue `PLAN_UPDATE: FINISH_PLAN {{}}`.
        b. **In the same response**, decide the final output: EITHER call `transfer_to_reporter_expert` OR generate the final `AIMessage` content yourself.
    * **If Plan Status IS 'completed'**:
        a. Your job is done. Generate the final `AIMessage` content if you didn't call the reporter in the previous step.
    * **If Waiting/Blocked/Failed**: Output a status message explaining the situation.

## Output Constraints:
- Your response **CAN** contain **both** a `PLAN_UPDATE:` directive (in content) and a `transfer_to_` tool call if logically appropriate (e.g., completing one task and starting the next).
- Your response **CAN** contain **both** `PLAN_UPDATE: FINISH_PLAN` and the final action (call reporter or final answer).
- **NEVER** delegate to more than one agent simultaneously (only one `transfer_to_` tool call per response).
- `PLAN_UPDATE:` directives MUST be in the text content with **valid JSON arguments**.
- **CRITICAL**: `UPDATE_TASK` **MUST** use the correct Task UUID string for `"by_id"`.

## Planning Directives Format (Mandatory - JSON Args in text):
Use these exact formats **within your response content**. Arguments **MUST** be a valid JSON string.
- `PLAN_UPDATE: ADD_TASKS {{"tasks": [...]}}`
- `PLAN_UPDATE: UPDATE_TASK {{"by_id": "<task-uuid-from-plan>", "status": "<new_status>", "evaluation": "<text>", "notes": "<text>"}}` (**UUID!**)
- `PLAN_UPDATE: FINISH_PLAN {{}}`
*(Note: CREATE_PLAN is handled by the Planner Agent)*

## Tool Usage:
- Only `transfer_to_<agent_name>` tools are callable by you. Args **MUST** include `"task_id"` and `"instructions"`.

Now, analyze the current state and messages, and determine the necessary action(s) for this turn.
"""


# **主要调整说明:**

# 1.  **允许动作组合**: 修改了 Workflow 和 Output Constraints，明确允许 Supervisor 在一个回合中既更新 Plan 状态（通过 `PLAN_UPDATE:` 指令）又委派任务（通过 `transfer_to_` 工具调用），或者在结束计划的同时进行最终输出操作。这给予 LLM 更大的灵活性，可能更符合它的“思考习惯”。
# 2.  **保留核心要求**: 仍然**强制要求** `PLAN_UPDATE` 的参数必须是有效的 JSON，并且 `UPDATE_TASK` **必须**使用正确的 Task UUID。同时，**仍然禁止**一次委派多个 Agent。
# 3.  **移除了严格的 `STOP` 指令**: 不再强制要求 LLM 在发出 `PLAN_UPDATE` 后必须结束当前回合。

# **预期效果:**

# * Supervisor LLM 在处理完子 Agent 的结果并更新任务状态后，如果发现下一个任务已准备就绪，它可能会在同一个回复中直接发出 `transfer_to_` 指令，从而减少一个交互回合，提高效率。
# * 在所有任务完成后，它可以一步到位地发出 `FINISH_PLAN` 并同时决定最终输出（调用 Reporter 或自己总结）。
# * **潜在风险**: 这种灵活性也可能使得 LLM 在复杂情况下更容易出错（例如，忘记更新状态就去委派，或者错误地组合了动作）。但鉴于之前严格分步也遇到了问题，这种方式值得一试。

================================================
FILE: core/agents/state_based_supervisor/state_schema.py
================================================
# reason_graph/state_schema.py
import operator
from typing import Dict, List, Optional, Any, Literal, TypedDict, Sequence, Annotated, Union
from langchain_core.messages import BaseMessage
from langgraph.graph.message import add_messages
from langgraph.managed import IsLastStep, RemainingSteps

# 定义计划状态类型
PlanningStatus = Literal["not_started", "planning", "ready", "executing", "completed", "failed", "error"]

# 定义任务状态类型
TaskStatus = Literal["pending", "ready", "in_progress", "completed", "failed", "skipped", "pending_review", "revision_needed"]

# 定义任务项
class Task(TypedDict, total=False):
    """任务项定义

    表示计划中的一个任务项，包含任务描述、状态、分配的代理等信息
    """
    id: str  # 任务唯一标识符
    description: str  # 任务描述
    status: TaskStatus  # 任务状态
    agent: Optional[str]  # 分配的代理名称 (建议的执行者)
    created_at: str  # 创建时间 (ISO 格式)
    updated_at: str  # 更新时间 (ISO 格式)
    completed_at: Optional[str]  # 完成时间 (ISO 格式)
    dependencies: Optional[List[str]]  # 依赖的任务ID列表
    notes: Optional[str]  # 关于任务执行情况的备注 (可由 Agent 或 Supervisor 更新)
    evaluation: Optional[str] # 对任务完成情况的评估 (可由 Supervisor LLM 或 Evaluator Agent 更新)
    result: Optional[Any] # (可选) 存储任务的直接输出结果摘要

# 定义计划
class Plan(TypedDict, total=False):
    """计划定义

    表示一个完整的计划，包含计划状态、任务列表等信息
    """
    status: PlanningStatus  # 计划状态
    tasks: List[Task]  # 任务列表
    current_task_id: Optional[str]  # 当前 Supervisor 关注或正在处理的任务ID
    created_at: str  # 创建时间 (ISO 格式)
    updated_at: str  # 更新时间 (ISO 格式)
    completed_at: Optional[str]  # 完成时间 (ISO 格式)
    title: Optional[str]  # 计划标题
    description: Optional[str]  # 计划描述 (通常是用户原始请求)

# 扩展基础 AgentState 以支持计划功能
class PlanningAgentState(TypedDict):
    """支持计划功能的、用于 Supervisor 图的状态定义"""
    messages: Annotated[Sequence[BaseMessage], add_messages] # 消息历史
    plan: Optional[Plan] = None # 存储计划对象
    # last_agent_result: Optional[Dict[str, Any]] = None # 存储刚结束的子 Agent 的 {name: ..., content: ...}
    is_last_step: IsLastStep # LangGraph 内部状态
    remaining_steps: RemainingSteps # LangGraph 内部状态, 用于防止无限循环
    error: Optional[str] = None # 用于记录执行中发生的错误信息
    # 可以根据需要添加其他全局共享的状态字段
    # 例如: shared_context: Optional[Dict] = None

# 可以为子 Agent 定义一个稍微不同的状态（如果它们不需要 plan）
class BasicAgentState(TypedDict):
    """基础 Agent 状态，仅包含消息历史"""
    messages: Annotated[Sequence[BaseMessage], add_messages]
    is_last_step: IsLastStep
    remaining_steps: RemainingSteps
    error: Optional[str] = None

# 方便类型提示
StateSchemaType = Union[Dict[str, Any], PlanningAgentState, BasicAgentState]

================================================
FILE: core/agents/state_based_supervisor/supervisor_graph.py
================================================
# reason_graph/supervisor_graph.py
import inspect
import re
import functools
import uuid
import asyncio
import anyio
import traceback 
from typing import Any, Callable, List, Optional, Type, Union, Dict, Literal, Sequence, cast # <--- 导入 cast

from langchain_core.language_models import BaseChatModel, LanguageModelLike
from langchain_core.tools import BaseTool
from langchain_core.messages import AIMessage, ToolMessage, BaseMessage, ToolCall, SystemMessage # <--- 导入 SystemMessage
from langchain_core.runnables import RunnableConfig
from langgraph.utils.runnable import RunnableCallable

from langgraph.graph import END, START, StateGraph
from langgraph.graph.state import CompiledStateGraph
from langgraph.prebuilt import ToolNode
from langgraph.pregel import Pregel

# 内部导入
try:
    from core.agents.base.base_agent import BaseAgent
    from .handoff import create_handoff_tool, _normalize_agent_name # 确保导入 _normalize_agent_name
    from .state_schema import PlanningAgentState, Plan # 导入 PlanningAgentState 和 Plan
    from .supervisor_node import supervisor_node_logic # 导入异步节点逻辑
    from .planner_node import planner_node_logic, planner_node_logic_sync # <--- 导入 Planner 逻辑
    from .evaluate_result_node import evaluate_result_node_logic, evaluate_result_node_logic_sync # <--- 导入 Evaluator 逻辑
    from .agent_name import AgentNameMode, with_agent_name
except ImportError as e:
     print(f"Error importing modules in supervisor_graph.py: {e}")
     # Add Dummy classes for type hints if needed
     class BaseAgent: pass
     class PlanningAgentState(Dict): pass
     class Plan(Dict): pass
     class Pregel: pass
     AgentNameMode = Literal["inline"]
     def create_handoff_tool(*args, **kwargs): return None # type: ignore
     def _normalize_agent_name(s: str) -> str: return s
     async def supervisor_node_logic(*args, **kwargs): return {}
     async def planner_node_logic(*args, **kwargs): return {} # <--- 添加 planner_node_logic
     def planner_node_logic_sync(*args, **kwargs): return {} # <--- 添加 planner_node_logic_sync
     async def evaluate_result_node_logic(*args, **kwargs): return {} # 添加 evaluate_result_node_logic  
     def evaluate_result_node_logic_sync(*args, **kwargs): return {} # 添加 evaluate_result_node_logic_sync
     def with_agent_name(model, mode): return model


# 定义 OutputMode, MODELS_NO_PARALLEL_TOOL_CALLS, _supports_disable_parallel_tool_calls (保持不变)
OutputMode = Literal["full_history", "last_message"]
MODELS_NO_PARALLEL_TOOL_CALLS = {"o3-mini"}
def _supports_disable_parallel_tool_calls(model: LanguageModelLike) -> bool:
    if not isinstance(model, BaseChatModel): return False
    if hasattr(model, "model_name") and model.model_name in MODELS_NO_PARALLEL_TOOL_CALLS: return False
    if not hasattr(model, "bind_tools"): return False
    if "parallel_tool_calls" not in inspect.signature(model.bind_tools).parameters: return False
    return True


# _make_call_agent (保持不变 - 已支持同步/异步)
def _make_call_agent(
    agent_graph: Pregel, 
    output_mode: OutputMode,
    add_handoff_back_messages: bool, 
    supervisor_name: str,
) -> RunnableCallable:
    if output_mode not in ["full_history", "last_message"]: raise ValueError(...)

    async def acall_agent(state: Dict, config: Optional[RunnableConfig] = None) -> Dict:
        agent_name = getattr(agent_graph, 'name', 'sub_agent')
        print(f"🟡 [Async invoke] Handoff to agent '{agent_name}'")
        sub_agent_input = {"messages": state.get("messages", [])}
        output: Dict[str, Any] = {}
        agent_error: Optional[str] = None

        try:
             output = await agent_graph.ainvoke(sub_agent_input, config=config)
             print(f"✅ [Async invoke] Agent '{agent_name}' completed.")
        except Exception as e:
             print(f"!!! Error during sub-agent {agent_name} ainvoke: {e}"); traceback.print_exc()
             agent_error = f"Error executing agent '{agent_name}': {type(e).__name__}"

        sub_agent_messages: List[BaseMessage] = output.get("messages", [])
        returned_messages: List[BaseMessage] = []
        if not sub_agent_messages and not agent_error:
             returned_messages = [AIMessage(content="(No output received from agent)", name=agent_name)]
        elif output_mode == "last_message":
             last_ai_message = next((m for m in reversed(sub_agent_messages) if isinstance(m, AIMessage)), None)
             returned_messages = [last_ai_message] if last_ai_message else sub_agent_messages[-1:]
        else:
             returned_messages = sub_agent_messages
             
        last_content = agent_error
        if not last_content and returned_messages:
             last_content = str(returned_messages[-1].content) if hasattr(returned_messages[-1], 'content') else "(No textual content)"

        return {
            "messages": returned_messages,
            "last_agent_result": {
                 "agent_name": agent_name,
                 "content": last_content or "(Agent execution finished without specific output or error)"
            }
        }

    def call_agent(state: Dict, config: Optional[RunnableConfig] = None) -> Dict:
        agent_name = getattr(agent_graph, 'name', 'sub_agent')
        print(f"🟡 [Sync invoke] Handoff to agent '{agent_name}'")
        sub_agent_input = {"messages": state.get("messages", [])}
        output: Dict[str, Any] = {}
        agent_error: Optional[str] = None

        try: output = agent_graph.invoke(sub_agent_input, config=config); print(f"✅ [Sync invoke] Agent '{agent_name}' completed.")
        except NotImplementedError: agent_error = f"Error: Sync invoke not supported by agent '{agent_name}'."; print(agent_error)
        except Exception as e: agent_error = f"Error during sub-agent {agent_name} invoke: {e}"; print(f"!!! {agent_error}")
        
        sub_agent_messages: List[BaseMessage] = output.get("messages", [])
        returned_messages: List[BaseMessage] = []
        if not sub_agent_messages and not agent_error: returned_messages = [AIMessage(content="(No output received)", name=agent_name)]
        elif output_mode == "last_message":
             last_ai_message = next((m for m in reversed(sub_agent_messages) if isinstance(m, AIMessage)), None)
             returned_messages = [last_ai_message] if last_ai_message else sub_agent_messages[-1:]
        else: returned_messages = sub_agent_messages
        
        last_content = agent_error
        if not last_content and returned_messages: last_content = str(returned_messages[-1].content) if hasattr(returned_messages[-1], 'content') else "(No content)"

        return {
            "messages": returned_messages,
            "last_agent_result": {
                 "agent_name": agent_name,
                 "content": last_content or "(Agent sync execution finished)"
            }
        }

    return RunnableCallable(func=call_agent, afunc=acall_agent, name=f"Call_{getattr(agent_graph, 'name', 'sub_agent')}")


def supervisor_node_logic_sync(
    state: PlanningAgentState,
    config: Optional[RunnableConfig],
    model: Any,
    supervisor_name: str,
    agent_description_map: Dict[str, str]
) -> Dict[str, Any]:
    print(f"--- Entering Supervisor Node (Sync Wrapper) ---")
    try:
        return anyio.run(
            supervisor_node_logic, state, config, model, supervisor_name, agent_description_map
        )
    except Exception as e:
        print(f"Error running supervisor_node_logic synchronously using anyio: {e}")
        import traceback
        traceback.print_exc()
        return {"error": f"Sync execution wrapper failed: {e}", "messages": state.get("messages",[])}


def create_supervisor(
    model: LanguageModelLike,
    sub_agents: List[BaseAgent],
    state_schema: Type[PlanningAgentState] = PlanningAgentState,
    config_schema: Type[Any] | None = None,
    tools: list[BaseTool | Callable] | None = None,
    output_mode: OutputMode = "last_message",
    add_handoff_back_messages: bool = False,
    supervisor_name: str = "supervisor",
    planner_node_name: str = "planner",
    evaluator_node_name: str = "evaluate_result",
    handoff_executor_name: str = "handoff_executor",
    include_agent_name: AgentNameMode | None = "inline",
) -> StateGraph:
    agent_graphs: Dict[str, Pregel] = {}
    agent_names: List[str] = []
    agent_description_map: Dict[str, str] = {}
    # --- 1. 提取 Agent 信息  ---
    for agent in sub_agents:
        if not isinstance(agent, BaseAgent): raise TypeError(...)
        if not agent.name or agent.name == "LangGraph": raise ValueError(...)
        if agent.name in agent_graphs: raise ValueError(...)
        agent_names.append(agent.name)
        agent_description_map[agent.name] = getattr(agent, 'description', '...')
        try:
            compiled_graph = agent.get_agent()
            if not isinstance(compiled_graph, Pregel): 
                 core_graph = getattr(compiled_graph, 'last', None)
                 if isinstance(core_graph, Pregel):
                      compiled_graph = core_graph
                 else:
                      raise TypeError(f"Could not retrieve Pregel instance from agent '{agent.name}'.get_agent()")
            agent_graphs[agent.name] = compiled_graph
        except Exception as e: raise e

     # --- 2. 创建 Handoff 工具 ---
    handoff_tools = [create_handoff_tool(agent_name=name) for name in agent_names]
    supervisor_callable_tools = (tools or []) + handoff_tools
    print(f"Supervisor '{supervisor_name}' bound with tools: {[t.name for t in supervisor_callable_tools]}")

    # --- 3. 绑定工具到 Supervisor 模型 ---
    bound_supervisor_model: LanguageModelLike
    if not supervisor_callable_tools:
         print(f"Warning: Supervisor '{supervisor_name}' has no tools bound.")
         bound_supervisor_model = model
    elif _supports_disable_parallel_tool_calls(model):
        bound_supervisor_model = model.bind_tools(supervisor_callable_tools, parallel_tool_calls=False)
    else:
        bound_supervisor_model = model.bind_tools(supervisor_callable_tools)
    if include_agent_name:
        bound_supervisor_model = with_agent_name(bound_supervisor_model, include_agent_name)

    # --- 4. 构建 StateGraph ---
    builder = StateGraph(state_schema, config_schema=config_schema)
    
    # --- 5. 添加 Planner 节点 (使用同步/异步包装) ---
    planner_logic_partial_async = functools.partial(
        planner_node_logic,
        model=model,
        agent_description_map=agent_description_map,
    )
    planner_logic_partial_sync = functools.partial(
        planner_node_logic_sync,
        model=model,
        agent_description_map=agent_description_map,
    )
    planner_runnable = RunnableCallable(
        func=planner_logic_partial_sync,
        afunc=planner_logic_partial_async,
        name=planner_node_name
    )
    builder.add_node(planner_node_name, planner_runnable)

    # --- 6. 添加 Supervisor 节点 (使用同步/异步包装) ---
    supervisor_logic_partial_async = functools.partial(
        supervisor_node_logic,
        model=bound_supervisor_model,
        supervisor_name=supervisor_name,
        agent_description_map=agent_description_map,
    )
    supervisor_logic_partial_sync = functools.partial(
        supervisor_node_logic_sync,
        model=bound_supervisor_model,
        supervisor_name=supervisor_name,
        agent_description_map=agent_description_map,
    )
    supervisor_runnable = RunnableCallable(
        func=supervisor_logic_partial_sync,
        afunc=supervisor_logic_partial_async,
        name=supervisor_name
    )
    builder.add_node(supervisor_name, supervisor_runnable)

    # --- 7. 添加子 Agent 节点 ---
    for name, compiled_graph in agent_graphs.items():
        builder.add_node(name, _make_call_agent(compiled_graph, output_mode, add_handoff_back_messages, supervisor_name))
        builder.add_edge(name, evaluator_node_name)

    # --- 8. 添加 Handoff Tool 执行节点 ---
    handoff_executor_node = ToolNode(handoff_tools, name=handoff_executor_name)
    builder.add_node(handoff_executor_name, handoff_executor_node)
    
    # --- 9. 添加 Evaluate Result 节点 ---
    evaluator_runnable = RunnableCallable(func=evaluate_result_node_logic_sync, afunc=evaluate_result_node_logic, name=evaluator_node_name)
    # Evaluator 不需要 model 或 agent descriptions 作为直接参数
    builder.add_node(evaluator_node_name, evaluator_runnable) # type: ignore
    # --- 10. 设置图的入口和边 ---
    builder.set_entry_point(planner_node_name)
    builder.add_edge(planner_node_name, supervisor_name)

    def route_from_supervisor(state: PlanningAgentState) -> str:
        messages = state.get('messages', [])
        plan = state.get('plan')
        last_message = messages[-1] if messages else None

        if not isinstance(last_message, AIMessage):
            print("Routing: Last message not AIMessage, looping supervisor.")
            return supervisor_name

        if last_message.tool_calls:
            tool_call = last_message.tool_calls[0]
            agent_name_match = re.match(r"transfer_to_(\w+)", tool_call["name"])
            if agent_name_match and agent_name_match.group(1) in agent_names: 
                 extracted_name = agent_name_match.group(1)
                 print(f"DEBUG route_from_supervisor: Tool Call Name = {repr(tool_call['name'])}") 
                 print(f"DEBUG route_from_supervisor: Extracted Target Name = {repr(extracted_name)}") 
                 print(f"DEBUG route_from_supervisor: Available Agent Names = {repr(agent_names)}") 
                 print(f"Routing: Supervisor -> HandoffExecutor (for {extracted_name})")
                 return handoff_executor_name
            else:
                 print(f"DEBUG route_from_supervisor: Membership check failed! ('{extracted_name}' in {repr(agent_names)}) is False.")
                 print(f"Warning: Supervisor called unknown/invalid tool: {tool_call['name']}. Looping supervisor.")
                 return supervisor_name

        if plan and plan.get("status") == "completed":
             print("Routing: Plan completed -> END")
             return END

        print(f"Routing: No tool call and plan not completed (status: {plan.get('status') if plan else 'None'}). Looping supervisor.")
        return supervisor_name

    builder.add_conditional_edges(
        supervisor_name,
        route_from_supervisor,
        {
            handoff_executor_name: handoff_executor_name,
            supervisor_name: supervisor_name,
            END: END,
        }
    )
    
    # Handoff Executor 完成后, LangGraph 处理 Command(goto=...) 直接路由到子 Agent
    # 不需要从 Handoff Executor 出发的显式边

    # --- 关键修改: 子 Agent 完成后 -> Evaluator ---
    for name in agent_names:
        builder.add_edge(name, evaluator_node_name) # <--- 修改: 指向 Evaluator

    # --- 新增: Evaluator 完成后 -> Supervisor ---
    builder.add_edge(evaluator_node_name, supervisor_name) # <--- 新增: Evaluator 指回 Supervisor

    print("Supervisor graph definition created with Planner and Evaluator nodes.")
    return builder # 返回 StateGraph 定义

================================================
FILE: core/agents/state_based_supervisor/supervisor_node.py
================================================
# reason_graph/supervisor_node.py

import re
import json
import time
import copy
import ast 
import traceback
from typing import Dict, Any, List, Optional, Union, cast
from datetime import datetime 
from langchain_core.messages import BaseMessage, AIMessage, SystemMessage, HumanMessage, ToolMessage
from langchain_core.messages import ToolCall  # 确保导入
from langchain_core.runnables import RunnableConfig
from langgraph.graph import END

# 内部导入 (确保路径正确)
try:
    from .state_schema import PlanningAgentState, TaskStatus, Plan
    from .planning_handler import PlanningStateHandler
    from .prompt import SUPERVISOR_PLANNING_PROMPT_TEMPLATE
except ImportError as e:
    print(f"Error importing modules in supervisor_node.py: {e}")
    # Fallbacks
    class PlanningAgentState(Dict): pass
    class Plan(Dict): pass
    class PlanningStateHandler: 
        @staticmethod
        def update_task(*args, **kwargs): return kwargs.get('plan')
        @staticmethod
        def create_plan(*args, **kwargs): return {}
        @staticmethod
        def add_tasks(*args, **kwargs): return kwargs.get('plan')
        @staticmethod
        def finish_plan(*args, **kwargs): return kwargs.get('plan')
        @staticmethod
        def get_task(*args, **kwargs): return None
        @staticmethod
        def update_plan_status(*args, **kwargs): return kwargs.get('plan')
        @staticmethod
        def set_current_task(*args, **kwargs): return kwargs.get('plan')
    SUPERVISOR_PLANNING_PROMPT_TEMPLATE = "Fallback Prompt: Error loading template."


# --- 参数解析函数 (使用 JSON / ast.literal_eval) ---
def parse_directive_args(directive_str: str) -> Dict[str, Any]:
    """从指令字符串中解析 JSON 参数"""
    args = {}
    # 查找第一个 '{' 到最后一个 '}' 之间的内容作为 JSON 字符串
    json_match = re.search(r"(\{.*?\})\s*$", directive_str.split(maxsplit=1)[1] if len(directive_str.split(maxsplit=1)) > 1 else "", re.DOTALL)
    if json_match:
        args_json_str = json_match.group(1)
        try:
            args = json.loads(args_json_str)
            if not isinstance(args, dict): raise ValueError("Args JSON not a dict.")
            print(f"DEBUG: Parsed args via JSON: {args}")
            return args
        except json.JSONDecodeError as json_err:
            print(f"Warning: JSON parsing failed ({json_err}), trying ast.literal_eval...")
            try:
                 args = ast.literal_eval(args_json_str)
                 if not isinstance(args, dict): raise ValueError("ast.literal_eval didn't return dict.")
                 print(f"DEBUG: Parsed args via ast.literal_eval: {args}")
                 return args
            except Exception as ast_err:
                 raise ValueError(f"Failed to parse args: {ast_err}. Raw: '{args_json_str}'") from ast_err
    elif directive_str.strip().upper().endswith("{}"): # 处理 FINISH_PLAN {} 的情况
         return {} # 返回空字典
    else:
         # 如果找不到有效的 JSON 参数，但指令需要参数，则抛出错误或返回空字典
         print(f"Warning: Could not find valid JSON arguments in directive: '{directive_str}'. Returning empty args.")
         return {}


# --- Supervisor 节点核心逻辑 (移除结果处理，增加设置 current_task_id) ---
async def supervisor_node_logic(
    state: PlanningAgentState,
    config: Optional[RunnableConfig],
    model: Any,
    supervisor_name: str,
    agent_description_map: Dict[str, str]
) -> Dict[str, Any]:
    """Supervisor 节点核心逻辑 (不再处理 Agent 结果状态更新)"""
    print(f"--- Entering Supervisor Node ({supervisor_name}) ---")
    messages: List[BaseMessage] = state.get('messages', [])
    plan: Optional[Plan] = state.get('plan')
    current_error = state.get('error'); state['error'] = None
    if current_error: print(f"  Supervisor saw previous error: {current_error}")

    # --- 0. 检查 Plan 是否存在 (不变) ---
    if not plan:
         print("ERROR: Supervisor node requires a plan, but none found in state.")
         return {"error": "Plan is missing.", "messages": []}

    # --- 1. 准备 Prompt (不变) ---
    plan_json_str = json.dumps(plan, indent=2, ensure_ascii=False)
    desc_list = [f"- {name}: {desc}" for name, desc in agent_description_map.items()]
    desc_list.append(f"- {supervisor_name}: Coordinates tasks...")
    agent_descriptions_str = "\n".join(desc_list)
    system_prompt_text = "Error loading/formatting prompt"
    try:
         current_date_str = datetime.now().strftime("%a, %b %d, %Y")
         system_prompt_text = SUPERVISOR_PLANNING_PROMPT_TEMPLATE.format(
             plan_json=plan_json_str, 
             agent_descriptions=agent_descriptions_str, 
             current_date=current_date_str
         )
    except Exception as e: print(f"ERROR loading/formatting prompt: {e}")
    llm_input_messages = [SystemMessage(content=system_prompt_text)] + messages

    # --- 2. 调用 Supervisor LLM (不变) ---
    print("--- Calling Supervisor LLM ---"); response=None; llm_error_msg=None
    try: 
        response = await model.ainvoke(llm_input_messages, config=config)
        if not isinstance(response, AIMessage): raise TypeError(f"LLM returned non-AIMessage: {type(response)}")
        if not response.name: response.name = supervisor_name
        print(f"Supervisor LLM Raw Response Content: {response.content[:300]}...")
        if response.tool_calls: print(f"Supervisor LLM Tool Calls: {response.tool_calls}")
        messages_to_add = [response]
    except Exception as e: 
        print(f"!!! Error invoking Supervisor LLM: {e}"); traceback.print_exc()
        llm_error_msg = f"LLM failed: {e}"; messages_to_add = []; response = None

    # --- 3. 处理 LLM 回复 ---
    plan_updated: bool = False
    updated_plan: Optional[Plan] = copy.deepcopy(plan) # 从当前 plan 开始
    directive_error_msg: Optional[str] = None
    task_id_to_delegate: Optional[str] = None # <-- 存储本轮要委派的任务 ID

    if response and isinstance(response.content, str):
        # --- A. 先解析并执行所有 PLAN_UPDATE 指令 (移除 status='completed/failed' 的处理) ---
        try:
            plan_directives = re.findall(r"PLAN_UPDATE:\s*(\w+)\s*(\{.*?\})\s*$", response.content, re.IGNORECASE | re.DOTALL | re.MULTILINE)
            plan_directives.extend(re.findall(r"PLAN_UPDATE:\s*(FINISH_PLAN)\s*(\{\})\s*$", response.content, re.IGNORECASE | re.DOTALL | re.MULTILINE))

            if plan_directives:
                 print(f"Found {len(plan_directives)} PLAN_UPDATE directive(s).")
                 for command, args_json_str in plan_directives:
                      command = command.upper(); args_json_str = args_json_str if args_json_str else "{}"
                      print(f"Processing directive: {command} with args JSON: {args_json_str[:100]}...")
                      try:
                           args = json.loads(args_json_str) # 使用 JSON 解析
                           if not isinstance(args, dict): raise ValueError("Args not dict.")

                           # --- 执行规划指令 ---
                           if command == "ADD_TASKS":
                                if not updated_plan: raise ValueError("No plan."); tasks=args.get("tasks",[])
                                if isinstance(tasks, list): 
                                    # 确保新任务状态是 pending
                                    for task_data in tasks: task_data['status'] = 'pending'
                                    updated_plan = PlanningStateHandler.add_tasks(updated_plan, tasks); plan_updated = True
                                else: raise ValueError("Invalid 'tasks'.")

                           elif command == "UPDATE_TASK":
                                if not updated_plan: raise ValueError("No plan.")
                                by_id=args.get("by_id")
                                if not by_id or not isinstance(by_id, str): raise ValueError("Requires string 'by_id'.")
                                by_id = by_id.strip()
                                task_exists = PlanningStateHandler.get_task(updated_plan, by_id)
                                if not task_exists: raise ValueError(f"Task ID '{by_id}' not found!")
                                
                                # 只处理状态为 'in_progress' 或 其他非终结状态的更新，以及 notes/evaluation
                                new_status=args.get("status"); notes_text=args.get("notes"); eval_text=args.get("evaluation") # 保留 evaluation 用于记录 LLM 的想法
                                update_kwargs = {}
                                # **不再**设置 "completed", "failed", "pending_review"
                                if new_status and new_status == "in_progress": 
                                     update_kwargs['new_status'] = "in_progress"
                                     task_id_to_delegate = by_id # 记录这个 ID，将在 Handoff 前设置
                                # 总是可以更新 notes 和 evaluation (如果 LLM 提供了)
                                if notes_text is not None: update_kwargs['new_notes'] = notes_text
                                if eval_text is not None: update_kwargs['new_evaluation'] = eval_text 

                                if update_kwargs: # 只有当确实需要更新时才调用
                                     print(f"Updating task {by_id} with: {update_kwargs}")
                                     updated_plan = PlanningStateHandler.update_task(updated_plan, by_id=by_id, **update_kwargs); plan_updated = True

                           elif command == "FINISH_PLAN":
                                if not updated_plan: raise ValueError("No plan.")
                                updated_plan = PlanningStateHandler.finish_plan(updated_plan); plan_updated = True
                           
                           else: print(f"Warning: Unknown PLAN_UPDATE command '{command}' ignored by Supervisor.")

                      except (json.JSONDecodeError, ValueError, KeyError, TypeError) as e:
                           err_msg = f"Error processing plan directive '{command} {args_json_str}': {type(e).__name__} - {e}"
                           print(err_msg); traceback.print_exc()
                           if not directive_error_msg: directive_error_msg = err_msg # 只记录第一个错误
                      except Exception as e:
                           err_msg = f"Unexpected error processing directive '{command} {args_json_str}': {type(e).__name__} - {e}"
                           print(err_msg); traceback.print_exc()
                           if not directive_error_msg: directive_error_msg = err_msg
                 
                 # --- 重新计算 Plan 状态 ---
                 if plan_updated and updated_plan:
                      updated_plan = PlanningStateHandler.update_plan_status(updated_plan)
                      print(f"Plan status after updates by Supervisor: {updated_plan.get('status')}")

        except Exception as outer_e:
             err_msg = f"Error occurred while searching for PLAN_UPDATE directives: {outer_e}"
             print(err_msg); traceback.print_exc()
             if not directive_error_msg: directive_error_msg = err_msg

    # --- B. 检查 Tool Calls 并设置 Current Task ID ---
    handoff_tool_call: Optional[Dict] = None # 显式初始化
    if response and response.tool_calls:
        for tool_call in response.tool_calls:
             agent_name_match = re.match(r"transfer_to_(\w+)", tool_call["name"])
             # **使用 agent_description_map.keys() 来检查**
             if agent_name_match and agent_name_match.group(1) in agent_description_map.keys():
                  handoff_tool_call = cast(Dict, tool_call) # 找到第一个有效的就用它
                  break

    # 如果决定 Handoff，尝试设置 plan 中的 current_task_id
    if handoff_tool_call and updated_plan:
         # **关键**: 尝试从 Tool Call 的 args 中获取 task_id (Prompt 要求 LLM 必须提供)
         tool_args = handoff_tool_call.get("args", {})
         task_id_from_tool = tool_args.get("task_id") if isinstance(tool_args, dict) else None
         
         # 如果 Tool args 中没有，再使用之前记录的 task_id_to_delegate (标记为 in_progress 的)
         effective_task_id = task_id_from_tool or task_id_to_delegate 

         if effective_task_id:
             print(f"Setting current_task_id in plan to: {effective_task_id}")
             try:
                 # 验证 ID 存在
                 if PlanningStateHandler.get_task(updated_plan, effective_task_id):
                      updated_plan = PlanningStateHandler.set_current_task(updated_plan, effective_task_id)
                      # plan_updated 标志可能已经被 Plan Directive 设置，这里不需要重复设置
                 else:
                      print(f"Warning: Task ID '{effective_task_id}' provided for delegation not found. Cannot set current_task_id.")
                      # 记录错误，阻止 Handoff? 或者让路由回到 Supervisor?
                      directive_error_msg = directive_error_msg or f"Invalid Task ID '{effective_task_id}' for delegation."
             except Exception as e:
                   err_msg = f"Error setting current_task_id to '{effective_task_id}': {e}"
                   print(f"ERROR: {err_msg}")
                   if not directive_error_msg: directive_error_msg = err_msg

    # --- 4. 准备最终返回的状态更新字典 ---
    updates: Dict[str, Any] = {"messages": messages_to_add}
    if updated_plan is not None: updates["plan"] = updated_plan
    elif plan is not None: updates["plan"] = plan
    
    final_error = llm_error_msg or directive_error_msg
    if final_error: updates["error"] = final_error
    elif state.get("error"): updates["error"] = None # 清除旧错误

    print(f"--- Exiting Supervisor Node. Plan updated this step: {plan_updated} ---")
    return updates

================================================
FILE: core/agents/sub_agents/__init__.py
================================================


================================================
FILE: core/agents/sub_agents/coder_agent.py
================================================
# Refactored coder_agent.py
from typing import Any, List, Optional, Union, Callable, Type
from langchain_core.language_models import LanguageModelLike
from langchain_core.tools import BaseTool
from langchain_core.messages import SystemMessage
from langgraph.types import Checkpointer

from core.agents.base.react_agent import ReactAgent
from core.tools.registry import get_tools_by_category, ToolCategory, get_tool_instance # Import get_tool_instance

import logging
logger = logging.getLogger(__name__)

class CoderAgent(ReactAgent):
    """
    Coder Agent (Refactored)
    - Interacts with a sandboxed Linux environment via code execution tools.
    """

    def __init__(
        self,
        name: str = "coder_expert",
        model: LanguageModelLike = None,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = 100000, # Coding might need more context
        **kwargs
    ):
        # 1. Define Description
        description = "Writes, executes, tests, and debugs Python code and Linux shell commands within a secure sandboxed environment. Can install packages, manage files, and interact with the network."

        # 2. Get Tools from Registry
        agent_tools = []
        default_tool_name = "e2b_code_interpreter" # Expected tool name
        try:
            code_tools = get_tools_by_category(ToolCategory.CODE_INTERPRETER) + get_tools_by_category(ToolCategory.FILE_SYSTEM)

            agent_tools.extend(code_tools)
            # Optionally add file system tools if not included in interpreter tool
            # fs_tools = get_tools_by_category(ToolCategory.FILE_SYSTEM)
            # agent_tools.extend(fs_tools)
            print(f"[{name}] Loaded tools from registry: {[t.name for t in agent_tools if hasattr(t,'name')]}")
            # Verify the main execution tool is present
            if not any(getattr(t,'name', None) == default_tool_name for t in agent_tools):
                 print(f"CRITICAL Warning: CoderAgent '{name}' is missing the primary '{default_tool_name}' tool!")
                 # Attempt to get it specifically if missing?
                 specific_tool = get_tool_instance(default_tool_name)
                 if specific_tool: agent_tools.append(specific_tool)

        except Exception as e:
             print(f"Warning: Failed to get tools from registry for {name}: {e}")

        if tools: # Merge extra tools
             existing_names = {t.name for t in agent_tools if hasattr(t,'name')}
             agent_tools.extend([t for t in tools if getattr(t, 'name', None) not in existing_names])

        if not agent_tools:
             print(f"CRITICAL Warning: CoderAgent '{name}' initialized with NO tools!")

        # 3. Define System Prompt (using the capabilities)
        tool_name_for_prompt = next((t.name for t in agent_tools if hasattr(t, 'name') and 'code' in t.name.lower()), default_tool_name) # Try to get actual tool name

        base_prompt = f"""You are an expert Coder Agent interacting with a secure, sandboxed Linux environment provided by the '{tool_name_for_prompt}' tool. Your goal is to fulfill coding, file manipulation, or shell command requests by generating and executing appropriate code or commands within this sandbox.

Available Tools:
{self._format_tools_for_prompt(agent_tools)}
- **{tool_name_for_prompt}**: Executes Python code or shell commands within the sandboxed Linux environment. Returns stdout, stderr, execution errors, and potentially file outputs or structured results (like image data). To run shell commands, generate Python code that uses the 'subprocess' module OR if the tool directly supports it, prefix the command with '!'. Always prefer generating Python code for complex shell operations or when needing output capture.

Key Capabilities of the Sandbox Environment (via the tool):
- Execute Python 3 code.
- Install Python packages using pip (generate code like `import subprocess; subprocess.run(['pip', 'install', 'requests'], check=True)`).
- Run standard Linux shell commands (e.g., `ls`, `pwd`, `mkdir`, `curl`, `git`, etc. using Python's subprocess).
- Access and manipulate a persistent filesystem within the sandbox (typically starting in `/home/user/` or `/`). Create, read, write, delete files and directories.
- Access the internet from within the sandbox for tasks like cloning repos or fetching data.

Workflow & Instructions:
1.  **Analyze Request**: Understand the goal, constraints, and required inputs/outputs.
2.  **Plan Steps**: Outline the necessary code or commands. Consider file paths, dependencies, and error handling.
3.  **Generate Code/Command**: Write the Python code or shell command sequence needed. For non-trivial Python, include comments.
4.  **Execute using Tool**: Prepare the arguments for the '{tool_name_for_prompt}' tool (usually the code string or command string) and invoke the tool.
5.  **Analyze Output**: Carefully review the stdout, stderr, errors, and any results returned by the tool.
6.  **Debug/Iterate**: If errors occurred or the output is not as expected, analyze the error, revise the code/command, and execute again using the tool.
7.  **Final Output**: Once the task is successfully completed, provide the final working code (if relevant), a summary of the execution results (stdout/stderr highlights), confirmation of file operations, and any requested explanation. If the task cannot be completed, explain why.
8.  **File Handling**: If generating files (code, data, images), clearly state the full path within the sandbox where the file was saved (e.g., `/home/user/my_script.py`, `/home/user/output.csv`). Do not attempt to display images directly in your response.

Focus strictly on tasks achievable within the sandboxed environment using the provided tool. Be precise and careful with file paths and commands.
"""

        # 4. Call super().__init__
        super().__init__(
            name=name,
            model=model,
            tools=agent_tools,
            prompt=base_prompt,
            description=description,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            **kwargs
        )
        print(f"CoderAgent '{self.name}' initialized with tools: {[t.name for t in self.tools if hasattr(t,'name')]}")

    # Inherits _format_tools_for_prompt and other methods from BaseAgent/ReactAgent

================================================
FILE: core/agents/sub_agents/data_analyst_agent.py
================================================
# data_analyst_agent.py (or in main.py)

from typing import Any, List, Optional, Union, Callable, Type
from langchain_core.language_models import LanguageModelLike
from langchain_core.tools import BaseTool
from langchain_core.messages import SystemMessage
from langgraph.types import Checkpointer

# Internal imports - ensure paths are correct
from core.agents.base.react_agent import ReactAgent
from core.tools.registry import get_tools_by_category, ToolCategory, get_tool_instance # Import necessary functions

import logging
logger = logging.getLogger(__name__)

# Assume ToolCategory.CODE_INTERPRETER exists
# Assume ToolCategory.FILE_SYSTEM exists if needed

class DataAnalystAgent(ReactAgent):
    """
    Data Analyst Agent (Refactored)
    - Focuses on analyzing structured data using code execution sandbox.
    - Generates insights and saves visualizations to files.
    """

    def __init__(
        self,
        name: str = "data_analyst_expert",
        model: LanguageModelLike = None,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = 120000, # Analysis might need decent context
        debug: bool = False,
        **kwargs
    ):
        # 1. Define Description for Supervisor
        description = "Analyzes structured data (provided in context or potentially read from sandbox files) using Python (Pandas, NumPy, Matplotlib, Seaborn) within a secure code execution environment. Performs statistical analysis, identifies trends, generates insights, and creates data visualizations (saved as files in the sandbox)."

        # 2. Get Tools from Registry
        agent_tools = []
        default_tool_name = "e2b_code_interpreter" # Tool needed for execution
        try:
            # Primarily needs Code Interpreter
            code_tools = get_tools_by_category(ToolCategory.CODE_INTERPRETER) + get_tools_by_category(ToolCategory.FILE_SYSTEM) # 需要代码和文件工具

            agent_tools.extend(code_tools)
            # Optionally, add File System tools if needed to read data files
            # fs_tools = get_tools_by_category(ToolCategory.FILE_SYSTEM)
            # agent_tools.extend(fs_tools)
            print(f"[{name}] Loaded tools from registry: {[t.name for t in agent_tools if hasattr(t,'name')]}")
            # Verify the main execution tool is present
            if not any(getattr(t,'name', None) == default_tool_name for t in agent_tools):
                 print(f"CRITICAL Warning: DataAnalystAgent '{name}' is missing the primary '{default_tool_name}' tool!")
                 specific_tool = get_tool_instance(default_tool_name)
                 if specific_tool: agent_tools.append(specific_tool)

        except Exception as e:
             print(f"Warning: Failed to get tools from registry for {name}: {e}")

        if tools: # Merge extra tools
             existing_names = {t.name for t in agent_tools if hasattr(t,'name')}
             agent_tools.extend([t for t in tools if getattr(t, 'name', None) not in existing_names])

        if not agent_tools:
             print(f"CRITICAL Warning: DataAnalystAgent '{name}' initialized with NO execution tools!")

        # 3. Define System Prompt
        tool_name_for_prompt = next((t.name for t in agent_tools if hasattr(t, 'name') and 'code' in t.name.lower()), default_tool_name)

        base_prompt = f"""You are an expert Data Analyst. Your task is to analyze data using Python code within a secure sandbox environment accessed via the '{tool_name_for_prompt}' tool. Libraries like Pandas, NumPy, Matplotlib, and Seaborn are available (install if needed using pip in your code).

Available Tools:
{self._format_tools_for_prompt(agent_tools)}
- **{tool_name_for_prompt}**: Executes Python code in the sandbox. Returns stdout, stderr, errors, and potentially structured results.

Key Instructions:
1.  **Understand Data & Goal**: Identify the data source (likely provided in previous messages or mentioned as a sandbox file path like '/home/user/data.csv') and the specific analysis question or goal.
2.  **Plan Analysis**: Briefly outline the Python code steps (e.g., load data into Pandas DataFrame, clean/transform data, perform calculations, generate plot).
3.  **Write Python Code**: Generate the necessary Python code. Use libraries effectively. Import necessary libraries (e.g., `import pandas as pd`, `import matplotlib.pyplot as plt`).
4.  **Handle Files (If Needed)**: If reading/writing files within the sandbox, use standard Python file I/O within your code (e.g., `pd.read_csv('/home/user/data.csv')`, `df.to_csv('/home/user/output.csv')`).
5.  **Handle Visualizations**: If asked to create plots:
    * Generate the plot using Matplotlib/Seaborn.
    * **MUST save the plot to a file** inside the sandbox (e.g., `/home/user/plots/my_plot.png`). Use `plt.savefig('/home/user/plots/my_plot.png')`. Create directories if necessary (`os.makedirs('/home/user/plots', exist_ok=True)`).
    * Use `plt.show()` or `plt.close()` after saving to clear the plot buffer.
    * **DO NOT attempt to return image data directly.** Images cannot be displayed in the response.
    * In your response, **state that the plot was generated and provide the full path** where it was saved in the sandbox (e.g., "I have generated a scatter plot and saved it to /home/user/plots/scatter_plot.png").
6.  **Execute Code**: Use the '{tool_name_for_prompt}' tool to run your complete Python script.
7.  **Analyze Results**: Interpret the output (stdout, numerical results, errors) from the tool execution.
8.  **Present Findings**: Summarize your analysis and findings clearly. Use Markdown tables for structured data if helpful. Mention any plots saved and their paths. If errors occurred, explain them.
9.  **Focus**: Concentrate on data analysis using code execution. Do not perform web searches unless specifically instructed and given tools for it.
"""

        # 4. Call super().__init__
        super().__init__(
            name=name,
            model=model,
            tools=agent_tools,
            prompt=base_prompt,
            description=description,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            debug=debug,
            **kwargs
        )
        print(f"DataAnalystAgent '{self.name}' initialized.")

    # Inherits _format_tools_for_prompt and other methods

================================================
FILE: core/agents/sub_agents/designer_agent.py
================================================
# 文件路径示例: reason_graph/designer_agent.py

from typing import Any, List, Optional, Union, Callable, Type
from langchain_core.language_models import LanguageModelLike # 确保导入正确类型
from langchain_core.tools import BaseTool
from langchain_core.messages import SystemMessage
from langgraph.types import Checkpointer

# 内部导入
from core.agents.base.react_agent import ReactAgent
from core.tools.registry import get_tools_by_category, ToolCategory # 导入 Registry
# 假设您的 Flux 工具已注册或在此导入
# from core.tools.flux_image_tool import FluxImageGeneratorTool 

import logging
logger = logging.getLogger(__name__)

# 假设的 ToolCategory.IMAGE_GENERATION
if not hasattr(ToolCategory, 'IMAGE_GENERATION'):
     ToolCategory.IMAGE_GENERATION = ToolCategory.OTHER

class DesignerAgent(ReactAgent):
    """
    设计 Agent (重构版)
    - 能够理解图像上下文，并使用工具生成新的视觉内容。
    - 应用设计原则来完成海报、网页等设计任务。
    """

    def __init__(
        self,
        name: str = "designer_expert",
        model: LanguageModelLike = None, # <--- 必须传入多模态模型 (e.g., gpt-4o)
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = 8000, # 调整上下文需求
        debug: bool = False,
        **kwargs
    ):
        # 1. 定义 Agent 描述
        description = "Understands images provided in context and generates new visual content (images, mockups, diagrams) using specialized image generation tools (like Flux). Can apply design thinking for tasks like poster or web page layout design."

        # 2. 获取工具 (主要是图像生成工具)
        agent_tools = []
        try:
            # 从 Registry 获取图像生成工具
            img_tools = get_tools_by_category(ToolCategory.IMAGE_GENERATION)
            agent_tools.extend(img_tools)
            # 也可以直接实例化
            # agent_tools.append(FluxImageGeneratorTool()) # 如果不使用 Registry
            print(f"[{name}] Loaded tools: {[t.name for t in agent_tools if hasattr(t,'name')]}")
        except Exception as e:
             print(f"Warning: Failed to get IMAGE_GENERATION tools for {name}: {e}")

        if tools: # 合并额外工具
             existing_names = {t.name for t in agent_tools if hasattr(t,'name')}
             agent_tools.extend([t for t in tools if getattr(t, 'name', None) not in existing_names])

        if not agent_tools:
             print(f"CRITICAL Warning: DesignerAgent '{name}' initialized with NO generation tools!")

        # 3. 定义 System Prompt
        tool_name_for_prompt = next((t.name for t in agent_tools if hasattr(t, 'name') and 'generat' in t.name.lower()), "image_generator_tool") # 获取工具名

        base_prompt = f"""You are an expert Visual Designer and Creative Assistant. Your capabilities include understanding images provided in the conversation history and generating new images using available tools based on detailed text prompts.

Available Tools:
{self._format_tools_for_prompt(agent_tools)}
- **{tool_name_for_prompt}**: Use this tool to generate images. Input requires a detailed 'prompt'.

Key Instructions & Workflow:

1.  **Understand Request**: Analyze the user request, paying attention to both text and any images provided in the message history. Identify the core visual goal (e.g., analyze image, generate image, design layout).
2.  **Image Understanding (If Applicable)**: If the request involves analyzing or describing an existing image from the history, provide your analysis directly based on your multimodal understanding.
3.  **Design Thinking (For Generation/Design Tasks)**:
    * **Clarify**: If the request is vague (e.g., "design a logo"), think about necessary elements: target audience, brand feeling, key symbols, color preferences, desired style (minimalist, vintage, futuristic, etc.). You might need to state assumptions if details are missing.
    * **Conceptualize**: Describe the visual elements, layout, color palette, and overall composition you plan to generate.
    * **Formulate Prompt for Tool**: Translate your design concept into a **highly detailed and descriptive text prompt** suitable for the `{tool_name_for_prompt}`. Include style, mood, composition, colors, and specific objects.
4.  **Use Generation Tool**: Call the `{tool_name_for_prompt}` with the detailed prompt you formulated.
5.  **Present Result**:
    * State that you have generated the image.
    * Provide the result from the tool (e.g., the image URL or identifier).
    * Briefly describe the generated image and how it matches the design concept or request.
    * **Important**: Do NOT attempt to display the image directly in your text response. Only provide the URL or description.
6.  **Handle Errors**: If the tool fails, report the error clearly.

Focus on visual design and generation tasks. Use your understanding of design principles when conceptualizing visuals for requests like posters or web mockups.
"""

        # 4. 调用父类 __init__
        super().__init__(
            name=name,
            model=model, # 必须是多模态模型
            tools=agent_tools,
            prompt=base_prompt,
            description=description,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            debug=debug,
            **kwargs
        )
        print(f"DesignerAgent '{self.name}' initialized.")

    # 继承 _format_tools_for_prompt 和其他 BaseAgent/ReactAgent 方法

================================================
FILE: core/agents/sub_agents/reporter_agent.py
================================================
# 文件路径: reason_graph/reporter_agent.py

import json
import time
from datetime import datetime
from typing import Dict, Any, List, Optional, Union, Type, cast, Sequence

# --- LangChain / LangGraph ---
from langchain_core.language_models import LanguageModelLike
from langchain_core.tools import BaseTool
from langchain_core.messages import SystemMessage, HumanMessage, BaseMessage, AIMessage
from langchain_core.runnables import RunnableConfig, Runnable
from langgraph.graph import StateGraph, END, START # 导入 StateGraph, END, START
from langgraph.graph.graph import CompiledGraph
from langgraph.types import Checkpointer

# --- 内部导入 ---
from core.agents.base.base_agent import BaseAgent # 导入最终版 BaseAgent
# 导入最终报告的 Prompt 模板

import logging
logger = logging.getLogger(__name__)

class ReporterAgent(BaseAgent):
    """
    报告 Agent (最终版)
    - 继承自 BaseAgent。
    - 负责基于完整的消息历史和明确指令生成最终 Markdown 报告。
    - 内部包含一个简单的图用于执行报告生成任务。
    """

    FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE = """You are a professional writer and editor AI assistant. Your primary goal is to generate high-quality, well-structured text content based on the specific instructions provided in the latest message and the relevant information available in the preceding conversation history.

The current date is {current_date}.

**Your Task Execution Workflow:**
1.  **Identify Instructions:** Carefully read the **last message** you received, which contains the specific writing task assigned to you by the supervisor. Understand the desired output (e.g., summary, report section, full report), format, tone, and any other requirements.
2.  **Gather Context:** Review the preceding messages in the conversation history to find the necessary information, data points, findings, or creative elements needed to complete the assigned task.
3.  **Compose Output:** Write the text according to the instructions.
    * If asked for creative content (like a poem), focus on fulfilling the creative request.
    * If asked for a summary or section, synthesize the relevant information concisely and accurately.
    * If asked to compile a **full report**, structure it logically (e.g., Introduction, Body, Conclusion), use Markdown formatting effectively, and incorporate information/citations from the history as instructed. Adhere to any specified length or style guidelines.
4.  **Final Response:** Your output should be **only** the requested written text. Do not add extra conversational phrases unless necessary for context. Do not include planning directives or attempt to call tools (unless a specific writing/editing tool was provided and instructed for use). If you cannot fulfill the request due to missing information in the history, state that clearly.
"""


    def __init__(
        self,
        name: str = "reporter_expert",
        model: LanguageModelLike = None, # 应传入适合长文本生成的模型
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = 16000, # 报告生成可能需要处理长上下文
        debug: bool = False,
        prompt_template: str = FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE, # 使用最终报告模板
        **kwargs # 接收其他 BaseAgent 参数
    ):
        # 1. 定义 Agent 描述 (给 Supervisor 看)
        description = "Synthesizes information from the complete conversation history and task results into a final, comprehensive, well-structured, and potentially cited Markdown research report, following specific instructions."

        # 2. 定义工具列表 (Reporter 通常不需要工具)
        agent_tools = []

        # 3. 存储基础 Prompt 模板 (将在节点逻辑中使用)
        # 注意：我们将模板本身（或其引用）存储起来，而不是格式化后的 prompt
        self.report_prompt_template = prompt_template

        # 4. 调用父类 __init__
        super().__init__(
            name=name,
            model=model, # 传入用于报告生成的 LLM
            tools=agent_tools,
            prompt=None, # BaseAgent 的 prompt 字段不直接用于此 Agent 的核心逻辑
            description=description,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            # **kwargs 传递 debug 等
            **kwargs
        )
        print(f"ReporterAgent '{self.name}' initialized.")


    async def _generate_report_node_logic(self, state: Dict[str, Any], config: RunnableConfig) -> Dict[str, Any]:
        """报告生成节点的核心逻辑"""
        # 注意：这里的 state 已经是经过 BaseAgent._preprocess_state 处理后的状态
        print(f"--- Entering Node: {self.name}._generate_report_node_logic ---")

        messages: List[BaseMessage] = state.get("messages", [])
        # 理论上，所有需要的信息都应该在 messages 历史中，
        # 特别是 Supervisor 委派时的最后一条指令消息。

        if not messages:
             error_msg = "Error: No messages found in state for report generation."
             print(error_msg)
             return {"messages": [AIMessage(content=f"# Report Generation Failed\n\n{error_msg}", name=self.name)]}

        # --- 格式化 System Prompt (包含日期) ---
        try:
            current_date_str = datetime.now().strftime("%a, %b %d, %Y")
            system_prompt = self.report_prompt_template.format(current_date=current_date_str)
        except Exception as e:
            print(f"Error formatting report system prompt: {e}")
            system_prompt = "You are a report writing assistant. Synthesize the provided messages into a final report." # Fallback

        # --- 准备 LLM 输入 ---
        # 输入是 System Prompt + 完整的、经过预处理（截断）的消息历史
        # BaseAgent 的 _preprocess_state 已经处理了截断
        llm_input_messages = [SystemMessage(content=system_prompt)] + messages

        # --- 调用 LLM 生成报告 ---
        final_report_markdown = ""
        llm_error = None
        try:
            print(f"--- Calling LLM for Final Report Generation ({self.name}) ---")
            # 使用 self.model (初始化时传入的 LLM 实例)
            response = await self.model.ainvoke(llm_input_messages, config=config)
            final_report_markdown = response.content
            print(f"--- Report Generation LLM Call Successful ({self.name}). Length: {len(final_report_markdown)} chars ---")
        except Exception as e:
             print(f"!!! Error during Report Generation LLM call ({self.name}): {e}")
             llm_error = f"Report generation failed due to LLM error: {e}"
             final_report_markdown = f"# Report Generation Failed\n\nError: {str(e)}"
             # 可以在这里打印更详细的 traceback
             # import traceback
             # traceback.print_exc()

        # --- 返回包含报告或错误的状态更新 ---
        # Reporter 的最终输出就是报告本身，放入 messages 中，替换掉历史？
        # 不，应该追加，让调用者（Supervisor 或 main）能看到完整历史和最终报告
        # 使用 AIMessage 返回报告
        return {
            "messages": [AIMessage(content=final_report_markdown, name=self.name)],
            "error": state.get("error") or llm_error # 保留或记录错误
        }

    def build(self) -> Optional[StateGraph]:
        """构建 Reporter Agent 的简单工作流： Start -> GenerateReport -> End """
        if self._workflow: return self._workflow

        print(f"Building internal graph for ReporterAgent '{self.name}'")
        # Reporter 通常使用 BasicAgentState，因为它不直接操作 Plan
        # 但为了兼容 Supervisor 可能传递 PlanningAgentState，这里可以暂时用 Any
        # 或者定义一个 ReporterState
        workflow = StateGraph(Dict[str, Any]) # 使用通用字典状态，因为它只关心 messages

        # 添加报告生成节点，确保它能访问 self.model
        # functools.partial 不能直接用于异步实例方法，需要包装
        async def node_wrapper(state, config):
             return await self._generate_report_node_logic(state, config)

        workflow.add_node("generate_report", node_wrapper) # type: ignore
        workflow.add_edge(START, "generate_report")
        workflow.add_edge("generate_report", END)

        self._workflow = workflow
        return workflow

    # compile 方法继承自 BaseAgent
    # 它会调用上面的 build() 获取 StateGraph 定义，然后编译它，
    # 并创建包含预处理步骤 (_preprocess_state) 的最终 _executable_agent

    # invoke, ainvoke, get_agent (get_executable_agent), reset 继承自 BaseAgent

================================================
FILE: core/agents/sub_agents/research_agent.py
================================================
# 文件路径示例: reason_graph/research_agent.py

from typing import Any, List, Optional, Union, Callable, Type, cast
from langchain_core.language_models import LanguageModelLike
from langchain_core.tools import BaseTool
from langchain_core.messages import SystemMessage
from langgraph.types import Checkpointer

# 内部导入 - 请确保路径正确
from core.agents.base.react_agent import ReactAgent
# 导入工具 Registry 相关 - 只需要 get_tools_by_category 和 ToolCategory
from core.tools.registry import get_tools_by_category, ToolCategory
# *** 不再需要导入 get_tool 或 get_registered_tools ***

import logging
logger = logging.getLogger(__name__)

# 假设 ToolCategory 包含 SEARCH 和 WEB_Browse
if not hasattr(ToolCategory, 'SEARCH'): ToolCategory.SEARCH = ToolCategory.OTHER
if not hasattr(ToolCategory, 'WEB_Browse'): ToolCategory.WEB_Browse = ToolCategory.OTHER


class ResearchAgent(ReactAgent):
    """
    研究 Agent (重构版)
    - 继承自新的 ReactAgent
    - 专注于定义自身工具和 Prompt
    - 移除了自定义的状态管理和方法
    """

    def __init__(
        self,
        name: str = "research_expert",
        model: LanguageModelLike = None,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = 8000,
        debug: bool = False,
        **kwargs
    ):

        # 1. 定义 Agent 描述 (不变)
        description = "Expert at finding, extracting, and synthesizing the latest information, data, and background knowledge on specific topics using search engines (like Tavily, Google Search) and web Browse tools (like Firecrawl, Arxiv). Capable of providing source links and content summaries."

        # 2. --- 从 Registry 获取和合并工具 ---
        agent_tools: List[Union[BaseTool, Callable]] = []
        search_tools_loaded: List[Union[BaseTool, Callable]] = [] # 用于后续检查
        Browse_tools_loaded: List[Union[BaseTool, Callable]] = []

        try:
            search_tools_loaded = get_tools_by_category(ToolCategory.SEARCH)
            agent_tools.extend(search_tools_loaded)
            try:
                 Browse_tools_loaded = get_tools_by_category(ToolCategory.WEB_Browse)
                 agent_tools.extend(Browse_tools_loaded)
            except Exception as e:
                 if debug: print(f"[{name}] Info: Failed to get WEB_Browse tools: {e}")
            print(f"[{name}] Loaded tools from registry: {[t.name for t in agent_tools if hasattr(t,'name')]}")

            # --- 简化核心工具检查 ---
            if not search_tools_loaded: # 直接检查从 Registry 加载的搜索工具列表是否为空
                 print(f"CRITICAL Warning: ResearchAgent '{name}' initialized without any SEARCH tools from registry!")
            # ------------------------

        except Exception as e:
             print(f"Warning: Failed to get tools from registry for {name}: {e}")

        # 合并外部传入的 `tools` 参数 (逻辑不变)
        if tools:
            # ... (合并逻辑不变) ...
             existing_tool_names = {t.name for t in agent_tools if hasattr(t, 'name')}
             added_external_count = 0
             for tool in tools:
                 tool_name = getattr(tool, 'name', None)
                 if tool_name and tool_name not in existing_tool_names:
                      agent_tools.append(tool)
                      existing_tool_names.add(tool_name)
                      added_external_count +=1
                 elif not tool_name: 
                      agent_tools.append(tool)
                      added_external_count += 1
             if added_external_count > 0: print(f"[{name}] Merged {added_external_count} external tool(s).")


        # --- 简化最终工具检查 ---
        if not agent_tools:
             print(f"CRITICAL Warning: ResearchAgent '{name}' initialized with NO tools configured!")
        # 不再需要那个复杂的 any(...) 检查
        # ----------------------

        # 3. 定义 Agent 的 System Prompt (逻辑不变)
        base_prompt = f"""You are a professional Research Analyst expert...
Available Tools:
{self._format_tools_for_prompt(agent_tools)} 
Instructions:

- Analyze the request in the message history.

- If the request requires searching for current information, facts, data, or background knowledge, you MUST use one of your search tools (like 'tavily_search_results').

- When using tools, formulate concise and effective search queries based on the request.

- Synthesize the information found from the tools into a clear and informative answer.

- If you use information from a tool, cite the source implicitly in your response (e.g., "According to [Source Title], ...").

- If the initial search is insufficient, analyze the results and decide if further searches with refined queries or different tools are needed.

- If you cannot find the information after thorough searching, or if the tools return errors, clearly state the limitations encountered. Do not invent information.
"""

        # 4. 调用父类 __init__ (逻辑不变)
        super().__init__(
            name=name,
            model=model,
            tools=agent_tools,
            prompt=base_prompt,
            description=description,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            debug=debug,
            **kwargs
        )
        print(f"ResearchAgent '{self.name}' initialized with final tools: {[t.name for t in self.tools if hasattr(t,'name')]}")


================================================
FILE: core/llm/llm_manager.py
================================================
# reason_graph/llm_manager.py
import os
from enum import Enum, auto
from typing import Any, Dict, List, Optional, Type, Union, Callable, Tuple
from langchain_core.language_models import BaseChatModel, LanguageModelLike
from langchain_openai import ChatOpenAI
# (移除 ChatGroq 导入)

from dotenv import load_dotenv

# 加载环境变量
load_dotenv()

class ModelType(Enum):
    """模型提供商类型枚举"""
    OPENAI = auto()
    XAI = auto()
    DEEPSEEK = auto()
    CUSTOM = auto() # 保持用于其他 OpenAI 兼容 API

class ModelCapability(Enum):
    """模型能力枚举"""
    GENERAL = auto(); PLANNING = auto(); REASONING = auto()
    CREATIVE = auto(); RESEARCH = auto(); CODE = auto()
    LONG_CONTEXT = auto()

class LLMManager:
    """
    模型管理器 (融合版 V2)
    - 在初始化时根据配置自动注册模型。
    - 支持按能力获取模型。
    - 支持延迟实例化。
    - 从环境变量加载 API Keys/Base URLs。
    """

    def __init__(self):
        """初始化模型管理器，加载配置并自动注册模型"""
        self._models_config: Dict[str, Dict[str, Any]] = {}
        self._models_instance: Dict[str, BaseChatModel] = {}
        self._default_model_id: Optional[str] = None
        self._capability_models: Dict[ModelCapability, str] = {}

        # 加载 API Keys 和 Base URLs (保持不变)
        self._loaded_api_keys = {
            ModelType.OPENAI: os.getenv("OPENAI_API_KEY"),
            ModelType.XAI: os.getenv("XAI_API_KEY"),
            ModelType.DEEPSEEK: os.getenv("DEEPSEEK_API_KEY"),
            ModelType.CUSTOM: os.getenv("LLM_API_KEY"),
        }
        self._loaded_base_urls = {
            ModelType.OPENAI: os.getenv("OPENAI_BASE_URL"),
            ModelType.XAI: os.getenv("XAI_BASE_URL"),
            ModelType.DEEPSEEK: os.getenv("DEEPSEEK_BASE_URL", "https://api.deepseek.com/v1"),
            ModelType.CUSTOM: os.getenv("LLM_BASE_URL"),
        }
        print("LLMManager initialized.")
        print("Loaded API Keys for:", [k.name for k, v in self._loaded_api_keys.items() if v])
        print("Loaded Base URLs for:", {k.name: v for k, v in self._loaded_base_urls.items() if v})

        # --- 自动注册模型 ---
        try:
            from .model_config import SUPPORTED_MODELS_CONFIG # 从配置文件导入
            
            print("Registering models from config...")
            for model_id, config in SUPPORTED_MODELS_CONFIG.items():
                # 检查所需 Key/URL 是否存在，如果不存在则跳过注册并警告
                model_type = config.get("model_type")
                api_key = config.get("config_override", {}).get("api_key") or self._loaded_api_keys.get(model_type)
                base_url = config.get("config_override", {}).get("base_url") or self._loaded_base_urls.get(model_type)
                
                # OpenAI 可以只依赖 OPENAI_API_KEY 环境变量
                if model_type == ModelType.OPENAI and not api_key:
                    api_key = os.getenv("OPENAI_API_KEY") # 再次检查 OpenAI 专用 Key

                # 对于需要 Key 的类型进行检查
                key_required = model_type not in [ModelType.CUSTOM] # 假设 CUSTOM 可能匿名
                url_required = model_type in [ModelType.XAI, ModelType.CUSTOM] # DeepSeek 有默认值

                if key_required and not api_key:
                    print(f"  Skipping registration for '{model_id}': Required API key for type '{model_type.name}' not found.")
                    continue
                if url_required and not base_url:
                     print(f"  Skipping registration for '{model_id}': Required Base URL for type '{model_type.name}' not found.")
                     continue

                # 调用内部注册方法
                self._register_model(
                    model_id=model_id,
                    model_type=config["model_type"],
                    model_name=config["model_name"],
                    model_class=config.get("model_class"), # 可能为 None
                    capabilities=config.get("capabilities", [ModelCapability.GENERAL]),
                    set_as_default=config.get("is_default", False),
                    config_override=config.get("config_override"),
                    **config.get("kwargs", {})
                )
            print("Model registration complete.")
            # 可以在这里设置一个环境变量的默认模型 ID，如果配置中没有 is_default=True
            if not self._default_model_id and self._models_config:
                 fallback_default = list(self._models_config.keys())[0]
                 print(f"Warning: No default model marked in config. Falling back to first registered: '{fallback_default}'")
                 self._default_model_id = fallback_default


        except ImportError:
            print("Warning: Could not import model_config.py. No models registered automatically.")
        except Exception as e:
            print(f"Error during automatic model registration: {e}")

        print(f"Default model set to: {self._default_model_id}")
        print(f"Capability mapping: {self.list_capabilities()}")
        print("-" * 20)


    # register_model 现在是内部方法
    def _register_model(
        self, model_id: str, model_type: ModelType, model_name: str,
        model_class: Optional[Type[BaseChatModel]] = None,
        capabilities: List[ModelCapability] = [ModelCapability.GENERAL],
        set_as_default: bool = False,
        config_override: Optional[Dict[str, Any]] = None,
        **kwargs
    ) -> None:
        """(Internal) Registers a model configuration."""
        if model_id in self._models_config:
            # Decide on behavior: overwrite or ignore? Let's overwrite with warning.
            print(f"  Overwriting registration for existing model_id: '{model_id}'")
            # pass # If ignore is preferred

        if model_class is None:
            model_class = ChatOpenAI

        self._models_config[model_id] = {
            "type": model_type, "name": model_name, "class": model_class,
            "capabilities": list(set(capabilities)),
            "config_override": config_override or {},
            "kwargs": kwargs,
        }
        print(f"  Registered model config: '{model_id}' (Type: {model_type.name}, Class: {model_class.__name__})")

        if set_as_default:
            self._default_model_id = model_id
            print(f"    Set '{model_id}' as default.")

        for capability in capabilities:
            if capability not in self._capability_models:
                self._capability_models[capability] = model_id
                print(f"    Mapped capability '{capability.name}' to '{model_id}'.")

    def set_default_model(self, model_id: str) -> None:
        """设置默认模型"""
        if model_id not in self._models_config: raise ValueError(...)
        self._default_model_id = model_id

    def set_capability_model(self, capability: ModelCapability, model_id: str) -> None:
        """设置特定能力的模型"""
        if model_id not in self._models_config: raise ValueError(...)
        model_info = self._models_config[model_id]
        if capability not in model_info.get("capabilities", []):
              print(f"Warning: Model '{model_id}' not registered with capability '{capability.name}'.")
        self._capability_models[capability] = model_id

    # _get_instance (核心实例化逻辑)
    def _get_instance(self, model_id: str) -> BaseChatModel:
        """(Internal) Gets or creates a model instance."""
        if model_id in self._models_instance:
            return self._models_instance[model_id]

        if model_id not in self._models_config:
            raise ValueError(f"Model ID '{model_id}' not registered or registration skipped due to missing config.")

        config = self._models_config[model_id]
        model_type = config["type"]
        model_name = config["name"]
        model_class = config["class"]
        config_override = config["config_override"]
        kwargs = config["kwargs"]

        # 确定 Key/URL (优先 override, 其次 env)
        api_key = config_override.get("api_key", self._loaded_api_keys.get(model_type))
        base_url = config_override.get("base_url", self._loaded_base_urls.get(model_type))

        # OpenAI 特殊 Key 处理
        if model_type == ModelType.OPENAI and not api_key:
            api_key = os.getenv("OPENAI_API_KEY")

        # 检查必要配置
        key_required = model_type not in [ModelType.CUSTOM]
        url_required = model_type in [ModelType.XAI, ModelType.DEEPSEEK, ModelType.CUSTOM]
        if key_required and not api_key:
            raise ValueError(f"API key required but not found for '{model_id}' (Type: {model_type.name}). Set in .env or config_override.")
        if url_required and not base_url:
            raise ValueError(f"Base URL required but not found for '{model_id}' (Type: {model_type.name}). Set in .env or config_override.")

        print(f"Instantiating model: ID='{model_id}', Type='{model_type.name}', Name='{model_name}'")

        # 准备构造函数参数
        init_kwargs = kwargs.copy()
        if model_class == ChatOpenAI:
             init_kwargs['model'] = model_name
             if api_key: init_kwargs['openai_api_key'] = api_key
             if base_url: init_kwargs['openai_api_base'] = base_url
        # elif model_class == ChatGroq: ... # Removed
        else: # 尝试通用参数
             init_kwargs['model'] = model_name # 很多兼容类可能也认 model
             init_kwargs['model_name'] = model_name
             if api_key: init_kwargs['api_key'] = api_key
             if base_url: init_kwargs['base_url'] = base_url

        # 移除内部配置键
        for k in ["config_override", "capabilities", "type", "class", "name", "instance"]:
            init_kwargs.pop(k, None)
            
        # 实例化
        try:
            instance = model_class(**init_kwargs)
            self._models_instance[model_id] = instance
            return instance
        except Exception as e:
            print(f"!!! Failed to instantiate model '{model_id}'")
            raise e

    # get_model 和 get_model_for_capability (保持不变, 调用 _get_instance)
    def get_model(self, model_id: Optional[str] = None) -> BaseChatModel:
        """获取模型实例 (通过 ID 或默认)"""
        target_id = model_id
        if target_id is None:
            if self._default_model_id is None: raise ValueError("No default model set.")
            target_id = self._default_model_id
        if target_id not in self._models_config: raise ValueError(f"Model ID '{target_id}' not registered.")
        return self._get_instance(target_id)

    def get_model_for_capability(self, capability: ModelCapability) -> BaseChatModel:
        """获取具有特定能力的模型实例"""
        if capability not in self._capability_models:
            print(f"No preferred model for '{capability.name}'. Falling back to default.")
            if self._default_model_id is None: raise ValueError(f"No model for '{capability.name}' and no default set.")
            model_id = self._default_model_id
        else: model_id = self._capability_models[capability]
        print(f"Using model '{model_id}' for capability '{capability.name}'.")
        return self.get_model(model_id)

    # list_models 和 list_capabilities (保持不变)
    def list_models(self) -> Dict[str, Dict[str, Any]]:
        """列出所有注册的模型及其配置"""
        result = {}; # ... (populate result) ...
        for model_id, model_info in self._models_config.items():
            result[model_id] = {
                "type": model_info["type"].name,
                "name": model_info["name"],
                "class": model_info["class"].__name__,
                "capabilities": [c.name for c in model_info.get("capabilities", [])],
                "is_default": model_id == self._default_model_id,
                "kwargs": model_info.get("kwargs"),
                "config_override": model_info.get("config_override"),
            }
        return result

    def list_capabilities(self) -> Dict[str, str]:
        return {capability.name: model_id for capability, model_id in self._capability_models.items()}

================================================
FILE: core/llm/model_config.py
================================================
# reason_graph/model_config.py
from langchain_openai import ChatOpenAI
# from langchain_groq import ChatGroq # 不再需要
# (如果未来支持其他非 OpenAI 兼容的，在这里 import)

from .llm_manager import ModelType, ModelCapability # 从同级 llm_manager 导入枚举

# 定义支持的模型及其配置
# key 是我们内部使用的 model_id
SUPPORTED_MODELS_CONFIG = {
    "openai_gpt4o": {
        "model_type": ModelType.OPENAI,
        "model_name": "gpt-4o", # API 调用名
        "model_class": ChatOpenAI,
        "capabilities": [
            ModelCapability.GENERAL, ModelCapability.PLANNING, ModelCapability.REASONING,
            ModelCapability.CREATIVE, ModelCapability.LONG_CONTEXT, ModelCapability.CODE,
            ModelCapability.RESEARCH # GPT-4o 也能做一定研究
        ],
        "is_default": False, # 不设为默认
        "config_override": {}, # 允许覆盖 env vars, e.g., {'api_key': '...'}
        "kwargs": {"temperature": 0.1} # 传递给构造函数的额外参数
    },
    "openai_gpt4o_mini": {
        "model_type": ModelType.OPENAI,
        "model_name": "gpt-4o-mini",
        "model_class": ChatOpenAI,
        "capabilities": [ModelCapability.GENERAL, ModelCapability.REASONING, ModelCapability.CREATIVE],
        "is_default": True, # <--- 将其设为默认模型
        "config_override": {},
        "kwargs": {"temperature": 0.0}
    },
    "xai_grok": { # 假设 ID 命名为 xai_grok
        "model_type": ModelType.XAI,
        "model_name": "grok-2-latest", # 或者是 xAI API 实际接受的模型名
        "model_class": ChatOpenAI, # 假设使用兼容 OpenAI 的方式连接
        "capabilities": [ModelCapability.GENERAL, ModelCapability.REASONING, ModelCapability.LONG_CONTEXT, ModelCapability.CREATIVE],
        "is_default": False,
        "config_override": {}, # Key/URL 将从 env (XAI_API_KEY, XAI_BASE_URL) 加载
        "kwargs": {"temperature": 0.2}
    },
    "deepseek_v3": { # 假设 ID 命名为 deepseek_chat
        "model_type": ModelType.DEEPSEEK,
        "model_name": "deepseek/deepseek-v3-0324", # DeepSeek Chat 模型 API 名
        "model_class": ChatOpenAI, # 使用兼容 OpenAI 的方式连接
        "capabilities": [ModelCapability.GENERAL, ModelCapability.REASONING, ModelCapability.CODE, ModelCapability.LONG_CONTEXT],
        "is_default": False,
        "config_override": {}, # Key/URL 将从 env (DEEPSEEK_API_KEY, DEEPSEEK_BASE_URL) 加载
        "kwargs": {"temperature": 0.0}
    },
    # --- 可以继续添加其他模型配置 ---
    # "groq_llama3_70b": {
    #     "model_type": ModelType.GROQ,
    #     "model_name": "llama3-70b-8192",
    #     "model_class": ChatGroq, # 需要导入 ChatGroq
    #     "capabilities": [...],
    #     "is_default": False,
    #     "config_override": {},
    #     "kwargs": {"temperature": 0.1}
    # },
}

================================================
FILE: core/mcp/README.md
================================================
# Mentis MCP 客户端与配置指南

本目录 (`core/mcp/`) 包含用于与模型上下文协议 (MCP - Model Context Protocol) 服务器进行交互的 Python 客户端实现。

## 背景

MCP 旨在为 AI 模型（如 LLM Agent）提供一个标准的、与外部工具或服务进行交互的协议。本客户端的目标是提供一种灵活、可配置的方式来连接这些 MCP 服务器，并将它们提供的工具集成到 LangChain Agent 中。

## 客户端 (`MCPClient`)

核心实现是 `MCPClient` 类 (位于 `client.py`)，它具备以下特性：

* **配置驱动:** 通过读取一个位于 `core/mcp/config.json` 的 JSON 文件来管理一个或多个服务器的连接/启动信息。兼容 "Cursor 风格" 的配置格式。
* **灵活连接:**
    * **启动本地服务 (stdio):** 如果配置文件中提供了 `command` 和 `args`，客户端会尝试执行该命令启动服务器进程，并通过 **STDIO** 建立通信。这对于使用 `uvx` 或 `python -m` 启动的标准 MCP 服务器很有用。
    * **连接远程服务 (sse):** 如果配置文件中提供了 `url`，客户端会直接通过 **SSE** 连接到该 URL 对应的、已在运行的 MCP 服务器。
* **异步架构:** 基于 `asyncio` 构建，适合异步应用。
* **健壮的资源管理:** 使用 `contextlib.AsyncExitStack` 管理连接和会话，旨在提高关闭时的稳定性。
* **LangChain 集成支持:** 提供了加载 MCP 工具为 LangChain `BaseTool` 对象的基础（尽管存在适配器问题，见下文）。

## 如何使用

### 1. 配置服务器 (`core/mcp/config.json`)

你需要在此目录下创建一个 `config.json` 文件，定义你想要连接的 MCP 服务器。文件是一个 JSON 对象，键是服务器的逻辑名称，值是该服务器的配置详情。

**示例 `config.json` (只包含外部标准服务器):**

```json
{
  "fetch_via_uvx": {
    "id": "fetch-uvx-stdio",
    "type": "mcp-server",
    "description": "Fetch Server launched by uvx via stdio",
    "connection": {
      "transport": "stdio",
      "command": "uvx",
      "args": [ "mcp-server-fetch" ],
      "timeout": 45
    }
  },
  "everything": {
    "id": "everything-stdio",
    "type": "mcp-server",
    "description": "Everything Server launched by npx via stdio",
    "connection": {
      "transport": "stdio",
      "command": "npx",
      "args": [ "-y", "@modelcontextprotocol/server-everything" ],
      "env": {
        // 如果 Everything Server 需要 API Keys, 在此添加
        // 或确保运行客户端脚本的环境变量会被继承
        // "OPENAI_API_KEY": "YOUR_KEY",
        // "TAVILY_API_KEY": "YOUR_KEY"
      },
      "timeout": 60
    }
  },
  "external_sse_example": {
    "id": "external-sse",
    "type": "mcp-server",
    "description": "Connect to a pre-running SSE server (Example)",
    "connection": {
        "transport": "sse",
        "url": "http://localhost:9001/sse" // 假设有服务器在此运行
    }
  }
}
```

**重要:**

* 使用 `command` 启动服务器时，确保 `command` (如 `uvx`, `npx`, `python`) 在你的环境中可用。
* 如果服务器需要 API Keys，请通过 `env` 字段或系统环境变量提供。
* `transport: "stdio"` 告诉我们的客户端使用 stdio 连接，`transport: "sse"` 告诉它使用 sse 连接。

### 2. 客户端代码示例

使用 `config_loader.py` 加载配置，并通过 `async with` 语句使用 `MCPClient`。

```python
import asyncio
import os
from core.mcp.client import MCPClient
from core.mcp.config_loader import load_config
# 导入 LangChain 相关 (如果需要 Agent)
from langchain_openai import ChatOpenAI
from langgraph.prebuilt import create_react_agent
from langchain_core.tools import BaseTool, Tool
# 导入工具的 Pydantic Schema (用于手动创建 Tool)
from pydantic.v1 import BaseModel, Field # 或 v2

# --- Fetch Schema 示例 ---
class FetchInputSchema(BaseModel):
     url: str = Field(..., description="URL to fetch")
     # ... 其他字段 ...

async def main():
    # --- 加载配置 ---
    config_path = os.path.join(os.path.dirname(__file__), "config.json") # 假设 config 在同目录
    try:
        all_configs = load_config(config_path)
        # 选择要使用的配置
        server_key = "fetch_via_uvx" # 或 "everything", "e2b_stdio" 等
        mcp_config = all_configs.get(server_key)
        if not mcp_config:
            print(f"Config '{server_key}' not found.")
            return
    except Exception as e:
        print(f"Failed to load config: {e}")
        return

    # --- 使用 MCPClient ---
    async with MCPClient(mcp_config) as client:
        print(f"Connected to MCP Server '{server_key}'. Session active: {client.session is not None}")
        if not client.session: return

        # --- 获取和使用工具 ---

        # 方式一: 标准方式 (但存在已知问题)
        # print("\nAttempting standard tool loading via load_mcp_tools...")
        # loaded_tools = client.get_tools() # 内部调用 load_mcp_tools
        # print(f"load_mcp_tools returned {len(loaded_tools)} tools.")
        # # !! 注意：对于某些服务器实现 (如此处之前的 MentisMCPServer),
        # # !! load_mcp_tools 返回的工具对象的 args_schema 可能是错误的！
        # # !! 这会导致 Agent 调用失败。但对于 Fetch Server 这样的标准服务器，
        # # !! 它加载的 Schema 可能是正确的。需要根据打印的 Schema 判断。

        # 方式二: 【当前推荐】手动创建 Tool 对象 (绕过 load_mcp_tools 问题)
        print("\nManually creating Tool object with correct schema...")
        tool_name = "fetch" # 假设测试 Fetch Server
        tool_description = "Fetches URL content." # 可以从服务器获取或手写
        correct_schema = FetchInputSchema # 使用正确的 Pydantic 模型

        # 定义调用逻辑
        async def call_mcp_tool_wrapper(**kwargs) -> str:
             # ... (内部使用 client.session.call_tool 发送正确请求) ...
            # 参考 examples/14_mcp_fetch_test.py 中的实现
            if not client or not client.session: return "ERROR: Session lost."
            try:
                req_params = {"name": tool_name, "arguments": kwargs}
                from mcp.types import CallToolRequest # 需要导入
                request = CallToolRequest(method='tools/call', params=req_params)
                result = await client.session.call_tool(request)
                if hasattr(result, 'result'): return str(result.result)
                elif hasattr(result, 'error'): return f"Tool Error: {result.error.message}"
                else: return "Unknown response"
            except Exception as e: return f"Error: {e}"

        # 创建 LangChain Tool
        manual_tool = Tool.from_function(
            name=tool_name,
            description=tool_description,
            args_schema=correct_schema,
            coroutine=call_mcp_tool_wrapper
        )
        tools_for_agent = [manual_tool]
        print(f"Manual tool '{manual_tool.name}' created.")

        # --- 使用 Agent ---
        try:
            # model = llm_manager.get_model("openai_gpt4o_mini") # 获取 LLM
            # agent = create_react_agent(model, tools_for_agent)
            # response = await agent.ainvoke(...)
            # print("Agent Response:", response)
            print("\nAgent execution part skipped in README example.")
            print("Refer to examples/14_mcp_fetch_test.py for full Agent integration.")
        except Exception as e:
            print(f"Agent execution error: {e}")

# if __name__ == "__main__":
#     asyncio.run(main())
```

## 关于自建 MCP Server (MentisMCPServer)

我们在之前的开发中，尝试在 `core/mcp/server.py` 中构建了一个 `MentisMCPServer` 类，目的是将我们内部工具注册表 (`core/tools/registry.py`) 中的 LangChain `BaseTool` 动态包装成 MCP 工具。

**当前遇到的主要挑战：**

我们发现，当使用 `FastMCP` 库的 `@mcp.tool` 装饰器来动态注册这些包装器时，服务器未能正确地向客户端广播这些工具的**输入模式 (Schema)**。这导致客户端的 `load_mcp_tools` 收到了错误的 Schema 信息，进而使 LangChain Agent 在调用工具时因参数错误而失败。

虽然我们通过重构服务器的注册逻辑（改为在 `run_server.py` 中直接使用 `FastMCP` 实例注册顶层包装函数）**成功解决**了 Schema 广播的问题，使得 `load_mcp_tools` 能够获取到正确的 Schema，但后续测试发现 Agent (`create_react_agent`) 在调用这些工具时仍可能出现内部错误 (`TypeError`)。

**结论与建议：**

由于在结合 LangChain 工具、动态包装、`FastMCP` 和 LangChain Agent 时遇到了较深的库交互和调试障碍，我们**目前不建议**将 `MentisMCPServer` 作为稳定可靠的方案对外提供服务。

**推荐使用以下方式来提供或使用 MCP Server:**

1.  **使用社区标准服务器:** 直接使用像 `mcp-server-fetch`, `@modelcontextprotocol/server-everything` 这样由社区或官方提供的、预构建好的 MCP 服务器。通过 `config.json` 配置 `command` (如 `uvx`, `npx`, `python -m`) 或 `url` 来使用它们。
2.  **采用简单服务器模式:** 如果你需要自己实现 MCP Server 来暴露特定功能，建议参考 `modelcontextprotocol/servers` 仓库中的简单示例（如 `math_server`, `time_server`），采用**直接注册工具函数**（用 `@mcp_instance.tool` 装饰顶层 `async def` 函数）的模式，避免复杂的动态包装层。

================================================
FILE: core/mcp/__init__.py
================================================
# core/mcp/__init__.py
"""
MCP (Model Context Protocol) 功能模块
"""

================================================
FILE: core/mcp/client.py
================================================
import os
import asyncio
from pathlib import Path
from typing import List, Dict, Any, Optional, Union, Type, Literal, TypedDict, cast
from types import TracebackType
import re
import sys
import json
import traceback
from contextlib import asynccontextmanager, AsyncExitStack

# --- MCP Imports ---
from mcp import ClientSession, StdioServerParameters
from mcp.client.stdio import stdio_client
from mcp.client.sse import sse_client
# --- Adapter Import ---
try:
     from langchain_mcp_adapters.tools import load_mcp_tools
     LOAD_MCP_TOOLS_AVAILABLE = True
except ImportError:
     print("警告: 未找到 langchain-mcp-adapters。 load_mcp_tools 将不可用。")
     async def load_mcp_tools(session: ClientSession) -> list: return []
     LOAD_MCP_TOOLS_AVAILABLE = False
# --- LangChain / Pydantic Imports ---
from langchain_core.tools import BaseTool
try: from pydantic.v1 import BaseModel as BaseModelV1
except ImportError: from pydantic import BaseModel as BaseModelV1 # Fallback
# --- Config Loader Import ---
try: from .config_loader import MCPConfig, StdioConfig, SSEConfig
except ImportError: print("WARNING: Could not import config models from .config_loader."); MCPConfig=Any; StdioConfig=Any; SSEConfig=Any # Placeholders

print("--- DEBUG: Loading FINAL client.py (Config-Driven + AsyncExitStack) ---")

class MCPClient:
    """Config-driven MCP Client using AsyncExitStack."""
    def __init__(self, config: MCPConfig):
        self.config = config
        self.session: Optional[ClientSession] = None
        self.tools: List[BaseTool] = []
        self._stack: AsyncExitStack = AsyncExitStack()
        self._server_process: Optional[asyncio.subprocess.Process] = None

    async def __aenter__(self) -> "MCPClient":
        print(f"DEBUG: MCPClient entering context for config ID: {getattr(self.config, 'id', 'N/A')}")
        try:
            connection_config = self.config.connection
            transport_ctx = None
            reader = None
            writer = None

            if isinstance(connection_config, SSEConfig) and connection_config.url:
                # --- Direct SSE ---
                print(f"DEBUG: Connecting via SSE to {connection_config.url}")
                transport_ctx = sse_client(
                    connection_config.url, getattr(connection_config,'headers', None),
                    getattr(connection_config,'timeout', 5.0), getattr(connection_config,'sse_read_timeout', 300.0)
                )
                reader, writer = await self._stack.enter_async_context(transport_ctx)
                print("DEBUG: SSE transport context entered.")

            elif isinstance(connection_config, StdioConfig) and connection_config.command:
                # --- Launch via Command + STDIO ---
                print(f"DEBUG: Launching command via STDIO: {connection_config.command} {' '.join(connection_config.args)}")
                merged_env = os.environ.copy();
                if connection_config.env: merged_env.update(connection_config.env)
                server_params = StdioServerParameters(
                    command=connection_config.command, args=connection_config.args, env=merged_env,
                    cwd=connection_config.cwd, encoding=connection_config.encoding,
                    encoding_error_handler=connection_config.encoding_error_handler,
                    startup_timeout=connection_config.timeout
                )
                transport_ctx = stdio_client(server_params)
                reader, writer = await self._stack.enter_async_context(transport_ctx)
                print("DEBUG: STDIO transport context entered.")

            else: # Fallback/Error - Handle case where config might be wrong or transport missing
                 # Added check for command presence before assuming SSE launch
                 if hasattr(connection_config, 'command') and connection_config.command:
                      # This is the complex "launch then connect SSE" case from the guide
                      # Keeping it simple for now - if transport isn't 'stdio', it must be 'sse' with a URL
                      raise NotImplementedError("Launching command for SSE connection (URL capture) not implemented in this client version. Use direct SSE URL or STDIO command.")
                 else:
                      raise ValueError("Invalid configuration: must have 'url' for SSE or 'command' for STDIO.")


            # --- Establish ClientSession ---
            session_kwargs = getattr(connection_config, 'session_kwargs', None) or {}
            session_ctx = ClientSession(reader, writer, **session_kwargs)
            self.session = await self._stack.enter_async_context(session_ctx)
            print("DEBUG: ClientSession context entered.")

            # --- Initialize and Load Tools (with Schema Check) ---
            print("Initializing MCP session...")
            await asyncio.wait_for(self.session.initialize(), timeout=30.0)
            print("MCP session initialized.")

            if LOAD_MCP_TOOLS_AVAILABLE:
                print("Loading MCP tools (via langchain-mcp-adapters)...")
                loaded_tools_from_mcp = await load_mcp_tools(self.session)
                print(f"Successfully loaded {len(loaded_tools_from_mcp)} tool descriptions.")
                print("--- Loaded Tools & Args Schema (Diagnostic) ---")
                self.tools = []
                for i, tool in enumerate(loaded_tools_from_mcp):
                     schema = getattr(tool, 'args_schema', 'N/A'); tool_name = getattr(tool, 'name', f'Tool_{i+1}')
                     print(f"{i+1}. Tool Name: {tool_name}")
                     schema_detail = "N/A"
                     is_correct = None # Undetermined
                     if schema != 'N/A': # Schema printing and basic check
                          schema_dict = None
                          if isinstance(schema, type) and issubclass(schema, BaseModelV1):
                               try: schema_dict = schema.schema(); schema_detail = f"(PydanticV1): {json.dumps(schema_dict, indent=2)}"
                               except Exception as e_schema: schema_detail = f"(PydanticV1): Error - {e_schema}"
                          elif hasattr(schema, 'model_json_schema'):
                               try: schema_dict = schema.model_json_schema(); schema_detail = f"(PydanticV2): {json.dumps(schema_dict, indent=2)}"
                               except Exception as e_schema: schema_detail = f"(PydanticV2): Error - {e_schema}"
                          else: schema_detail = f"(Unknown Type): {schema}"
                          # Basic check: does it look like the faulty kwargs schema?
                          if isinstance(schema_dict, dict):
                               props = schema_dict.get('properties', {})
                               if list(props.keys()) == ['kwargs'] and props['kwargs'].get('type') == 'string':
                                    is_correct = False
                                    schema_detail += " <-- LOOKS WRONG (kwargs only!)"
                               elif props:
                                    is_correct = True # Has properties other than just kwargs
                                    schema_detail += " <-- Looks structured correctly"
                               else:
                                     is_correct = True # No properties, might be simple input
                                     schema_detail += " <-- No properties defined"
                     else: is_correct = False # No schema is usually wrong
                     print(f"   Args Schema: {schema_detail}")
                     print("-" * 15); self.tools.append(tool)
                print(f"Schema Check Result: {'All schemas look structured correctly.' if all(s is not False for s in [getattr(t, 'args_schema', None) != 'N/A' and 'kwargs' not in str(getattr(t, 'args_schema', '')).lower() for t in self.tools]) else 'One or more schemas look incorrect (kwargs only or missing)!'}")
                print("-------------------------------------------")
            else: print("Warning: load_mcp_tools unavailable."); self.tools = []
            print(f"MCPClient ready. Loaded {len(self.tools)} tools via adapter.")
            return self
        except Exception as enter_err:
            print(f"ERROR: Failed during MCPClient __aenter__: {type(enter_err).__name__}: {enter_err}")
            await self.close(); raise

    async def __aexit__(self, exc_type: Optional[Type[BaseException]], exc_val: Optional[BaseException], exc_tb: Optional[TracebackType]):
        print("DEBUG: MCPClient exiting context..."); await self.close(); print("DEBUG: MCPClient context exited.")

    async def close(self):
        """Closes connections and resets state using AsyncExitStack."""
        print("Closing MCP Client...");
        if hasattr(self, '_stack') and self._stack:
            print("  Closing managed async contexts (via AsyncExitStack)...")
            try: await self._stack.aclose(); print("  AsyncExitStack closed.")
            except Exception as e: print(f"WARNING: Error closing AsyncExitStack: {type(e).__name__}: {e}")
            finally: self._stack = None
        else: print("  No active AsyncExitStack.")
        self.session = None; self.tools = []; self._transport_ctx = None; self._server_process = None
        print("MCP Client state reset.")

    def get_tools(self) -> List[BaseTool]:
        """Returns the list of tools loaded by load_mcp_tools."""
        return self.tools

================================================
FILE: core/mcp/config_loader.py
================================================
# core/mcp/config_loader.py (修改 load_config 返回类型)
import json
import os
from pathlib import Path
from typing import Dict, Any, Optional, List, Literal, Union, Type # 导入 Type
try:
    from pydantic.v1 import BaseModel, Field, ValidationError, validator
    PYDANTIC_V = 1
except ImportError:
    try:
        from pydantic import BaseModel, Field, ValidationError, validator # type: ignore
        PYDANTIC_V = 2
    except ImportError: raise ImportError("Pydantic (v1 or v2) required.")
from typing_extensions import TypedDict

EncodingErrorHandler = Literal["strict", "ignore", "replace"]

class StdioConfig(BaseModel):
    transport: Literal["stdio"] = "stdio"; command: str = Field(...)
    args: List[str] = Field(default_factory=list); env: Optional[Dict[str, str]] = None
    cwd: Optional[Union[str, Path]] = None; encoding: str = Field(default="utf-8")
    encoding_error_handler: EncodingErrorHandler = Field(default="strict")
    timeout: int = Field(default=30, gt=0); session_kwargs: Optional[Dict[str, Any]] = None
    if PYDANTIC_V == 1: 
        class Config: extra = 'forbid'
    else: model_config = {'extra': 'forbid'}

class SSEConfig(BaseModel):
    transport: Literal["sse"] = "sse"; url: str = Field(...)
    headers: Optional[Dict[str, Any]] = None; timeout: float = Field(default=5.0, gt=0)
    sse_read_timeout: float = Field(default=300.0, gt=0); session_kwargs: Optional[Dict[str, Any]] = None
    if PYDANTIC_V == 1: 
        class Config: extra = 'forbid'
    else: model_config = {'extra': 'forbid'}

class MCPConfig(BaseModel):
    """Represents the structure for a single server configuration."""
    id: Optional[str] = Field(default=None)
    type: Literal["mcp-server"] = Field(default="mcp-server")
    description: Optional[str] = Field(default=None)
    connection: Union[StdioConfig, SSEConfig] = Field(..., discriminator='transport')
    if PYDANTIC_V == 1: 
        class Config: extra = 'forbid'
    else: model_config = {'extra': 'forbid'}


# --- 修改 load_config ---
def load_config(config_path: Union[str, Path]) -> Dict[str, MCPConfig]:
    """
    Loads the central MCP configuration JSON file and validates each server entry.

    Args:
        config_path: Path to the central config.json file.

    Returns:
        A dictionary where keys are server names and values are validated MCPConfig objects.
    """
    config_p = Path(config_path).resolve()
    if not config_p.is_file():
        raise FileNotFoundError(f"Configuration file not found at: {config_p}")

    print(f"DEBUG: Loading central MCP configuration from: {config_p}")
    validated_configs: Dict[str, MCPConfig] = {}
    try:
        with open(config_p, 'r', encoding='utf-8') as f:
            raw_config_dict = json.load(f)

        if not isinstance(raw_config_dict, dict):
            raise TypeError("Root configuration must be a JSON object (dictionary).")

        # 遍历字典中的每个服务器配置并验证
        for server_name, config_data in raw_config_dict.items():
            print(f"DEBUG: Validating config for server: '{server_name}'")
            if not isinstance(config_data, dict):
                 print(f"WARNING: Entry for '{server_name}' is not a dictionary. Skipping.")
                 continue
            try:
                 # 确保 connection 和 transport 存在
                 if 'connection' not in config_data: raise ValueError("Missing 'connection'")
                 if 'transport' not in config_data.get('connection', {}): raise ValueError("Missing 'transport' in connection")

                 if PYDANTIC_V == 2:
                      validated_config = MCPConfig.model_validate(config_data)
                 else: # Pydantic V1
                      validated_config = MCPConfig.parse_obj(config_data)
                 validated_configs[server_name] = validated_config
                 print(f"DEBUG: Config for '{server_name}' validated successfully.")
            except (ValidationError, ValueError) as e_val:
                 print(f"ERROR: Validation failed for server '{server_name}' config:\n{e_val}\nSkipping this server.")
                 #可以选择继续加载其他配置，或者在这里 raise 让整个加载失败

        if not validated_configs:
             print("WARNING: No valid server configurations were loaded.")

        print(f"DEBUG: Central configuration loaded. Found {len(validated_configs)} valid server configs.")
        return validated_configs
    except json.JSONDecodeError as e:
        print(f"ERROR: Failed to decode JSON from {config_p}: {e}"); raise
    except Exception as e:
        print(f"ERROR: An unexpected error occurred loading config {config_p}: {e}"); raise

================================================
FILE: core/mcp/mcp_server_config.json
================================================
{
    "fetch_via_uvx": {
      "id": "fetch-uvx-stdio",
      "type": "mcp-server",
      "description": "Fetch Server launched by uvx via stdio",
      "connection": {
        "transport": "stdio",
        "command": "uvx",
        "args": [
          "mcp-server-fetch"
        ],
        "env": null,
        "cwd": null,
        "encoding": "utf-8",
        "encoding_error_handler": "strict",
        "timeout": 45
      }
    },
    "everything": {
      "id": "everything-stdio",
      "type": "mcp-server",
      "description": "Everything Server",
      "connection": {
        "transport": "stdio",
        "command": "npx",
        "args": [
          "-y",
          "@modelcontextprotocol/server-everything"
        ],
        "env": null,
        "cwd": null,
        "encoding": "utf-8",
        "encoding_error_handler": "strict",
        "timeout": 45
      }
    }
  }

================================================
FILE: core/mcp/run_server.py
================================================
# core/mcp/run_server.py (FINAL - Direct FastMCP Registration)
import os
import sys
import argparse
import traceback
import logging
from typing import List, Dict, Any, Optional, Type

# --- Standard Setup ---
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
logger = logging.getLogger("mcp_server_direct")

current_dir = os.path.dirname(os.path.abspath(__file__)); 
project_root = os.path.dirname(os.path.dirname(os.path.dirname(current_dir))); sys.path.insert(0, project_root)

# --- Imports ---
from mcp.server.fastmcp import FastMCP # Import FastMCP directly
# Assume registry is populated correctly by preregister_core_tools
from core.tools.registry import get_registered_tools, get_tool_instance
try: 
    from core.tools import preregister_core_tools; 
    PREREGISTER_AVAILABLE = True
except ImportError: 
    print("WARNING: preregister_core_tools not found"); 
    def preregister_core_tools(): pass; 
    PREREGISTER_AVAILABLE = False
from langchain_core.tools import BaseTool
import asyncio
import time
import json
import functools
import inspect # Needed for func_metadata potentially

print("--- DEBUG: Loading FINAL run_server.py (Direct FastMCP Registration) ---")

# --- Tool Wrapper Creation Logic (as a standalone function) ---
def create_tool_wrapper(tool_instance: BaseTool):
    """
    Creates the async wrapper function for a given tool instance.
    This function will be decorated LATER by the mcp_instance.
    """
    tool_name = getattr(tool_instance, 'name', 'unknown_tool')
    print(f"    DEBUG: Defining wrapper function for tool: '{tool_name}'")

    # Define the actual wrapper coroutine
    async def dynamic_tool_wrapper(tool_to_run=tool_instance, **kwargs): # Bind instance
        _tool_name = tool_to_run.name
        log_file = "/tmp/mcp_wrapper.log"; 
        timestamp = time.strftime("%Y-%m-%d %H:%M:%S"); 
        log_prefix = f"--- {timestamp} WRAPPER for '{_tool_name}' ---"
        log_lines = [f"{log_prefix} START", f"Received kwargs: {kwargs}"]
        try: # Main execution block
            result = None
            if hasattr(tool_to_run, '_arun'):
                log_lines.append(f"Calling await tool_to_run._arun(**kwargs)")
                result = await tool_to_run._arun(**kwargs)
                log_lines.append(f"Await _arun completed.")
            elif hasattr(tool_to_run, '_run'):
                log_lines.append(f"Calling tool_to_run._run(**kwargs) via run_in_executor")
                loop = asyncio.get_running_loop()
                sync_func_with_args = functools.partial(tool_to_run._run, **kwargs)
                result = await loop.run_in_executor(None, sync_func_with_args)
                log_lines.append(f"Executor _run completed.")
            else: log_lines.append("ERROR: Tool no _arun/_run!"); raise NotImplementedError(f"Tool {_tool_name} no method.")

            log_lines.append(f"Raw result type: {type(result)}"); log_lines.append(f"Raw value snippet: {str(result)[:500]}...")
            final_result = result
            try: json.dumps(result); log_lines.append("Result JSON serializable.")
            except TypeError: log_lines.append(f"WARN: Non-JSON type {type(result)}.->str."); final_result = str(result)
            log_lines.append(f"Returning final (type {type(final_result)})."); log_lines.append(f"{log_prefix} END (Success)")
            return {"result": final_result}
        except Exception as e: # Catch execution errors
            log_lines.append(f"!!! EXCEPTION in tool exec for '{_tool_name}': {e} !!!"); tb_lines = traceback.format_exc().splitlines(); log_lines.append("--- Traceback ---"); log_lines.extend(tb_lines); log_lines.append("-----------------"); log_lines.append(f"{log_prefix} END (Exception)")
            return f"ERROR_EXECUTING_TOOL_{_tool_name}: {str(e)}" # Return error string
        finally: # Ensure logging
            try:
                for line in log_lines: print(line, flush=True, file=sys.stderr)
                with open(log_file, "a") as f: f.write("\n".join(log_lines) + "\n\n")
            except Exception as log_e: print(f"!!! Logging Error for tool {_tool_name}: {log_e} !!!", flush=True, file=sys.stderr)

    # Return the created wrapper function AND the original tool's metadata
    return dynamic_tool_wrapper, tool_name, getattr(tool_instance, 'description', f"Tool {tool_name}")

# --- Main Execution Logic ---
def main():
    parser = argparse.ArgumentParser(description='Start Mentis MCP Server (Direct Registration)')
    parser.add_argument('--transport', type=str, choices=['stdio', 'sse'], default='stdio'); parser.add_argument('--host', type=str, default='0.0.0.0'); parser.add_argument('--port', type=int, default=8000); parser.add_argument('--name', type=str, default='MentisMCP'); parser.add_argument('--tools', nargs='+'); parser.add_argument('--debug', action='store_true')
    args = parser.parse_args()

    if args.debug: logger.setLevel(logging.DEBUG); print("DEBUG Logging Enabled")

    try:
        # --- 1. Preregister tools into the central registry ---
        if PREREGISTER_AVAILABLE:
             print("DEBUG: Calling preregister_core_tools...")
             preregister_core_tools() # This populates the registry
             print("DEBUG: preregister_core_tools finished.")
        else: print("DEBUG: Skipping preregister_core_tools (unavailable).")

        # --- 2. Create FastMCP instance ---
        print(f"DEBUG: Creating FastMCP instance: name='{args.name}'")
        fastmcp_kwargs = {}
        if args.transport == 'sse':
            if args.host: fastmcp_kwargs['host'] = args.host
            if args.port: fastmcp_kwargs['port'] = args.port
        mcp_instance = FastMCP(args.name, **fastmcp_kwargs) # Create instance directly
        print(f"DEBUG: FastMCP instance created.")

        # --- 3. Load tools from registry and register wrappers with FastMCP ---
        registered_count = 0
        target_tools = args.tools # List of names, or None for all

        # Get all tools first if needed
        all_tools_dict = get_registered_tools(as_dict=True)

        tools_to_register = {}
        if target_tools: # Filter if specific tools requested
             print(f"DEBUG: Filtering for specific tools: {target_tools}")
             for name in target_tools:
                  if name in all_tools_dict:
                       tools_to_register[name] = all_tools_dict[name]
                  else:
                       print(f"ERROR: Requested tool '{name}' not found in registry.")
        else: # Register all tools found in registry
             print("DEBUG: Registering all tools found in registry...")
             tools_to_register = all_tools_dict

        # Iterate and register the selected tools
        print(f"DEBUG: Attempting to register {len(tools_to_register)} tools with FastMCP...")
        for tool_name, tool_info in tools_to_register.items():
            tool_instance = tool_info.get("tool")
            if isinstance(tool_instance, BaseTool):
                 try:
                      # Create the wrapper function and get metadata
                      wrapper_func, name, description = create_tool_wrapper(tool_instance)
                      # Register the wrapper directly using the mcp_instance decorator method
                      mcp_instance.tool(name=name, description=description)(wrapper_func)
                      print(f"DEBUG: Successfully registered '{name}' with FastMCP.")
                      registered_count += 1
                 except Exception as e_register:
                      print(f"ERROR: Failed to register wrapper for tool '{tool_name}': {e_register}")
                      traceback.print_exc()
            else:
                 print(f"WARNING: Item '{tool_name}' not a BaseTool, skipping.")

        print(f"DEBUG: Tool registration complete. {registered_count} tools registered with FastMCP.")
        if registered_count == 0: print("WARNING: No tools were registered!")

        # --- 4. Run the FastMCP server ---
        print(f"Starting MCP Server '{args.name}' (Transport: {args.transport})...")
        mcp_instance.run(transport=args.transport)

    except KeyboardInterrupt: print("Server shutting down..."); sys.exit(0)
    except Exception as e: print(f"Error starting server: {e}"); traceback.print_exc(); sys.exit(1)

if __name__ == "__main__":
    main()

================================================
FILE: core/mcp/server.py
================================================
import os
import sys
import traceback
import asyncio
import time
import json
import functools
from typing import Dict, Any, Optional, List

# mcp & fastmcp
from mcp.server.fastmcp import FastMCP
from mcp.types import CallToolResult, TextContent, ErrorData  # <-- 关键导入

# 修正路径，导入你自己的工具与 BaseTool
sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(__file__))))
from core.tools.registry import get_registered_tools, get_tool_instance
from langchain_core.tools import BaseTool

print("--- DEBUG: Loading REFACTORED server.py (Fix InvalidSignature) ---")

class MentisMCPServer:
    def __init__(self, name: str = "MentisMCP", host: Optional[str] = None, port: Optional[int] = None):
        print(f"DEBUG: Initializing MentisMCPServer(name='{name}', host={host}, port={port})")
        fastmcp_kwargs = {}
        if host is not None:
            fastmcp_kwargs['host'] = host
        if port is not None:
            fastmcp_kwargs['port'] = port

        try:
            print(f"DEBUG: Calling FastMCP(name='{name}', **{fastmcp_kwargs})")
            self.mcp = FastMCP(name, **fastmcp_kwargs)
            print("DEBUG: FastMCP initialized successfully.")
        except Exception as e_fastmcp:
            print("ERROR: Failed to initialize FastMCP!")
            print(traceback.format_exc())
            raise

        # 记录注册成功的工具包装器
        self.registered_tools_wrappers = {}

    def register_all_tools(self):
        """批量注册所有在 registry 中找到的 BaseTool"""
        tools_dict = get_registered_tools(as_dict=True)
        print(f"DEBUG: Registering all tools ({len(tools_dict)} found)...")
        registered_count = 0
        for tool_name, tool_info in tools_dict.items():
            tool_instance = tool_info.get("tool")
            if isinstance(tool_instance, BaseTool):
                if self._register_tool_with_simplified_wrapper(tool_instance):
                    registered_count += 1
            else:
                print(f"WARNING: Item '{tool_name}' not BaseTool, skipping.")
        print(f"DEBUG: Finished registering all tools. Registered: {registered_count}")

    def register_single_tool(self, tool_name: str):
        """仅注册特定名称的一个工具"""
        print(f"DEBUG: Attempting to register single tool: {tool_name}")
        try:
            tool_instance = get_tool_instance(tool_name)
            if not tool_instance:
                print(f"ERROR: Tool '{tool_name}' not found in registry.")
                return
            if isinstance(tool_instance, BaseTool):
                if self._register_tool_with_simplified_wrapper(tool_instance):
                    print(f"DEBUG: Successfully registered single tool: {tool_instance.name}")
                else:
                    print(f"ERROR: Failed wrapper registration for: {tool_instance.name}")
            else:
                print(f"WARNING: Tool '{tool_name}' not BaseTool, skipping.")
        except Exception as e:
            print(f"ERROR during register_single_tool for '{tool_name}': {e}")
            print(traceback.format_exc())

    def _register_tool_with_simplified_wrapper(self, tool: BaseTool) -> bool:
        """
        为工具创建并注册一个简化的包装器 (Fix InvalidSignature),
        并确保返回的数据符合 CallToolResult，以便客户端解析.
        """
        try:
            tool_name = getattr(tool, 'name', None)
            tool_description = getattr(tool, 'description', None)
            if not tool_name or not isinstance(tool_name, str):
                print(f"ERROR: Invalid tool name: {tool_name}. Skip.")
                return False
            if not tool_description or not isinstance(tool_description, str):
                print(f"WARNING: Empty/invalid description for '{tool_name}'.")
                tool_description = f"Tool {tool_name}"

            print(f"DEBUG: Defining wrapper for tool: '{tool_name}'")

            @self.mcp.tool(name=tool_name, description=tool_description)
            async def simplified_tool_wrapper(tool_for_wrapper=tool, **kwargs):
                """
                同步或异步地调用 tool_for_wrapper，并将结果包装到
                CallToolResult 中返回给客户端，以匹配 .content 或 .error.
                """
                _tool_name = tool_for_wrapper.name
                log_file = "/tmp/mcp_wrapper.log"
                timestamp = time.strftime("%Y-%m-%d %H:%M:%S")
                log_prefix = f"--- {timestamp} WRAPPER for '{_tool_name}' ---"
                log_lines = [f"{log_prefix} START", f"Received kwargs: {kwargs}"]

                try:
                    # 根据工具方法签名决定调用 _arun (异步) 或 _run (同步)
                    result = None
                    if hasattr(tool_for_wrapper, '_arun'):
                        log_lines.append("Calling await tool_for_wrapper._arun(**kwargs)")
                        result = await tool_for_wrapper._arun(**kwargs)
                        log_lines.append("Await _arun completed.")
                    elif hasattr(tool_for_wrapper, '_run'):
                        log_lines.append("Calling tool_for_wrapper._run(**kwargs) via run_in_executor")
                        loop = asyncio.get_running_loop()
                        sync_func_with_args = functools.partial(tool_for_wrapper._run, **kwargs)
                        result = await loop.run_in_executor(None, sync_func_with_args)
                        log_lines.append("Executor _run completed.")
                    else:
                        log_lines.append(f"ERROR: Tool '{_tool_name}' has no _arun/_run!")
                        raise NotImplementedError(f"Tool '{_tool_name}' cannot be invoked directly.")

                    # 记录结果类型和内容片段
                    log_lines.append(f"Raw result type: {type(result)}")
                    log_lines.append(f"Raw value snippet: {str(result)[:500]}...")

                    # 关键：将结果包装成 CallToolResult，让客户端能识别 .content
                    call_result = CallToolResult(
                        content=[TextContent(text=str(result))]
                    )
                    log_lines.append("Returning standard CallToolResult with .content.")
                    log_lines.append(f"{log_prefix} END (Success)")
                    return call_result

                except Exception as e:
                    # 出现异常则使用 .error 返回
                    log_lines.append(f"!!! EXCEPTION in tool exec for '{_tool_name}': {e} !!!")
                    tb_lines = traceback.format_exc().splitlines()
                    log_lines.append("--- Traceback ---")
                    log_lines.extend(tb_lines)
                    log_lines.append("-----------------")
                    log_lines.append(f"{log_prefix} END (Exception)")
                    err_msg = f"ERROR_EXECUTING_TOOL_{_tool_name}: {str(e)}"
                    return CallToolResult(error=ErrorData(message=err_msg))

                finally:
                    # 日志记录
                    try:
                        for line in log_lines:
                            print(line, flush=True, file=sys.stderr)
                        with open(log_file, "a") as f:
                            f.write("\n".join(log_lines) + "\n\n")
                    except Exception as log_e:
                        print(f"!!! Logging Error for '{_tool_name}': {log_e} !!!",
                              flush=True, file=sys.stderr)

            # 修正下包装器的名字，避免重复
            simplified_tool_wrapper.__name__ = f"{tool_name}_simplified_wrapper"
            self.registered_tools_wrappers[tool_name] = simplified_tool_wrapper
            print(f"DEBUG: Registered simplified wrapper for tool: '{tool_name}'")
            return True

        except Exception as registration_error:
            failed_tool_name = getattr(tool, 'name', 'unknown')
            print(f"ERROR: Failed to create/register wrapper for tool '{failed_tool_name}': {registration_error}")
            print(traceback.format_exc())
            return False

    def run(self, transport: str = "stdio"):
        """运行 MCP 服务器 (签名中移除了 host/port)"""
        print(f"DEBUG: MentisMCPServer.run(transport='{transport}') called.")
        print(f"正在启动 MCP 服务器，传输方式: {transport}")

        if transport == "sse":
            # SSE 方式
            host = 'N/A'
            port = 'N/A'
            if hasattr(self.mcp, 'settings'):
                host = getattr(self.mcp.settings, 'host', 'N/A')
                port = getattr(self.mcp.settings, 'port', 'N/A')
            print(f"配置 SSE 服务器监听在: http://{host}:{port} (如果 N/A 表示未配置或获取失败)")
            try:
                import importlib
                try:
                    fastmcp_module = importlib.import_module('mcp.server.fastmcp')
                    print(f"FastMCP version: {getattr(fastmcp_module, '__version__', '未知')}")
                except:
                    pass
                import uvicorn
                import fastapi
                print(f"FastAPI: {fastapi.__version__}, Uvicorn: {uvicorn.__version__}")
                print(f"DEBUG: Calling self.mcp.run(transport='{transport}') for SSE")
                self.mcp.run(transport=transport)
            except Exception as e:
                print(f"SSE 服务器启动失败: {e}")
                print(traceback.format_exc())
                raise
        else:
            # 默认 stdio 模式
            print("启动 stdio 模式服务器...")
            try:
                print(f"DEBUG: Calling self.mcp.run(transport='{transport}') for STDIO")
                self.mcp.run(transport=transport)
            except Exception as e:
                print(f"stdio 服务器启动失败: {e}")
                print(traceback.format_exc())
                raise


================================================
FILE: core/mcp/test/README.md
================================================
# MCP 测试框架说明

## 概述

MCP（Machine Conversation Protocol）是一个用于机器对话的协议框架，它允许不同的系统通过标准化的接口进行通信。本测试框架提供了一种方式来测试MCP服务器的功能和性能。

## 测试文件结构

测试框架包含以下主要文件：

### 1. minimal_fastmcp_test.py

这是一个最小化的FastMCP服务器实现，用于测试基本功能：

- 创建FastMCP实例
- 注册简单的工具函数（ping工具）
- 通过STDIO传输方式运行服务器

该文件可以独立运行，也可以被其他测试脚本作为子进程启动。

### 2. test_minimal_client.py

这个脚本使用MCP客户端库来测试minimal_fastmcp_test.py：

- 导入必要的MCP客户端库（ClientSession, stdio_client等）
- 连接到minimal_fastmcp_test.py并测试ping工具
- 展示如何使用客户端API进行工具调用

## 测试方法

### 客户端库测试（test_minimal_client.py）

这种测试方法使用MCP客户端库与MCP服务器通信，展示了如何在实际应用中使用MCP客户端。测试流程如下：

1. 创建ClientSession对象
2. 连接到MCP服务器
3. 调用工具并处理结果

## 运行测试

### 运行客户端库测试

```bash
python core/mcp/test/test_minimal_client.py
```

## 扩展测试

### 添加新工具

要在minimal_fastmcp_test.py中添加新工具，可以按照以下步骤操作：

1. 定义新的异步工具函数
2. 使用FastMCP实例的装饰器注册工具

示例：
```python
async def new_tool(param1: str, param2: int = 0) -> str:
    """A new tool description."""
    # 工具实现
    return f"Result: {param1}, {param2}"

mcp_server.tool(name="new_tool", description="New tool description.")(new_tool)
```

### 创建新的测试脚本

可以参考现有的测试脚本创建新的测试脚本，测试不同的功能或场景。

## 常见问题

### 服务器无响应

- 确保服务器进程正在运行
- 检查传输方式是否正确（stdio或sse）
- 检查客户端连接参数是否正确

### 工具调用失败

- 确保工具名称正确
- 检查参数是否符合工具的要求
- 查看服务器日志以获取更多信息

## 总结

MCP测试框架提供了使用MCP客户端库测试MCP服务器功能的方法。通过这些测试，可以验证MCP服务器的基本功能和性能，为开发和调试提供支持。

================================================
FILE: core/mcp/test/__init__.py
================================================
# MCP测试模块
# 包含用于测试MCP（Message Control Protocol）功能的各种测试脚本

================================================
FILE: core/mcp/test/minimal_fastmcp_test.py
================================================
import asyncio
from mcp.server.fastmcp import FastMCP
import logging

# 配置基本日志，看FastMCP内部是否有更多信息
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger("minimal_test")

print("--- Minimal FastMCP Server Test ---")

# 1. 创建 FastMCP 实例
# (假设 FastMCP 对于 stdio 不需要 host/port in __init__)
mcp_server = FastMCP(name="MinimalServer")
print("FastMCP instance created.")

# 2. 定义一个简单的 async 工具函数
async def ping_tool(query: str = "default ping") -> str:
    """A very basic tool that just returns pong."""
    print(f"\n--- PING TOOL CALLED! ---") # 在工具内部打印日志
    print(f"Received query: {query}")
    result = f"pong: {query}"
    print(f"Returning: {result}")
    print(f"--- PING TOOL END ---")
    return result

# 3. 直接用 FastMCP 实例的装饰器注册
try:
    mcp_server.tool(name="ping", description="Returns pong plus the query.")(ping_tool)
    # 上一行等价于:
    # @mcp_server.tool(name="ping", description="Returns pong plus the query.")
    # async def ping_tool(...) ...
    print("Tool 'ping' registered directly with FastMCP.")
except Exception as e_reg:
    print(f"Error registering tool directly: {e_reg}")
    import traceback
    traceback.print_exc()
    exit(1)

# 4. 运行服务器 (使用 STDIO)
try:
    print("Starting minimal server with STDIO transport...")
    # 假设 run() 只需 transport 参数对 stdio 有效
    mcp_server.run(transport="stdio")
    print("Server finished.") # 理应不会执行到，除非服务器停止
except Exception as e_run:
    print(f"Error running minimal server: {e_run}")
    import traceback
    traceback.print_exc()
    exit(1)

================================================
FILE: core/mcp/test/test_minimal_client.py
================================================
# test_minimal_client_fixed.py - 用于测试minimal_fastmcp_test.py的客户端脚本（修复版）
import os
import sys
import asyncio
import json
import traceback
from typing import Optional, Dict, Any

# 添加项目根目录到路径
sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

# 导入必要的MCP客户端库
try:
    from mcp import ClientSession
    from mcp.client.stdio import stdio_client, StdioServerParameters
    from mcp.types import CallToolRequest
    DEPS_OK = True
except ImportError as e:
    print(f"错误: 缺少必要的依赖: {e}")
    print("请确保已安装mcp库: pip install mcp")
    DEPS_OK = False

async def main():
    """连接到minimal_fastmcp_test.py并测试ping工具"""
    print("=== MCP最小客户端测试（修复版）===\n")
    
    if not DEPS_OK:
        print("缺少必要的依赖，无法继续。")
        return
    
    # 准备minimal_fastmcp_test.py的路径
    script_path = os.path.join(os.path.dirname(__file__), "minimal_fastmcp_test.py")
    cmd = [sys.executable, script_path]
    print(f"准备连接到服务器: {script_path}")
    
    try:
        # 创建StdioServerParameters对象
        server_params = StdioServerParameters(
            command=sys.executable,
            args=[script_path],
            # 可以根据需要添加其他参数，如env, cwd等
        )
        print("已创建服务器参数配置。")
        
        # 创建STDIO客户端连接
        print("\n创建STDIO客户端连接...")
        async with stdio_client(server_params) as (reader, writer):
            print("STDIO连接已建立。创建ClientSession...")
            async with ClientSession(reader, writer) as session:
                print("ClientSession已创建。初始化会话...")
                await session.initialize()
                print("会话已初始化。")
                
                # 获取服务器支持的工具列表
                print("\n获取服务器支持的工具列表...")
                tools_result = await session.list_tools()
                print(f"服务器支持的工具: {tools_result}")
                
                # 调用ping工具
                print("\n调用ping工具...")
                ping_request = CallToolRequest(
                    method="tools/call",
                    params={
                        "name": "ping",
                        "arguments": {"query": "Hello, MCP!"}
                    }
                )
                
                try:
                    print(f"发送请求: {ping_request}")
                    result = await session.call_tool("ping", {"query": "Hello, MCP!"})
                    print(f"\n收到响应: {result}")
                    if hasattr(result, 'result'):
                        print(f"结果: {result.result}")
                    elif hasattr(result, 'error'):
                        print(f"错误: {result.error}")
                    else:
                        print(f"未知响应格式: {result}")
                except Exception as e:
                    print(f"调用工具时出错: {e}")
                    print(traceback.format_exc())
    
    except Exception as e:
        print(f"运行测试时出错: {e}")
        print(traceback.format_exc())

if __name__ == "__main__":
    asyncio.run(main())

================================================
FILE: core/tools/__init__.py
================================================
# Tools package initialization
from langchain_community.agent_toolkits.load_tools import load_tools
from core.tools.registry import register_tool, ToolCategory, get_registered_tools
from core.tools.firecrawl_tool import FireCrawlTool
from core.tools.e2b_tool import E2BCodeInterpreterTool
import os
import importlib
import inspect
from typing import Any, Dict, List, Type, Optional
from langchain_core.tools import BaseTool

# 导入预注册所需的工具
from langchain_community.tools import (
    TavilySearchResults,
    ArxivQueryRun,
)
from langchain_community.agent_toolkits import FileManagementToolkit
from langchain_community.agent_toolkits.openapi.toolkit import RequestsToolkit,TextRequestsWrapper
from langchain_community.tools.riza.command import ExecPython, ExecJavaScript

from dotenv import load_dotenv
load_dotenv()  # 自动加载 .env 文件

# 预注册核心工具列表 - 定义需要预注册的核心工具
def preregister_core_tools():
    """预注册核心工具，确保系统启动时这些工具已经可用"""
    print("开始预注册核心工具...")
    
    # 注册搜索类工具
    try:
        # Tavily搜索工具
        tavily_search = TavilySearchResults()
        register_tool(tavily_search, ToolCategory.SEARCH)
        print(f"已预注册工具: {tavily_search.name} (类别: {ToolCategory.SEARCH.value})")
    except Exception as e:
        print(f"预注册Tavily搜索工具失败: {e}")
    
    # 注册网页浏览类工具
    try:
        # Arxiv查询工具
        arxiv_tool = ArxivQueryRun()
        register_tool(arxiv_tool, ToolCategory.WEB_BROWSING)
        print(f"已预注册工具: {arxiv_tool.name} (类别: {ToolCategory.WEB_BROWSING.value})")
    except Exception as e:
        print(f"预注册Arxiv查询工具失败: {e}")
    
    try:
        # RequestoolKit请求工具
        # 创建TextRequestsWrapper实例作为请求包装器
        requests_wrapper = TextRequestsWrapper(headers={})
        # 初始化RequestsToolkit，提供必要的参数
        requests_toolkit = RequestsToolkit(
            requests_wrapper=requests_wrapper,
            allow_dangerous_requests=True  # 允许危险请求，使工具可用
        )
        for req_tool in requests_toolkit.get_tools():
            register_tool(req_tool, ToolCategory.WEB_BROWSING)
            print(f"已预注册工具: {req_tool.name} (类别: {ToolCategory.WEB_BROWSING.value})")
    except Exception as e:
        print(f"预注册 RequestoolKit请求工具失败: {e}")
    
    # 注册文件系统工具
    try:
        # 获取当前目录作为文件系统工具的根目录
        current_dir = os.getcwd()
        # 创建文件系统工具集
        filesystem_toolkit = FileManagementToolkit(
            root_dir=current_dir,
            selected_tools=["write_file", "read_file", "list_directory"]
        )
        # 获取文件系统工具并注册
        for fs_tool in filesystem_toolkit.get_tools():
            register_tool(fs_tool, ToolCategory.FILE_SYSTEM)
            print(f"已预注册工具: {fs_tool.name} (类别: {ToolCategory.FILE_SYSTEM.value})")
    except Exception as e:
        print(f"预注册文件系统工具失败: {e}")
    
    # 注册代码解释器工具
    # try:
    #     # Python REPL工具
    #     python_repl = ExecPython()
    #     register_tool(python_repl, ToolCategory.CODE_INTERPRETER)
    #     print(f"已预注册工具: {python_repl.name} (类别: {ToolCategory.CODE_INTERPRETER.value})")
    # except Exception as e:
    #     print(f"预注册Python REPL工具失败: {e}")

    # # 注册代码解释器工具
    # try:
    #     # Python REPL工具
    #     javascript_repl = ExecJavaScript()
    #     register_tool(javascript_repl, ToolCategory.CODE_INTERPRETER)
    #     print(f"已预注册工具: {javascript_repl.name} (类别: {ToolCategory.CODE_INTERPRETER.value})")
    # except Exception as e:
    #     print(f"预注册Python REPL工具失败: {e}")
    
    # 注册自定义工具 - FireCrawl工具
    try:
        firecrawl_tool = FireCrawlTool()
        register_tool(firecrawl_tool, ToolCategory.WEB_BROWSING)
        print(f"已预注册工具: {firecrawl_tool.name} (类别: {ToolCategory.WEB_BROWSING.value})")
    except Exception as e:
        print(f"预注册FireCrawl工具失败: {e}")
    
    # 注册E2B代码解释器工具
    try:
        e2b_tool = E2BCodeInterpreterTool()
        register_tool(e2b_tool, ToolCategory.CODE_INTERPRETER)
        print(f"已预注册工具: {e2b_tool.name} (类别: {ToolCategory.CODE_INTERPRETER.value})")
    except Exception as e:
        print(f"预注册E2B代码解释器工具失败: {e}")


    from .replicate_flux_tool import ReplicateFluxImageTool, category 
    try:
        flux_tool = ReplicateFluxImageTool()
        if flux_tool._is_available:
            register_tool(flux_tool, category)
    except Exception as e:
        print(f"Failed to register ReplicateFluxImageTool: {e}")

print("核心工具预注册完成")

# 执行预注册
preregister_core_tools()

# 注册 LangChain 工具 - 使用load_tools加载的工具列表
try:
    langchain_tools = load_tools(["serpapi"])
    for tool in langchain_tools:
        register_tool(tool, ToolCategory.SEARCH)
        print(f"已注册LangChain工具: {tool.name} (类别: {ToolCategory.SEARCH.value})")
except Exception as e:
    print(f"加载LangChain工具失败: {e}")

# 工具类别映射 - 用于自动分类直接导入的工具
tool_category_mapping = {
    # 搜索类工具
    "TavilySearchResults": ToolCategory.SEARCH,
    "GoogleSearchResults": ToolCategory.SEARCH,
    "GoogleSerperResults": ToolCategory.SEARCH,
    "WikipediaQueryRun": ToolCategory.SEARCH,
    "FireCrawl": ToolCategory.SEARCH,
    
    # 网页浏览类工具
    "WebBrowser": ToolCategory.WEB_BROWSING,
    "ArxivQueryRun": ToolCategory.WEB_BROWSING,
    "RequestsGet": ToolCategory.WEB_BROWSING,
    "RequestsPost": ToolCategory.WEB_BROWSING,
    
    # 文件系统类工具
    "WriteFile": ToolCategory.FILE_SYSTEM,
    "ReadFile": ToolCategory.FILE_SYSTEM,
    "ListDirectory": ToolCategory.FILE_SYSTEM,
    
    # 代码解释器类工具
    "PythonREPL": ToolCategory.CODE_INTERPRETER,
    "ShellTool": ToolCategory.CODE_INTERPRETER,
    "E2BCodeInterpreterTool": ToolCategory.CODE_INTERPRETER,
    
    # 数据库类工具
    "SQLDatabaseTool": ToolCategory.DATABASE,
    
    # 默认为其他类别
    "default": ToolCategory.OTHER
}

def register_direct_tool(tool_instance: BaseTool, category: ToolCategory = None) -> None:
    """注册直接从langchain_community.tools导入的工具
    
    Args:
        tool_instance: 工具实例
        category: 工具类别，如果为None则自动根据工具名称判断类别
    """
    if not category:
        # 获取工具类名
        tool_class_name = tool_instance.__class__.__name__
        # 根据工具类名自动判断类别
        category = tool_category_mapping.get(tool_class_name, tool_category_mapping["default"])
    
    # 注册工具
    register_tool(tool_instance, category)
    print(f"已注册工具: {tool_instance.name} (类别: {category.value})")

# 获取 tools 目录路径
tools_dir = os.path.dirname(__file__)

# 遍历目录中的所有文件，注册自定义工具
for filename in os.listdir(tools_dir):
    # 只处理 .py 文件，且排除 __init__.py 和 registry.py
    if filename.endswith('.py') and filename not in ['__init__.py', 'registry.py']:
        # 提取模块名（去掉 .py 后缀）
        module_name = filename[:-3]
        try:
            # 动态导入模块
            module = importlib.import_module(f'.{module_name}', package='core.tools')
            
            # 查找模块中的工具类（继承自BaseTool的类）
            for name, obj in inspect.getmembers(module):
                # 检查是否是类且是BaseTool的子类
                if inspect.isclass(obj) and issubclass(obj, BaseTool) and obj != BaseTool:
                    # 检查该类是否已经被实例化并注册
                    tool_name = getattr(obj, 'name', None)
                    if tool_name and tool_name not in [info['tool'].name for info in get_registered_tools().values()]:
                        # 确定工具类别
                        category = getattr(module, 'category', ToolCategory.OTHER)
                        # 实例化并注册工具
                        try:
                            tool_instance = obj()
                            register_tool(tool_instance, category)
                            print(f"已注册工具类: {name} (工具名: {tool_instance.name}, 类别: {category.value})")
                        except Exception as e:
                            print(f"实例化工具类 {name} 时出错: {e}")
        except Exception as e:
            print(f"导入 {module_name} 时出错: {e}")

================================================
FILE: core/tools/e2b_tool.py
================================================
# core/tools/e2b_tool.py

import os
import json
import asyncio
import traceback
from typing import Dict, Any, Optional, Type, List # 确保导入 List
from pydantic import BaseModel, Field, PrivateAttr
from langchain_core.tools import BaseTool


# --- E2B Imports ---
try:
    from e2b_code_interpreter import Sandbox
    from e2b_code_interpreter.exceptions import TimeoutException
    E2B_AVAILABLE = True
except ImportError:
    Sandbox = None # type: ignore
    SandboxException = Exception # type: ignore # Fallback to base Exception
    TimeoutException = TimeoutError # type: ignore # Fallback to base TimeoutError
    E2B_AVAILABLE = False
    print("Warning: 'e2b' package not installed (pip install e2b). E2BCodeInterpreterTool will not work.")

# --- Tool Category ---
try:
    from .registry import ToolCategory, register_tool
    if not hasattr(ToolCategory, 'CODE_INTERPRETER'):
         ToolCategory.CODE_INTERPRETER = ToolCategory.OTHER
    category = ToolCategory.CODE_INTERPRETER
except ImportError:
    category = None
    print("Tool registry not found.")

# --- Input Schema (保持不变) ---
class E2BCodeInterpreterToolInput(BaseModel):
    code: str = Field(description="要执行的Python代码")

# --- Tool Class (优化版) ---
class E2BCodeInterpreterTool(BaseTool):
    """
    使用 E2B SDK 在安全沙箱中执行 Python 代码的工具 (修正异常处理版)。
    返回执行结果的字符串摘要。
    """
    name: str = "e2b_code_interpreter"
    description: str = ( # 可以稍微调整描述，强调是 Python 执行环境
        "Executes Python code in a sandboxed environment. "
        "Input MUST be a JSON object with a 'code' key containing the Python code string. "
        "Libraries like matplotlib, pandas, numpy, sympy are available. Install others using pip (e.g., `import subprocess; subprocess.run(['pip', 'install', 'requests'])`). "
        "Use 'print()' to output results. For plots, save them to a file (e.g., '/home/user/plot.png') and state the path; do not return raw image data. "
        "Returns a string summarizing execution status, stdout, stderr, and any errors."
    )
    args_schema: Type[BaseModel] = E2BCodeInterpreterToolInput

    _sandbox: Optional[Any] = PrivateAttr(default=None)
    _is_available: bool = PrivateAttr(default=False)
    _init_error: Optional[str] = PrivateAttr(default=None)
    # 不再需要 self.ExceptionClass

    def __init__(self, **kwargs):
        super().__init__(**kwargs)
        self._initialize_sandbox()

    def _initialize_sandbox(self):
        """初始化沙箱环境"""
        if not E2B_AVAILABLE:
            self._init_error = "Package 'e2b' not installed."
            print(f"ERROR: {self._init_error}")
            return

        if "E2B_API_KEY" not in os.environ:
            self._init_error = "Environment variable E2B_API_KEY not set."
            print(f"ERROR: {self._init_error}")
            return

        try:
            print("Initializing E2B Sandbox...")
            # 实例化 Sandbox
            self._sandbox = Sandbox() # 使用导入的 Sandbox 类
            print("E2B Sandbox initialized successfully!")
            self._is_available = True
            self._init_error = None
        except (SandboxException, TimeoutException) as e: # <--- 捕获特定的 E2B 异常
            self._init_error = f"Failed to initialize E2B Sandbox (E2B Error): {e}"
            print(f"ERROR: {self._init_error}")
            self._is_available = False
        except Exception as e: # 捕获其他意外错误
            self._init_error = f"An unexpected error occurred during E2B Sandbox initialization: {e}"
            print(f"ERROR: {self._init_error}")
            self._is_available = False

    def _run(self, code: str, **kwargs) -> str:
        """同步执行 Python 代码并返回结果摘要字符串"""
        if not self._is_available or self._sandbox is None:
            # ... (返回包含设置指南的错误信息，不变) ...
            error_message = "E2B Sandbox is not available"
            if self._init_error: error_message += f": {self._init_error}"
            setup_guide = "\n\nSetup: pip install e2b; export E2B_API_KEY='...'"
            return f"Execution Failed: {error_message}{setup_guide}"

        output_summary = ""
        try:
            print(f"--- E2B: Executing code synchronously ---\n{code}\n--------------------------------------")
            # 使用 run_python 方法
            execution = self._sandbox.run_code(code)

            # 构建结果字符串 (逻辑保持不变)
            if execution.error:
                output_summary += f"Execution Failed!\nError Name: {execution.error.name}\nError Value: {execution.error.value}\n"
                if execution.error.traceback:
                     traceback_lines = execution.error.traceback.splitlines()
                     output_summary += f"Traceback (last few lines):\n...\n" + "\n".join(traceback_lines[-5:])
            else:
                 output_summary += "Execution Successful.\n"
            if execution.logs.stdout: output_summary += f"\nSTDOUT:\n{execution.logs.stdout}"
            if execution.logs.stderr: output_summary += f"\nSTDERR:\n{execution.logs.stderr}"
            if execution.results: output_summary += "\n\nNote: Execution produced structured results (e.g., plots saved as files)."
            if not output_summary.strip() or output_summary.strip() == "Execution Successful.": output_summary = "Code executed successfully with no textual output."

            print(f"--- E2B: Execution finished ---\nResult Summary:\n{output_summary[:500]}...\n-----------------------------")
            return output_summary.strip()

        except (SandboxException, TimeoutException) as e: # <--- 捕获特定的 E2B 异常
             error_str = f"Execution Failed (E2B Error)!\nError Name: {getattr(e, 'name', type(e).__name__)}\nDetails: {e}"
             # TimeoutException 可能没有 traceback 属性，SandboxException 通常有
             tb = getattr(e, 'traceback', traceback.format_exc())
             if tb:
                 tb_lines = tb.splitlines()
                 error_str += f"\nTraceback (last few lines):\n...\n" + "\n".join(tb_lines[-5:])
             print(f"ERROR during E2B execution: {error_str}")
             return error_str
        except Exception as e: # 其他错误
            error_str = f"Execution Failed (Unexpected Error)!\nError Type: {type(e).__name__}\nError Details: {str(e)}\nTraceback:\n{traceback.format_exc()}"
            print(f"ERROR during E2B execution: {error_str}")
            return error_str

    async def _arun(self, code: str, **kwargs) -> str:
        """异步执行 Python 代码并返回结果摘要字符串"""
        if not self._is_available or self._sandbox is None:
             # ... (返回错误信息) ...
             error_message = f"E2B Sandbox is not available: {self._init_error}"
             return f"Execution Failed: {error_message}"

        try:
            loop = asyncio.get_running_loop()
            import functools
            # 注意：传递给 run_in_executor 的函数应该是可调用的
            # 这里 _run 是实例方法，所以直接传递 self._run 即可
            # 但为了确保 code 参数被正确传递，可以用 lambda 或 partial
            sync_run_with_args = functools.partial(self._run, code=code, **kwargs)

            print(f"--- E2B: Executing code asynchronously via executor ---\n{code}\n--------------------------------------")
            result_summary = await loop.run_in_executor(
                None, sync_run_with_args
            )
            print(f"--- E2B: Async execution finished ---")
            return result_summary
        except Exception as e: # run_in_executor 或 _run 的异常会在这里捕获
            error_str = f"Execution Failed (Async Wrapper Error)!\nError Type: {type(e).__name__}\nError Details: {str(e)}"
            # 尝试获取 Traceback
            tb = traceback.format_exc()
            error_str += f"\nTraceback:\n{tb}"
            print(f"ERROR during E2B async execution: {error_str}")
            return error_str


    def close(self):
        """关闭沙箱，释放资源。"""
        if hasattr(self, "sandbox") and self._is_available and self._sandbox is not None:
            try:
                print("Attempting to close E2B Sandbox...")
                self._sandbox.kill()
                print("E2B Sandbox closed successfully.")
                self._is_available = False
                self._sandbox = None
            except (SandboxException, TimeoutException) as e: # 捕获特定异常
                print(f"Error closing E2B Sandbox (E2B Error): {e}")
            except Exception as e:
                print(f"An unexpected error occurred while closing E2B Sandbox: {e}")

    model_config = {
        "arbitrary_types_allowed": True
    }

    # __del__ 方法用于对象销毁，通常不保证执行，不建议依赖它来关闭资源
    # def __del__(self): self.close()

================================================
FILE: core/tools/firecrawl_tool.py
================================================
# 文件路径: core/tools/firecrawl_tool.py (或您存放工具的文件)

import os
import json # 虽然不直接返回 JSON，但可能用于处理 metadata
from typing import Dict, List, Literal, Optional, Tuple, Type, Union, Any # 确保导入
from pydantic import BaseModel, Field, PrivateAttr # 导入 PrivateAttr
from langchain_core.callbacks import (
    AsyncCallbackManagerForToolRun,
    CallbackManagerForToolRun,
)
from langchain_core.tools import BaseTool
from dotenv import load_dotenv
load_dotenv()  # 自动加载 .env 文件


# 尝试导入 FireCrawlLoader，如果失败则标记
try:
    from langchain_community.document_loaders import FireCrawlLoader
    FIRECRAWL_LOADER_AVAILABLE = True
except ImportError:
    FireCrawlLoader = None # type: ignore
    FIRECRAWL_LOADER_AVAILABLE = False
    print("Warning: langchain_community or firecrawl-py not installed? FireCrawlLoader unavailable.")
    print("Run: pip install -U langchain-community firecrawl-py")

# 定义输入 Schema (保持不变)
class FireCrawlInput(BaseModel):
    """Input for the FireCrawl tool."""
    url: str = Field(description="URL to crawl or scrape")
    mode: str = Field(
        default="scrape", # <-- 将默认模式改为 'scrape' 可能更常用
        description="Mode: 'scrape' (single page), 'crawl' (multiple pages). Default: 'scrape'",
    )
    # 可以添加 params 字段如果希望 LLM 控制更多参数
    # params: Optional[Dict[str, Any]] = Field(default=None, description="Optional dictionary of additional FireCrawl parameters (e.g., {'pageOptions': {'onlyMainContent': True}})")


class FireCrawlTool(BaseTool):
    """
    Tool that uses FireCrawl API to crawl or scrape web content and return a summary.

    Setup:
        pip install -U langchain-community firecrawl-py
        export FIRECRAWL_API_KEY="your-api-key"

    Instantiate:
        tool = FireCrawlTool() # Reads API key from env
        # Or explicitly: tool = FireCrawlTool(api_key="...")

    Invoke:
        tool.invoke({"url": "https://example.com", "mode": "scrape"})
    """

    name: str = "firecrawl_web_content" # 建议用更描述性的名字
    description: str = (
        "Fetches and extracts the main textual content from a given URL. "
        "Use 'scrape' mode (default) for a single page, or 'crawl' mode to follow links (use sparingly). "
        "Input should be a URL. Returns a textual summary of the content."
    )
    args_schema: Type[BaseModel] = FireCrawlInput

    # --- 配置属性 ---
    # API Key 可以通过 __init__ 传入，或者留空让 loader 从环境变量读取
    _api_key: Optional[str] = PrivateAttr(default=None) # 使用 PrivateAttr 避免 Pydantic 验证
    _api_url: Optional[str] = PrivateAttr(default=None)
    # 可以在 __init__ 中设置默认 mode 和 params，或者在 _run/_arun 中处理
    default_mode: str = "scrape" # 工具级别的默认模式
    default_params: Dict[str, Any] = Field(default_factory=dict) # 工具级别的默认参数

    # 添加 __init__ 以便可以传入 api_key (可选)
    def __init__(self, api_key: Optional[str] = None, api_url: Optional[str] = None,
                 mode: str = "scrape", params: Optional[Dict[str, Any]] = None, **kwargs):
        super().__init__(**kwargs)
        # Pydantic V2 中，非 model 字段需要用 PrivateAttr 或在 model_config 中设置
        self._api_key = api_key
        self._api_url = api_url
        self.default_mode = mode
        self.default_params = params or {}
        # 检查 Loader 是否可用
        if not FIRECRAWL_LOADER_AVAILABLE:
            print("ERROR: FireCrawlLoader is unavailable. Please install required packages.")

    def _run(
        self,
        url: str,
        mode: Optional[str] = None,
        run_manager: Optional[CallbackManagerForToolRun] = None,
    ) -> str: # <--- 返回值必须是字符串
        """使用工具同步获取网页内容。"""
        if not FIRECRAWL_LOADER_AVAILABLE:
            return "Error: FireCrawlLoader is not available. Required packages might be missing."
            
        # 确定使用的 API Key (优先实例属性，其次环境变量)
        key = self._api_key or os.getenv('FIRECRAWL_API_KEY')
        if not key:
             return "Error: FIRECRAWL_API_KEY not found in environment variables or instantiation."
        
        # 打印 Debug 信息 (可选)
        print(f"DEBUG [FireCrawlTool]: Running for URL='{url}', Mode='{mode or self.default_mode}'")
        # print(f"DEBUG [FireCrawlTool]: Effective API Key = {'*' * (len(key) - 4) + key[-4:] if key else 'None'}")

        try:
            current_mode = mode or self.default_mode
            loader = FireCrawlLoader(
                url=url,
                api_key=key, # 传递最终确定的 key
                api_url=self._api_url, # 传递实例属性或 None
                mode=current_mode,
                params=self.default_params, # 传递实例默认参数
            )

            print(f"--- Calling FireCrawl API (Sync) for: '{url}' ---")
            docs = loader.load()
            print(f"--- FireCrawl API call successful for: '{url}', received {len(docs)} document(s) ---")

            # --- 格式化结果为字符串 ---
            if not docs:
                return f"FireCrawl successful but returned no content from {url} (Mode: {current_mode}). The page might be empty or restricted."

            summary_parts = [f"Content summary from {url} (Mode: {current_mode}):"]
            content_limit = 4000 # 限制返回给 LLM 的总字符数 (可调整)
            current_length = len(summary_parts[0])
            doc_count = 0

            for doc in docs:
                 # 可以考虑只返回第一个文档的内容，如果文档很多
                 # if doc_count >= 1 and current_mode == 'scrape': break 
                 
                 source_info = f"\n\n--- Source: {doc.metadata.get('sourceURL', url)} ---"
                 page_content = doc.page_content or ""
                 
                 available_length = content_limit - current_length - len(source_info) - 20 # 预留空间
                 if available_length <= 0 and doc_count > 0: # 如果已经有内容且空间不足
                      summary_parts.append("\n\n... (further content truncated)")
                      break

                 content = source_info + "\n" + page_content
                 
                 if len(content) > available_length:
                      content = content[:available_length] + "... (truncated)"
                 
                 summary_parts.append(content)
                 current_length += len(content)
                 doc_count += 1
                 if current_length >= content_limit: break # 达到总长度限制

            return "\n".join(summary_parts).strip()
            # --- 格式化结束 ---

        except Exception as e:
            error_msg = f"Error during FireCrawl for {url} (Mode: {mode or self.default_mode}): {repr(e)}"
            print(f"ERROR: {error_msg}")
            return error_msg # 返回错误信息字符串

    async def _arun(
        self,
        url: str,
        mode: Optional[str] = None,
        run_manager: Optional[AsyncCallbackManagerForToolRun] = None,
    ) -> str: # <--- 返回值必须是字符串
        """使用工具异步获取网页内容。"""
        if not FIRECRAWL_LOADER_AVAILABLE:
            return "Error: FireCrawlLoader is not available."
            
        key = self.api_key or os.getenv('FIRECRAWL_API_KEY')
        if not key:
             return "Error: FIRECRAWL_API_KEY not found."
        
        print(f"DEBUG [FireCrawlTool]: Running async for URL='{url}', Mode='{mode or self.default_mode}'")

        try:
            current_mode = mode or self.default_mode
            loader = FireCrawlLoader(
                url=url, api_key=key, api_url=self.api_url,
                mode=current_mode, params=self.default_params,
            )

            print(f"--- Calling FireCrawl API (Async) for: '{url}' ---")
            # 使用 aload 进行异步加载
            docs = await loader.aload()
            print(f"--- FireCrawl API call successful for: '{url}', received {len(docs)} document(s) ---")

            # --- 格式化结果为字符串 (与 _run 逻辑相同) ---
            if not docs: return f"FireCrawl successful but returned no content from {url} (Mode: {current_mode})."
            summary_parts = [f"Content summary from {url} (Mode: {current_mode}):"]
            content_limit = 4000; current_length = len(summary_parts[0]); doc_count = 0
            for doc in docs:
                 # if doc_count >= 1 and current_mode == 'scrape': break
                 source_info = f"\n\n--- Source: {doc.metadata.get('sourceURL', url)} ---"
                 page_content = doc.page_content or ""
                 available_length = content_limit - current_length - len(source_info) - 20
                 if available_length <= 0 and doc_count > 0:
                      summary_parts.append("\n\n... (further content truncated)"); break
                 content = source_info + "\n" + page_content
                 if len(content) > available_length: content = content[:available_length] + "... (truncated)"
                 summary_parts.append(content); current_length += len(content); doc_count += 1
                 if current_length >= content_limit: break
            return "\n".join(summary_parts).strip()
            # --- 格式化结束 ---

        except Exception as e:
            error_msg = f"Error during Async FireCrawl for {url} (Mode: {mode or self.default_mode}): {repr(e)}"
            print(f"ERROR: {error_msg}")
            return error_msg

    # Pydantic V2: 允许额外的私有属性
    model_config = {
        "arbitrary_types_allowed": True
    }

================================================
FILE: core/tools/registry.py
================================================
from enum import Enum
from typing import List, Dict, Union, Optional
from langchain.tools import Tool

# 定义工具分类枚举
class ToolCategory(Enum):
    SEARCH = "Search"
    CODE_INTERPRETER = "Code Interpreter"
    WEB_BROWSING = "Web Browsing"
    DATABASE = "Database"
    FILE_SYSTEM = "FileSystem"
    IMAGE_GENERATION = "Image Generation"
    OTHER = "Other"

# 全局工具注册表
_registered_tools = {}

def register_tool(tool: Tool, category: ToolCategory) -> None:
    """注册一个工具到全局字典中，带有分类信息
    
    如果工具名已存在，将覆盖现有的工具注册信息
    """
    if tool.name in _registered_tools:
        print(f"警告: 工具名 {tool.name} 已存在，将覆盖现有注册信息")
    _registered_tools[tool.name] = {
        "tool": tool,
        "category": category
    }

def get_registered_tools(as_dict: bool = False) -> Union[List[Tool], Dict[str, Dict]]:
    """返回所有已注册的工具
    
    Args:
        as_dict: 如果为True，返回原始字典格式；如果为False，返回工具列表
        
    Returns:
        如果as_dict为True，返回原始字典格式；否则返回工具列表
    """
    if as_dict:
        return _registered_tools
    return [info["tool"] for info in _registered_tools.values()]

def get_tools_list() -> List[Tool]:
    """返回所有已注册的工具列表，直接可用于Agent初始化
    
    Returns:
        所有已注册工具的列表
    """
    return [info["tool"] for info in _registered_tools.values()]

def get_tools_dict() -> Dict[str, Tool]:
    """返回工具名称到工具实例的映射字典
    
    Returns:
        工具名称到工具实例的映射字典
    """
    return {name: info["tool"] for name, info in _registered_tools.items()}

def get_tool(name: str) -> Optional[Dict]:
    """根据名称获取工具及其分类
    
    Args:
        name: 工具名称
        
    Returns:
        包含工具和分类的字典，如果工具不存在则返回None
    """
    tool_info = _registered_tools.get(name)
    if tool_info:
        return {
            "tool": tool_info["tool"],
            "category": tool_info["category"].value
        }
    return None

def get_tool_instance(name: str) -> Optional[Tool]:
    """根据名称直接获取工具实例
    
    Args:
        name: 工具名称
        
    Returns:
        工具实例，如果工具不存在则返回None
    """
    tool_info = _registered_tools.get(name)
    return tool_info["tool"] if tool_info else None

def get_tools_by_category(category: ToolCategory, return_instances: bool = True) -> List[Union[str, Tool]]:
    """返回指定分类的工具列表
    
    Args:
        category: 工具分类
        return_instances: 如果为True，返回工具实例列表；如果为False，返回工具名称列表
        
    Returns:
        工具实例列表或工具名称列表
    """
    if return_instances:
        return [info["tool"] for name, info in _registered_tools.items() if info["category"] == category]
    return [name for name, info in _registered_tools.items() if info["category"] == category]

================================================
FILE: core/tools/replicate_flux_tool.py
================================================
# 文件路径: core/tools/replicate_flux_tool.py (或类似)

import os
import asyncio
import json
from typing import Dict, Any, Optional, Type, List, Literal
from pydantic import BaseModel, Field, PrivateAttr
from langchain_core.tools import BaseTool
from langchain_core.callbacks import (
    AsyncCallbackManagerForToolRun,
    CallbackManagerForToolRun,
)

# --- Replicate Client ---
try:
    import replicate
    REPLICATE_AVAILABLE = True
except ImportError:
    replicate = None # type: ignore
    REPLICATE_AVAILABLE = False
    print("Warning: 'replicate' package not installed (pip install replicate). ReplicateFluxImageTool will not work.")

# --- Tool Category (可选, 用于 Registry) ---
try:
    from .registry import ToolCategory, register_tool
    if not hasattr(ToolCategory, 'IMAGE_GENERATION'):
         ToolCategory.IMAGE_GENERATION = ToolCategory.OTHER
    category = ToolCategory.IMAGE_GENERATION
except ImportError:
    category = None
    print("Tool registry not found. Cannot auto-register ReplicateFluxImageTool.")


# --- Input Schema based on flux-dev ---
class ReplicateFluxToolInput(BaseModel):
    """Input schema for the Replicate Flux Image Generator Tool."""
    prompt: str = Field(description="Required. Detailed text description of the image to be generated.")
    aspect_ratio: Literal["1:1", "16:9", "21:9", "3:2", "2:3", "4:5", "5:4", "3:4", "4:3", "9:16", "9:21"] = Field(
        default="1:1", description="Aspect ratio for the generated image."
    )
    num_outputs: int = Field(
        default=1, description="Number of images to generate (1-4).", ge=1, le=4
    )
    guidance: float = Field(
        default=3.0, description="Guidance scale (0-10).", ge=0, le=10
    )
    num_inference_steps: int = Field(
        default=28, description="Number of denoising steps (1-50). Lower is faster, lower quality.", ge=1, le=50
    )
    seed: Optional[int] = Field(default=None, description="Random seed for reproducible generation.")
    # Add other relevant fields from the schema if needed, e.g., megapixels, output_format
    # megapixels: Literal["1", "0.25"] = Field(default="1", description="Approximate megapixels for output.")
    # output_format: Literal["webp", "jpg", "png"] = Field(default="webp", description="Output image format.")


# --- Tool Class (修正返回值处理) ---
class ReplicateFluxImageTool(BaseTool):
    """Generates images using 'black-forest-labs/flux-dev' on Replicate."""
    name: str = "replicate_flux_image_generator"
    description: str = (
        "Generates high-quality images based on a detailed text prompt using the Flux model on Replicate. "
        "Specify 'prompt' and optionally other parameters like 'aspect_ratio'. "
        "Returns a string containing the URL(s) of the generated image(s)."
    )
    args_schema: Type[BaseModel] = ReplicateFluxToolInput
    _client: Any = PrivateAttr(default=None)
    _is_available: bool = PrivateAttr(default=False)
    _init_error: Optional[str] = PrivateAttr(default=None)
    model_identifier: str = "black-forest-labs/flux-dev"

    def __init__(self, api_token: Optional[str] = None, model_id: Optional[str] = None, **kwargs):
        """Initialize the Replicate client."""
        super().__init__(**kwargs)
        if not REPLICATE_AVAILABLE: self._init_error = "..."; print(f"ERROR: {self._init_error}"); return
        token = api_token or os.getenv("REPLICATE_API_TOKEN")
        if not token: self._init_error = "..."; print(f"ERROR: {self._init_error}"); return
        try:
            print("Initializing Replicate client...")
            self._client = replicate.Client(api_token=token)
            print("Replicate client initialized successfully.")
            self._is_available = True; self._init_error = None
            if model_id: self.model_identifier = model_id
        except Exception as e: self._init_error = f"...: {e}"; print(f"ERROR: {self._init_error}"); self._is_available = False

    def _run( self, run_manager: Optional[CallbackManagerForToolRun] = None, **kwargs: Any ) -> str:
        """Generates image(s) synchronously."""
        if not self._is_available or self._client is None:
             error_message = f"Replicate client unavailable: {self._init_error}"
             print(f"ERROR: {error_message}"); return f"Error: {error_message}"

        input_data = {k: v for k, v in kwargs.items() if v is not None and k in self.args_schema.__fields__}
        prompt_short = str(input_data.get('prompt', ''))[:100]
        print(f"--- TOOL CALL: {self.name} ---")
        print(f"   Input: Prompt='{prompt_short}...', Args={ {k:v for k,v in input_data.items() if k != 'prompt'} }")

        try:
            # output 现在预期是包含特殊对象 (如 FileOutput 或 URL 字符串) 的列表
            output: List[Any] = self._client.run(self.model_identifier, input=input_data)

            if not output or not isinstance(output, list):
                result_str = "Image generation failed: Replicate API returned no output or unexpected format."
                print(f"   Warning: {result_str}"); return f"Error: {result_str}"

            # --- 从返回的对象中提取 URL ---
            image_urls: List[str] = []
            for item in output:
                if isinstance(item, str): # 如果直接返回了 URL 字符串
                    image_urls.append(item)
                elif hasattr(item, 'url') and isinstance(getattr(item, 'url'), str): # 检查是否有 .url 属性且是字符串
                    image_urls.append(getattr(item, 'url'))
                elif hasattr(item, 'read'): # 如果是文件类对象，可能需要其他处理或报错
                     print(f"Warning: Received file-like object from Replicate, cannot directly get URL: {item}")
                     # 或者尝试其他属性？这个需要根据 replicate 库的具体 FileOutput 类型确定
                else:
                     print(f"Warning: Unknown item type in Replicate output list: {type(item)}")

            if not image_urls:
                 result_str = "Image generation succeeded but failed to extract image URLs from the response."
                 print(f"   Warning: {result_str}"); return f"Error: {result_str}"
            # --- 提取结束 ---

            # 格式化 URL 列表为字符串
            url_list_str = "\n".join(image_urls)
            result_str = f"Successfully generated {len(image_urls)} image(s):\n{url_list_str}"
            print(f"   Result: {result_str}")
            return result_str

        except Exception as e: # 捕获 Replicate API 错误等
            # 检查是否是 ReplicateError 并提取更具体的细节
            error_detail = str(e)
            if REPLICATE_AVAILABLE and isinstance(e, replicate.exceptions.ReplicateError):
                 error_detail = f"ReplicateError (Status: {e.status}): {e.title} - {e.detail}"

            error_msg = f"Error calling Replicate API ({self.model_identifier}): {error_detail}"
            print(f"   Error: {error_msg}")
            # traceback.print_exc() # 可以在调试时取消注释
            return f"Error: {error_msg}" # 返回错误信息给 LLM

    async def _arun( self, run_manager: Optional[AsyncCallbackManagerForToolRun] = None, **kwargs: Any ) -> str:
        """Generates image(s) asynchronously using run_in_executor."""
        if not self._is_available or self._client is None:
             error_message = f"Replicate client unavailable: {self._init_error}"
             print(f"ERROR: {error_message}"); return f"Error: {error_message}"

        input_data = {k: v for k, v in kwargs.items() if v is not None and k in self.args_schema.__fields__}
        prompt_short = str(input_data.get('prompt', ''))[:100]
        print(f"--- TOOL CALL (Async): {self.name} ---")
        print(f"   Input: Prompt='{prompt_short}...', Args={ {k:v for k,v in input_data.items() if k != 'prompt'} }")

        try:
            loop = asyncio.get_running_loop()
            import functools
            sync_call_with_args = functools.partial( self._client.run, self.model_identifier, input=input_data )
            output: List[Any] = await loop.run_in_executor( None, sync_call_with_args )

            if not output or not isinstance(output, list):
                result_str = "Async image generation failed: Replicate API returned no output or unexpected format."
                print(f"   Warning: {result_str}"); return f"Error: {result_str}"

            # --- 从返回的对象中提取 URL (逻辑同 _run) ---
            image_urls: List[str] = []
            for item in output:
                if isinstance(item, str): image_urls.append(item)
                elif hasattr(item, 'url') and isinstance(getattr(item, 'url'), str): image_urls.append(getattr(item, 'url'))
                else: print(f"Warning: Unknown item type in async Replicate output list: {type(item)}")
            if not image_urls:
                 result_str = "Async image generation succeeded but failed to extract image URLs."
                 print(f"   Warning: {result_str}"); return f"Error: {result_str}"
            # --- 提取结束 ---

            url_list_str = "\n".join(image_urls)
            result_str = f"Successfully generated {len(image_urls)} image(s) asynchronously:\n{url_list_str}"
            print(f"   Result: {result_str}")
            return result_str

        except Exception as e: # 捕获 Replicate API 错误等
            error_detail = str(e)
            if REPLICATE_AVAILABLE and isinstance(e, replicate.exceptions.ReplicateError):
                 error_detail = f"ReplicateError (Status: {e.status}): {e.title} - {e.detail}"
            error_msg = f"Error calling Replicate API asynchronously ({self.model_identifier}): {error_detail}"
            print(f"   Error: {error_msg}")
            # traceback.print_exc()
            return f"Error: {error_msg}"


    def close(self):
        """关闭沙箱（如果需要的话）。Replicate Client 通常不需要关闭。"""
        print(f"Info: Replicate client for '{self.name}' does not require explicit closing.")
        pass # Replicate client 通常不需要显式关闭

    model_config = {"arbitrary_types_allowed": True}


================================================
FILE: core/utils/agent_utils.py
================================================
import os
from typing import Dict, Any, Optional, Literal
from langchain_core.messages import AIMessage, ToolMessage
import inspect

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动
    
    这个函数用于在控制台打印Agent的思考过程、工具调用和工具返回结果，
    便于观察和调试Agent的行为。
    
    Args:
        state: 包含消息历史的状态字典
    """
    print("\n" + "=" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            print(latest_message.content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    print(f"- 参数: {tool_call['args']}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            # 只打印结果的前500个字符，避免输出过长
            content = latest_message.content
            if len(content) > 500:
                content = content[:500] + "... (更多内容省略)"
            print(f"- 结果: {content}")
    
    print("=" * 50)

def save_agent_graph(
    agent, 
    caller_file_path: Optional[str] = None,
    output_format: Literal["png", "svg", "mermaid"] = "png",
    custom_filename: Optional[str] = None,
    output_dir: Optional[str] = None
) -> str:
    """保存Agent的图表到指定目录
    
    这个函数用于生成Agent的图表并保存到指定目录，
    默认情况下文件名与调用者的文件名保持一致（不含扩展名）。
    
    Args:
        agent: Agent对象，必须有get_graph方法
        caller_file_path: 调用者的文件路径，如果为None则使用调用栈获取
        output_format: 输出格式，可选"png"、"svg"或"mermaid"
        custom_filename: 自定义文件名（不含扩展名），如果提供则使用此名称
        output_dir: 自定义输出目录，如果提供则使用此目录
        
    Returns:
        str: 保存的图表路径
    """
    # 如果没有提供调用者文件路径，则从调用栈获取
    if caller_file_path is None:
        # 获取调用者的栈帧
        frame = inspect.currentframe().f_back
        caller_file_path = frame.f_code.co_filename
    
    try:
        # 获取图对象
        graph = agent.get_graph()
    except AttributeError:
        raise ValueError("提供的agent对象没有get_graph方法") 
    except Exception as e:
        raise RuntimeError(f"获取图表时出错: {str(e)}")
    
    # 确定文件名
    if custom_filename:
        file_name_without_ext = custom_filename
    else:
        # 获取当前文件名（不含路径和扩展名）
        current_file = os.path.basename(caller_file_path)
        file_name_without_ext = os.path.splitext(current_file)[0]
    
    # 确定输出目录
    if output_dir:
        graph_dir = output_dir
    else:
        # 如果调用者在examples目录下，则使用examples/graphs
        # 否则在调用者所在目录创建graphs子目录
        if 'examples' in caller_file_path:
            base_dir = os.path.dirname(os.path.dirname(caller_file_path))
            graph_dir = os.path.join(base_dir, "examples", "graphs")
        else:
            graph_dir = os.path.join(os.path.dirname(caller_file_path), "graphs")
    
    # 确保graphs目录存在
    os.makedirs(graph_dir, exist_ok=True)
    
    # 根据输出格式生成相应文件
    try:
        if output_format == "png":
            image_data = graph.draw_mermaid_png()
            graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")
            with open(graph_path, "wb") as f:
                f.write(image_data)
                
        elif output_format == "svg":
            image_data = graph.draw_mermaid_svg()
            graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.svg")
            with open(graph_path, "wb") as f:
                f.write(image_data)
                
        elif output_format == "mermaid":
            mermaid_code = graph.get_mermaid()
            graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.mmd")
            with open(graph_path, "w") as f:
                f.write(mermaid_code)
        else:
            raise ValueError(f"不支持的输出格式: {output_format}")
            
    except Exception as e:
        raise RuntimeError(f"保存图表时出错: {str(e)}")
        
    print(f"图表已保存为 {graph_path}")
    return graph_path

def visualize_agent(agent, **kwargs):
    """可视化Agent的快捷方法
    
    这是save_agent_graph的简便包装，用于快速可视化Agent
    
    Args:
        agent: Agent对象
        **kwargs: 传递给save_agent_graph的其他参数
        
    Returns:
        str: 保存的图表路径
    """
    # 获取调用者的栈帧
    frame = inspect.currentframe().f_back
    caller_file_path = frame.f_code.co_filename
    
    return save_agent_graph(agent, caller_file_path=caller_file_path, **kwargs)

================================================
FILE: core/utils/timezone.py
================================================
from datetime import datetime
import os
from typing import Optional
from zoneinfo import ZoneInfo

def get_timezone() -> str:
    """Get timezone from environment variable or use default.
    
    Returns:
        str: Timezone string (e.g. 'Asia/Shanghai')
    """
    return os.getenv('TZ', 'UTC')

def get_formatted_date(timezone: Optional[str] = None) -> str:
    """Get formatted date string with timezone awareness.
    
    Args:
        timezone: Optional timezone string. If not provided, uses TZ from env or UTC.
        
    Returns:
        str: Formatted date string (e.g. 'Today's Date: Mon, Jan 01, 2024')
    """
    tz = ZoneInfo(timezone or get_timezone())
    now = datetime.now(tz)
    return f"Today's Date: {now.strftime('%a, %b %d, %Y')}"

def get_current_time(timezone: Optional[str] = None) -> datetime:
    """Get current time with timezone awareness.
    
    Args:
        timezone: Optional timezone string. If not provided, uses TZ from env or UTC.
        
    Returns:
        datetime: Current time with timezone information
    """
    tz = ZoneInfo(timezone or get_timezone())
    return datetime.now(tz)

================================================
FILE: examples/01_supervisor_test.py
================================================
from langgraph.prebuilt import create_react_agent
from core.agents.supervisor import create_supervisor
from langchain_openai import ChatOpenAI
from langgraph.func import entrypoint, task
from langgraph.graph import add_messages
from dotenv import load_dotenv
from core.utils.agent_utils import visualize_agent

load_dotenv()  # 自动加载 .env 文件
# 1. 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# Agent 1: Joke Generator (Functional API)
##############################################################################

@task
def generate_joke(messages):
    """Generate a short joke (no tool calls)."""
    system_message = {
        "role": "system", 
        "content": "You are a witty comedian. Write a short joke."
    }
    # 直接调用 model.invoke，拼接 system_message + 用户消息
    msg = model.invoke([system_message] + messages)
    return msg

@entrypoint()
def joke_agent(state):
    # 调用上面的函数型任务
    joke = generate_joke(state['messages']).result()
    # 将产物插入消息列表
    messages = add_messages(state["messages"], [joke])
    return {"messages": messages}

joke_agent.name = "joke_agent"

##############################################################################
# Agent 2: Research Expert (Graph API)
##############################################################################

def web_search(query: str) -> str:
    """Search the web for information. (Mocked data here)"""
    return (
        "Here are the headcounts for each of the FAANG companies in 2024:\n"
        "1. **Facebook (Meta)**: 67,317 employees.\n"
        "2. **Apple**: 164,000 employees.\n"
        "3. **Amazon**: 1,551,000 employees.\n"
        "4. **Netflix**: 14,000 employees.\n"
        "5. **Google (Alphabet)**: 181,269 employees."
    )

research_agent = create_react_agent(
    model=model,
    tools=[web_search],
    name="research_expert",
    # Prompt 告诉它是一个研究型 Agent，可调用 web_search
    prompt=(
        "You are a world-class researcher. You have access to a 'web_search(query: str)' tool. "
        "Do not do any complicated math, just provide factual info from the web_search if needed."
    ),
)

##############################################################################
# Supervisor Workflow
##############################################################################

# 让 Supervisor 在一次对话中可以多轮调用 joke_agent 和 research_expert
# 这里的 prompt 告诉它：如果用户要“先讲笑话再查信息”，请先调用 joke_agent，再调用 research_expert，
# 这样可以在同一个用户请求下顺序执行两个 Agent。
# 这是最简单的示例，只是为了演示 create_supervisor 的基本用法，该方法没有被封装成一个 Agent
# 也不具备 Planning 能力
workflow = create_supervisor(
    [research_agent, joke_agent],
    model=model,
    prompt=(
        "You are the overall supervisor. You manage two specialized agents:\n"
        "1) joke_agent: for telling jokes.\n"
        "2) research_expert: for factual or data-related questions.\n\n"
        "If the user wants a joke AND some research data in the same query, "
        "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
        "After both calls, provide a final combined response. "
        "Do not call more than one agent in a single LLM message; do it step by step."
    ),
)

# 编译得到一个可调用的"App"
agent = workflow.compile()
# 保存为一个可视化的图
# visualize_agent(agent)
##############################################################################
# 测试：单个用户请求想要 "先讲笑话，再查Apple的2024年人数" 并合并结果
##############################################################################
result = agent.invoke({
    "messages": [
        {
            "role": "user",
            "content": (
                "Hi! I'd like to start with a short joke to lighten the mood, "
                "then please check Apple's headcount in 2024. Summarize both."
            )
        }
    ]
})

##############################################################################
# 打印最终对话消息
##############################################################################
for m in result["messages"]:
    m.pretty_print()

================================================
FILE: examples/02_supervisor_agent_test.py
================================================
from langgraph.prebuilt import create_react_agent
from core.agents.base.react_agent import ReactAgent
from core.agents.react_supervisor_agent import SupervisorAgent
from langchain_openai import ChatOpenAI
from langgraph.func import entrypoint, task
from langgraph.graph import add_messages
from dotenv import load_dotenv
load_dotenv()  # 自动加载 .env 文件
# 1. 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# Agent 1: Joke Generator (Functional API)
##############################################################################

@task
def generate_joke(messages):
    """Generate a short joke (no tool calls)."""
    system_message = {
        "role": "system", 
        "content": "You are a witty comedian. Write a short joke."
    }
    # 直接调用 model.invoke，拼接 system_message + 用户消息
    msg = model.invoke([system_message] + messages)
    return msg

@entrypoint()
def joke_agent(state):
    # 调用上面的函数型任务
    joke = generate_joke(state['messages']).result()
    # 将产物插入消息列表
    messages = add_messages(state["messages"], [joke])
    return {"messages": messages}

joke_agent.name = "joke_agent"

##############################################################################
# Agent 2: Research Expert (Graph API)
##############################################################################

def web_search(query: str) -> str:
    """Search the web for information. (Mocked data here)"""
    return (
        "Here are the headcounts for each of the FAANG companies in 2024:\n"
        "1. **Facebook (Meta)**: 67,317 employees.\n"
        "2. **Apple**: 164,000 employees.\n"
        "3. **Amazon**: 1,551,000 employees.\n"
        "4. **Netflix**: 14,000 employees.\n"
        "5. **Google (Alphabet)**: 181,269 employees."
    )

# research_agent = create_react_agent(
#     model=model,
#     tools=[web_search],
#     name="research_expert",
#     # Prompt 告诉它是一个研究型 Agent，可调用 web_search
#     prompt=(
#         "You are a world-class researcher. You have access to a 'web_search(query: str)' tool. "
#         "Do not do any complicated math, just provide factual info from the web_search if needed."
#     ),
# )
research_agent = ReactAgent(
    model=model,
    tools=[web_search],
    name="research_expert",
    # Prompt 告诉它是一个研究型 Agent，可调用 web_search
    prompt=(
        "You are a world-class researcher. You have access to a 'web_search(query: str)' tool. "
        "Do not do any complicated math, just provide factual info from the web_search if needed."
    ),
)

##############################################################################
# 使用 SupervisorAgent 类替代直接调用 create_supervisor 函数
##############################################################################

# 创建 SupervisorAgent 实例
supervisor = SupervisorAgent(
    agents=[research_agent],
    model=model,
    # prompt=(
    #     "You are the overall supervisor. You manage two specialized agents:\n"
    #     "1) joke_agent: for telling jokes.\n"
    #     "2) research_expert: for factual or data-related questions.\n\n"
    #     "If the user wants a joke AND some research data in the same query, "
    #     "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
    #     "After both calls, provide a final combined response. "
    #     "Do not call more than one agent in a single LLM message; do it step by step."
    # ),
)
##############################################################################
# 测试：单个用户请求想要 "先讲笑话，再查Apple的2024年人数" 并合并结果
##############################################################################
result = supervisor.invoke({
    "messages": [
        {
            "role": "user",
            "content": (
                "Hi! I'd like to start with a short joke to lighten the mood, "
                "then please check Apple's headcount in 2024. Summarize both."
            )
        }
    ]
})

##############################################################################
# 打印最终对话消息
##############################################################################
for m in result["messages"]:
    m.pretty_print()

================================================
FILE: examples/03_tavily_tools_test.py
================================================
import os
from langgraph.prebuilt import create_react_agent
from core.agents.react_supervisor_agent import SupervisorAgent
from langchain_openai import ChatOpenAI
from langgraph.func import entrypoint, task
from langgraph.graph import add_messages
from langchain_community.tools import TavilySearchResults
from dotenv import load_dotenv
load_dotenv()  # 自动加载 .env 文件
# 1. 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# Agent 1: Joke Generator (Functional API)
##############################################################################

@task
def generate_joke(messages):
    """Generate a short joke (no tool calls)."""
    system_message = {
        "role": "system", 
        "content": "You are a witty comedian. Write a short joke."
    }
    # 直接调用 model.invoke，拼接 system_message + 用户消息
    msg = model.invoke([system_message] + messages)
    return msg

@entrypoint()
def joke_agent(state):
    # 调用上面的函数型任务
    joke = generate_joke(state['messages']).result()
    # 将产物插入消息列表
    messages = add_messages(state["messages"], [joke])
    return {"messages": messages}

joke_agent.name = "joke_agent"

##############################################################################
# Agent 2: Research Expert with Tavily Search (Graph API)
##############################################################################

# 创建Tavily搜索工具
tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=False,
    include_images=False,
    search_depth="advanced"
)

research_agent = create_react_agent(
    model=model,
    tools=[tavily_search],
    name="research_expert",
    # Prompt 告诉它是一个研究型 Agent，可调用 tavily_search
    prompt=(
        "You are a world-class researcher. You have access to the 'tavily_search_results_json' tool "
        "which can search the web for real-time information. "
        "When asked a question, use this tool to find accurate and up-to-date information. "
        "Summarize the search results in a clear and concise manner. "
        "Always cite your sources by including the URLs from the search results."
    ),
)

##############################################################################
# 使用 SupervisorAgent 类来协调多个智能体
##############################################################################

# 创建 SupervisorAgent 实例
supervisor = SupervisorAgent(
    agents=[research_agent, joke_agent],
    model=model,
    prompt=(
        "You are the overall supervisor. You manage two specialized agents:\n"
        "1) joke_agent: for telling jokes.\n"
        "2) research_expert: for factual or data-related questions using real-time web search.\n\n"
        "If the user wants a joke, call joke_agent.\n"
        "If the user wants factual information or research data, call research_expert.\n"
        "If the user wants a joke AND some research data in the same query, "
        "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
        "After both calls, provide a final combined response. "
        "Do not call more than one agent in a single LLM message; do it step by step."
    ),
)

# 编译得到一个可调用的"App"
app = supervisor.compile()

# # 获取当前文件名（不含路径和扩展名）
# current_file = os.path.basename(__file__)
# file_name_without_ext = os.path.splitext(current_file)[0]
# graph_dir = os.path.join(os.path.dirname(__file__), "graphs")

# # 确保 graphs 目录存在
# os.makedirs(graph_dir, exist_ok=True)

# # 生成与文件名一致的图片名，并保存到 examples/graphs 目录
# image_data = app.get_graph().draw_mermaid_png()
# graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")

# # 保存图片（如果已存在则覆盖）
# with open(graph_path, "wb") as f:
#     f.write(image_data)

# print(f"Image saved as {graph_path}")

# 使用示例
if __name__ == "__main__":
    # 示例1：只询问笑话
    result1 = app.invoke({"messages": [{"role": "user", "content": "讲个笑话"}]})
    print("\n示例1 - 只询问笑话:")
    for message in result1["messages"]:
        message.pretty_print()
    
    # 示例2：只询问研究数据
    result2 = app.invoke({"messages": [{"role": "user", "content": "谁是现任美国总统？"}]})
    print("\n示例2 - 只询问研究数据:")
    for message in result2["messages"]:
        message.pretty_print()
    
    # 示例3：同时询问笑话和研究数据
    result3 = app.invoke({"messages": [{"role": "user", "content": "讲个关于人工智能的笑话，然后告诉我什么是大型语言模型"}]})
    print("\n示例3 - 同时询问笑话和研究数据:")
    for message in result3["messages"]:
        message.pretty_print()

================================================
FILE: examples/04_react_agent_test.py
================================================
import os
import json
from langgraph.prebuilt import create_react_agent
from langchain_openai import ChatOpenAI
from langchain_community.tools import TavilySearchResults
from typing import Dict, Any
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from dotenv import load_dotenv
from core.utils.agent_utils import log_agent_actions, save_agent_graph
load_dotenv()  # 自动加载 .env 文件
# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# 创建Tavily搜索工具 - 配置为深度搜索模式
##############################################################################

tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=True,  # 包含原始内容，便于分析
    include_images=False,
    search_depth="advanced"  # 使用高级搜索深度
)

##############################################################################
# 创建REACT Agent - 使用更详细的提示词引导多步思考
##############################################################################

react_agent = create_react_agent(
    model=model,
    tools=[tavily_search],
    name="tesla_research_expert",
    # 提示词强调分解问题、多步思考和综合信息
    prompt=(
        "你是一位专业的研究分析师，擅长分析复杂问题并提供深入见解。\n"
        "你有一个强大的工具'tavily_search_results_json'可以搜索网络获取实时信息。\n\n"
        "当面对复杂问题时，请遵循以下REACT方法论：\n"
        "1. 分解问题：将复杂问题分解为更小的子问题\n"
        "2. 制定计划：确定需要搜索哪些信息，以及搜索的顺序\n"
        "3. 执行搜索：使用tavily_search_results_json工具执行搜索\n"
        "4. 分析结果：分析搜索结果，确定是否需要进一步搜索\n"
        "5. 综合信息：将所有搜索结果综合成一个连贯的回答\n\n"
        "重要提示：\n"
        "- 不要一次性搜索过于宽泛的问题\n"
        "- 对于复杂问题，进行多次有针对性的搜索\n"
        "- 每次搜索后评估结果，决定下一步行动\n"
        "- 在最终回答中引用来源，包括搜索结果中的URL\n"
        "- 清晰地展示你的思考过程，包括问题分解和计划制定\n"
    ),
)

# 保存Agent图表
# save_agent_graph(react_agent)

##############################################################################
# 测试：查询"特斯拉2025年的发展预期"
##############################################################################

if __name__ == "__main__":
    # 复杂查询测试
    print("\n开始测试REACT Agent处理复杂查询的能力...\n")
    print("查询: 特斯拉2025年的发展预期")
    
    # 定义输入
    inputs = {
        "messages": [
            {"role": "user", "content": "分析特斯拉2025年的发展预期，包括新车型计划、销量目标、技术创新和市场扩张战略。"}
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in react_agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用原有的log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print("\n最终回答:")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                message.pretty_print()

================================================
FILE: examples/05_react_agent_user_input.py
================================================
import asyncio
import os
from typing import Dict, Any

from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage

from core.agents.base.react_agent import ReactAgent
from langchain_community.tools import TavilySearchResults
from dotenv import load_dotenv
load_dotenv()  # 自动加载 .env 文件
# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# 创建一个记录Agent思考过程的函数
##############################################################################

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动"""
    print("\n" + "=" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            print(latest_message.content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    print(f"- 参数: {tool_call['args']}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            # 只打印结果的前200个字符，避免输出过长
            content = latest_message.content
            if len(content) > 200:
                content = content[:200] + "... (更多内容省略)"
            print(f"- 结果: {content}")
    
    print("=" * 50)

##############################################################################
# 创建Tavily搜索工具 - 配置为深度搜索模式
##############################################################################

tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=True,  # 包含原始内容，便于分析
    include_images=False,
    search_depth="advanced"  # 使用高级搜索深度
)

##############################################################################
# 创建ReactAgent实例
##############################################################################

def create_react_agent_instance():
    """创建并返回ReactAgent实例"""
    react_agent = ReactAgent(
        model=model,
        tools=[tavily_search],
        name="research_assistant",
        # 提示词强调分解问题、多步思考和综合信息
        prompt=(
            "你是一位专业的研究分析师，擅长分析复杂问题并提供深入见解。\n"
            "你有一个强大的工具'tavily_search_results_json'可以搜索网络获取实时信息。\n\n"
            "当面对复杂问题时，请遵循以下REACT方法论：\n"
            "1. 分解问题：将复杂问题分解为更小的子问题\n"
            "2. 制定计划：确定需要搜索哪些信息，以及搜索的顺序\n"
            "3. 执行搜索：使用tavily_search_results_json工具执行搜索\n"
            "4. 分析结果：分析搜索结果，确定是否需要进一步搜索\n"
            "5. 综合信息：将所有搜索结果综合成一个连贯的回答\n\n"
            "重要提示：\n"
            "- 不要一次性搜索过于宽泛的问题\n"
            "- 对于复杂问题，进行多次有针对性的搜索\n"
            "- 每次搜索后评估结果，决定下一步行动\n"
            "- 在最终回答中引用来源，包括搜索结果中的URL\n"
            "- 清晰地展示你的思考过程，包括问题分解和计划制定\n"
        ),
    )
    
    # 获取图对象并保存
    agent = react_agent.compile()    
    return agent

##############################################################################
# 主函数 - 处理用户输入
##############################################################################

async def main():
    # 创建ReactAgent实例
    react_agent = create_react_agent_instance()
    
    while True:
        # 获取用户输入
        user_input = await asyncio.to_thread(input, "\n请输入您想了解的问题 (输入'退出'结束): ")
        
        # 检查是否退出
        if user_input.lower() in ['退出', 'exit', 'quit']:
            print("\n感谢使用，再见！")
            break
        
        # 准备初始状态
        initial_state = {
            "messages": [HumanMessage(content=user_input)]
        }
        
        try:
            print("\n=== 🔍 开始研究 ===\n")
            
            # 使用stream方法逐步获取中间状态
            final_state = None
            for partial_state in react_agent.stream(initial_state, stream_mode="values"):
                # 保存最终状态
                final_state = partial_state
                
                # 获取消息列表
                messages = partial_state.get("messages", [])
                if not messages:
                    continue
                    
                # 获取最新消息
                latest_message = messages[-1]
                
                # 使用log_agent_actions函数记录状态
                log_agent_actions({"messages": [latest_message]})
            
            # 打印最终回答
            print("\n最终回答:")
            if final_state and final_state.get("messages"):
                for message in final_state["messages"]:
                    if isinstance(message, AIMessage) and not message.tool_calls:
                        print("\n" + "=" * 80)
                        print(message.content)
                        print("=" * 80 + "\n")
        
        except Exception as e:
            print(f"\n处理查询时出错: {e}")

##############################################################################
# 程序入口
##############################################################################

if __name__ == "__main__":
    print("\n欢迎使用ReactAgent研究助手！")
    print("这个助手可以帮助您研究各种问题，使用Tavily搜索工具获取最新信息。")
    print("您可以输入任何问题，助手将使用REACT方法论进行分析和回答。")
    
    # 运行主函数
    asyncio.run(main())

================================================
FILE: examples/06_web_extraction_tools_test.py
================================================
import os
import sys
from langgraph.prebuilt import create_react_agent
from langchain_openai import ChatOpenAI
import json
from typing import Dict, Any
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from dotenv import load_dotenv
from langchain_community.tools import JinaSearch
from core.tools.firecrawl_tool import FireCrawlTool


load_dotenv()  # 自动加载 .env 文件
# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")


##############################################################################
# 创建一个记录Agent思考过程的函数
##############################################################################

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动"""
    print("\n" + "=" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            print(latest_message.content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    print(f"- 参数: {tool_call['args']}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            # 只打印结果的前200个字符，避免输出过长
            content = latest_message.content
            if len(content) > 300:
                content = content[:300] + "... (更多内容省略)"
            print(f"- 结果: {content}")
    
    print("=" * 50)

##############################################################################
# 创建Web提取工具 - FireCrawl用于网站结构，Jina用于内容提取
##############################################################################

# 创建FireCrawl工具 - 用于网站结构分析
firecrawl_tool = FireCrawlTool(
    mode="crawl",  # 使用爬取模式
    params={"max_pages": 10}  # 限制爬取页面数量
)

# 创建Jina Reader工具 - 用于内容提取
jina_reader_tool = JinaSearch()

##############################################################################
# 创建REACT Agent - 使用更详细的提示词引导多步思考
##############################################################################

react_agent = create_react_agent(
    model=model,
    tools=[firecrawl_tool, jina_reader_tool],
    name="web_extraction_expert",
    # 提示词强调分解问题、多步思考和综合信息
    prompt=(
        "你是一位专业的网页内容分析专家，擅长提取和分析网站结构与内容。\n"
        "你有两个强大的工具:\n"
        "1. 'firecrawl_tool': 用于爬取网站结构和下级页面\n"
        "2. 'jina_reader_tool': 用于从特定URL提取结构化内容，获取干净可读的内容\n\n"
        "当面对网站分析任务时，请遵循以下方法论:\n"
        "1. 分析任务: 明确需要从网站获取什么信息\n"
        "2. 网站结构分析: 使用firecrawl_tool爬取网站结构，了解可用页面\n"
        "3. 内容提取: 根据网站结构，使用jina_reader_tool从关键页面提取内容\n"
        "4. 信息整合: 将提取的内容整合成有条理的分析结果\n\n"
        "重要提示:\n"
        "- 先使用firecrawl_tool了解网站结构，再使用jina_reader_tool提取具体内容\n"
        "- 对于大型网站，先分析网站结构，再有针对性地选择重要页面进行内容提取\n"
        "- 每次工具使用后评估结果，决定下一步行动\n"
        "- 在最终回答中提供结构化的分析，包括网站组织方式和关键内容摘要\n"
        "- 清晰地展示你的思考过程，包括为什么选择特定页面进行分析\n"
    ),
)

##############################################################################
# 测试：分析LangGraph文档网站
##############################################################################

if __name__ == "__main__":
    # 测试网站分析
    print("\n开始测试Web提取Agent分析网站的能力...\n")
    print("分析目标: LangGraph文档网站")
    
    # 定义输入
    inputs = {
        "messages": [
            {"role": "user", "content": "爬取LangGraph文档网站的每个章节的内容(https://langchain-ai.github.io/langgraph/how-tos/) "}
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in react_agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用原有的log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print("\n最终分析结果:")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                message.pretty_print()

================================================
FILE: examples/07_web_extraction_with_filesystem.py
================================================
import os
import sys
import json
import asyncio
from datetime import datetime
from typing import Dict, Any, List

from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from langchain_community.agent_toolkits import FileManagementToolkit
from langgraph.prebuilt import create_react_agent
from langgraph.checkpoint.memory import MemorySaver
from dotenv import load_dotenv
from langchain_community.tools import TavilySearchResults
from core.agents.react_supervisor_agent import SupervisorAgent

load_dotenv()  # 自动加载 .env 文件

# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# 创建一个记录Agent思考过程的函数
##############################################################################

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动"""
    print("\n" + "=" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            # 限制内容长度，避免过长输出
            content = latest_message.content
            if len(content) > 500:
                content = content[:250] + "\n... (内容过长，已截断) ...\n" + content[-250:]
            print(content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    # 限制参数输出长度
                    args = str(tool_call['args'])
                    if len(args) > 100:
                        args = args[:100] + "... (参数过长，已截断)"
                    print(f"- 参数: {args}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            # 只打印结果的前200个字符，避免输出过长
            content = latest_message.content
            if len(content) > 200:
                content = content[:100] + "\n... (更多内容省略) ...\n" + content[-100:]
            print(f"- 结果: {content}")
    
    print("=" * 50)

##############################################################################
# 创建Web提取工具
##############################################################################
# 创建Tavily搜索工具

tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=False,
    include_images=False,
    search_depth="advanced"
)

##############################################################################
# 创建文件系统工具 - 用于保存提取的内容
##############################################################################

# 设置文件系统工具的根目录为examples/output
output_dir = os.path.join(os.path.dirname(__file__), "output")
os.makedirs(output_dir, exist_ok=True)

# 创建文件系统工具集
filesystem_toolkit = FileManagementToolkit(
    root_dir=output_dir,
    selected_tools=["write_file", "read_file", "list_directory"]
)

# 获取文件系统工具
filesystem_tools = filesystem_toolkit.get_tools()

##############################################################################
# 创建Research Agent - 用于网站内容提取
##############################################################################

research_agent = create_react_agent(
    model=model,
    tools=[tavily_search],
    name="research_agent",
    # 提示词强调分解问题、多步思考和综合信息
    prompt=(
        "You are a world-class researcher. You have access to the 'tavily_search_results_json' tool "
        "which can search the web for real-time information. "
        "When asked a question, use this tool to find accurate and up-to-date information. "
        "Summarize the search results in a clear and concise manner. "
        "Always cite your sources by including the URLs from the search results."
    ),
    debug=False)

##############################################################################
# 创建FileSystem Agent - 用于保存提取的内容
##############################################################################

filesystem_agent = create_react_agent(
    model=model,
    tools=filesystem_tools,
    name="filesystem_agent",
    # 提示词强调文件操作和内容保存
    prompt=(
        "你是一位专业的文件系统管理专家，负责将网页内容保存到本地文件系统。\n"
        "你有以下工具可以使用:\n"
        "1. 'write_file': 用于将内容写入文件\n"
        "2. 'read_file': 用于读取文件内容\n"
        "3. 'list_directory': 用于列出目录内容\n\n"
        "当接收到保存内容的请求时，请遵循以下方法论:\n"
        "1. 分析内容: 确定内容的类型和结构\n"
        "2. 确定文件名: 根据内容类型和来源创建合适的文件名\n"
        "3. 保存内容: 使用write_file工具将内容保存到文件中\n"
        "4. 验证保存: 使用read_file或list_directory工具验证内容已正确保存\n\n"
        "重要提示:\n"
        "- 为文件创建有意义的名称，包含日期和内容描述\n"
        "- 对于结构化数据，优先使用JSON格式保存\n"
        "- 对于文本内容，使用TXT或MD格式保存\n"
        "- 确保文件名不包含非法字符\n"
        "- 在保存前，检查是否已存在同名文件，避免覆盖重要内容\n"
    ),
)

##############################################################################
# 创建Supervisor Agent - 协调Research Agent和FileSystem Agent
##############################################################################
# 创建内存存储器用于保存对话状态
memory_saver = MemorySaver()
supervisor = SupervisorAgent(
    agents=[research_agent, filesystem_agent],
    model=model,
    prompt=(
        "你是一个智能助手的总协调者，负责管理两个专业智能体:\n"
        "1) research_agent: 网页内容分析专家，可以爬取和分析网站内容\n"
        "2) filesystem_agent: 文件系统管理专家，可以将内容保存到本地文件系统\n\n"
        "你的工作流程如下:\n"
        "1. 分析用户请求，确定是需要网页内容提取还是文件操作，或两者都需要\n"
        "2. 如果需要网页内容提取，调用research_agent获取网页内容\n"
        "3. 如果需要将提取的内容保存到文件，调用filesystem_agent进行保存\n"
        "4. 如果用户同时需要提取内容并保存，先调用research_agent获取内容，再调用filesystem_agent保存内容\n\n"
        "重要规则:\n"
        "- 不要在一个消息中同时调用多个智能体，必须一步一步来\n"
        "- 当调用filesystem_agent保存内容时，必须提供完整的内容和建议的文件名\n"
        "- 确保在最终回复中告知用户内容已成功提取和/或保存\n"
        "- 如果用户只想提取内容而不保存，只调用research_agent\n"
        "- 如果用户只想操作文件而不提取新内容，只调用filesystem_agent\n\n"
        "上下文管理指南:\n"
        "- 当处理大型网站或多个页面时，指导research_agent采用分批处理策略\n"
        "- 对于大型内容提取任务，先让research_agent获取网站结构，再逐步处理各个页面\n"
        "- 当发现research_agent返回的内容过大时，指导它进行内容摘要或分批处理\n"
        "- 如果research_agent一次性尝试处理过多页面导致上下文超限，指导它减少并行处理的页面数量\n"
        "- 对于需要保存的大型内容，考虑将其分割成多个小文件，而不是一个大文件\n"
        "- 在处理多页面内容时，可以采用先保存再处理的策略，减轻上下文负担\n"
    ),
    checkpointer=memory_saver
)


# 编译得到一个可调用的"App"，添加checkpointer实现记忆功能
app = supervisor.compile()

# # 获取当前文件名（不含路径和扩展名）
# current_file = os.path.basename(__file__)
# file_name_without_ext = os.path.splitext(current_file)[0]
# graph_dir = os.path.join(os.path.dirname(__file__), "graphs")

# # 确保 graphs 目录存在
# os.makedirs(graph_dir, exist_ok=True)

# # 生成与文件名一致的图片名，并保存到 examples/graphs 目录
# image_data = app.get_graph().draw_mermaid_png()
# graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")

# # 保存图片（如果已存在则覆盖）
# with open(graph_path, "wb") as f:
#     f.write(image_data)

# print(f"图表已保存为 {graph_path}")

##############################################################################
# 主函数 - 处理用户输入
##############################################################################

async def main():
    # 创建一个固定的thread_id用于保持对话上下文
    thread_id = "user_session_1"
    
    # 创建配置对象，包含thread_id
    config = {"configurable": {"thread_id": thread_id}}
    
    print("\n当前会话ID:", thread_id)
    print("(所有对话将在同一会话中保持上下文记忆)")
    
    while True:
        # 获取用户输入
        user_input = await asyncio.to_thread(input, "\n请输入您想了解的问题 (输入'退出'结束): ")
        
        # 检查是否退出
        if user_input.lower() in ['退出', 'exit', 'quit']:
            print("\n感谢使用，再见！")
            break
        
        # 准备初始状态 - 只包含当前用户消息
        initial_state = {
            "messages": [HumanMessage(content=user_input)]
        }
        
        try:
            print("\n=== 🔍 开始研究 ===\n")
            
            # 使用stream方法逐步获取中间状态，传入config以使用相同的thread_id
            for partial_state in app.stream(initial_state, config, stream_mode="values"):
                # 保存最终状态
                final_state = partial_state
                
                # 获取消息列表
                messages = partial_state.get("messages", [])
                if not messages:
                    continue
                    
                # 获取最新消息
                latest_message = messages[-1]
                
                # 使用log_agent_actions函数记录状态
                log_agent_actions({"messages": [latest_message]})
        
        except Exception as e:
            print(f"\n处理查询时出错: {e}")
            print("可能是由于上下文长度超出限制，请尝试减少查询范围或使用'批处理大小设置为X'命令调整批处理大小(1-5之间)")

##############################################################################
# 程序入口
##############################################################################

if __name__ == "__main__":
    print("\n欢迎使用具有记忆功能的网页爬取助手！")
    print("本助手可以记住您之前的对话内容，实现连续对话体验。")
    print("您可以询问之前提到过的内容，助手会根据上下文理解您的问题。")
    
    # 运行主函数
    asyncio.run(main())

================================================
FILE: examples/08_react_agent_tool_registry_test.py
================================================
import os
import sys
import json
from typing import Dict, Any, List

from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from langchain_community.tools import JinaSearch, WikipediaQueryRun
from langchain_community.utilities import WikipediaAPIWrapper
from dotenv import load_dotenv

from core.agents.base.react_agent import ReactAgent
from core.tools import register_direct_tool
from core.tools.registry import get_registered_tools, ToolCategory
from core.tools.firecrawl_tool import FireCrawlTool

load_dotenv()  # 自动加载 .env 文件

##############################################################################
# 工具注册和ReactAgent测试 - 美联储研究任务
##############################################################################

def print_separator(title):
    """打印分隔符"""
    print("\n" + "=" * 80)
    print(f" {title} ".center(80, "="))
    print("=" * 80)

##############################################################################
# 创建一个记录Agent思考过程的函数
##############################################################################

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动"""
    print("\n" + "-" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            print(latest_message.content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    print(f"- 参数: {tool_call['args']}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            # 只打印结果的前200个字符，避免输出过长
            content = latest_message.content
            if len(content) > 200:
                content = content[:200] + "... (更多内容省略)"
            print(f"- 结果: {content}")
    
    print("-" * 50)

##############################################################################
# 注册工具
##############################################################################

print_separator("注册搜索工具")

# 创建JinaSearch工具实例
jina_search = JinaSearch()

# 创建Wikipedia工具实例
# wiki_tool = WikipediaQueryRun(api_wrapper=WikipediaAPIWrapper())

firecrawl_tool = FireCrawlTool()

# 使用register_direct_tool函数注册工具
register_direct_tool(jina_search)
register_direct_tool(firecrawl_tool)
# 注册自定义工具 - FireCrawlTool

# 获取所有已注册的工具（以字典格式）
registered_tools = get_registered_tools(as_dict=True)

# 打印所有已注册的工具
print("\n已注册的工具:")
for name, info in registered_tools.items():
    print(f"- {name} (类别: {info['category'].value})")

##############################################################################
# 创建ReactAgent实例
##############################################################################

print_separator("创建ReactAgent实例")

# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

# 从注册表中只获取搜索类工具列表
from core.tools.registry import get_tools_by_category, ToolCategory
tools_list = get_tools_by_category(ToolCategory.SEARCH)

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=tools_list,
    name="fed_research_agent",
    # 提示词强调分解问题、多步思考和综合信息
    prompt=(
        "你是一位专业的经济研究分析师，擅长分析复杂的经济问题并提供深入见解。\n"
        "你有多个强大的工具可以搜索网络获取实时信息：\n"
        "当面对复杂问题时，请遵循以下方法论：\n"
        "1. 分解问题：将复杂问题分解为更小的子问题\n"
        "2. 制定计划：确定需要搜索哪些信息，以及使用哪些工具\n"
        "3. 执行搜索：使用适当的工具执行搜索\n"
        "4. 分析结果：分析搜索结果，确定是否需要进一步搜索\n"
        "5. 综合信息：将所有搜索结果综合成一个连贯的回答\n\n"
        "重要提示：\n"
        "- 每次搜索后评估结果，决定下一步行动\n"
        "- 在最终回答中引用来源\n"
        "- 清晰地展示你的思考过程，包括问题分解和计划制定\n"
    ),
)

# agent = react_agent.compile()
# 获取图对象
# graph = agent.get_graph()

# # 获取当前文件名（不含路径和扩展名）
# current_file = os.path.basename(__file__)
# file_name_without_ext = os.path.splitext(current_file)[0]
# graph_dir = os.path.join(os.path.dirname(__file__), "graphs")

# # 确保 graphs 目录存在
# os.makedirs(graph_dir, exist_ok=True)

# # 生成与文件名一致的图片名，并保存到 examples/graphs 目录
# image_data = graph.draw_mermaid_png()
# graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")

# # 保存图片（如果已存在则覆盖）
# with open(graph_path, "wb") as f:
#     f.write(image_data)

# print(f"工作流图已保存为 {graph_path}")

##############################################################################
# 测试：查询"美联储的详细介绍和它如何影响全球经济"
##############################################################################

if __name__ == "__main__":
    print_separator("开始测试ReactAgent处理美联储研究任务")
    print("\n查询: 美联储的详细介绍和它如何影响全球经济")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请提供2025年美联储(Federal Reserve)的详细介绍，包括其历史、结构、职能，以及它如何通过货币政策影响全球经济。")
        ]
    }
    result = react_agent.run(inputs)
##############################################################################
# 打印最终对话消息
##############################################################################
    for m in result["messages"]:
        m.pretty_print()

================================================
FILE: examples/09_e2b_code_interpreter_test.py
================================================
import os
import sys
import json
from typing import Dict, Any, List

from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from dotenv import load_dotenv

from core.agents.base.react_agent import ReactAgent
from core.tools.registry import get_registered_tools, ToolCategory, get_tools_by_category
from core.tools.e2b_tool import E2BCodeInterpreterTool

load_dotenv()  # 自动加载 .env 文件

##############################################################################
# E2B代码解释器工具测试
##############################################################################

def print_separator(title):
    """打印分隔符"""
    print("\n" + "=" * 80)
    print(f" {title} ".center(80, "="))
    print("=" * 80)

##############################################################################
# 检查E2B代码解释器工具是否已注册
##############################################################################

print_separator("检查E2B代码解释器工具是否已注册")

# 获取所有已注册的工具（以字典格式）
registered_tools = get_registered_tools(as_dict=True)

# 打印所有已注册的工具
print("\n已注册的工具:")
for name, info in registered_tools.items():
    print(f"- {name} (类别: {info['category'].value})")

# 检查E2B代码解释器工具是否已注册
e2b_tool_name = "e2b_code_interpreter"
if e2b_tool_name in registered_tools:
    print(f"\nE2B代码解释器工具已成功注册: {e2b_tool_name}")
else:
    print(f"\n警告: E2B代码解释器工具未注册")
    # 手动注册E2B代码解释器工具
    print("尝试手动注册E2B代码解释器工具...")
    try:
        from core.tools.registry import register_tool
        e2b_tool = E2BCodeInterpreterTool()
        register_tool(e2b_tool, ToolCategory.CODE_INTERPRETER)
        print(f"已手动注册工具: {e2b_tool.name}")
    except Exception as e:
        print(f"手动注册E2B代码解释器工具失败: {e}")

##############################################################################
# 创建ReactAgent实例
##############################################################################

print_separator("创建ReactAgent实例")

# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

# 从注册表中只获取代码解释器类工具列表
tools_list = get_tools_by_category(ToolCategory.CODE_INTERPRETER)

# 打印获取到的代码解释器工具
print("\n获取到的代码解释器工具:")
for tool in tools_list:
    print(f"- {tool.name}: {tool.description}")

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=tools_list,
    name="code_interpreter_agent",
    # 提示词强调使用代码解释器工具进行数据分析和可视化
    prompt=(
        "你是一位专业的数据分析师和编程助手，擅长使用Python进行数据分析和可视化。\n"
        "你有多个强大的代码执行工具可以使用：\n"
        "- e2b_code_interpreter: 用于执行Python代码，支持数据分析和可视化\n"
        "当面对编程和数据分析问题时，请遵循以下方法论：\n"
        "1. 分析问题：理解用户的需求和问题本质\n"
        "2. 制定计划：确定解决方案和需要使用的工具\n"
        "3. 编写代码：使用适当的工具编写和执行代码\n"
        "4. 分析结果：解释代码执行结果，提供见解\n"
        "5. 优化方案：如有必要，优化代码或提供改进建议\n\n"
        "重要提示：\n"
        "- 优先使用e2b_code_interpreter工具执行Python代码\n"
        "- 对于数据分析和可视化任务，确保导入必要的库（如pandas, matplotlib, numpy等）\n"
        "- 对于不存在的库，工具会自动尝试使用pip install进行安装\n"
        "- 在代码中添加详细注释，解释关键步骤\n"
        "- 执行代码后，解释结果含义和见解\n"
    ),
)

# 编译Agent
agent = react_agent.compile()

# # 获取图对象
# graph = agent.get_graph()

# # 获取当前文件名（不含路径和扩展名）
# current_file = os.path.basename(__file__)
# file_name_without_ext = os.path.splitext(current_file)[0]
# graph_dir = os.path.join(os.path.dirname(__file__), "graphs")

# # 确保 graphs 目录存在
# os.makedirs(graph_dir, exist_ok=True)

# # 生成与文件名一致的图片名，并保存到 examples/graphs 目录
# image_data = graph.draw_mermaid_png()
# graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")

# # 保存图片（如果已存在则覆盖）
# with open(graph_path, "wb") as f:
#     f.write(image_data)

# print(f"工作流图已保存为 {graph_path}")

##############################################################################
# 测试：使用E2B代码解释器执行简单的数据分析任务
##############################################################################

if __name__ == "__main__":
    print_separator("开始测试ReactAgent使用E2B代码解释器")
    print("\n查询: 使用Python生成一个简单的正弦波图形")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="使用Python生成一个简单的正弦波图形，如果有找不到的模块，需要自动安装")
        ]
    }
    result = agent.invoke(inputs)

    for m in result["messages"]:
        m.pretty_print()

================================================
FILE: examples/10_financial_data_analysis.py
================================================
import os
import sys
import json
from typing import Dict, Any, List

from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from dotenv import load_dotenv

from core.agents.base.react_agent import ReactAgent
from core.tools.registry import get_registered_tools, ToolCategory, get_tools_by_category
from core.tools.e2b_tool import E2BCodeInterpreterTool

load_dotenv()  # 自动加载 .env 文件

##############################################################################
# 财务数据分析报表生成示例
##############################################################################

def print_separator(title):
    """打印分隔符"""
    print("\n" + "=" * 80)
    print(f" {title} ".center(80, "="))
    print("=" * 80)

##############################################################################
# 创建一个记录Agent思考过程的函数
##############################################################################

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动"""
    print("\n" + "-" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            print(latest_message.content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    print(f"- 参数: {tool_call['args']}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            content = latest_message.content
            print(f"- 结果: {content}")
    
    print("-" * 50)

##############################################################################
# 检查E2B代码解释器工具是否已注册
##############################################################################

print_separator("检查E2B代码解释器工具是否已注册")

# 获取所有已注册的工具（以字典格式）
registered_tools = get_registered_tools(as_dict=True)

# 打印所有已注册的工具
print("\n已注册的工具:")
for name, info in registered_tools.items():
    print(f"- {name} (类别: {info['category'].value})")

# 检查E2B代码解释器工具是否已注册
e2b_tool_name = "e2b_code_interpreter"
if e2b_tool_name in registered_tools:
    print(f"\nE2B代码解释器工具已成功注册: {e2b_tool_name}")
else:
    print(f"\n警告: E2B代码解释器工具未注册")
    # 手动注册E2B代码解释器工具
    print("尝试手动注册E2B代码解释器工具...")
    try:
        from core.tools.registry import register_tool
        e2b_tool = E2BCodeInterpreterTool()
        register_tool(e2b_tool, ToolCategory.CODE_INTERPRETER)
        print(f"已手动注册工具: {e2b_tool.name}")
    except Exception as e:
        print(f"手动注册E2B代码解释器工具失败: {e}")

##############################################################################
# 创建ReactAgent实例
##############################################################################

print_separator("创建ReactAgent实例")

# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

# 从注册表中只获取代码解释器类工具列表
tools_list = get_tools_by_category(ToolCategory.CODE_INTERPRETER)

# 打印获取到的代码解释器工具
print("\n获取到的代码解释器工具:")
for tool in tools_list:
    print(f"- {tool.name}: {tool.description}")

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=tools_list,
    name="financial_data_analyst",
    # 提示词强调使用代码解释器工具进行财务数据分析和可视化
    prompt=(
        "你是一位专业的财务数据分析师，擅长使用Python进行财务数据分析和可视化。\n"
        "你有强大的代码执行工具可以使用：\n"
        "- e2b_code_interpreter: 用于执行Python代码，支持数据分析和可视化\n\n"
        "当面对财务数据分析问题时，请遵循以下方法论：\n"
        "1. 分析问题：理解用户的需求和问题本质\n"
        "2. 制定计划：确定解决方案和需要使用的工具\n"
        "3. 编写代码：使用适当的工具编写和执行代码\n"
        "4. 分析结果：解释代码执行结果，提供财务见解\n"
        "5. 优化方案：如有必要，优化代码或提供改进建议\n\n"
        "重要提示：\n"
        "- 优先使用e2b_code_interpreter工具执行Python代码\n"
        "- 对于财务数据分析和可视化任务，确保导入必要的库（如pandas, matplotlib, numpy等）\n"
        "- 对于不存在的库，工具会自动尝试使用pip install进行安装\n"
        "- 在代码中添加详细注释，解释关键步骤\n"
        "- 执行代码后，解释结果含义和财务见解\n"
    ),
)

# # 编译Agent
# agent = react_agent.compile()

# # 获取图对象
# graph = agent.get_graph()

# # 获取当前文件名（不含路径和扩展名）
# current_file = os.path.basename(__file__)
# file_name_without_ext = os.path.splitext(current_file)[0]
# graph_dir = os.path.join(os.path.dirname(__file__), "graphs")

# # 确保 graphs 目录存在
# os.makedirs(graph_dir, exist_ok=True)

# # 生成与文件名一致的图片名，并保存到 examples/graphs 目录
# image_data = graph.draw_mermaid_png()
# graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")

# # 保存图片（如果已存在则覆盖）
# with open(graph_path, "wb") as f:
#     f.write(image_data)

# print(f"工作流图已保存为 {graph_path}")

##############################################################################
# 从沙箱下载文件到本地的函数
##############################################################################
import os

def download_file_from_sandbox(sandbox, sandbox_path, local_path):
    """从 e2b 沙箱中下载文件并保存到本地，自动区分文本和二进制文件"""
    try:
        print(f"读取文件: {sandbox_path}")

        # 判断是否为常见二进制文件类型（可自行扩展）
        binary_extensions = (
            '.png', '.jpg', '.jpeg', '.gif', '.pdf', '.svg',
            '.xlsx', '.xls', '.zip', '.bin', '.pyc', '.pyd',
            '.pptx', '.docx', '.mp3', '.mp4', '.avi', '.mov',
        )
        is_binary = sandbox_path.lower().endswith(binary_extensions)

        # 创建目录
        os.makedirs(os.path.dirname(local_path), exist_ok=True)

        if is_binary:
            print("📦 识别为二进制文件，使用 sandbox.download_file()")
            content = sandbox.files.read(sandbox_path)  # 返回 bytes
            with open(local_path, 'wb') as f:
                f.write(content)
        else:
            print("📄 识别为文本文件，使用 sandbox.files.read()")
            content = sandbox.files.read(sandbox_path)  # 返回 str
            with open(local_path, 'w', encoding='utf-8') as f:
                f.write(content)

        print(f"✅ 文件已保存到本地: {local_path}")
        return True

    except Exception as e:
        print(f"❌ 下载失败: {e}")
        return False
    
def download_directory_from_sandbox(sandbox, sandbox_dir_path, local_dir_path):
    """从沙箱下载整个目录内容到本地
    
    Args:
        sandbox: 沙箱实例
        sandbox_dir_path: 沙箱中的目录路径
        local_dir_path: 本地保存目录路径
    
    Returns:
        bool: 是否成功下载所有文件
    """
    try:
        print(f"尝试下载目录: {sandbox_dir_path} -> {local_dir_path}")
        
        # 确保本地目录存在
        os.makedirs(local_dir_path, exist_ok=True)
        
        # 列出沙箱中指定目录下的所有文件
        try:
            files = sandbox.files.list(sandbox_dir_path)
            # print(f"获取到文件列表: {sandbox_dir_path}, 类型: {type(files)}")
            # if files and len(files) > 0:
            #     print(f"第一个文件类型: {type(files[0])}, 内容: {files[0]}")
            #     # 检查对象属性
            #     print(f"文件对象可用属性: {dir(files[0])}")
        except Exception as e:
            print(f"列出文件时出错: {sandbox_dir_path}, 错误: {str(e)}")
            return False
        
        if not files:
            print(f"沙箱中目录 {sandbox_dir_path} 为空或不存在")
            return False
            
        downloaded_count = 0
        # 定义需要跳过的系统文件
        skip_files = {'.bashrc', '.bash_logout', '.profile'}
        
        # 遍历并下载每个文件
        for file_info in files:
            try:
                # 使用dir()查看对象有哪些属性
                print(f"文件信息对象属性: {dir(file_info)}")
                
                # 尝试安全获取name和type属性
                file_name = getattr(file_info, "name", None)
                if file_name is None:
                    print(f"警告: 无法获取文件名, 跳过此文件")
                    continue
                    
                file_type = getattr(file_info, "type", "file")  # 默认为文件类型
                # 如果 file_type 是枚举, 使用其 value 进行判断
                type_value = file_type.value if hasattr(file_type, "value") else file_type
                
                # 跳过不需要的系统文件或系统目录（隐藏文件/目录）
                if file_name in skip_files or (file_name.startswith('.') and type_value == 'dir'):
                    print(f"跳过系统文件或目录: {file_name}")
                    continue
                
                print(f"处理文件: {file_name}, 类型: {type_value}")
                
                sandbox_file_path = f"{sandbox_dir_path}/{file_name}"
                local_file_path = os.path.join(local_dir_path, file_name)
                
                if type_value == 'dir':
                    # 递归下载子目录
                    print(f"发现子目录: {sandbox_file_path}")
                    if download_directory_from_sandbox(sandbox, sandbox_file_path, local_file_path):
                        downloaded_count += 1
                else:
                    # 下载文件
                    print(f"下载文件: {sandbox_file_path} -> {local_file_path}")
                    if download_file_from_sandbox(sandbox, sandbox_file_path, local_file_path):
                        downloaded_count += 1
            except Exception as e:
                print(f"处理文件时出错: {str(e)}")
                import traceback
                print(f"详细错误跟踪: {traceback.format_exc()}")
                continue
        
        if downloaded_count > 0:
            print(f"从 {sandbox_dir_path} 下载了 {downloaded_count} 个文件/目录到 {local_dir_path}")
            return True
        return False
        
    except Exception as e:
        print(f"从沙箱下载目录时出错: {str(e)}")
        import traceback
        print(f"详细错误跟踪: {traceback.format_exc()}")
        return False

##############################################################################
# 测试：使用E2B代码解释器生成财务数据分析报表
##############################################################################

if __name__ == "__main__":
    print_separator("开始测试ReactAgent使用E2B代码解释器进行财务数据分析")
    print("\n查询: 生成模拟财务数据并进行分析，生成财务报表")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请生成一组模拟的公司财务数据（包括收入、支出、利润等），对数据进行分析，将处理过程（代码）和最终生成的结果保存到本地。")
        ]
    }
    result = react_agent.run(inputs)

    for m in result["messages"]:
        m.pretty_print()

    print("\n下载沙盒里的文件")
    try:
        # 遍历 react_agent.tools 以查找 E2B 相关工具
        sandbox = None
        for tool in react_agent.tools:
            if hasattr(tool, "sandbox"):
                sandbox = tool.sandbox
                break  # 找到后就退出循环

        if sandbox:
            # 设定输出目录
            output_dir = os.path.join(os.getcwd(), "examples/output/sandbox_files")
            os.makedirs(output_dir, exist_ok=True)

            # 直接下载主要工作目录
            print("\n从沙箱下载文件到本地...")
            download_directory_from_sandbox(sandbox, "/home/user", output_dir)

            # 下载临时目录中可能的图表和数据文件
            # download_directory_from_sandbox(sandbox, "/tmp", output_dir)

            print(f"\n文件已保存到目录: {output_dir}")
            sandbox.close()
    except Exception as e:
        print(f"从沙箱下载文件时出错: {str(e)}")

================================================
FILE: examples/11_e2b_sandbox_test.py
================================================
import os
import sys
import json
from typing import Dict, Any, List
from datetime import datetime

from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from dotenv import load_dotenv

from core.agents.base.react_agent import ReactAgent
from core.tools.registry import get_registered_tools, ToolCategory, get_tools_by_category
from core.tools.e2b_tool import E2BCodeInterpreterTool

load_dotenv()  # 自动加载 .env 文件

##############################################################################
# E2B沙盒环境测试程序
##############################################################################

def print_separator(title):
    """打印分隔符"""
    print("\n" + "=" * 80)
    print(f" {title} ".center(80, "="))
    print("=" * 80)

##############################################################################
# 创建一个记录Agent思考过程的函数
##############################################################################

def log_agent_actions(state: Dict[str, Any]) -> None:
    """记录Agent的思考过程和行动"""
    print("\n" + "-" * 50)
    print("当前状态:")
    
    # 打印最新消息
    if state.get("messages") and len(state["messages"]) > 0:
        latest_message = state["messages"][-1]
        
        if isinstance(latest_message, AIMessage):
            print(f"\nAI思考过程:")
            print(latest_message.content)
            
            # 如果有工具调用，打印工具调用信息
            if latest_message.tool_calls:
                print(f"\n工具调用:")
                for tool_call in latest_message.tool_calls:
                    print(f"- 工具: {tool_call['name']}")
                    print(f"- 参数: {tool_call['args']}")
        
        elif isinstance(latest_message, ToolMessage):
            print(f"\n工具返回结果:")
            print(f"- 工具: {latest_message.name}")
            content = latest_message.content
            if len(content) > 500:
                content = content[:250] + "\n... (内容过长，已截断) ...\n" + content[-250:]
            print(f"- 结果: {content}")
    
    print("-" * 50)

##############################################################################
# 从沙箱下载文件到本地的函数
##############################################################################

def download_file_from_sandbox(sandbox, sandbox_path, local_path):
    """从 e2b 沙箱中下载文件并保存到本地，自动区分文本和二进制文件"""
    try:
        print(f"读取文件: {sandbox_path}")

        # 判断是否为常见二进制文件类型（可自行扩展）
        binary_extensions = (
            '.png', '.jpg', '.jpeg', '.gif', '.pdf', '.svg',
            '.xlsx', '.xls', '.zip', '.bin', '.pyc', '.pyd',
            '.pptx', '.docx', '.mp3', '.mp4', '.avi', '.mov',
        )
        is_binary = sandbox_path.lower().endswith(binary_extensions)

        # 创建目录
        os.makedirs(os.path.dirname(local_path), exist_ok=True)

        if is_binary:
            print("📦 识别为二进制文件，使用 sandbox.download_file()")
            content = sandbox.files.read(sandbox_path)  # 返回 bytes
            with open(local_path, 'wb') as f:
                f.write(content)
        else:
            print("📄 识别为文本文件，使用 sandbox.files.read()")
            content = sandbox.files.read(sandbox_path)  # 返回 str
            with open(local_path, 'w', encoding='utf-8') as f:
                f.write(content)

        print(f"✅ 文件已保存到本地: {local_path}")
        return True

    except Exception as e:
        print(f"❌ 下载失败: {e}")
        return False

def run_ai_generated_code(sandbox, code: str, save_results_dir=None):
    """在 E2B 沙箱中执行 AI 生成的代码
    
    Args:
        sandbox: 沙箱实例
        code: AI 生成的代码字符串
        save_results_dir: 用于保存结果文件的本地目录路径（可选）
    
    Returns:
        dict: 包含执行结果的字典
    """
    try:
        print("在沙箱中执行 AI 生成的代码...")
        # 确保代码是字符串类型
        if not isinstance(code, str):
            code = str(code)
            
        # 执行代码
        execution = sandbox.run_code(code)
        print("代码执行完成!")
        
        # 准备结果字典
        result = {
            "success": True,
            "stdout": "",
            "results": []
        }
        
        # 提取标准输出
        if hasattr(execution, "stdout"):
            result["stdout"] = execution.stdout
            
        # 检查代码是否执行成功
        if hasattr(execution, "error") and execution.error:
            error_name = getattr(execution.error, "name", "Unknown")
            error_value = getattr(execution.error, "value", "Unknown error")
            error_traceback = getattr(execution.error, "traceback", "")
            
            print("AI 生成的代码执行出错:")
            print(f"错误类型: {error_name}")
            print(f"错误信息: {error_value}")
            if error_traceback:
                print(f"错误追踪: {error_traceback}")
                
            result["success"] = False
            result["error"] = {
                "name": error_name,
                "value": error_value,
                "traceback": error_traceback
            }
            return result
        
        # 处理执行结果
        if hasattr(execution, "results") and execution.results:
            import base64
            result_idx = 0
            
            for res in execution.results:
                # 默认为文本结果
                result_data = {"type": "text", "value": str(res)}
                
                # 检查是否有PNG图像
                if hasattr(res, "png") and res.png:
                    result_data["type"] = "png"
                    result_data["value"] = res.png  # base64编码的字符串
                    
                    # 如果指定了保存目录，保存图像到本地
                    if save_results_dir:
                        try:
                            os.makedirs(save_results_dir, exist_ok=True)
                            image_path = os.path.join(save_results_dir, f"result-{result_idx}.png")
                            
                            # 解码并保存图像
                            with open(image_path, 'wb') as f:
                                f.write(base64.b64decode(res.png))
                            print(f"图像已保存到: {image_path}")
                            result_data["local_path"] = image_path
                        except Exception as img_err:
                            print(f"保存图像时出错: {str(img_err)}")
                
                result["results"].append(result_data)
                result_idx += 1
        
        return result
        
    except Exception as e:
        print(f"执行AI生成的代码时出错: {str(e)}")
        import traceback
        print(f"详细错误: {traceback.format_exc()}")
        return {
            "success": False,
            "error": {
                "name": type(e).__name__,
                "value": str(e),
                "traceback": traceback.format_exc()
            }
        }

def download_directory_from_sandbox(sandbox, sandbox_dir_path, local_dir_path):
    """从沙箱下载整个目录内容到本地
    
    Args:
        sandbox: 沙箱实例
        sandbox_dir_path: 沙箱中的目录路径
        local_dir_path: 本地保存目录路径
    
    Returns:
        bool: 是否成功下载所有文件
    """
    try:
        print(f"尝试下载目录: {sandbox_dir_path} -> {local_dir_path}")
        
        # 确保本地目录存在
        os.makedirs(local_dir_path, exist_ok=True)
        
        # 列出沙箱中指定目录下的所有文件
        try:
            files = sandbox.files.list(sandbox_dir_path)
            # print(f"获取到文件列表: {sandbox_dir_path}, 类型: {type(files)}")
            # if files and len(files) > 0:
            #     print(f"第一个文件类型: {type(files[0])}, 内容: {files[0]}")
            #     # 检查对象属性
            #     print(f"文件对象可用属性: {dir(files[0])}")
        except Exception as e:
            print(f"列出文件时出错: {sandbox_dir_path}, 错误: {str(e)}")
            return False
        
        if not files:
            print(f"沙箱中目录 {sandbox_dir_path} 为空或不存在")
            return False
            
        downloaded_count = 0
        # 定义需要跳过的系统文件
        skip_files = {'.bashrc', '.bash_logout', '.profile'}
        
        # 遍历并下载每个文件
        for file_info in files:
            try:
                # 使用dir()查看对象有哪些属性
                print(f"文件信息对象属性: {dir(file_info)}")
                
                # 尝试安全获取name和type属性
                file_name = getattr(file_info, "name", None)
                if file_name is None:
                    print(f"警告: 无法获取文件名, 跳过此文件")
                    continue
                    
                file_type = getattr(file_info, "type", "file")  # 默认为文件类型
                # 如果 file_type 是枚举, 使用其 value 进行判断
                type_value = file_type.value if hasattr(file_type, "value") else file_type
                
                # 跳过不需要的系统文件或系统目录（隐藏文件/目录）
                if file_name in skip_files or (file_name.startswith('.') and type_value == 'dir'):
                    print(f"跳过系统文件或目录: {file_name}")
                    continue
                
                print(f"处理文件: {file_name}, 类型: {type_value}")
                
                sandbox_file_path = f"{sandbox_dir_path}/{file_name}"
                local_file_path = os.path.join(local_dir_path, file_name)
                
                if type_value == 'dir':
                    # 递归下载子目录
                    print(f"发现子目录: {sandbox_file_path}")
                    if download_directory_from_sandbox(sandbox, sandbox_file_path, local_file_path):
                        downloaded_count += 1
                else:
                    # 下载文件
                    print(f"下载文件: {sandbox_file_path} -> {local_file_path}")
                    if download_file_from_sandbox(sandbox, sandbox_file_path, local_file_path):
                        downloaded_count += 1
            except Exception as e:
                print(f"处理文件时出错: {str(e)}")
                import traceback
                print(f"详细错误跟踪: {traceback.format_exc()}")
                continue
        
        if downloaded_count > 0:
            print(f"从 {sandbox_dir_path} 下载了 {downloaded_count} 个文件/目录到 {local_dir_path}")
            return True
        return False
        
    except Exception as e:
        print(f"下载整个目录时出错: {str(e)}")
        import traceback
        print(f"详细错误跟踪: {traceback.format_exc()}")

##############################################################################
# 检查E2B代码解释器工具是否已注册
##############################################################################

print_separator("检查E2B代码解释器工具是否已注册")

# 获取所有已注册的工具（以字典格式）
registered_tools = get_registered_tools(as_dict=True)

# 打印所有已注册的工具
print("\n已注册的工具:")
for name, info in registered_tools.items():
    print(f"- {name} (类别: {info['category'].value})")

# 检查E2B代码解释器工具是否已注册
e2b_tool_name = "e2b_code_interpreter"
if e2b_tool_name in registered_tools:
    print(f"\nE2B代码解释器工具已成功注册: {e2b_tool_name}")
else:
    print(f"\n警告: E2B代码解释器工具未注册")
    # 手动注册E2B代码解释器工具
    print("尝试手动注册E2B代码解释器工具...")
    try:
        from core.tools.registry import register_tool
        e2b_tool = E2BCodeInterpreterTool()
        register_tool(e2b_tool, ToolCategory.CODE_INTERPRETER)
        print(f"已手动注册工具: {e2b_tool.name}")
    except Exception as e:
        print(f"手动注册E2B代码解释器工具失败: {e}")

##############################################################################
# 创建ReactAgent实例
##############################################################################

print_separator("创建ReactAgent实例")

# 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

# 从注册表中只获取代码解释器类工具列表
tools_list = get_tools_by_category(ToolCategory.CODE_INTERPRETER)

# 打印获取到的代码解释器工具
print("\n获取到的代码解释器工具:")
for tool in tools_list:
    print(f"- {tool.name}: {tool.description}")

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=tools_list,
    name="sandbox_test_agent",
    # 提示词强调测试沙箱环境的各种功能
    prompt=(
        "你是一位专业的沙箱环境测试专家，负责测试E2B代码解释器沙箱环境的各种功能。\n"
        "你有强大的代码执行工具可以使用：\n"
        "- e2b_code_interpreter: 用于在沙箱环境中执行Python代码\n\n"
        "当进行沙箱环境测试时，请遵循以下方法论：\n"
        "1. 分析测试需求：理解需要测试的沙箱功能\n"
        "2. 设计测试用例：针对特定功能设计测试代码\n"
        "3. 执行测试：使用e2b_code_interpreter工具执行测试代码\n"
        "4. 分析结果：解释测试结果，判断功能是否正常\n"
        "5. 记录问题：如有异常，记录问题并提供详细信息\n\n"
        "重要提示：\n"
        "- 优先使用e2b_code_interpreter工具执行Python代码\n"
        "- 测试代码应包含详细注释，解释测试目的和预期结果\n"
        "- 所有文件和图片必须保存在沙盒环境中的特定目录，不要直接返回图片\n"
        "- 图片不允许在回复中展示！Images are not allowed in the response!\n"
        "- 测试应覆盖沙箱的各种功能，包括但不限于：\n"
        "  * 基本Python代码执行\n"
        "  * 文件系统操作（创建、读取、写入文件）\n"
        "  * 包管理（安装和使用第三方包）\n"
        "  * 系统命令执行（使用!前缀执行shell命令）\n"
        "  * 数据处理和可视化\n"
        "  * 异常处理和错误恢复\n"
    ),
)

# 添加调试信息，验证工具列表和沙箱实例的初始状态
print("\n验证ReactAgent工具列表和沙箱实例初始状态:")
print(f"react_agent.tools类型: {type(react_agent.tools)}")
print(f"react_agent.tools长度: {len(react_agent.tools)}")

# 遍历所有工具，检查是否有sandbox属性
for i, tool in enumerate(react_agent.tools):
    print(f"\n工具[{i}]类型: {type(tool)}")
    print(f"工具[{i}]名称: {getattr(tool, 'name', '未知')}")
    print(f"工具[{i}]是否有sandbox属性: {'sandbox' in dir(tool)}")
    
    # 如果有sandbox属性，打印沙箱实例信息
    if 'sandbox' in dir(tool):
        print(f"工具[{i}]的sandbox类型: {type(tool.sandbox)}")
        print(f"工具[{i}]的sandbox是否可用: {getattr(tool, '_is_available', False)}")
        print(f"工具[{i}]的初始化错误: {getattr(tool, '_init_error', None)}")

# 编译Agent
agent = react_agent.compile()

# # 获取图对象
# graph = agent.get_graph()

# # 获取当前文件名（不含路径和扩展名）
# current_file = os.path.basename(__file__)
# file_name_without_ext = os.path.splitext(current_file)[0]
# graph_dir = os.path.join(os.path.dirname(__file__), "graphs")

# # 确保 graphs 目录存在
# os.makedirs(graph_dir, exist_ok=True)

# # 生成与文件名一致的图片名，并保存到 examples/graphs 目录
# image_data = graph.draw_mermaid_png()
# graph_path = os.path.join(graph_dir, f"{file_name_without_ext}.png")

# # 保存图片（如果已存在则覆盖）
# with open(graph_path, "wb") as f:
#     f.write(image_data)

# print(f"工作流图已保存为 {graph_path}")

##############################################################################
# 测试用例1：基本Python代码执行和环境信息
##############################################################################

def run_test_case_1():
    print_separator("测试用例1：基本Python代码执行和环境信息")
    print("\n查询: 测试基本Python代码执行和获取环境信息")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请执行一段Python代码，测试基本的数学运算、字符串操作，并获取沙箱环境的系统信息（Python版本、操作系统信息等）。")
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print_separator("测试用例1结果")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                print(message.content)

##############################################################################
# 测试用例2：文件系统操作
##############################################################################

def run_test_case_2():
    print_separator("测试用例2：文件系统操作")
    print("\n查询: 测试沙箱环境的文件系统操作")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请测试沙箱环境的文件系统操作，包括创建目录、创建文件、写入内容、读取内容、列出目录内容等。创建一个测试目录结构，并将操作结果保存到文件中。文件保存到 /home/user/test_dir")
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print_separator("测试用例2结果")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                print(message.content)
                
                # 检查是否有E2B沙箱实例，尝试下载生成的文件
                for msg in final_state["messages"]:
                    if isinstance(msg, ToolMessage) and msg.name == "e2b_code_interpreter":
                        try:
                            # 尝试解析工具消息内容
                            tool_output = json.loads(msg.content)
                            print(f"\n工具消息内容解析成功: {type(tool_output)}")
                            
                            # 检查是否有原始输出
                            if hasattr(msg, 'raw_output') and msg.raw_output:
                                print(f"\n消息包含raw_output属性: {type(msg.raw_output)}")
                                
                                # 打印react_agent.tools的信息
                                print(f"\nreact_agent.tools类型: {type(react_agent.tools)}")
                                print(f"react_agent.tools长度: {len(react_agent.tools)}")
                                
                                # 遍历所有工具，检查是否有sandbox属性
                                for i, tool in enumerate(react_agent.tools):
                                    print(f"\n工具[{i}]类型: {type(tool)}")
                                    print(f"工具[{i}]名称: {getattr(tool, 'name', '未知')}")
                                    print(f"工具[{i}]是否有sandbox属性: {'sandbox' in dir(tool)}")
                                    if 'sandbox' in dir(tool):
                                        print(f"工具[{i}]的sandbox类型: {type(tool.sandbox)}")
                                
                                # 遍历 react_agent.tools 以查找 E2B 相关工具
                                sandbox = None
                                for tool in react_agent.tools:
                                    if hasattr(tool, "sandbox"):
                                        sandbox = tool.sandbox
                                        break  # 找到后就退出循环
                                
                                if sandbox:
                                    print("\n成功获取沙箱实例!")
                                    print(f"沙箱实例类型: {type(sandbox)}")
                                    
                                    # 从沙箱下载生成的文件
                                    output_dir = os.path.join(os.path.dirname(__file__), "output", "sandbox_test")
                                    os.makedirs(output_dir, exist_ok=True)
                                    print(f"输出目录已创建: {output_dir}")
                                    
                                    # 尝试下载测试目录，路径和提示中保持一致
                                    sandbox_test_path = "/home/user/test_dir"
                                    print(f"尝试从沙箱下载目录: {sandbox_test_path}")
                                    download_directory_from_sandbox(sandbox, sandbox_test_path, os.path.join(output_dir, "test_dir"))
                                else:
                                    print("\n错误: 无法获取沙箱实例，没有找到具有sandbox属性的工具")
                            else:
                                print("\n错误: 消息没有raw_output属性")
                        except Exception as e:
                            print(f"处理工具消息时出错: {str(e)}")

##############################################################################
# 测试用例3：包管理和第三方库使用
##############################################################################

def run_test_case_3():
    print_separator("测试用例3：包管理和第三方库使用")
    print("\n查询: 测试沙箱环境的包管理和第三方库使用")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请测试沙箱环境的包管理功能，安装一个不常见的第三方库（如wordcloud、pycountry等），并使用该库编写一个简单的示例程序。验证包安装和使用是否正常。")
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print_separator("测试用例3结果")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                print(message.content)

##############################################################################
# 测试用例4：Shell命令执行
##############################################################################

def run_test_case_4():
    print_separator("测试用例4：Shell命令执行")
    print("\n查询: 测试沙箱环境的Shell命令执行")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请测试沙箱环境中执行Shell命令的功能，使用!前缀执行一系列Linux命令，包括系统信息查询、目录操作、文件查找等。将命令执行结果保存到文件（/home/user/shell_commands_results.txt）中。")
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print_separator("测试用例4结果")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                print(message.content)
                
                # 尝试下载生成的文件
                for msg in final_state["messages"]:
                    if isinstance(msg, ToolMessage) and msg.name == "e2b_code_interpreter":
                        try:
                            print(f"\n测试用例4: 检查工具消息类型: {type(msg)}")
                            print(f"测试用例4: 工具消息名称: {msg.name}")
                            
                            # 检查react_agent.tools的信息
                            print(f"\n测试用例4: react_agent.tools类型: {type(react_agent.tools)}")
                            print(f"测试用例4: react_agent.tools长度: {len(react_agent.tools)}")
                            
                            # 遍历 react_agent.tools 以查找 E2B 相关工具
                            sandbox = None
                            for tool in react_agent.tools:
                                if hasattr(tool, "sandbox"):
                                    sandbox = tool.sandbox
                                    break  # 找到后就退出循环
                            
                            if sandbox:
                                print("\n测试用例4: 成功获取沙箱实例!")
                                print(f"测试用例4: 沙箱实例类型: {type(sandbox)}")
                                print(f"测试用例4: 沙箱实例属性: {dir(sandbox)[:10]}...")
                                
                                output_dir = os.path.join(os.path.dirname(__file__), "output", "sandbox_test")
                                os.makedirs(output_dir, exist_ok=True)
                                print(f"测试用例4: 输出目录已创建: {output_dir}")
                                
                                # 尝试下载shell命令结果文件，路径和提示中保持一致
                                sandbox_file_path = "/home/user/shell_commands_results.txt"
                                local_file_path = os.path.join(output_dir, "shell_commands_results.txt")
                                print(f"测试用例4: 尝试下载文件: {sandbox_file_path} -> {local_file_path}")
                                download_file_from_sandbox(sandbox, sandbox_file_path, local_file_path)
                            else:
                                print("\n测试用例4: 错误: 无法获取沙箱实例，没有找到具有sandbox属性的工具")
                                print(f"测试用例4: react_agent.tools的类型和长度: {type(react_agent.tools)}, {len(react_agent.tools)}")
                        except Exception as e:
                            print(f"下载文件时出错: {str(e)}")

##############################################################################
# 测试用例5：数据处理和可视化
##############################################################################

def run_test_case_5():
    print_separator("测试用例5：数据处理和可视化")
    print("\n查询: 测试沙箱环境的数据处理和可视化功能")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content=(
                "请测试沙箱环境的数据处理和可视化功能，生成一些随机数据，使用pandas进行数据处理，"
                "然后使用matplotlib创建多种类型的图表（折线图、柱状图、散点图等）。\n"
                "严格按照以下要求:\n"
                "1. 将所有图表保存到 /home/user/visualizations 目录\n"
                "2. 不要在回复中包含图片 - 图片直接保存到上述目录即可\n"
                "3. Images are not allowed in the response!\n"
                "4. 只需描述你做了什么，创建了哪些图表，并说明它们保存在哪里\n"
                "5. 请确保目录存在后再保存图片\n"
            ))
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print_separator("测试用例5结果")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                print(message.content)
                
                # 尝试下载生成的图表文件
                for msg in final_state["messages"]:
                    if isinstance(msg, ToolMessage) and msg.name == "e2b_code_interpreter":
                        try:
                            # 遍历 react_agent.tools 以查找 E2B 相关工具
                            sandbox = None
                            for tool in react_agent.tools:
                                if hasattr(tool, "sandbox"):
                                    sandbox = tool.sandbox
                                    break  # 找到后就退出循环
                            
                            if sandbox:
                                output_dir = os.path.join(os.path.dirname(__file__), "output", "sandbox_test")
                                os.makedirs(output_dir, exist_ok=True)
                                
                                # 针对性地下载可视化目录中的图表
                                vis_dir = "/home/user/visualizations"
                                local_vis_dir = os.path.join(output_dir, "visualizations")
                                os.makedirs(local_vis_dir, exist_ok=True)
                                print(f"测试用例5: 下载可视化图表目录: {vis_dir} -> {local_vis_dir}")
                                
                                # 尝试列出可视化目录中的文件
                                try:
                                    files = sandbox.files.list(vis_dir)
                                    if files:
                                        print(f"找到图表文件:")
                                        for file_info in files:
                                            file_name = getattr(file_info, "name", "未知文件")
                                            print(f"- {file_name}")
                                    else:
                                        print(f"警告: 可视化目录为空或不存在")
                                except Exception as e:
                                    print(f"列出可视化目录文件时出错: {str(e)}")
                                
                                # 执行下载
                                success = download_directory_from_sandbox(sandbox, vis_dir, local_vis_dir)
                                if success:
                                    print(f"✅ 成功下载可视化图表")
                                else:
                                    print(f"⚠️ 下载可视化图表失败，尝试下载整个用户目录作为备份")
                                    download_directory_from_sandbox(sandbox, "/home/user", output_dir)
                            else:
                                print("\n错误: 无法获取沙箱实例，没有找到具有sandbox属性的工具")
                        except Exception as e:
                            print(f"下载文件时出错: {str(e)}")
                            import traceback
                            print(f"错误详情: {traceback.format_exc()}")

##############################################################################
# 测试用例6：异常处理和错误恢复
##############################################################################

def run_test_case_6():
    print_separator("测试用例6：异常处理和错误恢复")
    print("\n查询: 测试沙箱环境的异常处理和错误恢复能力")
    
    # 定义输入
    inputs = {
        "messages": [
            HumanMessage(content="请测试沙箱环境的异常处理和错误恢复能力。编写一段包含各种常见错误的Python代码（如语法错误、除零错误、文件不存在错误等），然后展示如何捕获和处理这些异常。验证沙箱环境是否能正确报告错误并继续执行后续代码。")
        ]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取消息列表
        messages = partial_state.get("messages", [])
        if not messages:
            continue
            
        # 获取最新消息
        latest_message = messages[-1]
        
        # 使用log_agent_actions函数记录状态
        log_agent_actions({"messages": [latest_message]})
    
    # 打印最终回答
    print_separator("测试用例6结果")
    if final_state and final_state.get("messages"):
        for message in final_state["messages"]:
            if isinstance(message, AIMessage) and not message.tool_calls:
                print(message.content)

##############################################################################
# 主函数 - 运行所有测试用例
##############################################################################

if __name__ == "__main__":
    print_separator("开始测试E2B沙箱环境")
    
    try:
        # 确保输出目录存在
        output_dir = os.path.join(os.path.dirname(__file__), "output", "sandbox_test")
        os.makedirs(output_dir, exist_ok=True)
        print(f"创建输出目录: {output_dir}")
        
        # 确保可视化输出目录存在
        vis_output_dir = os.path.join(output_dir, "visualizations")
        os.makedirs(vis_output_dir, exist_ok=True)
        print(f"创建可视化输出目录: {vis_output_dir}")
        
        # # 运行测试用例
        # # 运行测试用例1：基本Python代码执行和环境信息
        # run_test_case_1()
        
        # # 运行测试用例2：文件系统操作
        # run_test_case_2()
        
        # # 运行测试用例3：包管理和第三方库使用
        # run_test_case_3()
        
        # # 运行测试用例4：Shell命令执行
        # run_test_case_4()
        
        # 运行测试用例5：数据处理和可视化
        run_test_case_5()
        
        # # 运行测试用例6：异常处理和错误恢复
        # run_test_case_6()
        
        print_separator("E2B沙箱环境测试完成")
        print("测试结果已保存到 examples/output/sandbox_test 目录")
        
    except Exception as e:
        print(f"测试过程中出错: {str(e)}")
    finally:
        # 关闭E2B沙箱
        print("\n正在关闭E2B沙箱...")
        for tool in react_agent.tools:
            if hasattr(tool, 'close'):
                tool.close()

================================================
FILE: examples/12_planning_supervisor_test.py
================================================
from langgraph.prebuilt import create_react_agent
from core.agents.react_supervisor_agent import SupervisorAgent
from core.agents.research_agent import ResearchAgent
from core.agents.base.react_agent import ReactAgent
from langchain_openai import ChatOpenAI
from langgraph.func import entrypoint, task
from langgraph.graph import add_messages
from dotenv import load_dotenv
from langchain_community.tools import TavilySearchResults
load_dotenv()  # 自动加载 .env 文件

# 1. 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")

##############################################################################
# Agent 1: Joke Generator (Functional API)
##############################################################################

@task
def generate_joke(messages):
    """Generate a short joke (no tool calls)."""
    system_message = {
        "role": "system", 
        "content": "You are a witty comedian. Write a short joke."
    }
    # 直接调用 model.invoke，拼接 system_message + 用户消息
    msg = model.invoke([system_message] + messages)
    return msg

@entrypoint()
def joke_agent(state):
    # 调用上面的函数型任务
    joke = generate_joke(state['messages']).result()
    # 将产物插入消息列表
    messages = add_messages(state["messages"], [joke])
    return {"messages": messages}

joke_agent.name = "joke_agent"

##############################################################################
# Agent 2: Research Expert with Tavily Search (Graph API)
##############################################################################

# 创建Tavily搜索工具
tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=False,
    include_images=False,
    search_depth="advanced"
)

# 使用我们自定义的ResearchAgent替代create_react_agent创建的agent
research_agent = ResearchAgent(
    name="research_expert",
    model=model,
    max_iterations=5,
    cache_enabled=True,
    debug=False
)
research_agent_2 = ReactAgent(
    name="research_expert",
    model=model,
    tools=[tavily_search])

##############################################################################
# 使用带有Planning功能的SupervisorAgent
##############################################################################

# 创建 SupervisorAgent 实例，启用Planning功能
supervisor = SupervisorAgent(
    agents=[joke_agent,research_agent_2],
    model=model,
)
##############################################################################
# 测试：复杂请求需要规划和多个步骤
##############################################################################
result = supervisor.run({
    "messages": [
        {
            "role": "user",
            "content": (
                "I'm preparing a presentation about tech companies. I need three things: "
                "1) A joke about tech companies to start with, "
                "2) The employee count for FANNG, and "
                "3) A comparison of which company has more employees."
            )
        }
    ]
})

##############################################################################
# 打印最终对话消息
##############################################################################
for m in result["messages"]:
    m.pretty_print()

# 打印任务列表
print("\n##############################################################################")
print("# 最终任务列表")
print("##############################################################################")
if "plan" in result and result["plan"] and "tasks" in result["plan"]:
    tasks = result["plan"]["tasks"]
    print(f"总共 {len(tasks)} 个任务:")
    for i, task in enumerate(tasks):
        print(f"\n任务 {i+1}: {task['description']}")
        print(f"  状态: {task['status']}")
        print(f"  代理: {task['agent'] if task['agent'] else '未分配'}")
        print(f"  创建时间: {task['created_at']}")
        print(f"  完成时间: {task['completed_at'] if task['completed_at'] else '未完成'}")
else:
    print("没有任务列表信息")

# 打印原始任务列表（如果存在）
if "tasks" in result:
    print("\n原始任务列表:")
    for t in result["tasks"]:
        t.pretty_print()

================================================
FILE: examples/13_multi_agent_roles_test.py
================================================
from langgraph.prebuilt import create_react_agent
from core.agents.react_supervisor_agent import SupervisorAgent
from core.agents.sub_agents.research_agent import ResearchAgent
from core.agents.sub_agents.coder_agent import CoderAgent
from core.agents.sub_agents.reporter_agent import ReporterAgent
from core.agents.sub_agents.designer_agent import DesignerAgent
from core.agents.sub_agents.data_analyst_agent import DataAnalystAgent
from langchain_openai import ChatOpenAI
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
from langgraph.func import entrypoint, task
from langgraph.graph import add_messages
from dotenv import load_dotenv
from langchain_community.tools import TavilySearchResults
import os
import logging
import sys
import io
import json
from contextlib import redirect_stdout, redirect_stderr

load_dotenv()  # 自动加载 .env 文件

# 1. 初始化大模型
model = ChatOpenAI(model="gpt-4o-mini")
# 设置日志捕获
class LogCapture:
    def __init__(self):
        self.log_buffer = io.StringIO()
        self.log_content = []
    
    def start_capture(self):
        self.log_buffer = io.StringIO()
        return self.log_buffer
    
    def stop_capture(self):
        output = self.log_buffer.getvalue()
        self.log_content.append(output)
        return output
    
    def get_content(self):
        return "\n".join(self.log_content)

log_capture = LogCapture()

##############################################################################
# 从沙箱下载文件到本地的函数
##############################################################################

def download_file_from_sandbox(sandbox, sandbox_path, local_path):
    """从 e2b 沙箱中下载文件并保存到本地，自动区分文本和二进制文件"""
    try:
        print(f"读取文件: {sandbox_path}")

        # 判断是否为常见二进制文件类型（可自行扩展）
        binary_extensions = (
            '.png', '.jpg', '.jpeg', '.gif', '.pdf', '.svg',
            '.xlsx', '.xls', '.zip', '.bin', '.pyc', '.pyd',
            '.pptx', '.docx', '.mp3', '.mp4', '.avi', '.mov',
        )
        is_binary = sandbox_path.lower().endswith(binary_extensions)

        # 创建目录
        os.makedirs(os.path.dirname(local_path), exist_ok=True)

        if is_binary:
            print("📦 识别为二进制文件，使用 sandbox.download_file()")
            content = sandbox.files.read(sandbox_path)  # 返回 bytes
            with open(local_path, 'wb') as f:
                f.write(content)
        else:
            print("📄 识别为文本文件，使用 sandbox.files.read()")
            content = sandbox.files.read(sandbox_path)  # 返回 str
            with open(local_path, 'w', encoding='utf-8') as f:
                f.write(content)

        print(f"✅ 文件已保存到本地: {local_path}")
        return True

    except Exception as e:
        print(f"❌ 下载失败: {e}")
        return False

def download_directory_from_sandbox(sandbox, sandbox_dir_path, local_dir_path):
    """从沙箱下载整个目录内容到本地
    
    Args:
        sandbox: 沙箱实例
        sandbox_dir_path: 沙箱中的目录路径
        local_dir_path: 本地保存目录路径
    
    Returns:
        bool: 是否成功下载所有文件
    """
    try:
        print(f"尝试下载目录: {sandbox_dir_path} -> {local_dir_path}")
        
        # 确保本地目录存在
        os.makedirs(local_dir_path, exist_ok=True)
        
        # 列出沙箱中指定目录下的所有文件
        try:
            files = sandbox.files.list(sandbox_dir_path)
        except Exception as e:
            print(f"列出文件时出错: {sandbox_dir_path}, 错误: {str(e)}")
            return False
        
        if not files:
            print(f"沙箱中目录 {sandbox_dir_path} 为空或不存在")
            return False
            
        downloaded_count = 0
        # 定义需要跳过的系统文件
        skip_files = {'.bashrc', '.bash_logout', '.profile'}
        
        # 遍历并下载每个文件
        for file_info in files:
            try:
                # 尝试安全获取name和type属性
                file_name = getattr(file_info, "name", None)
                if file_name is None:
                    print(f"警告: 无法获取文件名, 跳过此文件")
                    continue
                    
                file_type = getattr(file_info, "type", "file")  # 默认为文件类型
                # 如果 file_type 是枚举, 使用其 value 进行判断
                type_value = file_type.value if hasattr(file_type, "value") else file_type
                
                # 跳过不需要的系统文件或系统目录（隐藏文件/目录）
                if file_name in skip_files or (file_name.startswith('.') and type_value == 'dir'):
                    print(f"跳过系统文件或目录: {file_name}")
                    continue
                
                print(f"处理文件: {file_name}, 类型: {type_value}")
                
                sandbox_file_path = f"{sandbox_dir_path}/{file_name}"
                local_file_path = os.path.join(local_dir_path, file_name)
                
                if type_value == 'dir':
                    # 递归下载子目录
                    print(f"发现子目录: {sandbox_file_path}")
                    if download_directory_from_sandbox(sandbox, sandbox_file_path, local_file_path):
                        downloaded_count += 1
                else:
                    # 下载文件
                    print(f"下载文件: {sandbox_file_path} -> {local_file_path}")
                    if download_file_from_sandbox(sandbox, sandbox_file_path, local_file_path):
                        downloaded_count += 1
            except Exception as e:
                print(f"处理文件时出错: {str(e)}")
                import traceback
                print(f"详细错误跟踪: {traceback.format_exc()}")
                continue
        
        if downloaded_count > 0:
            print(f"从 {sandbox_dir_path} 下载了 {downloaded_count} 个文件/目录到 {local_dir_path}")
            return True
        return False
        
    except Exception as e:
        print(f"下载整个目录时出错: {str(e)}")
        import traceback
        print(f"详细错误跟踪: {traceback.format_exc()}")


##############################################################################
# Agent 2: Research Expert - 使用自定义的ResearchAgent
##############################################################################

research_agent = ResearchAgent(
    name="research_expert",
    model=model,
    max_iterations=5,
    cache_enabled=True,
    debug=True
)

##############################################################################
# Agent 3: Coder - 使用自定义的CoderAgent
##############################################################################
from core.tools.e2b_tool import E2BCodeInterpreterTool
e2b_tool = E2BCodeInterpreterTool()

coder_agent = CoderAgent(
    name="coder_expert",
    model=model,
    tools=[e2b_tool],
    max_iterations=5,
    cache_enabled=True,
    debug=True
)

##############################################################################
# Agent 4: Reporter - 使用自定义的ReporterAgent
##############################################################################

reporter_agent = ReporterAgent(
    name="reporter_expert",
    model=model,
    max_iterations=5,
    cache_enabled=True,
)

##############################################################################
# Agent 5: Designer - 使用自定义的DesignerAgent
##############################################################################

designer_agent = DesignerAgent(
    name="designer_expert",
    model=model,
    max_iterations=5,
    cache_enabled=True,
)

##############################################################################
# Agent 6: Data Analyst - 使用自定义的DataAnalystAgent
##############################################################################

data_analyst_agent = DataAnalystAgent(
    name="data_analyst_expert",
    model=model,
    max_iterations=5,
    cache_enabled=True,
)

##############################################################################
# 使用带有Planning功能的SupervisorAgent协调所有角色
##############################################################################

# 创建 SupervisorAgent 实例，启用Planning功能
supervisor = SupervisorAgent(
    agents=[
        research_agent,
        coder_agent,
        reporter_agent,
        designer_agent,
        data_analyst_agent,
    ],
    model=model,
    enable_planning=True,
    output_mode="last_message"
)

# 获取当前文件名（不含路径和扩展名）
current_file = os.path.basename(__file__)
file_name_without_ext = os.path.splitext(current_file)[0]
logs_dir = os.path.join(os.path.dirname(__file__), "logs")
# 创建图表输出文件路径
os.makedirs(logs_dir, exist_ok=True)
# 创建Markdown输出文件路径
markdown_path = os.path.join(logs_dir, f"{file_name_without_ext}.md")

##############################################################################
# 测试：复杂请求需要规划和多个步骤
##############################################################################

def save_markdown_log():
    """将执行结果保存为Markdown文件"""
    with open(markdown_path, "w", encoding="utf-8") as f:
        f.write(f"# 执行结果: {file_name_without_ext}\n\n")
        f.write("## 图表\n\n")
        f.write("## 执行日志\n\n")
        f.write("```\n")
        f.write(log_capture.get_content())
        f.write("\n```\n")
    print(f"执行日志已保存到 {markdown_path}")

if __name__ == "__main__":
    try:
        # 开始捕获输出
        log_buffer = log_capture.start_capture()
        
        with redirect_stdout(log_buffer), redirect_stderr(log_buffer):
            print(f"开始执行 {current_file} 测试...")
            
            # 测试1：需要研究和编码的任务
            print("\n## 测试1：需要研究和编码的任务")
            final_state = supervisor.run({
                "messages": [
                    {
                        "role": "user",
                        "content": (
                            "我需要一个Python爬虫来获取 https://www.paulgraham.com/articles.html 所有articles列表，并将结果保存为CSV文件,放在/home/user下面。"
                            "并将你测试通过的爬虫代码返回给我。"
                            "请确保你的代码能够正常运行。"
                            "如果遇到问题，请重试。"
                        )
                    }
                ]
            })
            
            print("\n测试1结果:")
            for m in final_state["messages"]:
                m.pretty_print()
            
            # 遍历 react_agent.tools 以查找 E2B 相关工具
            try:
            # 遍历 react_agent.tools 以查找 E2B 相关工具
                sandbox = None
                for tool in coder_agent.tools:
                    if hasattr(tool, "sandbox"):
                        sandbox = tool.sandbox
                        break  # 找到后就退出循环

                if sandbox:
                    # 设定输出目录
                    output_dir = os.path.join(os.getcwd(), "examples/output/sandbox_files")
                    os.makedirs(output_dir, exist_ok=True)

                    # 直接下载主要工作目录
                    print("\n从沙箱下载文件到本地...")
                    download_directory_from_sandbox(sandbox, "/home/user", output_dir)

                    # 下载临时目录中可能的图表和数据文件
                    # download_directory_from_sandbox(sandbox, "/tmp", output_dir)

                    print(f"\n文件已保存到目录: {output_dir}")
                    sandbox.close()
            except Exception as e:
                print(f"从沙箱下载文件时出错: {str(e)}")

           
    finally:
        # 停止捕获并保存结果
        log_capture.stop_capture()
        save_markdown_log()

================================================
FILE: examples/14_mcp_client_fetch_test.py
================================================
import os
import sys
import asyncio
import traceback
from typing import Dict, Optional, Type

from dotenv import load_dotenv

# 在这里添加项目根目录到路径，方便导入
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
load_dotenv()

from langchain_openai import ChatOpenAI
from langgraph.prebuilt import create_react_agent
from langchain_core.tools import BaseTool
from langchain_core.messages import HumanMessage

try:
    from pydantic.v1 import BaseModel, Field
except ImportError:
    from pydantic import BaseModel, Field  # type: ignore

from core.mcp.client import MCPClient
from core.mcp.config_loader import load_config, MCPConfig, StdioConfig
from core.llm.llm_manager import LLMManager

try:
    from mcp.types import CallToolRequest
    CALL_TOOL_REQ_AVAILABLE = True
except ImportError:
    CallToolRequest = None
    CALL_TOOL_REQ_AVAILABLE = False

# 这是唯一保留的 fetch schema
try:
    class FetchInputSchema(BaseModel):
        url: str = Field(..., description="URL to fetch")
        max_length: Optional[int] = Field(default=5000)
        start_index: Optional[int] = Field(default=0)
        raw: Optional[bool] = Field(default=False)
    FETCH_SCHEMA_AVAILABLE = True
except Exception:
    FetchInputSchema = None
    FETCH_SCHEMA_AVAILABLE = False

CENTRAL_CONFIG_PATH = os.path.join(os.path.dirname(__file__), "..", "core", "mcp", "mcp_server_config.json")
LLM_ID_FOR_TESTING = "openai_gpt4o_mini"
llm_manager = LLMManager()

class MCPToolRunner(BaseTool):
    name: str = "needs_override"
    description: str = "needs_override"
    args_schema: Optional[Type[BaseModel]] = None

    client: MCPClient = Field(exclude=True)

    class Config:
        arbitrary_types_allowed = True

    async def _arun(self, **kwargs) -> str:
        if not self.client or not self.client.session:
            return f"ERROR: MCP Client session inactive for {self.name}."
        if not CALL_TOOL_REQ_AVAILABLE:
            return "ERROR: CallToolRequest unavailable."

        try:
            print(f"    [_arun:{self.name}] Sending MCP request with args: {kwargs}")
            result_message = await asyncio.wait_for(
                self.client.session.call_tool(self.name, kwargs),
                timeout=120.0
            )
            # 简化: 只检查 result 和 error
            if hasattr(result_message, "result"):
                return str(result_message.result)
            elif hasattr(result_message, "error"):
                return f"Tool Error: {result_message.error.message}"
            else:
                return "Unknown response"
        except asyncio.TimeoutError:
            return "Error: Timeout."
        except Exception as e:
            return f"Error: {e}\n{traceback.format_exc()}"

    def _run(self, **kwargs) -> str:
        print(f"    [_run:{self.name}] Running async method via asyncio.run()...")
        try:
            return asyncio.run(self._arun(**kwargs))
        except Exception as e:
            return f"Error in sync wrapper: {e}"

async def run_fetch_test(server_config_key: str, all_configs: Dict[str, MCPConfig]):
    print(f"\n=== Running STDIO BaseTool Test for Server '{server_config_key}' (Tool: 'fetch') ===")
    if not FETCH_SCHEMA_AVAILABLE:
        print("ERROR: Fetch Schema missing.")
        return False
    if not CALL_TOOL_REQ_AVAILABLE:
        print("ERROR: CallToolRequest unavailable.")
        return False

    server_config = all_configs.get(server_config_key)
    if not server_config:
        print(f"ERROR: Config for '{server_config_key}' not found.")
        return False
    if not isinstance(server_config.connection, StdioConfig):
        print(f"ERROR: Config '{server_config_key}' not STDIO.")
        return False

    try:
        model = llm_manager.get_model(LLM_ID_FOR_TESTING)
        print(f"Using LLM: {getattr(model, 'model_name', LLM_ID_FOR_TESTING)}")
    except ValueError as e:
        print(f"获取 LLM 出错: {e}.")
        return False

    test_success = False
    async with MCPClient(server_config) as client:
        if not client.session:
            print("ERROR: MCP session not established!")
            return False

        try:
            runner = MCPToolRunner(
                client=client,
                name="fetch",
                description="Fetches URL content as markdown.",
                args_schema=FetchInputSchema
            )
            tools = [runner]
        except Exception as e_inst:
            print(f"ERROR: Failed to instantiate MCPToolRunner: {e_inst}")
            return False

        agent = create_react_agent(model, tools)
        query = (
            "Use the fetch tool to get the content of https://www.google.com "
            "and tell me its title (first 50 chars)."
        )
        print(f"\nQuery: {query}")

        try:
            response = await asyncio.wait_for(
                agent.ainvoke({"messages": [{"role": "user", "content": query}]}),
                timeout=180.0
            )
            print(f"\nAgent Final Response:")
            if response and "messages" in response and response["messages"]:
                response_content = response["messages"][-1].content
                print(response_content)
                if "google" in response_content.lower():
                    print("\n✅ Test PASS")
                    test_success = True
                else:
                    print("\n❌ Test FAIL (title not found)")
                    test_success = False
            else:
                print("No valid response from agent.")
                test_success = False
        except Exception as e:
            print(f"Exception: {e}")
            test_success = False

    return test_success

async def main():
    print("Starting a simplified MCP Integration Test for 'fetch_via_uvx' only...")
    try:
        all_configs = load_config(CENTRAL_CONFIG_PATH)
        print(f"Loaded {len(all_configs)} server configs.")
    except Exception as e:
        print(f"Error loading config: {e}")
        return

    # 只测试 fetch_via_uvx
    result = await run_fetch_test("fetch_via_uvx", all_configs)
    if result:
        print("\nALL GOOD: 'fetch' test passed.")
    else:
        print("\nTEST FAILED: 'fetch' test didn't pass.")
    print("Done.")

if __name__ == "__main__":
    asyncio.run(main())

================================================
FILE: examples/15_mcp_agent_test.py
================================================
# examples/14_mcp_fetch_basetool_test.py (最终版 - BaseTool 子类)
import os
import sys
import asyncio
import json
from dotenv import load_dotenv
import traceback
from typing import List, Dict, Any, Optional, Type

# --- 前置要求 ---
# 1. 确保 core/mcp/client.py 和 core/mcp/config_loader.py 是最新版本 (含 AsyncExitStack 和导入修复)。
# 2. 确保 core/mcp/config.json 文件存在，并包含 "fetch_via_uvx" 配置 (使用 uvx + stdio)。
# 3. 确保已安装 uv (`pip install uv`) 和 mcp-server-fetch。
# 4. 确保 OpenAI API Key (或其他 LLM Key) 在 .env 或环境变量中设置。
# 5. 推荐设置 LangSmith 环境变量用于详细追踪 Agent 行为。
# ---

# 添加项目根目录到路径
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
load_dotenv()

# --- 核心依赖导入 ---
# LangChain
from langchain_openai import ChatOpenAI
from langgraph.prebuilt import create_react_agent
from langchain_core.tools import BaseTool
from langchain_core.messages import HumanMessage
try:
    # 尝试导入 Pydantic v1 (LangChain 常用的版本)
    from langchain_core.pydantic_v1 import BaseModel, Field
except ImportError:
    try:
        # 如果 V1 不可用，尝试导入 V2
        from pydantic import BaseModel, Field # type: ignore
    except ImportError:
         print("CRITICAL ERROR: Pydantic (v1 or v2) not found.")
         sys.exit(1)
# MCP Client/Config
try: from core.mcp.client import MCPClient
except ImportError: print("CRITICAL ERROR: Cannot import MCPClient."); sys.exit(1)
try: from core.mcp.config_loader import load_config, MCPConfig, StdioConfig
except ImportError: print("CRITICAL ERROR: Cannot import config loader."); sys.exit(1)
# LLM
from core.llm.llm_manager import LLMManager
# MCP Types
try: from mcp.types import CallToolRequest; CALL_TOOL_REQ_AVAILABLE = True
except ImportError: CallToolRequest = None; CALL_TOOL_REQ_AVAILABLE = False
# ---

# --- Fetch Tool Schema 定义 ---
FETCH_SCHEMA_AVAILABLE = False
FetchInputSchema = None
try:
    class FetchInputSchema(BaseModel): # 使用导入的 BaseModel
         url: str = Field(..., description="URL to fetch")
         max_length: Optional[int] = Field(default=5000, description="Maximum number of characters to return")
         start_index: Optional[int] = Field(default=0, description="Start content from this character index")
         raw: Optional[bool] = Field(default=False, description="Get raw content without markdown conversion")
    FETCH_SCHEMA_AVAILABLE = True
except Exception as e_pyd_fetch: print(f"ERROR defining FetchInputSchema: {e_pyd_fetch}")
# ---

# --- 全局设置 ---
# **重要**: 确认此路径指向你的中央配置文件
CENTRAL_CONFIG_PATH = os.path.join(os.path.dirname(__file__), "..", "core", "mcp", "mcp_server_config.json")
# 使用 OpenAI 模型通常更稳定
LLM_ID_FOR_TESTING = "openai_gpt4o_mini"
# 要测试的服务器在 config.json 中的 key
SERVER_KEY_TO_TEST = "fetch_via_uvx"
# 要测试的工具名称
TOOL_NAME_TO_TEST = "fetch"
# 要测试的工具的正确 Schema
CORRECT_SCHEMA_FOR_TOOL = FetchInputSchema
# 要测试的工具的描述
TOOL_DESCRIPTION = "Fetches web content as markdown. Input requires 'url' (string) and optional 'max_length', 'start_index', 'raw'."

# --- Everything MCP 服务器设置 ---
EVERYTHING_SERVER_KEY = "everything"
EVERYTHING_ECHO_TOOL = "echo"
EVERYTHING_ADD_TOOL = "add"

# --- Everything MCP 工具 Schema 定义 ---
ECHO_SCHEMA_AVAILABLE = False
EchoInputSchema = None
try:
    class EchoInputSchema(BaseModel):
        message: str = Field(..., description="Message to echo back")
    ECHO_SCHEMA_AVAILABLE = True
except Exception as e_pyd_echo: print(f"ERROR defining EchoInputSchema: {e_pyd_echo}")

ADD_SCHEMA_AVAILABLE = False
AddInputSchema = None
try:
    class AddInputSchema(BaseModel):
        a: float = Field(..., description="First number")
        b: float = Field(..., description="Second number")
    ADD_SCHEMA_AVAILABLE = True
except Exception as e_pyd_add: print(f"ERROR defining AddInputSchema: {e_pyd_add}")

llm_manager = LLMManager()

# --- 标准 BaseTool 子类定义，用于桥接 MCP 调用 ---
class MCPToolRunner(BaseTool):
    """
    通过 MCP 调用服务器上工具的标准 BaseTool 实现。
    """
    # --- 类属性 (将在实例化时被覆盖) ---
    name: str = "mcp_tool_runner" # Default name
    description: str = "Runs a tool via MCP"
    args_schema: Optional[Type[BaseModel]] = None

    # --- 实例属性 ---
    client: MCPClient = Field(exclude=True) # 存储客户端引用

    # Pydantic 配置 (根据你使用的 BaseModel 版本)
    class Config: arbitrary_types_allowed = True

    async def _arun(self, **kwargs) -> str:
        """异步执行：构造 MCP 请求并调用 client.session.call_tool"""
        if not self.client or not self.client.session: return f"ERROR: MCP Client session inactive for {self.name}."
        if not CALL_TOOL_REQ_AVAILABLE: return "ERROR: CallToolRequest unavailable."

        try:
            # kwargs 应该是 LangChain 根据 args_schema 验证和准备好的参数
            print(f"    [_arun:{self.name}] Preparing MCP request with args: {kwargs}")
            # 不再需要构造CallToolRequest对象，直接传递工具名称和参数
            print(f"    [_arun:{self.name}] Calling tool '{self.name}' with args: {kwargs}")

            # 调用 MCP session - 直接传递工具名称和参数
            result_message = await asyncio.wait_for(
                self.client.session.call_tool(self.name, kwargs),
                timeout=120.0 # 给予足够的网络和执行超时
            )

            # 处理结果 - 简化处理逻辑，直接检查content属性
            print(f"    [_arun:{self.name}] MCP Response received, type: {type(result_message)}")
            
            # 直接检查是否有content属性（根据日志显示的响应结构）
            if hasattr(result_message, 'content'):
                content = result_message.content
                print(f"    [_arun:{self.name}] Found content attribute, type: {type(content)}")
                
                # 如果content是列表且不为空
                if isinstance(content, list) and len(content) > 0:
                    first_item = content[0]
                    print(f"    [_arun:{self.name}] Content is a list, first item type: {type(first_item)}")
                    
                    # 尝试获取text属性
                    if hasattr(first_item, 'text'):
                        print(f"    [_arun:{self.name}] First item has text attribute, returning text")
                        return first_item.text
                    else:
                        print(f"    [_arun:{self.name}] First item has no text attribute, converting to string")
                        return str(first_item)
                elif hasattr(content, 'text'):
                    print(f"    [_arun:{self.name}] Content has text attribute, returning text")
                    return content.text
                else:
                    print(f"    [_arun:{self.name}] Content has no text attribute, converting to string")
                    return str(content)
            # 如果没有content属性，回退到检查result属性
            elif hasattr(result_message, 'result'):
                res_val = result_message.result
                print(f"    [_arun:{self.name}] Found result attribute: {str(res_val)[:500]}...")
                return str(res_val) if not isinstance(res_val, str) else res_val
            elif hasattr(result_message, 'error'):
                err_msg = result_message.error.message
                print(f"    [_arun:{self.name}] MCP Tool Error: {err_msg}")
                # 对于 Agent，返回错误通常比抛出异常更好处理
                return f"Tool Error: {err_msg}"
            else:
                # 打印完整的响应对象，帮助诊断问题
                print(f"    [_arun:{self.name}] Unknown MCP response format. Full response object: {result_message}")
                print(f"    [_arun:{self.name}] Response type: {type(result_message)}")
                print(f"    [_arun:{self.name}] Response dir: {dir(result_message)}")
                
                # 尝试处理特殊的响应格式
                if hasattr(result_message, 'content'):
                    content = result_message.content
                    print(f"    [_arun:{self.name}] Found content attribute in response")
                    
                    # 处理content是列表的情况
                    if isinstance(content, list) and len(content) > 0:
                        print(f"    [_arun:{self.name}] Content is a list with {len(content)} items")
                        first_item = content[0]
                        if hasattr(first_item, 'text'):
                            print(f"    [_arun:{self.name}] First item has text attribute, returning text")
                            return first_item.text
                        elif hasattr(first_item, 'type') and hasattr(first_item, 'text'):
                            print(f"    [_arun:{self.name}] First item has type and text attributes, returning text")
                            return first_item.text
                        else:
                            print(f"    [_arun:{self.name}] First item has no text attribute, converting to string")
                            return str(first_item)
                    # 处理content是单个对象的情况
                    elif hasattr(content, 'text'):
                        print(f"    [_arun:{self.name}] Content has text attribute, returning text")
                        return content.text
                    else:
                        print(f"    [_arun:{self.name}] Content has no text attribute, converting to string")
                        return str(content)
                
                # 尝试提取更多信息
                response_details = ""
                for attr in dir(result_message):
                    if not attr.startswith('_'):
                        try:
                            value = getattr(result_message, attr)
                            if not callable(value):
                                response_details += f"\n    - {attr}: {value}"
                        except Exception as attr_err:
                            response_details += f"\n    - {attr}: [Error accessing: {attr_err}]"
                print(f"    [_arun:{self.name}] Response details: {response_details}")
                return f"Unknown response from MCP tool {self.name}. Details: {response_details}"
        except asyncio.TimeoutError:
            print(f"    [_arun:{self.name}] MCP call timeout.")
            return f"Error: Timeout calling MCP tool {self.name}."
        except Exception as e:
            print(f"    [_arun:{self.name}] Unexpected error during MCP call: {e}")
            print(traceback.format_exc())
            # 返回包含 Traceback 的错误，方便调试
            return f"Unexpected Error calling {self.name}: {e}\n{traceback.format_exc()}"

    def _run(self, **kwargs) -> str:
        """同步执行 (简单实现，通过运行异步方法)"""
        print(f"    [_run:{self.name}] Running async method via asyncio.run()...")
        try:
            # 注意: 在已运行的事件循环中调用 asyncio.run 会报错
            # 更好的方法是检查当前循环或使用 anyio/nest_asyncio
            # 但为了满足 BaseTool 要求，先用简单方式，如果 Agent 只用 async 就没问题
            # 如果 Agent 强制用 sync，可能需要更复杂的处理
            # return asyncio.run(self._arun(**kwargs))
            # 更安全的方式是提示不支持或使用更复杂的同步转异步
             return "Synchronous execution not fully supported, please use async."
        except Exception as e:
             print(f"    [_run:{self.name}] Error: {e}")
             return f"Error in sync wrapper: {e}"
# ---

# --- 主要测试逻辑 ---
async def run_fetch_test():
    """运行 Fetch Server 测试 (使用 BaseTool 子类)"""
    print(f"\n=== Running Fetch Server Test (BaseTool Subclass Method) ===")

    # 检查依赖和 Schema 定义
    if not FETCH_SCHEMA_AVAILABLE: print("ERROR: FetchInputSchema not available."); return False
    if not CALL_TOOL_REQ_AVAILABLE: print("ERROR: CallToolRequest unavailable."); return False

    # 加载配置
    config: Optional[MCPConfig] = None
    try:
        all_configs = load_config(CENTRAL_CONFIG_PATH)
        config = all_configs.get(SERVER_KEY_TO_TEST)
        if not config: print(f"ERROR: Config key '{SERVER_KEY_TO_TEST}' not found in '{CENTRAL_CONFIG_PATH}'."); return False
        if not isinstance(config.connection, StdioConfig): print("ERROR: Config connection is not STDIO."); return False
        print(f"Successfully loaded config for '{SERVER_KEY_TO_TEST}'.")
    except Exception as e_load: print(f"ERROR loading config: {e_load}"); return False

    # 获取 LLM
    try: model = llm_manager.get_model(LLM_ID_FOR_TESTING); print(f"Using LLM: {getattr(model, 'model_name', LLM_ID_FOR_TESTING)}")
    except ValueError as e: print(f"获取 LLM 出错: {e}."); return False

    test_success = False
    # 使用 MCPClient 连接 (它会根据 config 启动服务器)
    async with MCPClient(config) as client:
        print("\nMCPClient context entered.")
        if not client.session: print("ERROR: MCP session not established!"); return False

        # --- 实例化我们定义的 MCPToolRunner ---
        try:
            print(f"Instantiating MCPToolRunner for '{TOOL_NAME_TO_TEST}'...")
            mcp_tool_instance = MCPToolRunner(
                client=client, # 注入 client
                name=TOOL_NAME_TO_TEST,
                description=TOOL_DESCRIPTION,
                args_schema=CORRECT_SCHEMA_FOR_TOOL
            )
            tools = [mcp_tool_instance]
            print(f"Tool instance created successfully.")
        except Exception as e_inst: print(f"ERROR instantiating MCPToolRunner: {e_inst}"); return False
        # ---

        # --- Agent 执行 ---
        agent = create_react_agent(model, tools) # Agent 使用这个标准工具
        query = "Use the fetch tool to get the main content (first 2000 chars) from https://developer.mozilla.org/en-US/docs/Web/HTML"
        print(f"\nRunning Agent Query...")
        print(f"Query: {query}")
        print("--- NOTE: Enable LangSmith for detailed tracing! ---")
        try:
            response = await asyncio.wait_for( agent.ainvoke({"messages": [{"role": "user","content": query}]}), timeout=180.0 )
            print(f"\nAgent Final Response:")
            if response and "messages" in response and response["messages"]:
                 response_content = response["messages"][-1].content; print(response_content)
                 # 检查是否成功获取内容且无报错
                 contains_error = "error" in response_content.lower() or "fail" in response_content.lower() or "issue" in response_content.lower() or "apologi" in response_content.lower() or "unable" in response_content.lower() or "tool error" in response_content.lower()
                 contains_expected = "HTML" in response_content

                 if not contains_error and contains_expected:
                      print(f"\n✅ Test PASS: Agent successfully used tool and got expected content.")
                      test_success = True
                 else: print(f"\n❌ Test FAIL: Agent reported error or didn't get expected content."); test_success = False
            else: print("Agent returned no valid response."); test_success = False
        except asyncio.TimeoutError: print(f"Agent execution timed out"); test_success = False
        except Exception as e: print(f"Agent execution failed: {e}"); print(f"Traceback:\n{traceback.format_exc()}"); test_success = False
        # ---

    # async with 会自动调用 client.close()
    print(f"\n--- Fetch Server Test Result: {'PASS' if test_success else 'FAIL'} ---")
    return test_success

async def run_everything_test():
    """运行 Everything MCP Server 测试 (使用 BaseTool 子类)"""
    print(f"\n=== Running Everything MCP Server Test (BaseTool Subclass Method) ===")

    # 检查依赖和 Schema 定义
    if not ECHO_SCHEMA_AVAILABLE: print("ERROR: EchoInputSchema not available."); return False
    if not ADD_SCHEMA_AVAILABLE: print("ERROR: AddInputSchema not available."); return False
    if not CALL_TOOL_REQ_AVAILABLE: print("ERROR: CallToolRequest unavailable."); return False

    # 加载配置
    config: Optional[MCPConfig] = None
    try:
        all_configs = load_config(CENTRAL_CONFIG_PATH)
        config = all_configs.get(EVERYTHING_SERVER_KEY)
        if not config: print(f"ERROR: Config key '{EVERYTHING_SERVER_KEY}' not found in '{CENTRAL_CONFIG_PATH}'."); return False
        if not isinstance(config.connection, StdioConfig): print("ERROR: Config connection is not STDIO."); return False
        print(f"Successfully loaded config for '{EVERYTHING_SERVER_KEY}'.")
    except Exception as e_load: print(f"ERROR loading config: {e_load}"); return False

    # 获取 LLM
    try: model = llm_manager.get_model(LLM_ID_FOR_TESTING); print(f"Using LLM: {getattr(model, 'model_name', LLM_ID_FOR_TESTING)}")
    except ValueError as e: print(f"获取 LLM 出错: {e}."); return False

    test_success = False
    # 使用 MCPClient 连接 (它会根据 config 启动服务器)
    async with MCPClient(config) as client:
        print("\nMCPClient context entered for Everything MCP.")
        if not client.session: print("ERROR: MCP session not established!"); return False

        # --- 实例化我们定义的 MCPToolRunner 用于 echo 工具 ---
        try:
            print(f"Instantiating MCPToolRunner for '{EVERYTHING_ECHO_TOOL}'...")
            echo_tool = MCPToolRunner(
                client=client, # 注入 client
                name=EVERYTHING_ECHO_TOOL,
                description="Echoes back the input message",
                args_schema=EchoInputSchema
            )
            
            print(f"Instantiating MCPToolRunner for '{EVERYTHING_ADD_TOOL}'...")
            add_tool = MCPToolRunner(
                client=client, # 注入 client
                name=EVERYTHING_ADD_TOOL,
                description="Adds two numbers together",
                args_schema=AddInputSchema
            )
            
            tools = [echo_tool, add_tool]
            print(f"Tool instances created successfully.")
        except Exception as e_inst: print(f"ERROR instantiating MCPToolRunner: {e_inst}"); return False
        # ---

        # --- Agent 执行 ---
        agent = create_react_agent(model, tools) # Agent 使用这些工具
        query = "First, use the echo tool to echo back the message 'Hello from Everything MCP!'. Then, use the add tool to calculate 42 + 58."
        print(f"\nRunning Agent Query...")
        print(f"Query: {query}")
        print("--- NOTE: Enable LangSmith for detailed tracing! ---")
        try:
            response = await asyncio.wait_for(agent.ainvoke({"messages": [{"role": "user","content": query}]}), timeout=180.0)
            print(f"\nAgent Final Response:")
            if response and "messages" in response and response["messages"]:
                response_content = response["messages"][-1].content; print(response_content)
                # 检查是否成功获取内容且无报错
                contains_error = "error" in response_content.lower() or "fail" in response_content.lower() or "issue" in response_content.lower() or "apologi" in response_content.lower() or "unable" in response_content.lower() or "tool error" in response_content.lower()
                contains_echo = "Hello from Everything MCP!" in response_content
                contains_add = "100" in response_content

                if not contains_error and contains_echo and contains_add:
                    print(f"\n✅ Test PASS: Agent successfully used both tools and got expected content.")
                    test_success = True
                else: 
                    print(f"\n❌ Test FAIL: Agent reported error or didn't get expected content.")
                    print(f"  - Contains error: {contains_error}")
                    print(f"  - Contains echo response: {contains_echo}")
                    print(f"  - Contains add result: {contains_add}")
                    test_success = False
            else: print("Agent returned no valid response."); test_success = False
        except asyncio.TimeoutError: print(f"Agent execution timed out"); test_success = False
        except Exception as e: print(f"Agent execution failed: {e}"); print(f"Traceback:\n{traceback.format_exc()}"); test_success = False
        # ---

    # async with 会自动调用 client.close()
    print(f"\n--- Everything MCP Server Test Result: {'PASS' if test_success else 'FAIL'} ---")
    return test_success

async def main():
    """主函数 - 运行所有测试"""
    print("Starting MCP Integration Tests...")
    
    # 运行 Fetch 测试
    fetch_success = await run_fetch_test()
    
    # 运行 Everything MCP 测试
    everything_success = await run_everything_test()
    
    print("\n" + "="*20 + " FINAL TEST SUMMARY " + "="*20);
    print(f"  Fetch Server Test: {'PASS' if fetch_success else 'FAIL'}")
    print(f"  Everything MCP Test: {'PASS' if everything_success else 'FAIL'}")
    print("="*20 + " MCP Integration Test Finished " + "="*20)

if __name__ == "__main__":
    # 简化依赖检查
    print("--- Dependency Check ---")
    deps_ok = True
    try: import mcp; print("mcp available: True")
    except ImportError: print("mcp available: False"); deps_ok = False
    if CALL_TOOL_REQ_AVAILABLE: print("CallToolRequest available: True")
    else: print("CallToolRequest available: False"); deps_ok = False # 需要它
    try: import langgraph; print("langgraph available: True")
    except ImportError: print("langgraph available: False"); deps_ok = False
    try: import langchain_openai; print("langchain_openai available: True")
    except ImportError: print("langchain_openai available: False"); deps_ok = False
    try: import dotenv; print("dotenv available: True")
    except ImportError: print("dotenv available: False"); deps_ok = False
    try: import pydantic; print("pydantic available: True")
    except ImportError: print("pydantic available: False"); deps_ok = False
    try: from core.mcp.client import MCPClient; print("MCPClient available: True")
    except ImportError: print("MCPClient available: False"); deps_ok = False
    try: from core.mcp.config_loader import load_config; print("config_loader available: True")
    except ImportError: print("config_loader available: False"); deps_ok = False
    if not FETCH_SCHEMA_AVAILABLE: print("FetchInputSchema available: False"); deps_ok=False
    else: print("FetchInputSchema available: True")
    if not ECHO_SCHEMA_AVAILABLE: print("EchoInputSchema available: False"); deps_ok=False
    else: print("EchoInputSchema available: True")
    if not ADD_SCHEMA_AVAILABLE: print("AddInputSchema available: False"); deps_ok=False
    else: print("AddInputSchema available: True")
    print(f"------------------------")

    if not deps_ok:
        print("CRITICAL ERROR: Necessary dependencies missing.")
        sys.exit(1)

    asyncio.run(main())

================================================
FILE: examples/16_google_a2a/README.md
================================================
# LangGraph Agent 与 A2A 协议集成框架

## 概述

本项目提供了一个将 **LangGraph Agent**（特别是基于 ReAct 模式并能调用工具的 Agent）与 **A2A (Agent-to-Agent) 协议** 相集成的框架和示例。目标是展示如何将一个用 LangGraph 构建的复杂 Agent 能力，通过标准化的 A2A 接口暴露给外部客户端或其他 Agent。

此框架的核心在于 `AgentTaskManager`，它充当了 A2A 协议层与具体 Agent 实现之间的桥梁。项目包含了一个完整的端到端示例，其中 `CurrencyAgent`（使用 `create_react_agent` 构建，并带有计算器和搜索工具）通过 `A2AServer` 提供服务，并提供了两个不同的客户端示例 (`client_example.py` 和 `currency_agent_test.py`) 来演示如何与之交互。

关键技术栈包括：
* **A2A 协议:** 定义交互规范。
* **LangGraph:** 用于构建具备状态管理和工具调用能力的 Agent。
* **`create_react_agent`:** LangGraph 提供的预构建 ReAct Agent 实现（作为示例）。
* **Pydantic:** 用于定义和验证 A2A 协议中的数据结构 (`core/a2a/types.py`)。
* **Starlette/Uvicorn:** 作为底层 Web 框架运行 A2A 服务器 (`core/a2a/server/server.py`)。
* **OpenAI API:** 作为 LangGraph Agent 使用的后端大语言模型（可替换）。

## 特性

* **A2A 协议兼容:** 提供符合 A2A 规范的服务端点 (`/.well-known/agent.json` 和主任务端点)。
* **LangGraph Agent 集成:** 可将任意（满足特定接口要求的）LangGraph Agent 作为 A2A 服务的核心处理逻辑。
* **工具使用:** 集成的 Agent 能够根据需要调用外部工具（示例中为计算器和搜索）。
* **同步任务处理:** 支持客户端发送任务并等待最终结果。
* **流式基础:** 包含了处理流式请求和响应的框架（Agent 端流式逻辑需开发者实现）。
* **类型安全:** 使用 Pydantic 进行严格的数据校验。
* **环境配置:** 支持通过 `.env` 文件配置 API 密钥等敏感信息。
* **客户端示例:** 提供了基础和场景化的客户端示例代码。

## 目录结构

```
.
├── core/                           # 核心 A2A 协议实现
│   └── a2a/
│       ├── client/
│       │   └── client.py           # A2AClient 客户端库实现
│       ├── server/
│       │   ├── server.py           # A2AServer HTTP 服务器实现
│       │   └── task_manager.py     # TaskManager 基础接口 (被 AgentTaskManager 使用)
│       ├── agent_task_manager.py     # AgentTaskManager 实现 (连接 A2A 与 LangGraph)
│       └── types.py                # A2A 协议的 Pydantic 模型定义
├── examples/                       # 示例代码
│   └── a2a/
│       ├── langgraph_integration.py # 服务端设置和示例 LangGraph Agent (CurrencyAgent) 定义
│       ├── client_example.py          # 基础 A2A 客户端使用示例脚本
│       └── currency_agent_test.py     # 场景化 A2A 客户端测试脚本
├── .env                            # 存储环境变量 (例如 OPENAI_API_KEY) - *需要自行创建*
├── requirements.txt                # Python 依赖项列表 (假设存在)
└── README.md                       # 本文档
```

## 核心组件说明

* **`core/a2a/types.py`:** 定义所有 A2A 数据结构，是协议的基础和校验依据。
* **`core/a2a/server/server.py` (`A2AServer`):** 基于 Starlette 的 HTTP 服务器，处理 A2A JSON-RPC 请求路由，将请求交给 `AgentTaskManager`。通过 `.start()` 方法启动。
* **`core/a2a/agent_task_manager.py` (`AgentTaskManager`):** **核心适配器**。连接 A2A 层和 Agent 层。它接收来自 `A2AServer` 的请求，管理任务状态，并调用注入的 Agent 实例的 `invoke` 或 `stream` 方法。
* **`examples/a2a/langgraph_integration.py`:** 包含 `CurrencyAgent` (使用 `create_react_agent` 的示例 Agent) 的定义，以及如何配置和启动 `A2AServer` 来运行这个 Agent 的完整脚本。
* **`core/a2a/client/client.py` (`A2AClient`):** 基础 A2A 客户端库。
* **`examples/a2a/client_example.py`:** 一个简单的脚本，演示如何使用 `A2AClient` 发送基本请求。
* **`examples/a2a/currency_agent_test.py`:** 一个更复杂的客户端脚本，包含多个测试场景，用于测试服务器端 Agent 的不同交互模式。

## 先决条件

* Python (推荐 3.10 或更高版本)
* `pip` (Python 包安装器)
* 虚拟环境 (强烈推荐)
* 大语言模型 API Key (例如 OpenAI API Key)

## 安装与设置

1.  **克隆仓库:**
    ```bash
    git clone <your-repo-url>
    cd <your-repo-directory>
    ```
2.  **创建并激活虚拟环境:**
    ```bash
    uv venv
    source .venv/bin/activate
    ```
3.  **安装依赖项:**
    ```bash
    uv sync
    ```
4.  **设置环境变量:**
    * 在项目根目录下创建 `.env` 文件。
    * 添加所需的 API Key，例如：
        ```dotenv
        OPENAI_API_KEY="sk-..."
        ```

## 运行示例

1.  **启动 A2A 服务器:**
    * 在终端中，激活虚拟环境后运行：
        ```bash
        python -m examples.a2a.langgraph_integration
        ```
    * 服务器将在 `http://127.0.0.1:8000` 启动并监听。

2.  **运行 A2A 客户端:**
    * 打开**新的**终端，激活虚拟环境。
    * 你可以选择运行任一客户端示例：
        * **基础示例:**
            ```bash
            python -m examples.a2a.client_example
            ```
        * **场景化测试:**
            ```bash
            python -m examples.a2a.currency_agent_test
            ```

3.  **预期输出:**
    * **服务器终端**会显示接收请求、调用 LLM 和工具（如果被触发）的日志。
    * **客户端终端**会显示发送任务、轮询状态（对于同步任务）、接收结果或（模拟的）流式事件的输出。`currency_agent_test.py` 会按场景输出结果。

---

## **重要：集成新的 LangGraph Agent 指南**

如果你创建了一个新的基于 LangGraph 的 Agent，并希望将其接入到这个 A2A 框架中，你需要遵循以下步骤和约定：

### 1. Agent 类必须实现的接口

你的新 Agent 类（例如 `MyNewAgent`）需要被 `AgentTaskManager` 调用。为此，它**必须**实现以下方法和属性：

* **`__init__(self, llm, ...)`:**
    * 构造函数，用于初始化 Agent 所需的资源，例如 LLM 实例、工具列表等。
    * **关键:** 在这里构建或获取你的 LangGraph **Runnable** 实例（例如通过 `create_react_agent` 或手动构建 `StateGraph().compile()`），并将其存储为类的成员（例如 `self.agent_runnable`）。

* **`invoke(self, query: str, session_id: Optional[str] = None) -> str:`**
    * 处理 A2A 的**同步** `tasks/send` 请求。
    * 接收从 `AgentTaskManager` 传递过来的纯文本用户查询 `query` 和可选的 `session_id`。
    * **内部逻辑:**
        * 将 `query` 包装成你的 LangGraph Runnable 所需的输入格式。对于基于 `create_react_agent` 或类似使用消息列表的 Agent，通常是 `{"messages": [("user", query)]}`。如果需要 `session_id`，也应包含在内。
        * 调用 LangGraph Runnable 的 `.invoke()` 方法，传入构造好的输入字典。
        * 处理 Runnable 返回的结果字典。对于 ReAct Agent，最终的文本答案通常位于结果字典内 `messages` 列表的最后一条消息的内容中。你需要编写逻辑来提取这个最终答案。
    * **返回值:** **必须**返回一个包含最终答案的**字符串**。

* **`stream(self, query: str, session_id: Optional[str] = None) -> AsyncIterable[Dict[str, Any]]:`**
    * 处理 A2A 的**流式** `tasks/sendSubscribe` 请求。
    * 接收 `query` 和 `session_id`。
    * **必须**是一个**异步生成器** (`async def` 包含 `yield`)。
    * **内部逻辑:**
        * 准备 LangGraph Runnable 流式调用所需的输入（通常与 `invoke` 类似，例如 `{"messages": [("user", query)]}`）。
        * 调用 LangGraph Runnable 的流式方法，例如 `self.agent_runnable.astream(...)` 或 `self.agent_runnable.astream_log(...)`。
        * 使用 `async for chunk in ...:` 迭代 LangGraph Runnable 返回的流式数据块 (`chunk`)。
        * **解析 `chunk`**: LangGraph 流式输出的 `chunk` 格式取决于你调用的方法（`astream` vs `astream_log`）和图的结构。你需要解析这些 `chunk`（可能是状态变更、日志补丁等）来获取有意义的中间或最终内容。
        * **`yield` 符合格式的字典**: 对于每个希望发送给客户端的更新，你需要 `yield` 一个字典。这个字典**必须**包含以下键（供 `AgentTaskManager._run_streaming_agent` 使用）：
            * `"content"`: `str` - 当前步骤生成的文本内容。
            * `"is_task_complete"`: `bool` - 指示这是否是任务的最终产物/结束信号。
            * `"require_user_input"`: `bool` - 指示任务是否暂停并需要用户输入。
    * **返回值:** 返回一个异步可迭代对象（由 `async def` + `yield` 自动创建）。

* **`SUPPORTED_CONTENT_TYPES: List[str]` (类属性):**
    * 一个包含 Agent 支持的输出内容类型的列表。对于主要处理文本的 Agent，通常是 `["text"]`。`AgentTaskManager` 会用它来验证客户端请求的 `acceptedOutputModes`。

### 2. `AgentState` 的一致性

如果你手动构建 LangGraph 图，你定义的 `AgentState`（传递给 `StateGraph`）需要与你的 `invoke` 和 `stream` 方法处理输入/输出的方式保持一致。特别是，如果你依赖 `messages` 列表来管理对话历史或传递输入/输出，`AgentState` 中需要正确定义它。

### 3. 集成步骤

1.  **创建 Agent 类:**
    * 在你的项目中创建一个新的 Python 文件（例如 `my_new_agent.py`）。
    * 定义你的 Agent 类（例如 `MyNewAgent`），确保它实现了上面描述的 `__init__`, `invoke`, `stream` 方法和 `SUPPORTED_CONTENT_TYPES` 属性。
    * 在 `__init__` 中构建或加载你的 LangGraph Runnable。

2.  **修改服务器启动脚本 (例如 `examples/a2a/langgraph_integration.py`):**
    * **导入**你的新 Agent 类：`from my_new_agent import MyNewAgent`。
    * **实例化**你的新 Agent：`my_agent = MyNewAgent(llm)` (确保传递了所需的依赖，如 `llm`)。
    * **更新 `AgentCard`**: 修改 `name`, `description` 和 `skills` 列表以反映新 Agent 的信息。确保 `AgentSkill` 具有唯一的 `id` 和正确的 `name`。
    * **实例化 `AgentTaskManager`**: 使用你的新 Agent 实例：`task_manager = AgentTaskManager(my_agent)`。
    * **实例化 `A2AServer`**: 使用更新后的 `agent_card` 和 `task_manager`。

3.  **运行服务器:**
    * 启动修改后的服务器脚本：`python -m examples.a2a.your_server_script`。

4.  **测试:**
    * 使用 `client_example.py` 或 `currency_agent_test.py`（可能需要修改发送的查询或 `metadata` 中的 `skill_name`）来向新启动的服务器发送请求，验证你的新 Agent 是否能通过 A2A 协议正常工作。

### 示例 Agent 骨架

```python
# my_new_agent.py
import logging
from typing import List, Optional, AsyncIterable, Dict, Any, Tuple
from langchain_core.language_models import BaseChatModel # 示例 LLM 类型
from langgraph.graph.state import StateGraph # 如果手动构建图
# from langgraph.prebuilt import create_some_agent # 如果使用预构建
from typing import TypedDict

logger = logging.getLogger(__name__)

# 1. 定义你 Agent 使用的 State (如果需要)
class MyAgentState(TypedDict):
    messages: List[Tuple[str, str]]
    # ... 其他状态字段

class MyNewAgent:
    SUPPORTED_CONTENT_TYPES: List[str] = ["text"]

    def __init__(self, llm: BaseChatModel):
        self.llm = llm
        # TODO: 在这里构建或加载你的 LangGraph Runnable
        # 例如: self.agent_runnable = self._build_my_graph()
        # 或者: self.agent_runnable = create_some_agent(llm, tools)
        self.agent_runnable = self._get_placeholder_runnable() # 示例
        logger.info("MyNewAgent initialized.")

    def _get_placeholder_runnable(self):
        # 这是一个模拟的 Runnable，你需要替换成真实的 LangGraph Runnable
        class PlaceholderRunnable:
            def invoke(self, input_dict):
                logger.info(f"PlaceholderRunnable received invoke: {input_dict}")
                query = input_dict.get("messages", [("", "")])[-1][1]
                return {"messages": [("assistant", f"模拟回应 '{query}'")]}
            async def astream(self, input_dict):
                logger.info(f"PlaceholderRunnable received astream: {input_dict}")
                query = input_dict.get("messages", [("", "")])[-1][1]
                yield {"messages": [("assistant", f"模拟流式回应1 '{query}' ...")]}
                await asyncio.sleep(0.5)
                yield {"messages": [("assistant", f"模拟流式回应2 '{query}' 完毕。")]}
        return PlaceholderRunnable()

    # def _build_my_graph(self):
    #     # 如果你手动构建图，在这里实现
    #     # workflow = StateGraph(MyAgentState)
    #     # ... add nodes, edges ...
    #     # return workflow.compile()
    #     pass

    def invoke(self, query: str, session_id: Optional[str] = None) -> str:
        logger.debug(f"[MyNewAgent.invoke] query: '{query}', session_id: '{session_id}'")
        # 1. 准备输入
        invoke_input = {"messages": [("user", query)]}
        # 2. 调用 Runnable
        try:
            result = self.agent_runnable.invoke(invoke_input)
            logger.debug(f"[MyNewAgent.invoke] Runnable result: {result}")
            # 3. 解析结果
            final_output = "错误：未能解析 Agent 响应。"
            if isinstance(result, dict) and isinstance(result.get("messages"), list) and result["messages"]:
                 last_message = result["messages"][-1]
                 if isinstance(last_message, tuple) and len(last_message) == 2:
                     final_output = last_message[1]
                 elif hasattr(last_message, 'content'):
                      final_output = last_message.content
            return str(final_output)
        except Exception as e:
            logger.error(f"[MyNewAgent.invoke] Error: {e}", exc_info=True)
            raise # 重新抛出异常，让 TaskManager 处理

    async def stream(self, query: str, session_id: Optional[str] = None) -> AsyncIterable[Dict[str, Any]]:
        logger.debug(f"[MyNewAgent.stream] query: '{query}', session_id: '{session_id}'")
        # 1. 准备输入
        stream_input = {"messages": [("user", query)]}
        # 2. 调用 Runnable 的流式方法
        try:
            # 使用 astream 或 astream_log
            async for chunk in self.agent_runnable.astream(stream_input):
                logger.debug(f"[MyNewAgent.stream] Received chunk: {chunk}")
                # 3. 解析 chunk 并 yield 符合格式的字典
                #    这里的解析逻辑高度依赖于你的图和使用的流式方法
                #    你需要根据实际的 chunk 内容提取 content, is_task_complete, require_user_input
                # --- 这是一个 **高度简化** 的示例解析 ---
                content_to_yield = ""
                is_complete = False # 你需要根据 chunk 判断任务是否真的结束
                is_input_required = False # 你需要根据 chunk 判断是否需要输入

                # 尝试从 chunk 中提取 'messages' 的最新内容作为 content
                if isinstance(chunk, dict) and isinstance(chunk.get("messages"), list) and chunk["messages"]:
                    last_message = chunk["messages"][-1]
                    if isinstance(last_message, tuple) and len(last_message) == 2:
                        content_to_yield = last_message[1]
                    elif hasattr(last_message, 'content'):
                        content_to_yield = last_message.content

                if content_to_yield: # 只在有内容时 yield
                    # 在实际应用中，你需要更复杂的逻辑判断 is_task_complete
                    # 例如，检查 LangGraph 图是否到达了 END 节点，或者某个特定的最终节点状态
                    # is_complete = ???
                    yield {
                        "content": content_to_yield,
                        "is_task_complete": is_complete, # 需要正确设置
                        "require_user_input": is_input_required # 需要正确设置
                    }
                # --- 简化示例结束 ---

            # **重要**: 在循环结束后，如果任务确实完成了，需要再 yield 一个最终状态
            # (除非上面的循环中最后一个 yield 的 is_task_complete 已经是 True)
            # 例如:
            # final_result = await self.agent_runnable.ainvoke(stream_input) # 可能需要再调用一次 invoke 获取最终确认状态
            # final_text = ... # 解析最终文本
            # yield {"content": final_text, "is_task_complete": True, "require_user_input": False}

        except Exception as e:
            logger.error(f"[MyNewAgent.stream] Error: {e}", exc_info=True)
            # 在流中抛出异常可能会中断 SSE 连接，或者你可以 yield 一个错误信息
            yield {
                "content": f"处理流式请求时出错: {e}",
                "is_task_complete": True, # 标记任务失败并结束
                "require_user_input": False
            }
```

## 当前状态与限制

* 同步任务执行，包括 LangGraph Agent 调用 LLM 和工具，已成功实现并验证。
* A2A 协议的服务端和客户端基础结构已建立。
* **Agent 端的流式处理 (`CurrencyAgent.stream`) 目前是模拟的**，并未真正调用 LangGraph 的流式接口。真实的流式更新尚未实现。
* 当前 Agent 实现 (`CurrencyAgent`) 不支持需要跨请求保持状态的多轮对话澄清。
* 错误处理可以进一步增强。
* 任务存储仅在内存中 (`InMemoryTaskManager`)。

## 未来方向

* **实现真实流式输出:** 按照上述指南，在 Agent 类中实现 `stream` 方法，调用 LangGraph 的 `astream` 或 `astream_log`，并正确解析和 `yield` A2A 所需格式的字典。
* **支持多轮对话:** 修改 `AgentState` 以包含可累加的消息历史 (例如使用 `Annotated[List[BaseMessage], operator.add]`)，并调整 Agent 的 `invoke` 和 `stream` 方法以处理和利用这个历史记录。可能还需要 Agent 能返回 `input-required` 状态。
* **增强错误处理:** 为网络问题、Agent 执行错误、工具调用失败、类型验证错误等提供更详细、用户友好的错误报告。
* **持久化任务存储:** 替换 `InMemoryTaskManager`。
* **配置管理:** 外部化配置。
* **多技能支持:** 添加路由逻辑。


================================================
FILE: examples/16_google_a2a/__init__.py
================================================
# examples/a2a/__init__.py

"""
A2A协议与LangGraph集成示例

本目录包含了A2A协议与LangGraph Agent集成的示例和文档。
"""

================================================
FILE: examples/16_google_a2a/agent_task_manager_test.py
================================================
# examples/a2a/agent_task_manager_test.py

import os
import sys
import asyncio
import logging
from typing import TypedDict, Any, List, Optional,Tuple

# 添加项目根目录到路径
sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

# 导入环境变量
from dotenv import load_dotenv
load_dotenv()

# 导入A2A相关组件
from core.a2a.types import (
    TaskState, TaskStatus, Task, Artifact, Message,
    SendTaskRequest, SendTaskResponse, SendTaskStreamingRequest,
    TaskSendParams, JSONRPCResponse
)
from core.a2a.agent_task_manager import AgentTaskManager

# 导入LangChain和LLM相关组件
from langchain_core.tools import tool
from langchain_openai import ChatOpenAI
from langgraph.graph import END, StateGraph
from langgraph.prebuilt import create_react_agent

# 配置日志
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# 定义一个简单的工具
@tool
def search(query: str) -> str:
    """搜索互联网获取信息"""
    return f"这是关于 '{query}' 的搜索结果。"

@tool
def calculator(expression: str) -> str:
    """计算数学表达式"""
    try:
        result = eval(expression)
        return f"计算结果: {result}"
    except Exception as e:
        return f"计算错误: {e}"

# 定义一个简单的LangGraph Agent

class AgentState(TypedDict):
    messages: List[Tuple[str, str]]
    session_id: Optional[str] # 保留 session_id

class TestAgent:
    """测试用Agent"""
    
    # 支持的内容类型
    SUPPORTED_CONTENT_TYPES = ["text"]
    
    def __init__(self, llm=None):
        if llm is None:
            try:
                llm = ChatOpenAI(model="gpt-4o-mini")
            except Exception as e:
                print(f"警告: 无法创建OpenAI LLM ({e})，使用模拟模式")
                from langchain.llms.fake import FakeListLLM
                llm = FakeListLLM(responses=["这是一个模拟的LLM响应"])
                
        self.tools = [search, calculator]
        self.agent = create_react_agent(llm, self.tools)
        self.graph = self._build_graph()
    
    def _build_graph(self):
        """构建Agent的工作流图"""
        workflow = StateGraph(AgentState)
        workflow.add_node("agent", self.agent)
        workflow.set_entry_point("agent")
        workflow.add_edge("agent", END)
        return workflow.compile()
    
    def invoke(self, query: str, session_id: str = None) -> str:
        """同步调用Agent"""
        result = self.graph.invoke({"input": query, "session_id": session_id})
        return result["output"]
    
    async def stream(self, query: str, session_id: str = None):
        """流式调用Agent"""
        # 模拟流式输出
        chunks = [
            "正在处理您的请求...",
            "正在搜索相关信息...",
            "找到了一些结果，正在整理...",
            f"关于 '{query}' 的信息如下：这是一个模拟的流式响应。"
        ]
        
        for i, chunk in enumerate(chunks):
            is_last = i == len(chunks) - 1
            yield {
                "content": chunk,
                "is_task_complete": is_last,
                "require_user_input": False
            }
            await asyncio.sleep(0.5)  # 模拟延迟

# 测试AgentTaskManager的同步任务处理
async def test_sync_task():
    print("\n=== 测试同步任务处理 ===\n")
    
    # 创建Agent和AgentTaskManager
    agent = TestAgent()
    task_manager = AgentTaskManager(agent)
    
    # 创建任务请求
    task_id = "test_sync_task_1"
    session_id = "test_session_1"
    content = [{"type": "text", "text": "计算 123 + 456 的结果"}]
    
    task_params = TaskSendParams(
        id=task_id,
        sessionId=session_id,
        message=Message(role="user", parts=content),
        acceptedOutputModes=["text"],
        historyLength=10
    )
    
    request = SendTaskRequest(id="req1", params=task_params)
    
    # 发送任务
    response = await task_manager.on_send_task(request)
    
    # 打印结果
    print(f"任务ID: {task_id}")
    print(f"响应类型: {type(response)}")
    
    if hasattr(response, "error") and response.error:
        print(f"错误: {response.error}")
    else:
        print("任务成功完成")
        
        # 获取任务
        task = task_manager.tasks.get(task_id)
        if task:
            print(f"任务状态: {task.status.state}")
            if task.artifacts:
                for artifact in task.artifacts:
                    for part in artifact.parts:
                        if part.get("type") == "text":
                            print(f"任务结果: {part.get('text')}")

# 测试AgentTaskManager的流式任务处理
async def test_streaming_task():
    print("\n=== 测试流式任务处理 ===\n")
    
    # 创建Agent和AgentTaskManager
    agent = TestAgent()
    task_manager = AgentTaskManager(agent)
    
    # 创建任务请求
    task_id = "test_stream_task_1"
    session_id = "test_session_1"
    content = [{"type": "text", "text": "搜索关于人工智能的信息"}]
    
    task_params = TaskSendParams(
        id=task_id,
        sessionId=session_id,
        message=Message(role="user", parts=content),
        acceptedOutputModes=["text"],
        historyLength=10
    )
    
    request = SendTaskStreamingRequest(id="req2", params=task_params)
    
    # 发送流式任务
    response_generator = await task_manager.on_send_task_subscribe(request)
    
    # 检查响应类型
    if isinstance(response_generator, JSONRPCResponse):
        print(f"错误: {response_generator.error}")
        return
    
    # 处理流式响应
    print("开始接收流式响应:")
    async for response in response_generator:
        if hasattr(response, "error") and response.error:
            print(f"流式响应错误: {response.error}")
        else:
            result = response.result
            if hasattr(result, "status") and result.status and result.status.message:
                for part in result.status.message.parts:
                    # --- 修改开始 ---
                    # 直接访问对象的属性 type 和 text
                    if hasattr(part, 'type') and part.type == "text":
                        text_content = getattr(part, 'text', '') # 安全获取 text
                        print(f"流式更新: {text_content}")
                    # --- 修改结束 ---

            if hasattr(result, "artifact") and result.artifact:
                for part in result.artifact.parts:
                    # --- 修改开始 ---
                    # 直接访问对象的属性 type 和 text
                    if hasattr(part, 'type') and part.type == "text":
                         text_content = getattr(part, 'text', '') # 安全获取 text
                         print(f"流式结果: {text_content}")
                    # --- 修改结束 ---

            if hasattr(result, "final") and result.final:
                print("流式响应结束")

# 主函数
async def main():
    print("=== AgentTaskManager 测试 ===\n")
    
    # 测试同步任务
    await test_sync_task()
    
    # 测试流式任务
    await test_streaming_task()

# 运行测试
if __name__ == "__main__":
    asyncio.run(main())

================================================
FILE: examples/16_google_a2a/client_example.py
================================================
# examples/a2a/client_example.py

import os
import sys
import asyncio
import json
import logging # 添加 logging
from typing import Dict, Any, List, Optional
from uuid import uuid4 # 用于生成示例 Task ID

# 添加项目根目录到路径
sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

# 导入环境变量
from dotenv import load_dotenv
load_dotenv()

# 导入A2A客户端和类型
from core.a2a.client.client import A2AClient
# 导入 Message 和 TextPart 以构建请求，导入响应类型以进行类型提示
from core.a2a.types import (
    Part, TextPart, Message, TaskState, # 添加 TaskState
    SendTaskResponse, GetTaskResponse, SendTaskStreamingResponse, Task, # 添加 Task
    JSONRPCError # 添加 JSONRPCError
)

# 配置日志
logging.basicConfig(level=logging.INFO) # 可以改为 DEBUG 获取更详细客户端日志
logger = logging.getLogger(__name__)

# 示例: 使用A2A客户端连接到A2A服务器
async def run_a2a_client():
    print("\n=== 运行A2A客户端示例 ===\n")

    # 创建A2A客户端
    client = A2AClient(url="http://127.0.0.1:8000") # 指向你的服务器地址

    # 发送同步任务
    await send_sync_task(client)

    # 发送流式任务
    await send_streaming_task(client)

# --- 修正发送同步任务 ---
async def send_sync_task(client: A2AClient):
    print("\n=== 发送同步任务 ===\n")
    query = "请计算 123 + 456 的结果"
    task_id = "client_sync_" + uuid4().hex # 生成一个唯一的任务 ID
    try:
        # 1. 构建 Message 对象
        message = Message(role="user", parts=[TextPart(text=query)])

        # 2. 构建 TaskSendParams 对应的 payload 字典 (添加 id)
        payload_dict = {
            "id": task_id, # --- 添加必需的 id 字段 ---
            "sessionId": "client_session_sync_1",
            "message": message.model_dump(),
            "acceptedOutputModes": ["text"],
            "metadata": {"skill_name": "react_query"}
        }
        logger.debug(f"Sending sync task with payload: {payload_dict}")

        # 3. 调用 send_task，传入 payload 字典
        response: SendTaskResponse = await client.send_task(payload=payload_dict)
        logger.debug(f"Send task response: {response}")

        # 4. 处理响应
        if response.error:
            # 类型提示帮助访问属性
            error: JSONRPCError = response.error
            print(f"发送任务时出错: Code={error.code}, Message={error.message}")
            return
        # SendTaskResponse 的 result 是 Task 对象或 None
        if not response.result:
             print(f"发送任务成功，但响应中未包含任务详情: {response}")
             # 我们可以继续使用我们发送的 task_id 来查询状态
        elif response.result.id != task_id:
            # 理论上服务器应该使用或确认客户端提供的 ID
             logger.warning(f"服务器返回的任务ID '{response.result.id}' 与客户端发送的ID '{task_id}' 不匹配。")
             task_id = response.result.id # 以服务器返回的为准（如果存在）


        print(f"任务已发送，ID: {task_id}")

        # --- 轮询等待任务完成 ---
        print("等待任务完成...")
        task_result: Optional[Task] = None # 用于存储最终的任务对象
        for attempt in range(10): # 最多尝试 10 次
            await asyncio.sleep(2) # 等待 2 秒

            # 5. 构建 get_task 的 payload
            get_payload = {"id": task_id}
            logger.debug(f"Getting task with payload: {get_payload} (Attempt {attempt+1})")

            # 6. 获取任务结果 (传入 payload 字典)
            get_response: GetTaskResponse = await client.get_task(payload=get_payload)
            logger.debug(f"Get task response: {get_response}")

            if get_response.error:
                 error: JSONRPCError = get_response.error
                 print(f"获取任务时出错: Code={error.code}, Message={error.message}")
                 return # 出错则停止轮询
            if not get_response.result:
                 print(f"获取任务成功，但未收到任务详情: {get_response}")
                 continue # 继续轮询

            task_result = get_response.result # 获取任务对象
            print(f"  当前任务状态: {task_result.status.state}")
            # 检查任务是否完成或失败
            if task_result.status.state in [TaskState.COMPLETED, TaskState.FAILED, TaskState.CANCELED, TaskState.INPUT_REQUIRED]:
                break
        else:
            print("任务在限定时间内未完成。")
            return

        # 7. 处理最终任务结果 (使用属性访问)
        if task_result.status.state == TaskState.COMPLETED and task_result.artifacts:
            print("任务成功完成。结果:")
            for artifact in task_result.artifacts:
                 if artifact.parts:
                    for part in artifact.parts:
                        if isinstance(part, TextPart):
                             print(f"  - {part.text}")
        elif task_result.status.state == TaskState.FAILED:
             error_msg = "未知错误"
             if task_result.status.message and task_result.status.message.parts:
                 # 假设错误信息在第一个 TextPart
                 if isinstance(task_result.status.message.parts[0], TextPart):
                    error_msg = task_result.status.message.parts[0].text
             print(f"任务失败: {error_msg}")
        else:
             print(f"任务最终状态为: {task_result.status.state}")

    except Exception as e:
        logger.error(f"发送或处理同步任务时发生异常: {e}", exc_info=True)
        print(f"发送同步任务失败: {e}")

# --- 修正发送流式任务 ---
async def send_streaming_task(client: A2AClient):
    print("\n=== 发送流式任务 ===\n")
    query = "请搜索关于人工智能的最新进展"
    task_id = "client_stream_" + uuid4().hex # 为流式任务生成 ID
    try:
        # 1. 构建 Message 对象
        message = Message(role="user", parts=[TextPart(text=query)])

        # 2. 构建 TaskSendParams 对应的 payload 字典 (添加 id)
        payload_dict = {
            "id": task_id, # --- 添加必需的 id 字段 ---
            "sessionId": "client_session_stream_1",
            "message": message.model_dump(),
            "acceptedOutputModes": ["text"],
            "metadata": {"skill_name": "react_query"}
        }
        logger.debug(f"Sending streaming task with payload: {payload_dict}")
        print(f"任务已发送，ID: {task_id}") # 流式任务 ID 在发送时就已知

        # 3. 调用 send_task_streaming (不再使用 await)
        # 它返回一个异步生成器
        event_stream_generator = client.send_task_streaming(payload=payload_dict)

        # 4. 使用 async for 处理流式事件
        print("开始接收流式响应:")
        async for event_response in event_stream_generator: # 正确迭代异步生成器
            logger.debug(f"Received stream event: {event_response}")

            # 检查整个响应是否有错误
            if event_response.error:
                 error: JSONRPCError = event_response.error
                 print(f"流式传输中出错: Code={error.code}, Message={error.message}")
                 continue # 或 break

            # 获取事件具体内容
            event = event_response.result
            if not event:
                 logger.warning("Received stream response with empty result.")
                 continue

            # 处理状态更新事件中的消息部分
            if hasattr(event, "status") and event.status and event.status.message:
                 if event.status.message.parts:
                    for part in event.status.message.parts:
                        if isinstance(part, TextPart):
                            print(f"  流式更新: {part.text}")

            # 处理制品更新事件
            if hasattr(event, "artifact") and event.artifact:
                 print("  收到 Artifact:")
                 if event.artifact.parts:
                    for part in event.artifact.parts:
                        if isinstance(part, TextPart):
                            print(f"    流式结果 (TextPart): {part.text}")

            # 检查流结束标志
            if hasattr(event, "final") and event.final:
                 print("流式响应结束标志收到。")

        print("流式任务处理完成。")

    except Exception as e:
        logger.error(f"发送或处理流式任务时发生异常: {e}", exc_info=True)
        print(f"发送流式任务失败: {e}")

# 主函数
if __name__ == "__main__":
    # 使用 asyncio.run 运行顶层异步函数
    asyncio.run(run_a2a_client())

================================================
FILE: examples/16_google_a2a/currency_agent_test.py
================================================
# examples/a2a/currency_agent_test.py

import os
import sys
import asyncio
import json
import logging
from typing import Dict, Any, List, Optional
from uuid import uuid4 # Import uuid

# 添加项目根目录到路径
sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

# 导入环境变量
from dotenv import load_dotenv
load_dotenv()

# 导入A2A客户端和所需类型
from core.a2a.client.client import A2AClient
# 导入 Message, TextPart, TaskState, SendTaskResponse, GetTaskResponse, Task, JSONRPCError
from core.a2a.types import (
    Part, TextPart, Message, TaskState,
    SendTaskResponse, GetTaskResponse, Task, JSONRPCError,
    SendTaskStreamingResponse # 导入流式响应类型
)

# 配置日志
logging.basicConfig(level=logging.INFO) # 可以改为 DEBUG 获取详细日志
logger = logging.getLogger(__name__)

# 测试场景1: 同步请求 - 货币转换查询 (修正)
async def test_sync_currency_conversion(client: A2AClient):
    print("\n=== 测试场景1: 同步请求 - Agent 调用 (计算器) ===")
    # query = "How much is the exchange rate for 1 USD to INR?" # 这个查询可能需要搜索工具
    query = "计算 58 * 34 的结果" # 使用计算器工具确保能得到结果
    task_id = "test_sync_" + uuid4().hex # 客户端生成任务ID
    try:
        # 1. 构建 Message 对象
        message = Message(role="user", parts=[TextPart(text=query)])

        # 2. 构建 TaskSendParams 对应的 payload 字典
        payload_dict = {
            "id": task_id,
            "sessionId": "test_session_sync_1",
            "message": message.model_dump(), # 序列化为字典
            "acceptedOutputModes": ["text"],
            "metadata": {"skill_name": "react_query"} # 与 AgentCard 中的 skill name/id 对应
        }
        logger.debug(f"Sending sync task with payload: {payload_dict}")

        # 3. 调用 send_task，传入 payload 字典
        response: SendTaskResponse = await client.send_task(payload=payload_dict)
        logger.debug(f"Send task response: {response}")

        # 4. 处理响应
        if response.error:
            error: JSONRPCError = response.error
            print(f"发送任务时出错: Code={error.code}, Message={error.message}")
            return None
        if not response.result:
             print(f"发送任务成功，但未收到任务详情: {response}")
             # 继续使用我们发送的 task_id 查询
        elif response.result.id != task_id:
            logger.warning(f"服务器返回的任务ID '{response.result.id}' 与客户端发送的ID '{task_id}' 不匹配。")
            task_id = response.result.id # 以服务器返回的为准

        print(f"任务已发送，ID: {task_id}")

        # 5. 轮询等待任务完成
        print("等待任务完成...")
        task_result: Optional[Task] = None
        for attempt in range(10):
            await asyncio.sleep(2)
            get_payload = {"id": task_id}
            logger.debug(f"Getting task with payload: {get_payload} (Attempt {attempt+1})")
            get_response: GetTaskResponse = await client.get_task(payload=get_payload)
            logger.debug(f"Get task response: {get_response}")

            if get_response.error:
                 error: JSONRPCError = get_response.error
                 print(f"获取任务时出错: Code={error.code}, Message={error.message}")
                 return None
            if not get_response.result:
                 print(f"获取任务成功，但未收到任务详情: {get_response}")
                 continue

            task_result = get_response.result
            print(f"  当前任务状态: {task_result.status.state.value}") # 使用 .value 获取枚举值
            if task_result.status.state in [TaskState.COMPLETED, TaskState.FAILED, TaskState.CANCELED]:
                break
        else:
            print("任务在限定时间内未完成。")
            return None

        # 6. 处理最终任务结果 (使用属性访问)
        if task_result.status.state == TaskState.COMPLETED and task_result.artifacts:
            print("任务成功完成。结果:")
            for artifact in task_result.artifacts:
                 if artifact.parts:
                    for part in artifact.parts:
                        if isinstance(part, TextPart): # 检查类型
                             print(f"  - {part.text}") # 访问属性
        elif task_result.status.state == TaskState.FAILED:
             error_msg = "未知错误"
             if task_result.status.message and task_result.status.message.parts:
                 if isinstance(task_result.status.message.parts[0], TextPart):
                    error_msg = task_result.status.message.parts[0].text
             print(f"任务失败: {error_msg}")
        else:
             print(f"任务最终状态为: {task_result.status.state.value}")

        return task_result

    except Exception as e:
        logger.error(f"处理同步任务时发生异常: {e}", exc_info=True)
        print(f"发送同步任务失败: {e}")
        return None

# 测试场景2: 多轮对话 - 不完整信息 (修正，但有局限性)
async def test_multi_turn_conversation(client: A2AClient):
    print("\n=== 测试场景2: 多轮对话 (Agent 可能不支持) ===")
    print("注意：当前服务器端的 Agent 实现可能不支持真正的多轮状态保持。")

    # --- 第一轮对话 ---
    session_id = "test_session_multi_" + uuid4().hex # 为多轮对话创建唯一 session ID
    query1 = "100美元等于多少" # 故意不指定目标货币
    task_id_1 = "test_multi_1_" + uuid4().hex

    try:
        print(f"\n第一轮对话 (Session: {session_id}): 发送 '{query1}'")
        # 1a. 构建 Message 和 Payload
        message1 = Message(role="user", parts=[TextPart(text=query1)])
        payload_dict1 = {
            "id": task_id_1,
            "sessionId": session_id, # 传递 session ID
            "message": message1.model_dump(),
            "acceptedOutputModes": ["text"],
            "metadata": {"skill_name": "react_query"}
        }
        logger.debug(f"Sending multi-turn task 1 with payload: {payload_dict1}")

        # 1b. 发送任务
        response1: SendTaskResponse = await client.send_task(payload=payload_dict1)
        logger.debug(f"Send task 1 response: {response1}")

        if response1.error:
            error: JSONRPCError = response1.error
            print(f"发送第一轮任务时出错: Code={error.code}, Message={error.message}")
            return None
        if response1.result:
            task_id_1 = response1.result.id # Use server-confirmed ID

        print(f"第一轮任务已发送，ID: {task_id_1}")

        # 1c. 轮询获取结果
        print("等待第一轮任务响应...")
        task1_result: Optional[Task] = None
        for attempt in range(5): # 减少轮询次数
            await asyncio.sleep(2)
            get_payload1 = {"id": task_id_1}
            get_response1: GetTaskResponse = await client.get_task(payload=get_payload1)
            if get_response1.result:
                task1_result = get_response1.result
                print(f"  当前任务状态: {task1_result.status.state.value}")
                if task1_result.status.state != TaskState.WORKING:
                    break
        else:
            print("第一轮任务在限定时间内未完成或未开始。")
            return None

        # 1d. 检查 Agent 是否要求输入 (当前 Agent 可能直接完成或失败)
        if task1_result.status.state == TaskState.INPUT_REQUIRED and task1_result.status.message:
             print("Agent 要求更多信息:")
             for part in task1_result.status.message.parts:
                 if isinstance(part, TextPart):
                     print(f"  Agent: {part.text}")

             # --- 第二轮对话 ---
             query2 = "日元" # 提供目标货币
             task_id_2 = "test_multi_2_" + uuid4().hex
             print(f"\n第二轮对话 (Session: {session_id}): 发送 '{query2}'")

             # 2a. 构建 Message 和 Payload
             message2 = Message(role="user", parts=[TextPart(text=query2)])
             payload_dict2 = {
                 "id": task_id_2,
                 "sessionId": session_id, # 必须使用相同的 session ID
                 "message": message2.model_dump(),
                 "acceptedOutputModes": ["text"],
                 "metadata": {"skill_name": "react_query"}
             }
             logger.debug(f"Sending multi-turn task 2 with payload: {payload_dict2}")

             # 2b. 发送任务
             response2: SendTaskResponse = await client.send_task(payload=payload_dict2)
             logger.debug(f"Send task 2 response: {response2}")

             if response2.error:
                 error: JSONRPCError = response2.error
                 print(f"发送第二轮任务时出错: Code={error.code}, Message={error.message}")
                 return None
             if response2.result:
                 task_id_2 = response2.result.id

             print(f"第二轮任务已发送，ID: {task_id_2}")

             # 2c. 轮询获取最终结果
             print("等待第二轮任务完成...")
             task2_result: Optional[Task] = None
             for attempt in range(10):
                 await asyncio.sleep(2)
                 get_payload2 = {"id": task_id_2}
                 get_response2: GetTaskResponse = await client.get_task(payload=get_payload2)
                 if get_response2.result:
                     task2_result = get_response2.result
                     print(f"  当前任务状态: {task2_result.status.state.value}")
                     if task2_result.status.state != TaskState.WORKING:
                         break
             else:
                 print("第二轮任务在限定时间内未完成。")
                 return None

             # 2d. 处理最终结果
             if task2_result.status.state == TaskState.COMPLETED and task2_result.artifacts:
                 print("多轮任务成功完成。最终结果:")
                 for artifact in task2_result.artifacts:
                      if artifact.parts:
                         for part in artifact.parts:
                             if isinstance(part, TextPart):
                                  print(f"  - {part.text}")
             else:
                  print(f"第二轮任务最终状态为: {task2_result.status.state.value}")

             return task2_result

        elif task1_result.status.state == TaskState.COMPLETED:
            print("Agent 在第一轮就已完成任务 (可能直接使用了默认货币或无法处理):")
            if task1_result.artifacts:
                for artifact in task1_result.artifacts:
                     if artifact.parts:
                        for part in artifact.parts:
                            if isinstance(part, TextPart):
                                print(f"  - {part.text}")
            return task1_result
        else:
            print(f"第一轮任务未要求输入，最终状态为: {task1_result.status.state.value}")
            return task1_result

    except Exception as e:
        logger.error(f"处理多轮对话时发生异常: {e}", exc_info=True)
        print(f"多轮对话测试失败: {e}")
        return None


# 测试场景3: 流式响应 (修正)
async def test_streaming_response(client: A2AClient):
    print("\n=== 测试场景3: 流式响应 (Agent 端为模拟) ===")

    # query = "What are the current exchange rates between USD, EUR, and JPY?"
    query = "用中文写一首关于春天的短诗" # 更适合流式输出的查询
    task_id = "test_stream_" + uuid4().hex
    try:
        # 1. 构建 Message 和 Payload
        message = Message(role="user", parts=[TextPart(text=query)])
        payload_dict = {
            "id": task_id,
            "sessionId": "test_session_stream_1",
            "message": message.model_dump(),
            "acceptedOutputModes": ["text"],
            "metadata": {"skill_name": "react_query"}
        }
        logger.debug(f"Sending streaming task with payload: {payload_dict}")
        print(f"任务已发送，ID: {task_id}")

        # 2. 调用 send_task_streaming (不使用 await) 并使用 async for 迭代
        event_stream_generator = client.send_task_streaming(payload=payload_dict)

        print("开始接收流式响应:")
        async for event_response in event_stream_generator:
            logger.debug(f"Received stream event: {event_response}")

            if event_response.error:
                 error: JSONRPCError = event_response.error
                 print(f"流式传输中出错: Code={error.code}, Message={error.message}")
                 continue

            event = event_response.result
            if not event:
                 logger.warning("Received stream response with empty result.")
                 continue

            # 处理状态更新事件
            if hasattr(event, "status") and event.status and event.status.message:
                 if event.status.message.parts:
                    for part in event.status.message.parts:
                        if isinstance(part, TextPart):
                            print(f"  流式更新: {part.text}")

            # 处理 Artifact 事件
            if hasattr(event, "artifact") and event.artifact:
                 # print("  收到 Artifact:") # 打印多次可能比较干扰，注释掉
                 if event.artifact.parts:
                    for part in event.artifact.parts:
                        if isinstance(part, TextPart):
                            print(f"  流式结果: {part.text}")

            # 检查结束标志
            if hasattr(event, "final") and event.final:
                 print("流式响应结束标志收到。")

        print("流式任务处理完成。")
        return True

    except Exception as e:
        logger.error(f"处理流式任务时发生异常: {e}", exc_info=True)
        print(f"发送流式任务失败: {e}")
        return False

# 主函数 (修正)
async def main():
    print("=== LangGraph Agent A2A协议测试 ===\n")
    # print("此测试脚本将测试LangGraph Currency Agent通过A2A协议的三种交互场景:")
    # print("1. 同步请求 - Agent 调用 (计算器)")
    # print("2. 多轮对话 - 处理不完整信息 (Agent 可能不支持)")
    # print("3. 流式响应 - 实时状态更新 (Agent 端为模拟)")

    # 创建A2A客户端
    client = A2AClient(url="http://127.0.0.1:8000")

    # --- 移除了 get_agent_info 调用 ---
    # (如果需要验证服务器是否在线，可以尝试发送一个简单的任务)
    print("尝试连接到服务器并运行测试...")
    print("-" * 30)

    # 执行测试场景
    await test_sync_currency_conversion(client)
    print("-" * 30)
    # 注意：多轮对话测试依赖于 Agent 对话状态的处理能力
    await test_multi_turn_conversation(client)
    print("-" * 30)
    await test_streaming_response(client)
    print("-" * 30)
    print("所有测试场景执行完毕。")

# 运行测试
if __name__ == "__main__":
    asyncio.run(main())

================================================
FILE: examples/16_google_a2a/currency_agent_test_README.md
================================================
# LangGraph Agent A2A协议交互测试

## 概述

本测试脚本 (`examples/a2a/currency_agent_test.py`) 旨在通过具体的交互场景，测试和演示如何使用 A2A 客户端与先前通过 `langgraph_integration.py` 启动的 LangGraph Agent 服务进行通信。它覆盖了同步请求（涉及工具调用）、尝试进行多轮对话以及接收（模拟的）流式响应等场景。

## 测试场景说明

此脚本包含以下三个主要测试场景：

1.  **场景 1: 同步请求 - Agent 调用 (涉及工具)**
    * **目的:** 测试发送一个需要 Agent 调用内部工具（如此示例中的计算器）才能完成的请求。
    * **流程:** 客户端发送一个计算任务 -> 服务器端 Agent (LangGraph ReAct) 解析任务 -> 调用 `calculator` 工具 -> 获取结果 -> LLM 整合答案 -> 服务器返回最终结果 -> 客户端轮询获取并显示结果。
    * **预期:** 客户端能成功获取到 Agent 计算后的准确结果。

2.  **场景 2: 多轮对话尝试 (Agent 当前实现有限)**
    * **目的:** 测试客户端在需要多步交互时的请求发送方式（使用 `sessionId`），并观察当前 Agent 的响应行为。
    * **流程:**
        * 第一轮：客户端发送一个信息不明确的查询（例如 "100美元等于多少"，缺少目标货币），并附带 `sessionId`。
        * 客户端轮询获取结果。
        * **注意:** *根据我们当前的 Agent 实现 (`CurrencyAgent` 使用 `create_react_agent` 且 `invoke` 未特殊处理对话历史)，Agent 很可能不会返回 `input-required` 状态来请求更多信息，而是会直接尝试处理或告知无法处理，然后将任务标记为 `completed` 或 `failed`。*
        * (理想流程中，如果 Agent 返回 `input-required`，客户端会发送第二轮请求补充信息，使用相同的 `sessionId`。)
    * **预期:** 客户端能够正确发送带 `sessionId` 的请求，并能处理 Agent 的最终响应（即使它没有按预期进入多轮澄清状态）。此测试主要验证客户端的多轮请求发送能力和对 Agent 当前行为的观察。

3.  **场景 3: 流式响应 (Agent 端模拟)**
    * **目的:** 测试客户端接收 A2A 流式响应 (Server-Sent Events) 的能力。
    * **流程:** 客户端发送一个适合流式输出的查询 -> 服务器端的 `AgentTaskManager` 调用 `CurrencyAgent.stream` 方法 -> **注意:** *`CurrencyAgent.stream` 当前是一个模拟实现，它会发送预设的文本块，而不是真正调用 LangGraph 的流式接口。* -> 客户端接收并打印这些模拟的流式事件。
    * **预期:** 客户端能够成功连接 SSE 端点，并接收、打印服务器发送的（模拟）流式事件。

## 运行测试

### 前提条件

* Python (推荐 3.10 或更高版本)
* 已根据项目 `requirements.txt` 安装所有必需的 Python 依赖库。
* 在项目根目录下的 `.env` 文件中配置了有效的 `OPENAI_API_KEY` (或其他所需的 LLM API 密钥)。

### 步骤

1.  **启动 A2A 服务器:**
    * 确保你位于项目的根目录。
    * 在终端中运行 (如果尚未运行):
        ```bash
        python -m examples.a2a.langgraph_integration
        ```
    * 服务器应成功启动并监听在 `http://127.0.0.1:8000`。

2.  **运行本测试脚本:**
    * 打开 **另一个** 终端。
    * 确保你位于项目的根目录并激活了相同的虚拟环境。
    * 运行测试脚本:
        ```bash
        python -m examples.a2a.currency_agent_test
        ```

## 测试输出示例 (基于实际运行结果)

以下是运行此测试脚本时预期的输出格式，反映了当前 Agent 的实际行为：

### 同步请求示例 (计算器调用)

```
=== 测试场景1: 同步请求 - Agent 调用 (计算器) ===

任务已发送，ID: test_sync_...
等待任务完成...
  当前任务状态: completed
任务成功完成。结果:
  - 58 * 34 的结果是 1972。
```

### 多轮对话示例 (Agent 第一轮即完成)

```
=== 测试场景2: 多轮对话 (Agent 可能不支持) ===
注意：当前服务器端的 Agent 实现可能不支持真正的多轮状态保持。

第一轮对话 (Session: test_session_multi_...): 发送 '100美元等于多少'
第一轮任务已发送，ID: test_multi_1_...
等待第一轮任务响应...
  当前任务状态: completed
Agent 在第一轮就已完成任务 (可能直接使用了默认货币或无法处理):
  - 目前无法提供100美元等于多少人民币的具体信息。你可以查阅最新的汇率数据或使用汇率转换工具来获取准确的结果。
```
*(注意：Agent 的具体回复可能因 LLM 的不同调用而略有差异)*

### 流式响应示例 (Agent 端模拟)

```
=== 测试场景3: 流式响应 (Agent 端为模拟) ===

任务已发送，ID: test_stream_...
开始接收流式响应:
  流式更新: 正在处理您的请求...
  流式结果: 关于 '用中文写一首关于春天的短诗' 的信息如下：这是一个模拟的回应，因为真实流未实现。
流式响应结束标志收到。
流式任务处理完成。
```

## 注意事项

* 确保在运行测试前已正确设置 `.env` 文件中的环境变量。
* 测试脚本默认连接 `http://127.0.0.1:8000`。如果服务器地址或端口不同，请修改脚本中的 `A2AClient` 初始化 URL。
* 如果连接失败或测试出错，请优先检查 A2A 服务器是否已正确启动且正在运行，并查看服务器端的日志输出。

---

## 两个客户端示例的命名与区别

你项目中有两个客户端示例文件，我们可以为它们命名并说明其侧重点：

1.  **`examples/a2a/client_example.py` -> "基础客户端示例 (Basic Client Example)"**
    * **目的:** 这个脚本更侧重于**基础演示**，展示了调用 `A2AClient` 库中几个核心方法（`send_task`, `get_task`, `send_task_streaming`）的最基本用法。
    * **特点:** 代码相对简洁，逻辑直接，主要目的是让使用者快速了解如何发起不同类型的 A2A 请求并处理最简单的成功响应。它包含了一个简单的轮询逻辑。

2.  **`examples/a2a/currency_agent_test.py` -> "场景化测试客户端 (Scenario-based Test Client)"**
    * **目的:** 这个脚本的定位是**功能测试和场景演示**。它针对我们集成的 LangGraph Agent 设计了几个具体的交互场景（同步工具调用、尝试多轮对话、流式接收），以验证端到端的流程和观察 Agent 在特定情况下的行为。
    * **特点:** 结构更清晰地划分为不同的测试函数，包含了更具体的业务逻辑查询（尽管有些是模拟的或揭示了 Agent 的局限性），并且其输出更侧重于展示每个测试场景的结果。它也使用了轮询，并尝试了多轮交互的状态传递（通过 `sessionId`）。

**主要区别总结:**

| 特性         | `client_example.py` (基础示例)                 | `currency_agent_test.py` (场景化测试)                 |
| :----------- | :--------------------------------------------- | :---------------------------------------------------- |
| **目标** | 演示 Client API 基本用法                       | 测试/演示特定交互场景                                 |
| **结构** | 简单的顺序调用                                 | 按测试场景划分函数                                    |
| **复杂度** | 较低，核心 API 调用                            | 略高，包含场景逻辑（如尝试多轮）                      |
| **查询内容** | 通用示例（计算、搜索）                         | 针对场景设计（计算、不完整查询、适合流式的查询）        |
| **侧重点** | 如何调用 API                                   | Agent 在特定场景下的行为和端到端流程验证              |


================================================
FILE: examples/16_google_a2a/langgraph_integration.py
================================================
# examples/a2a/langgraph_integration.py

import os
import sys
import asyncio # asyncio 仍然可能被依赖库使用，保留导入
import logging
# 确保导入了 List, Tuple, Optional, TypedDict
from typing import Dict, Any, List, Optional, AsyncIterable, Union, TypedDict, Tuple

# 添加项目根目录到路径
sys.path.append(os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))

# 导入环境变量
from dotenv import load_dotenv
load_dotenv()

# 导入A2A相关组件
# 从你的项目结构导入
from core.a2a.types import (
    AgentCard, AgentCapabilities, AgentSkill,
    Task, TaskState, TaskStatus, Artifact, Message, TextPart, # TextPart 可能不再直接使用
    JSONRPCResponse, InvalidParamsError, InternalError,
    SendTaskRequest, SendTaskResponse, TaskSendParams
)
from core.a2a.server.server import A2AServer
from core.a2a.agent_task_manager import AgentTaskManager

# 导入LangChain和LLM相关组件
from langchain_openai import ChatOpenAI
from langchain_core.tools import tool
# StateGraph 和 END 不再直接使用，但保留导入
from langgraph.graph import END, StateGraph
from langgraph.prebuilt import create_react_agent

# 配置日志
logging.basicConfig(level=logging.INFO) # 可以改为 DEBUG 获取更详细日志
logger = logging.getLogger(__name__)

# --- 定义工具 (保持不变) ---
@tool
def search(query: str) -> str:
    """搜索互联网获取信息"""
    # 实际应用中应调用真实搜索引擎 API
    logger.info(f"Tool 'search' called with query: {query}")
    return f"这是关于 '{query}' 的模拟搜索结果。"

@tool
def calculator(expression: str) -> str:
    """计算数学表达式"""
    logger.info(f"Tool 'calculator' called with expression: {expression}")
    try:
        # 注意：生产环境中使用 eval 非常危险，这里仅作示例
        # 限制 eval 的能力，只允许简单的数学运算
        allowed_names = {
            k: v for k, v in __import__("math").__dict__.items() if not k.startswith("_")
        }
        allowed_names.update({"abs": abs, "int": int, "float": float}) # 添加常用函数
        code = compile(expression, "<string>", "eval")

        for name in code.co_names:
             if name not in allowed_names:
                  raise NameError(f"Use of name '{name}' not allowed")

        result = eval(code, {"__builtins__": {}}, allowed_names)
        return f"计算结果: {result}"
    except NameError as e:
         logger.error(f"Calculation error (NameError): {e} in expression '{expression}'")
         return f"计算错误: 不允许的名称 '{e.name}'"
    except Exception as e:
        logger.error(f"Calculation error: {e} in expression '{expression}'")
        return f"计算错误: {e}"

# --- 修正 AgentState 定义 ---
class AgentState(TypedDict):
    # 使用 'messages' 字段来传递对话内容
    # 格式为 (角色, 内容) 的元组列表
    messages: List[Tuple[str, str]]
    # session_id 可以保留，如果Agent内部逻辑需要的话 (create_react_agent 通常不需要)
    # session_id: Optional[str]
    # 注意: ReAct Agent 运行时可能会在状态中添加其他键 (例如 intermediate_steps)

# --- 修正 CurrencyAgent 类 ---
class CurrencyAgent:
    """一个简单的货币转换和信息查询Agent (已修正)"""

    # 支持的内容类型 (保持不变)
    SUPPORTED_CONTENT_TYPES = ["text"]

    def __init__(self, llm):
        """初始化Agent，直接使用 create_react_agent 创建的 Runnable"""
        self.tools = [search, calculator]
        # create_react_agent 返回一个可直接调用的 Runnable (图)
        self.agent_runnable = create_react_agent(llm, self.tools)
        logger.info("CurrencyAgent initialized with ReAct runnable.")

    def invoke(self, query: str, session_id: str = None) -> str:
        """同步调用Agent Runnable"""
        # (session_id 在此实现中未传递给 agent_runnable，如果需要可以添加)
        logger.debug(f"[CurrencyAgent.invoke] Received query: '{query}', session_id: '{session_id}'")
        if not query:
             logger.error("[CurrencyAgent.invoke] Query is empty!")
             return "错误：输入查询为空。"

        # 准备 ReAct Agent Runnable 所需的输入
        invoke_input = {"messages": [("user", query)]}

        logger.debug(f"[CurrencyAgent.invoke] Invoking agent runnable with input: {invoke_input}")
        try:
            # 直接调用 create_react_agent 返回的 runnable
            result = self.agent_runnable.invoke(invoke_input)
            logger.debug(f"[CurrencyAgent.invoke] Agent runnable result: {result}")

            # 提取最终响应
            final_output = "错误：未能从Agent获取有效响应。"
            if isinstance(result, dict) and isinstance(result.get("messages"), list) and result["messages"]:
                last_message = result["messages"][-1]
                if isinstance(last_message, tuple) and len(last_message) == 2:
                    final_output = last_message[1]
                elif hasattr(last_message, 'content'):
                     final_output = last_message.content
                else:
                     logger.warning(f"[CurrencyAgent.invoke] Last message format unexpected: {last_message!r}")
            else:
                 logger.warning(f"[CurrencyAgent.invoke] Could not find 'messages' list in result: {result}")

            logger.debug(f"[CurrencyAgent.invoke] Returning output: {final_output}")
            return str(final_output)
        except Exception as e:
             logger.error(f"[CurrencyAgent.invoke] Exception during agent invocation: {e}", exc_info=True)
             raise

    async def ainvoke(self, inputs: dict) -> dict:
        """异步调用Agent Runnable (输入格式也需调整)"""
        # TODO: 确认这里的输入格式是否也需要转换为 {"messages": [...]}
        logger.debug(f"[CurrencyAgent.ainvoke] Invoking agent runnable async with input: {inputs}")
        # 假设输入字典已经包含了正确的 "messages" 键
        return await self.agent_runnable.ainvoke(inputs)

    async def stream(self, query: str, session_id: str = None):
        """流式调用Agent (当前为模拟)"""
        # TODO: 实现真实的流式调用
        logger.warning("[CurrencyAgent.stream] Stream method is currently mocked.")
        # --- 模拟实现 ---
        yield { "content": "正在处理您的请求...", "is_task_complete": False, "require_user_input": False }
        await asyncio.sleep(0.5)
        final_simulated_answer = f"关于 '{query}' 的信息如下：这是一个模拟的回应，因为真实流未实现。"
        yield { "content": final_simulated_answer, "is_task_complete": True, "require_user_input": False }
        # --- 模拟结束 ---


# --- A2A 服务器设置 (修正函数定义和 AgentCard) ---
# 将函数改为同步定义 (def 而不是 async def)
def setup_a2a_server():
    """设置并返回 A2A 服务器实例 (同步函数)"""
    print("\n=== 配置 LangGraph A2A 服务器 ===\n")

    # 创建LLM
    try:
        llm = ChatOpenAI(model="gpt-4o-mini")
        logger.info("Using OpenAI LLM: gpt-4o-mini")
    except Exception as e:
        print(f"警告: 无法创建OpenAI LLM ({e})，将使用模拟模式")
        from langchain.llms.fake import FakeListLLM
        llm = FakeListLLM(responses=["这是一个模拟的LLM响应"])
        logger.info("Using FakeListLLM (simulation mode)")

    # 创建 Agent 实例
    agent = CurrencyAgent(llm)

    # 创建 Agent 卡片 (添加缺失字段)
    agent_card = AgentCard(
        name="LangGraph ReAct Agent",
        description="一个使用LangGraph ReAct处理查询并调用工具的Agent",
        url="http://127.0.0.1:8000/agent", # Agent 的访问 URL (示例)
        version="0.1.0",                  # Agent 的版本号
        capabilities=AgentCapabilities(   # 设置 Agent 的能力
            streaming=False,              # 当前 stream 是模拟的，设为 False
            pushNotifications=False       # 假设不支持推送
        ),
        skills=[                          # skills 列表在 AgentCard 顶层
            AgentSkill(
                id="react_query_skill",   # 技能的唯一 ID
                name="react_query",
                description="处理自然语言查询，可使用搜索和计算器工具",
                inputModes=["text"],
                outputModes=["text"]
            )
        ]
        # 其他可选字段可以按需添加
    )

    # 创建 AgentTaskManager
    task_manager = AgentTaskManager(agent)

    # 创建A2A服务器实例 (不在此处设置 host/port)
    server = A2AServer(agent_card=agent_card, task_manager=task_manager)
    print("A2A服务器实例已创建。")
    return server # 返回实例


# --- 主函数入口 (修正启动逻辑) ---
if __name__ == "__main__":
    try:
        # 调用同步函数来设置服务器
        server_instance = setup_a2a_server()

        # 定义 HOST 和 PORT
        HOST = "127.0.0.1"
        PORT = 8000
        print(f"准备启动A2A服务器，监听地址 http://{HOST}:{PORT}")

        # 在调用 start 前设置 host 和 port
        # (或者修改 A2AServer 的 __init__ 让其接受 host/port)
        server_instance.host = HOST
        server_instance.port = PORT

        # 启动服务器 (调用同步的 start 方法)
        server_instance.start()

    except KeyboardInterrupt:
        print("\n服务器已手动停止。")
    except Exception as e:
        # 捕获设置或启动过程中的其他异常
        logger.error(f"启动服务器时发生未处理的异常: {e}", exc_info=True)

================================================
FILE: examples/TODO_computer_tool_demo.py
================================================
from typing import Annotated, Literal
from langchain_core.messages import HumanMessage, AIMessage
from langchain.agents import AgentExecutor, create_openai_tools_agent
from langchain_core.runnables import Runnable, RunnablePassthrough
from langchain_core.runnables.graph import StateGraph, END, START
from langchain.tools.render import render_text_description
from langchain_openai import ChatOpenAI
from langchain_core.tools import Tool
from langchain.agents.format_scratchpad import format_to_openai_tool_messages
from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
from langchain_core.runnables.config import RunnableConfig
from langgraph.graph import END, StateGraph
from langgraph.prebuilt import ToolNode
from langgraph.graph.message import Command, InjectedState

# Import our custom computer tool
# TODO: MarinaBox - Import our custom computer tool
from marinabox import mb_start_computer, mb_stop_computer, mb_use_computer_tool

# Set up model with tools
model = ChatOpenAI(model="gpt-3.5-turbo-0125", temperature=0)
tools = [mt_use_computer_tool()]
model_with_tools = model.bind_tools(tools)

# Define workflow nodes
def should_continue(state: Annotated[dict, InjectedState()]):
    messages = state["messages"]
    if len(messages) > 0:
        last_message = messages[-1]
        if last_message.tool_calls:
            return Command(goto="tool_node")
    else:
        return Command(goto="stop_computer")
    return Command(goto="stop_computer")

def call_model(state: Annotated[dict, InjectedState()]):
    input_message = input("Enter your message: ")
    if input_message != "stop_computer":
        messages = [HumanMessage(content=input_message)]
        response = model_with_tools.invoke(messages)
        return {"messages": [response], "session_id": state.get("session_id")}
    else:
        return {"messages": [], "session_id": state.get("session_id")}

# Set up workflow
workflow = StateGraph(dict)
workflow.add_node("start_computer", mt_start_computer)
workflow.add_node("agent", call_model)
workflow.add_node("tool_node", ToolNode(tools=tools))
workflow.add_node("stop_computer", mt_stop_computer)
workflow.add_node("should_continue", should_continue)

# Define workflow edges
workflow.add_edge(START, "start_computer")
workflow.add_edge("start_computer", "agent")
workflow.add_edge("tool_node", "agent")
workflow.add_edge("agent", "should_continue")
workflow.add_edge("stop_computer", END)

# Compile and run workflow
app = workflow.compile()
if __name__ == "__main__":
    app.invoke({"messages": ""})


================================================
FILE: examples/__init__.py
================================================


================================================
FILE: examples/state_based_supervisor_examples/01_simple.py
================================================
import asyncio
import json
import os
import re
import time 
from datetime import datetime 
from typing import Literal, List, Dict, Any, Optional, cast

# --- LangChain / LangGraph ---
try:
    # 使用 langchain_openai (或你选择的模型提供商)
    from langchain_openai import ChatOpenAI 
except ImportError:
     ChatOpenAI = None 
     print("Warning: langchain_openai not installed.")

# 核心消息类型
from langchain_core.messages import HumanMessage, AIMessage, BaseMessage, ToolMessage 
# LangChain 工具相关
from langchain_core.tools import tool, BaseTool 

# --- OpenAI 错误处理 ---
try:
    from openai import RateLimitError
except ImportError:
    class RateLimitError(Exception): pass

# --- 内部模块导入 (请确保路径正确) ---
try:
    # 假设这些是你当前的路径
    from core.agents.sb_supervisor_agent import SupervisorAgent 
    from core.agents.supervisor.state_schema import PlanningAgentState
    from core.agents.base.react_agent import ReactAgent # 导入 ReactAgent
    # 导入 StreamUpdate (如果需要在最终状态中检查它，但这里主要关注消息)
    # from core.agents.supervisor.schemas import StreamUpdate 

except ImportError as e:
    print(f"Error importing agent components: {e}")
    print("Please ensure paths like 'core.agents.sb_supervisor_agent' are correct.")

import traceback

# --- 定义 Web Search 工具 ---
# 使用 @tool 装饰器明确这是一个工具
@tool
def web_search(query: str) -> str:
    """Search the web for current information about a given query. Use this for recent events, data, or facts."""
    print(f"--- TOOL CALLED: web_search(query='{query}') ---") # 添加日志确认工具被调用
    # Mocked data - 实际使用时会调用 Tavily 或其他搜索引擎
    if "apple" in query.lower() and "headcount" in query.lower() and "2024" in query:
        return (
            "According to recent (mocked) reports for 2024, Apple's headcount is approximately 164,000 employees globally."
        )
    elif "joke" in query.lower():
         # 这个工具不适合讲笑话
         return "I am a web search tool, I cannot tell jokes."
    else:
        return f"Mock search results for query: '{query}'. Found relevant information on various websites."

# --- 主执行逻辑 ---
async def main():
     # --- 初始化 LLM (确保 API Key 在环境中) ---
     try:
        model_name = os.getenv("LLM_MODEL_NAME", "gpt-4o") 
        print(f"Using LLM: {model_name}")
        if not ChatOpenAI: raise ImportError("ChatOpenAI not available.")
        # 使用温度稍高的模型可能有助于 ReAct 思考和调用工具
        model = ChatOpenAI(model=model_name, temperature=0.2) 
     except Exception as e:
         print(f"Failed to initialize ChatOpenAI model: {e}")
         return

     # --- 实例化 Agents ---
     try:
        # research_agent 现在有了一个明确定义的 web_search 工具
        research_agent = ReactAgent(
             name="research_expert", 
             tools=[web_search], # <--- 传入工具列表
             model=model,
             # 添加明确的 Prompt 引导工具使用
             prompt=(
                 "You are a research expert. Use available tools to find information. "
                 "You have access to 'web_search'. Use it for questions about current data, facts, or events."
             ),
             max_context_tokens=8000 
         ) 
         
        all_agents = [research_agent]

        # --- 实例化 Supervisor ---
        supervisor = SupervisorAgent(
             agents=all_agents,
             model=model, # Supervisor 使用相同的模型
             state_schema=PlanningAgentState, 
             include_agent_name="inline" 
             # checkpointer=... 
         )
     except Exception as e:
         print(f"Failed to initialize agents or supervisor: {e}")
         traceback.print_exc()
         return

     # --- 准备初始请求 ---
     # 用户请求包含两个意图：讲笑话 + 查信息
     user_request = (
                "Hi! I'd like to start with a short joke to lighten the mood, "
                "then please check Apple's headcount in 2024. Summarize both."
            )
     print(f"Initial Request: '{user_request}'")

     # --- 准备初始状态 ---
     initial_graph_state: PlanningAgentState = {
         "messages": [HumanMessage(content=user_request)], # 使用 HumanMessage
         "plan": None,
         "error": None
     }

     # --- 执行 Supervisor (使用 ainvoke) ---
     final_state: Optional[Dict[str, Any]] = None
     error_occurred: Optional[Exception] = None
     config = {"recursion_limit": 100} 

     try:
         print("\n--- Invoking Supervisor Agent (ainvoke) ---")
         final_state = await supervisor.ainvoke(initial_graph_state, config=config)
         print("\n--- Supervisor Agent Invocation Complete ---")

     # --- 错误处理 ---
     except RateLimitError as e: error_occurred = e; print(f"\n!!! OpenAI Quota Error: {e}")
     except Exception as e: error_occurred = e; print(f"\n!!! Error during graph execution: {e}"); traceback.print_exc()

     # --- 处理并打印最终结果 ---
     if error_occurred: print("\n--- Graph Execution INTERRUPTED or FAILED ---")
     else: print("\n--- Graph Execution Finished ---")

     if not final_state:
         print("Error: No final state available.")
         return

     print("\n--- FINAL STATE ---")
     # 打印错误（如果在状态中记录了）
     if final_state.get("error"): print(f"\nERROR RECORDED IN STATE: {final_state['error']}")
     # 打印计划
     final_plan = final_state.get('plan')
     if final_plan: print("\nFinal Plan State:", json.dumps(final_plan, indent=2, default=str))
     else: print("\nFinal Plan State: Not available.")
     # 打印消息历史
     final_messages = final_state.get("messages", [])
     if final_messages:
         print("\nFinal Message History (Last 10):")
         for m in final_messages[-10:]:
             try:
                 if hasattr(m, 'pretty_print'): m.pretty_print()
                 else: print(json.dumps(m, indent=2, default=str))
                 print("-" * 10)
             except Exception as print_err: print(f"Error printing final message: {print_err}")
     else: print("\nFinal Message History: Empty.")

     print("\n--- END OF TEST ---")


if __name__ == "__main__":
    try:
        asyncio.run(main())
    except KeyboardInterrupt:
        print("\nExecution interrupted by user.")
    except Exception as e:
         print(f"\nAn unexpected top-level error occurred: {e}")
         traceback.print_exc()

================================================
FILE: examples/state_based_supervisor_examples/02_tavily.py
================================================
# main.py (用于测试 State-Based Supervisor 和 ReactAgent)

import asyncio
import json
import os
from typing import Dict, Any, Optional
from langchain_community.tools import TavilySearchResults
# --- LangChain / LangGraph ---
# 假设模型直接在此初始化或从别处导入
from dotenv import load_dotenv
load_dotenv()  # 自动加载 .env 文件
try:
    from langchain_openai import ChatOpenAI # 或者你使用的其他模型
except ImportError:
     ChatOpenAI = None
     print("Warning: langchain_openai not installed.")

# 核心消息类型
from langchain_core.messages import HumanMessage, AIMessage, BaseMessage, ToolMessage

# --- OpenAI 错误处理 ---
try:
    from openai import RateLimitError
except ImportError:
    class RateLimitError(Exception): pass

# --- 内部模块导入 (请确保路径正确) ---
try:
    # 从你提供的 core.agents... 路径导入
    from core.agents.sb_supervisor_agent import SupervisorAgent # 你的 Supervisor 实现
    from core.agents.state_based_supervisor.state_schema import PlanningAgentState # 包含 Plan 的状态
    from core.agents.base.react_agent import ReactAgent # 你的 ReactAgent 实现
    from core.llm.llm_manager import LLMManager # LLM 管理器
    # (如果你的子 Agent 有更具体的类，在这里导入它们)
    # 例如:
    # from core.agents.researcher import ResearchAgent
    # from core.agents.coder import CoderAgent

    # --- 如果没有具体子 Agent 类，使用 ReactAgent 作为示例 ---
    # (确保 ReactAgent 可以被直接实例化用于测试)
    if not issubclass(ReactAgent, object): # 简单检查 ReactAgent 是否有效
         raise ImportError("ReactAgent class not found or invalid.")

except ImportError as e:
    print(f"Error importing agent components: {e}")
    print("Please ensure paths like 'core.agents.sb_supervisor_agent' are correct relative to your execution path.")

import traceback

# --- 主执行函数 (简化版，只关注最终结果) ---
async def run_supervisor_test(supervisor_agent: SupervisorAgent, initial_state: Dict[str, Any]):
    """Executes the supervisor graph using ainvoke and prints the final state."""

    print("--- Starting Supervisor Graph Test ---")
    # 获取初始消息列表，检查是否为空
    messages_list = initial_state.get("messages", [])
    initial_query = "N/A" # 默认值
    if messages_list:
        first_message = messages_list[0]
        # 检查第一个消息是否有 content 属性 (更健壮)
        if hasattr(first_message, 'content'):
            initial_query = first_message.content
        else:
             # 如果第一个元素不是预期的消息对象，记录一下
             print(f"Warning: First item in initial messages is not a standard message object: {type(first_message)}")
             initial_query = str(first_message) # 尝试转换为字符串
    print(f"Initial Query: '{initial_query}'")
    print("-" * 30)

    config = {"recursion_limit": 100} # 使用较高的递归限制
    final_state: Optional[Dict[str, Any]] = None
    error_occurred: Optional[Exception] = None

    try:
        print("--- Invoking Supervisor Agent (ainvoke) ---")
        # 直接调用 ainvoke 获取最终状态
        final_state = await supervisor_agent.ainvoke(initial_state, config=config)
        print("--- Supervisor Agent Invocation Complete ---")

    # --- 错误处理 ---
    except RateLimitError as e:
        error_occurred = e
        print("\n" + "="*40 + "\n!!! OpenAI API Error: Insufficient Quota !!!\n" + "="*40)
        print("Execution stopped. Check OpenAI plan/billing.")
        print(f"Original error: {e}")
    except TypeError as e:
         error_occurred = e
         print("\n" + "="*40 + "\n!!! TypeError During Graph Execution !!!\n" + "="*40)
         print(f"Error details: {e}")
         if "synchronous function provided" in str(e):
              print("Hint: Ensure all graph nodes support async or run the graph synchronously if needed.")
         traceback.print_exc()
    except Exception as e:
         error_occurred = e
         print("\n" + "="*40 + "\n!!! An Unexpected Error Occurred !!!\n" + "="*40)
         print(f"Error type: {type(e).__name__}\nError details: {e}")
         traceback.print_exc()

    # --- Process Final State ---
    if error_occurred: print("\n--- Graph Execution INTERRUPTED or FAILED ---")
    else: print("\n--- Graph Execution Finished ---")

    if not final_state:
         # 如果 ainvoke 返回 None 或在出错前未赋值 (理论上 ainvoke 会抛错或返回字典)
         print("Error: No final state available (Execution might have failed early).")
         # 尝试从 supervisor agent 获取最后状态 (如果 checkpointer 可用且实现了 get_state)
         if hasattr(supervisor_agent, 'checkpointer') and supervisor_agent.checkpointer and hasattr(supervisor_agent.checkpointer, 'get'):
             try:
                 # 需要知道配置中的 thread_id (这里假设是 'test_thread')
                 last_checkpoint = supervisor_agent.checkpointer.get({"configurable": {"thread_id": "test_thread"}})
                 if last_checkpoint:
                      print("Attempting to display last known checkpoint state:")
                      final_state = last_checkpoint.get('channel_values', {})
                 else:
                      print("Could not retrieve last checkpoint state.")
             except Exception as cp_err:
                  print(f"Error retrieving checkpoint state: {cp_err}")

    # 即使出错，也尝试打印 final_state (可能是包含错误信息的状态)
    if final_state and isinstance(final_state, dict):
        print("\n--- FINAL STATE ---")

        # 1. 打印错误信息 (如果存在)
        if final_state.get("error"):
             print(f"\nERROR RECORDED IN STATE: {final_state['error']}")

        # 2. 打印最终消息历史 (尝试 pretty_print)
        final_messages = final_state.get("messages", [])
        if final_messages and isinstance(final_messages, list):
             print("\nFinal Message History (Last ~10):")
             for m in final_messages[-10:]: # 只打印最后一部分
                  try:
                       if hasattr(m, 'pretty_print'):
                            m.pretty_print()
                       else: # Fallback for dict or other types
                            print(json.dumps(m, indent=2, default=str))
                       print("-" * 10)
                  except Exception as print_err:
                       print(f"Error printing final message: {print_err}")
        else:
             print("\nFinal Message History: Not available or empty.")

        # 3. 打印最终计划状态
        final_plan = final_state.get('plan')
        if final_plan and isinstance(final_plan, dict):
            print("\nFinal Plan State:")
            print(json.dumps(final_plan, indent=2, default=str))
        else:
            print("\nFinal Plan State: Not available or not generated.")

    else:
        print("\n--- No Final State Could Be Displayed ---")


    print("\n--- END OF TEST ---")
    return final_state

# --- Main Execution Block ---
async def main():
    # --- 1. 初始化 LLM 管理器 (它会自动注册配置好的模型) ---
    try:
        model_manager = LLMManager()
         # 可以选择打印一下注册了哪些模型
        print("Registered Models:", json.dumps(model_manager.list_models(), indent=2))
        print("Capability Mapping:", model_manager.list_capabilities())
    except Exception as e:
        print(f"Failed to initialize LLMManager: {e}")
        return

     # --- 2. 实例化 Agents (使用 ModelManager 获取模型) ---
    try:
         # 获取默认模型用于基础任务
        grok = model_manager.get_model("xai_grok") # 获取 ID 由 config 或第一个注册的决定
        deepseek_v3 = model_manager.get_model("deepseek_v3") # 获取 DeepSeek 模型
         # 创建Tavily搜索工具
        tavily_search = TavilySearchResults(
            max_results=3,
            include_answer=True,
            include_raw_content=False,
            include_images=False,
            search_depth="advanced"
        )

         # 确保 ReactAgent 使用与 Supervisor 兼容的状态 (例如 BasicAgentState)
         # 或者 Supervisor 能够处理不同类型的子 Agent 状态返回
        researcher_system_prompt = """You are a research expert. Use available tools to find the most up-to-date information to answer the user's query. You have access to a 'tavily_search_results_json' tool."""

        research_agent = ReactAgent(
            name="research_expert", 
            tools=[tavily_search],
            description="Research expert with access to Tavily search.",
            model=deepseek_v3,
            prompt=researcher_system_prompt,
         ) 
         
        all_agents = [research_agent] # 只包含一个子 Agent 用于测试

         # --- 实例化 Supervisor (使用 PlanningAgentState) ---
        supervisor = SupervisorAgent(
             agents=all_agents,
             model=deepseek_v3, # Supervisor 使用的 LLM
             state_schema=PlanningAgentState, # 明确 Supervisor 使用 Planning 状态
             # enable_planning=True, # 不再需要此参数，因为 state_schema 暗示了规划
             include_agent_name="inline" # 推荐
             # checkpointer=... # 添加 Checkpointer 以测试持久化
         )
    except Exception as e:
         print(f"Failed to initialize agents or supervisor: {e}")
         import traceback
         traceback.print_exc()
         return

     # --- 获取用户输入 ---
    topic = input("Please enter the initial request for the supervisor: ")
    if not topic:
         print("No request entered. Exiting.")
         return

     # --- 准备初始状态 (使用 PlanningAgentState) ---
    initial_graph_state: PlanningAgentState = {
         "messages": [HumanMessage(content=topic)], # 确保是 HumanMessage 对象
         "plan": None, # 初始没有计划
         "error": None
     }

     # --- 运行测试 ---
    await run_supervisor_test(supervisor, initial_graph_state)


if __name__ == "__main__":
    try:
        asyncio.run(main())
    except KeyboardInterrupt:
        print("\nExecution interrupted by user.")
    except Exception as e:
         print(f"\nAn unexpected top-level error occurred: {e}")
         traceback.print_exc()

================================================
FILE: examples/state_based_supervisor_examples/03_multi_agents.py
================================================
# main.py (Multi-Agent Test with State-Based Supervisor)

import asyncio
import json
import os
import re
import time
import traceback # 导入 traceback
from datetime import datetime
from typing import Dict, Any, Optional, List, Literal, cast

# --- LangChain / LangGraph / OpenAI Imports ---
from langchain_core.messages import HumanMessage, AIMessage, BaseMessage, ToolMessage


# --- Agent 和工具导入 (确保路径正确) ---
try:
    from core.agents.sb_supervisor_agent import SupervisorAgent # 替换为你的 SupervisorAgent 类路径
    from core.agents.state_based_supervisor.state_schema import PlanningAgentState
    from core.agents.base.react_agent import ReactAgent # 导入 ReactAgent 基类

    # 导入所有重构后的子 Agent 类
    from core.agents.sub_agents.research_agent import ResearchAgent # 假设路径
    from core.agents.sub_agents.coder_agent import CoderAgent       # 假设路径
    from core.agents.sub_agents.reporter_agent import ReporterAgent   # 假设路径
    from core.agents.sub_agents.designer_agent import DesignerAgent   # 假设路径
    from core.agents.sub_agents.data_analyst_agent import DataAnalystAgent # 假设路径

    # 导入工具注册表函数和枚举
    from core.tools.registry import get_tools_by_category, ToolCategory, register_tool # 导入 register_tool
    from core.llm.llm_manager import LLMManager # LLM 管理器
    # 导入特定工具实例或类 (如果 Registry 没有预注册所有工具)
    from langchain_community.tools.tavily_search import TavilySearchResults # 示例
    # from core.tools.e2b_tool import E2BCodeInterpreterTool # 示例
    # from core.tools.replicate_flux_tool import ReplicateFluxImageTool # 示例

    # --- 确保工具已注册 ---
    # 运行 registry 初始化 (通常在 core/tools/__init__.py 中完成)
    try:
        import core.tools # 尝试导入以触发 __init__.py 中的注册
        print("Tool registry potentially initialized.")
    except ImportError:
        print("Warning: Could not import 'core.tools' to initialize registry.")
    except Exception as reg_err:
         print(f"Error during tool registry initialization: {reg_err}")
         
    # (可选) 在这里可以检查或手动注册缺失的核心工具
    # Example: Check and register Tavily if not present
    if not any(getattr(t, 'name', '') == 'tavily_search_results_json' for t in get_tools_by_category(ToolCategory.SEARCH)):
        try:
            print("Attempting to register TavilySearchResults...")
            tavily_tool = TavilySearchResults(max_results=3)
            register_tool(tavily_tool, ToolCategory.SEARCH)
        except Exception as e:
            print(f"Warning: Failed to register TavilySearchResults manually: {e}")
            
    # ... 检查并注册其他必要的工具 ...


except ImportError as e:
    print(f"Error importing agent/tool components: {e}")
    print("Please ensure all agent/tool class paths and registry setup are correct.")
    exit(1)


# --- 助手函数 ---
def slugify(text: str) -> str:
    """Converts text to a safe filename part."""
    # ... (保持不变) ...
    if not text: return "no_topic"
    text = text.lower(); text = re.sub(r'\s+', '_', text)
    text = re.sub(r'[^\w\-]+', '', text); text = text.strip('_')
    return text[:100] if text else "sanitized_topic"

# --- 主研究/测试函数 ---
async def run_supervisor_test(supervisor_agent: SupervisorAgent, initial_state: Dict[str, Any]):
    """Executes the supervisor graph using ainvoke and prints the final state."""

    print("\n--- Starting Supervisor Graph Execution ---")
    initial_query = initial_state.get("messages", [{}])[0].content if initial_state.get("messages") and hasattr(initial_state.get("messages")[0], 'content') else "N/A"
    print(f"Initial Query: '{initial_query}'")
    print("-" * 30)

    config = {"recursion_limit": 100} # 保持较高的递归限制

    final_state: Optional[Dict[str, Any]] = None
    error_occurred: Optional[Exception] = None

    try:
        print("--- Invoking Supervisor Agent (ainvoke) ---")
        # 直接调用 ainvoke 获取最终状态
        final_state = await supervisor_agent.ainvoke(initial_state, config=config)
        print("--- Supervisor Agent Invocation Complete ---")

    # --- 错误处理 ---
    except Exception as e: error_occurred = e; print(f"\n!!! Error during graph execution: {e}"); traceback.print_exc()


    # --- 处理最终状态 ---
    if error_occurred: print("\n--- Graph Execution INTERRUPTED or FAILED ---")
    else: print("\n--- Graph Execution Finished ---")

    if not final_state:
         print("Error: No final state available (Execution might have failed early).")
         # 尝试从 checkpointer 获取最后状态 (如果配置了)
         # ... (checkpoint retrieval logic - optional) ...
         return None

    print("\n--- FINAL STATE ---")
    # 打印错误 (如果在状态中记录了)
    if final_state.get("error"): print(f"\nERROR RECORDED IN STATE: {final_state['error']}")

    # 打印计划
    final_plan = final_state.get('plan')
    if final_plan and isinstance(final_plan, dict):
        print("\nFinal Plan State:")
        print(json.dumps(final_plan, indent=2, default=str))
    else: print("\nFinal Plan State: Not available or not generated.")

    # 打印最终消息历史
    final_messages = final_state.get("messages", [])
    if final_messages and isinstance(final_messages, list):
         print("\nFinal Message History (Last 10):")
         for m in final_messages[-10:]:
              try:
                   if hasattr(m, 'pretty_print'): m.pretty_print()
                   else: print(json.dumps(m, indent=2, default=str)) # Fallback
                   print("-" * 10)
              except Exception as print_err: print(f"Error printing final message: {print_err}")
    else: print("\nFinal Message History: Empty.")

    # --- 保存最终报告 (如果 Reporter Agent 被调用且成功) ---
    # 检查最后一条消息是否来自 Reporter
    final_report_content = None
    if final_messages and isinstance(final_messages[-1], AIMessage) and final_messages[-1].name == "reporter_expert":
         final_report_content = final_messages[-1].content
         print("\n--- Final Report Found from Reporter Agent ---")

    if not error_occurred and final_report_content and isinstance(final_report_content, str) and "Failed" not in final_report_content:
        print("\n--- Saving Final Output to Markdown ---")
        try:
            markdown_content = final_report_content
            # 获取原始请求作为文件名基础
            initial_query_text = final_state.get('messages', [{}])[0].content if final_state.get('messages') and hasattr(final_state.get('messages')[0], 'content') else 'unknown_request'
            topic_slug = slugify(initial_query_text)
            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
            filename = f"multi_agent_report_{topic_slug}_{timestamp}.md"

            script_dir = os.path.dirname(os.path.abspath(__file__))
            output_dir = os.path.join(script_dir, "Output")
            os.makedirs(output_dir, exist_ok=True)
            filepath = os.path.join(output_dir, filename)

            with open(filepath, "w", encoding="utf-8") as f: f.write(markdown_content)
            print(f"Successfully saved output to: {filepath}")
        except Exception as e: print(f"Error saving output to Markdown: {e}")
    elif error_occurred: print("\nFinal Report: Not saved due to execution error.")
    else: print("\nFinal Report: Not generated or not found.")

    print("\n--- END OF TEST ---")
    return final_state


# --- Main Execution Block ---
async def main():
    # --- 1. 初始化 LLM 管理器 ---
    try:
        model_manager = LLMManager()
        print("Registered Models:", json.dumps(model_manager.list_models(), indent=2))
    except Exception as e:
        print(f"Failed to initialize LLMManager: {e}")
        return

    # --- 2. 实例化所有 Agents ---
    try:
        # 获取模型实例
        # 确保 'deepseek_v3' 和 'gpt-4o' 是你 LLMManager 中有效的 ID
        deepseek_model = model_manager.get_model("deepseek_v3")
        gpt4o_model = model_manager.get_model("openai_gpt4o") # 多模态模型

        # 实例化 ResearchAgent
        research_agent = ResearchAgent(
            model=deepseek_model,
        )

        # 实例化 CoderAgent
        coder_agent = CoderAgent(
            model=deepseek_model,
        )

        # 实例化 ReporterAgent
        reporter_agent = ReporterAgent(
            model=deepseek_model
        )

        # 实例化 DesignerAgent
        designer_agent = DesignerAgent(
            model=gpt4o_model,
        )

        # 实例化 DataAnalystAgent
        data_analyst_agent = DataAnalystAgent(
            model=deepseek_model,
        )

        # --- 3. 组合 Agent 列表 ---
        all_agents = [
            research_agent,
            coder_agent,
            reporter_agent,
            designer_agent,
            data_analyst_agent,
        ]

        # --- 4. 实例化 Supervisor ---
        supervisor = SupervisorAgent(
             agents=all_agents,
             model=deepseek_model, # Supervisor 自身使用的模型
             # model = gpt4o_model,
             state_schema=PlanningAgentState,
             include_agent_name="inline"
             # checkpointer=... # 可选: 添加 Checkpointer 实现持久化
        )

    except Exception as e:
         print(f"Failed to initialize agents or supervisor: {e}")
         traceback.print_exc()
         return

    # --- 5. 获取用户输入 ---
    topic = input("Please enter the initial request for the supervisor: ")
    if not topic:
         print("No request entered. Using default topic.")
         topic = """我需要获取法国巴黎当前的实时气温。请按以下步骤操作：
1. 首先，帮我调研一个可以免费获取巴黎当前天气数据的 API (例如 Open-Meteo, WeatherAPI.com 或其他类似的)，重点是找到获取当前气温的 API 端点(endpoint URL)以及如何构造请求（如果可能，选择不需要 API key 的）。
2. 然后，编写一个 Python 脚本，使用 'requests' 库来调用上一步找到的 API 端点，并从中提取出巴黎当前的温度（摄氏度）。
3. 使用你的代码执行工具来运行这个 Python 脚本。
4. 最后，告诉我你找到的当前巴黎温度是多少。"""

    # --- 6. 准备初始状态 ---
    initial_graph_state: PlanningAgentState = {
         "messages": [HumanMessage(content=topic)], 
         "plan": None,
         "error": None
    }

    # --- 7. 运行测试 ---
    await run_supervisor_test(supervisor, initial_graph_state)


if __name__ == "__main__":
    try:
        asyncio.run(main())
    except KeyboardInterrupt:
        print("\nExecution interrupted by user.")
    except Exception as e:
         print(f"\nAn unexpected top-level error occurred: {e}")
         traceback.print_exc()

================================================
FILE: examples/web_agents/README.md
================================================
# Web Agents

这个目录包含可以通过web界面加载的代理示例。每个子目录代表一个独立的代理实现，可以被server.py动态加载。

## 目录结构

每个代理应遵循以下结构：

```
agent_name/
  __init__.py  # 包含get_graph()函数，返回编译好的LangGraph
  README.md    # 代理的说明文档
```

## 接口规范

每个代理必须实现以下接口：

```python
def get_graph():
    """返回编译好的LangGraph实例"""
    # 构建并返回图
    return compiled_graph
```

================================================
FILE: examples/web_agents/README_SPEC.md
================================================
# Web Agent 开发规范

## 1. 概述

本规范旨在统一Web Agent的开发流程和命名约定，确保前后端协同工作，避免出现前端组件无法正确显示后端数据的问题。本文档基于实际开发经验，特别强调前后端节点命名一致性的重要性。

## 2. 节点命名规范

## 2. 前后端交互核心机制

### 2.1 关键概念

- **节点名称匹配**: 前端渲染组件时，会根据后端节点的名称来选择对应的组件进行渲染
- **状态数据结构**: 后端节点生成的状态数据必须符合前端组件期望的结构
- **渲染函数**: 前端的`renderNode`函数是连接后端节点和前端组件的关键桥梁

### 2.2 渲染流程

1. 后端节点执行并生成状态数据
2. 前端通过`useLangGraphAgent`钩子接收节点数据
3. 前端的`renderNode`函数根据节点名称选择对应组件
4. 组件根据状态数据进行渲染

## 3. 节点命名规范

### 3.1 关键节点命名

所有Web Agent必须在图结构中包含处理消息的节点，这些节点名称必须与前端`renderNode`函数中的case语句匹配：

```python
# 后端节点命名 - 必须与前端renderNode函数中的case匹配
builder.add_node("agent", agent_function)  # 或其他在前端已注册的节点名称
```

**重要提示**: 前端`page.tsx`中的`renderNode`函数定义了可识别的节点名称。目前支持的节点名称有：
- `__start__`
- `agent` (替代了原来的`chatbot`)
- `weather`
- `reminder`
- `research`
- `search`
- `report`

如果后端使用了其他节点名称，必须在前端的`renderNode`函数中添加对应的case语句。

### 3.2 状态字段命名

- 状态字段名称应与前端组件期望的字段名称保持一致
- 使用蛇形命名法（snake_case）命名状态字段
- 复杂数据结构应使用数组形式，即使只有一个元素

### 3.3 必要的状态字段

每个Web Agent必须在`agent-types.ts`文件中定义其状态接口，并确保后端发送的状态与此接口匹配：

```typescript
export interface AgentState extends WithMessages {
  // 定义Agent特有的状态字段
  weather_forecast?: WeatherForecast[];
  research_status?: ResearchStatus[];
  // 其他状态字段
}
```

## 4. 前端组件规范

### 4.1 组件结构

- 主组件应根据节点名称渲染不同的子组件
- 子组件应检查所需状态字段是否存在，并提供合理的默认行为

```typescript
export default function renderNode(checkpoint, node) {
  switch (node.name) {
    case '__start__':
    case 'agent':  // 注意：这里使用'agent'替代了原来的'chatbot'
      return <ChatbotNode nodeState={node.state} />;
    case 'weather':
      return <WeatherNode nodeState={node.state} />;
    // 其他节点类型
    default:
      return null;
  }
}
```

### 4.2 组件注册

所有Web Agent的节点组件必须在`page.tsx`的`renderNode`函数中正确注册：

```typescript
const renderNode = (checkpoint, node) => {
  switch (node.name) {
    // 确保这里的节点名称与后端图定义中的节点名称一致
    case '__start__':
    case 'agent':  // 注意：这里使用'agent'替代了原来的'chatbot'
      return <ChatbotNode nodeState={node.state} />;
    case 'weather':
      return <WeatherNode nodeState={node.state} />;
    case 'reminder':
      return <Reminder interruptValue={checkpoint.interruptValue} onResume={handleResume} />;
    case 'research':
    case 'search':
    case 'report':
      return <ResearchNode nodeState={node.state} />;
    // 添加新节点类型的渲染逻辑
    default:
      return null;
  }
}
```

## 5. 后端图结构规范

### 5.1 节点函数

- 节点函数应使用适当的参数来处理状态
- 消息处理必须在与前端匹配的节点中进行

```python
async def agent(state):  # 注意：这里使用'agent'替代了原来的'chatbot'
    # 处理消息并返回结果
    return {"messages": [...]}  # 必须包含messages字段
```

### 5.2 图构建

- 图必须包含与前端匹配的节点，用于处理消息
- 必须实现`get_graph()`函数返回编译好的图实例

```python
def get_graph():
    """返回编译好的LangGraph实例"""
    builder = StateGraph()
    builder.add_node("agent", agent)  # 注意：这里使用'agent'替代了原来的'chatbot'
    # 添加边和其他节点
    graph = builder.compile(checkpointer=MemorySaver())
    return graph
```

## 6. 开发流程

### 6.1 新建Web Agent流程

1. 在`examples/web_agents/`下创建新的Agent目录
2. 创建`graph.py`文件，实现Agent的图结构，确保节点名称与前端`renderNode`函数中的case语句匹配
3. 在`web/app/chat/[id]/agent-types.ts`中添加Agent所需的状态接口
4. 在`web/app/chat/[id]/components/`下创建Agent的组件
5. 在`web/app/chat/[id]/page.tsx`的`renderNode`函数中注册Agent的节点组件（如果使用新的节点名称）

### 6.2 测试验证

在提交代码前，必须进行以下测试：

1. 确认后端图结构中的节点名称与前端`renderNode`函数中的case语句匹配
2. 验证前端组件能正确渲染不同类型的节点
3. 检查状态字段名称与前端组件期望的字段名称一致

## 7. 常见问题与解决方案

### 7.1 前端不显示消息问题

如果前端不显示消息内容，请检查：

1. 后端图结构中的节点名称是否与前端`renderNode`函数中的case语句匹配
2. 前端`renderNode`函数是否正确处理了对应的节点名称
3. 消息是否正确包含在state的messages字段中

### 7.2 状态更新不生效

确保状态更新时，字段名称与前端期望的字段名称一致，并且数据结构符合前端组件的预期。

### 7.3 添加新节点类型

如果需要添加新的节点类型，必须：

1. 在后端图结构中定义新节点
2. 在前端`page.tsx`的`renderNode`函数中添加对应的case语句
3. 创建新节点对应的前端组件
4. 在`agent-types.ts`中添加新节点所需的状态接口

---

遵循本规范可以有效避免前后端不一致导致的显示问题，提高Web Agent的开发效率和质量。

================================================
FILE: examples/web_agents/__init__.py
================================================
# Web Agents Package
# This package contains web agents that can be loaded by the server

================================================
FILE: examples/web_agents/research_assistant/README.md
================================================
# 研究助手

这是一个强大的研究助手代理，可以帮助用户进行在线研究、信息收集和报告生成。

## 功能

- 在线搜索信息
- 提取和总结网页内容
- 生成研究报告
- 实时显示研究进度

## 使用方法

用户可以通过自然语言与代理交互，例如：

- "帮我研究人工智能在医疗领域的应用"
- "查找关于气候变化的最新研究"
- "总结量子计算的基本原理"

## 技术实现

该代理使用LangGraph构建，结合了Supervisor和React模式，包含以下节点：

- supervisor: 协调整个研究流程
- search: 执行在线搜索
- extract: 提取网页内容
- analyze: 分析收集的信息
- report: 生成研究报告

研究过程中会实时更新状态，让用户了解当前进度。

================================================
FILE: examples/web_agents/research_assistant/__init__.py
================================================
# Research Assistant Agent
# This module provides a research assistant agent that can crawl websites and extract content

from .graph import get_graph

__all__ = ["get_graph"]

================================================
FILE: examples/web_agents/research_assistant/graph.py
================================================
from langgraph.prebuilt import create_react_agent
from langchain_openai import ChatOpenAI
from typing import Dict, Any
from dotenv import load_dotenv
from langchain_community.tools import TavilySearchResults
from langgraph.checkpoint.memory import MemorySaver
from core.tools.e2b_tool import E2BCodeInterpreterTool
from core.tools.registry import register_tool, ToolCategory
from core.llm.llm_manager import LLMManager

load_dotenv()  # 自动加载 .env 文件
# 初始化大模型
model = LLMManager().get_model("deepseek_v3")

# 创建Tavily搜索工具
tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=False,
    include_images=False,
    search_depth="advanced"
)

# 创建E2B代码解释器工具
e2b_code_interpreter = E2BCodeInterpreterTool()


research_agent = create_react_agent(
    model=model,
    tools=[tavily_search, e2b_code_interpreter],
    name="research_expert",
    # Prompt 告诉它是一个研究型 Agent，可调用 tavily_search 和 e2b_code_interpreter
    prompt=(
        "你是一位世界级的研究专家和数据分析师，擅长信息检索和数据分析。你有两个强大的工具可以使用：\n"
        "1. 'tavily_search_results_json'：用于搜索网络获取实时信息\n"
        "2. 'e2b_code_interpreter'：用于执行Python代码，支持数据分析和可视化\n\n"
        "当面对问题时，请遵循以下方法论：\n"
        "1. 分析问题：理解用户的需求和问题本质\n"
        "2. 制定计划：确定需要搜索哪些信息，以及是否需要进行数据分析\n"
        "3. 执行搜索：使用tavily_search_results_json工具获取最新信息\n"
        "4. 数据分析：如果需要，使用e2b_code_interpreter工具编写和执行Python代码进行数据分析和可视化\n"
        "5. 综合信息：将搜索结果和数据分析结果综合成一个连贯的回答\n\n"
        "重要提示：\n"
        "- 对于信息检索任务，使用tavily_search_results_json工具，并在回答中引用来源URL\n"
        "- 对于数据分析和可视化任务，使用e2b_code_interpreter工具执行Python代码\n"
        "- 在使用代码解释器时，确保导入必要的库（如pandas, matplotlib, numpy等）\n"
        "- 在代码中添加详细注释，解释关键步骤\n"
        "- 执行代码后，解释结果含义和见解"
    ),
    checkpointer=MemorySaver(),
)


def get_graph():
    return research_agent

================================================
FILE: examples/web_agents/weather_agent/README.md
================================================
# 天气代理

这是一个简单的天气查询代理，可以回答用户关于天气的问题，并提供天气预报信息。

## 功能

- 查询当前天气
- 创建提醒

## 使用方法

用户可以通过自然语言与代理交互，例如：

- "今天北京的天气怎么样？"
- "帮我设置一个提醒，明天早上8点去开会"

## 技术实现

该代理使用LangGraph构建，包含以下节点：

- chatbot: 处理用户输入并生成回复
- weather: 处理天气查询请求
- reminder: 处理提醒创建请求

================================================
FILE: examples/web_agents/weather_agent/__init__.py
================================================
# Weather Agent Example
# This is a simple weather agent that can be loaded by the server

import operator
from typing import Literal, TypedDict, Any, Annotated
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from langgraph.graph import StateGraph, MessagesState, START, END
from langgraph.checkpoint.memory import MemorySaver
from langgraph.types import StreamWriter, interrupt, Send
from langchain_core.messages import ToolMessage
from langchain_core.tools import tool
import random
import asyncio

load_dotenv()


class Weather(TypedDict):
    location: str
    search_status: str
    result: str


class State(MessagesState):
    weather_forecast: Annotated[list[Weather], operator.add]


class WeatherInput(TypedDict):
    location: str
    tool_call_id: str


class ToolNodeArgs(TypedDict):
    name: str
    args: dict[str, Any]
    id: str


@tool
async def weather_tool(query: str) -> str:
    """Call to get current weather"""
    return "Sunny"


@tool
async def create_reminder_tool(reminder_text: str) -> str:
    """Call to create a reminder"""
    return "Reminder created"


async def weather(input: WeatherInput, writer: StreamWriter):
    location = input["location"]
    tool_call_id = input["tool_call_id"]

    # Send custom event to the client. It will update the state of the last checkpoint and all child nodes.
    # Note: if there are multiple child nodes (e.g. parallel nodes), the state will be updated for all of them.
    writer({"weather_forecast": [
           {"location": location, "search_status": f"Checking weather in {location}"}]})

    await asyncio.sleep(2)
    weather = random.choice(["Sunny", "Cloudy", "Rainy", "Snowy"])

    return {"messages": [ToolMessage(content=weather, tool_call_id=tool_call_id)], "weather_forecast": [{"location": location, "search_status": "", "result": weather}]}


async def reminder(input: ToolNodeArgs):
    res = interrupt(input['args']['reminder_text'])

    tool_answer = "Reminder created." if res == 'approve' else "Reminder creation cancelled by user."

    return {"messages": [ToolMessage(content=tool_answer, tool_call_id=input["id"])]}


async def chatbot(state: State):
    llm = ChatOpenAI(
        model="gpt-4o-mini").bind_tools([weather_tool, create_reminder_tool])
    response = await llm.ainvoke(state["messages"])
    return {"messages": [response]}


def tool_router(state: State) -> Literal["weather", "reminder", "__end__"]:
    messages = state["messages"]
    last_message = messages[-1]
    if last_message.tool_calls:
        if last_message.tool_calls[0]["name"] == "weather_tool":
            return "weather"
        elif last_message.tool_calls[0]["name"] == "create_reminder_tool":
            return "reminder"
    return "__end__"


# Chatbot node router. Based on tool calls, creates the list of the next parallel nodes.
def assign_tool(state: State) -> Literal["weather", "reminder", "__end__"]:
    messages = state["messages"]
    last_message = messages[-1]
    if last_message.tool_calls:
        send_list = []
        for tool in last_message.tool_calls:
            if tool["name"] == 'weather_tool':
                send_list.append(
                    Send('weather', {'location': tool['args']['query'], 'tool_call_id': tool['id']}))
            elif tool["name"] == 'create_reminder_tool':
                send_list.append(Send('reminder', tool))
        return send_list if len(send_list) > 0 else "__end__"
    return "__end__"


def get_graph():
    """Return the compiled graph for this agent"""
    builder = StateGraph(State)

    builder.add_node("chatbot", chatbot)
    builder.add_node("weather", weather)
    builder.add_node("reminder", reminder)

    builder.add_edge(START, "chatbot")
    builder.add_conditional_edges("chatbot", assign_tool)
    builder.add_edge("weather", "chatbot")
    builder.add_edge("reminder", "chatbot")

    builder.add_edge("chatbot", END)

    memory = MemorySaver()
    return builder.compile(checkpointer=memory)

================================================
FILE: instructions/00.Langgraph 和 React Agent.md
================================================
# 一、LangGraph 的核心思想

LangGraph 是一个可以让开发者以**图（Graph）**的方式来编排对话式AI流程的库，提供了以下能力：

1. **状态驱动**：在传统的对话模型中，我们经常需要维护对话上下文、剩余步骤等各种内部变量。LangGraph 将这些变量统一到一个“状态(State)”里，并约定任何节点的输入/输出都以“状态(State)”的形式表示。
   
2. **可视化执行流**：LangGraph 将对话/工具调用/自定义逻辑封装成“节点(Node)”与“边(Edge)”。当图被编译后，执行流会在节点之间穿梭，处理对话消息、调用工具、终止或转向某些分支。

3. **可组合**：你可以把一个复杂的对话逻辑拆分为多个可复用的子图，每个子图都可以独立进行单元测试或复用在更大的图中。

4. **多步思考 + 工具调用**：通过 ReAct Agent（一个经典的多步推理+工具调用范式），LangGraph 可以帮助你自动管理**多次**调用语言模型及其衍生工具的过程——只要你把“工具”注册到图里。

在使用时，你基本会经历如下步骤：

1. **定义状态模式（state schema）**：说明 state 中必须包含哪些字段（如：对话消息 `messages`，剩余可用步骤 `remaining_steps`，等等）。
2. **定义节点（Node）**：比如一个负责调用LLM的节点、一个负责执行特定工具的节点、或者你自定义的Python逻辑节点。
3. **连接边（Edges）**：决定每个节点之后，下一步走到哪个节点；也可以做条件分支或循环。
4. **编译图（Compile）**：LangGraph 会把你的“编排逻辑”转换为一个 LangChain 兼容的“可调用对象(CompiledGraph)”。
5. **执行或流式执行**：可以直接一次性 `graph.invoke(...)` 得到最终结果，也可以使用 `graph.stream(...)` 流式获取每个“阶段性状态（partial state）” 。

---

# 二、LangGraph 核心概念详解

LangGraph 构建的是一个"流程图"，每个智能体（agent）或功能模块（tool调用、分支逻辑）都是这个流程图的一个节点（node）。让我们深入理解其中的核心概念：

## 2.1 Graph：有状态的数据流图

Graph 是整个 Agent 系统的执行框架，定义了哪些模块怎么串联、怎么流转。你构建的 graph 是一个有向图：

```python
graph = StateGraph(state_schema=MyState)

# 添加节点
graph.add_node("supervisor", supervisor_runnable)
graph.add_node("writer", writer_runnable)

# 添加边来连接节点
graph.add_edge("supervisor", "writer")
graph.add_edge("writer", "supervisor")
```

LangGraph 根据这些连接关系来控制执行流程，决定在某个节点执行完后下一步应该去哪里。

## 2.2 Node：图中的"一个执行单元"

每个 node 是图中的一个处理模块（通常就是一个智能体）。它接受一个输入 state，做点事情，然后返回一个新的 state：

```python
def my_node(state: dict) -> dict:
    # 处理 state 中的数据
    new_state = state.copy()
    # 修改状态内容
    new_state["some_key"] = "new_value"
    return new_state
```

节点可以是：
- 函数（同步或异步）
- LLM Agent（如 create_react_agent 返回的）
- 包装后的 Agent（如 MemorySlidingReactAgent）

## 2.3 State：每一轮节点处理的输入/输出

每轮调用，LangGraph 会传递一个 "state"（字典类型）给当前节点。这个 state 中可以包含：
- `messages`: 当前对话历史（主上下文）【默认】
- `memory`: 你自定义的长期记忆（可以注入系统提示）
- `todo_list`, `current_task`: 其他任务状态
- 任何你自定义的字段

每个节点执行后，返回新的 state：

```python
def writer(state):
    new_msg = generate_chapter(state["current_task"])
    state["messages"].append({"role": "assistant", "content": new_msg})
    return state
```

## 2.4 Runnable：Node 的运行接口

LangGraph 要求，每个节点（node）必须是可以运行的，也就是说：你交给 `add_node()` 的对象必须有 `.invoke(state)` 或 `.ainvoke(state)` 方法。

比如：
- 函数本身（它会自动包装成 Runnable）
- Agent（React agent 本身就支持 `.invoke`）
- `RunnableCallable(...)` 是 LangGraph 用来显式包装函数的工具

举个例子：

```python
def my_function(state: dict) -> dict:
    # 处理逻辑
    return state

runnable = RunnableCallable(my_function, async_version)
graph.add_node("writer", runnable)
```

## 2.5 执行流程

LangGraph 的执行流程大致如下：

```
LangGraph Graph:
   [START]
      ↓
  [Supervisor Node]
      ↓
  [Writer Node]
      ↓
  [Supervisor Node]
      ↓
   [END]
```

每次节点执行时：
1. 传入当前 state
2. `.invoke(state)` 被调用
3. 返回更新后的 state
4. 下一节点接着执行

## 2.6 概念类比

| LangGraph 概念 | 类比 |
|----------------|------|
| Graph | 工作流程图/数据流图 |
| Node | 每个处理步骤/智能体 |
| State | 当前上下文与执行状态（黑匣子） |
| Runnable | 每个节点"能被执行"的接口定义 |

---

# 三、ReAct Agent 与 create_react_agent 概念

## 3.1 什么是 ReAct Agent

“ReAct” 是一种典型的LLM多步推理与工具调用策略。它主要包含两部分：

1. **Reasoning**：先让语言模型（LLM）进行一步推理，产出一个潜在的思考过程以及可能的工具调用。
2. **Acting**：如果模型说“我要调用某个工具”，则执行该工具，得到结果，再把结果加入对话，然后让模型再次 Reason，看看是否还需要再调用工具，或输出最后的答案。

这个循环可以**多次往返**，直到模型不再调用工具，输出最终结果。

## 3.2 create_react_agent 做了什么

`create_react_agent(...)` 是 LangGraph 中的一个快捷方法，用于**快速创建**一个可执行的“ReAct风格”图（Graph）：

- **自动添加“agent节点”**：用来调用你的语言模型（并在对话中发出可能的工具调用）。
- **自动添加“tools节点”**：如果 agent 的输出中含有工具调用（tool_calls），则会交给 tools 节点逐个执行，并把执行结果以 `ToolMessage` 的形式返回到对话中。
- **自动在 agent ↔ tools 之间连线**：只要 agent 产生了工具调用，就进入 tools；tools 执行完返回消息后，再回到 agent；直到不再有工具调用为止。
- **可选 structured output**：如果你传入了 `response_format` 参数，LangGraph 会在最后一步生成一个结构化输出(“JSON Schema”、“Pydantic”、“OpenAI function schema”等)，以便你获取可解析的最终结果。
- **控制“剩余步骤”**：Agent 每次回答后会检查是否还可以继续调用工具，或者是否需要中止并返回错误（“抱歉，需要更多步骤”）。

因此，调用 `create_react_agent(...)` 得到的结果，是一个**已经配置好**的 “CompiledGraph”。这个图中带有 “agent” 节点（LLM） 和 “tools” 节点（调用工具），以及检查**是否还有工具要调**的逻辑。你可以直接拿这个对象执行，获得一个 ReAct 流程的多轮对话+工具使用。

---

# 四、执行流程：从输入到输出

创建好 ReAct 图后，你给它一个输入状态（最少包含 `"messages"`，如 `{"messages": [("user", "Hello!")]}`）。执行过程大体是：

1. **entry point: "agent"**  
   进入 agent 节点，它会从 state["messages"] 中取出消息，交给 LLM 生成一个 AIMessage。如果 AIMessage 包含 tool_calls，那么 state 会更新多一些字段，比如 `messages` 后面多了这个 AIMessage。

2. **检查是否要调用工具**  
   - 如果 `tool_calls` 不为空，则顺着 edges 进入 "tools" 节点。
   - 如果没有 tool_calls，则表示 agent 没有想调用任何工具 -> 流程会判断是否要去 “generate_structured_response” 或 “END”。
   
3. **tools 节点执行**  
   "tools" 节点会去匹配 agent 要调用的工具，比如：  
   ```json
   {
     "name": "search_tool",
     "args": {"query": "something"},
     "id": "call_abc123"
   }
   ```
   然后运行相应的 Python 函数，得到结果后，包装成 `ToolMessage`，附加回 state["messages"] 列表里。
   - 如果 agent 一次性请求了多个工具，在 v1 版本中则会并行执行，再把返回结果依次追加到 messages 里。
   - 在 v2 版本中，LangGraph 会拆分 tool_calls 分批执行。

4. **回到 agent**  
   现在 agent 再次拿到新的 state["messages"]（多了“ToolMessage”），就会针对最新的对话上下文重新进行思考——是否要再调用别的工具、或者是否直接产出最终回答？

5. **循环，直到不再调用工具**  
   只要 AIMessage 继续发出 tool_calls，就进入 Tools 节点；Tools 执行完再回到 Agent 节点。这一过程可能多次往返。（如果你设定了 `remaining_steps`，LangGraph 在每一轮都会减少1，直到不足时终止或报错，避免死循环。）

6. **可选：结构化输出**  
   在最后如果 `response_format` 存在，图会跳到“generate_structured_response”节点，再次对(几乎)所有对话做一次 LLM 调用，要求 LLM 产出符合**你给定schema**的 JSON，并存入 `structured_response` 字段中。然后再返回 END。

7. **结束**  
   整个 ReAct 流程完成后，图会返回一个最终状态，如：
   ```python
   {
     "messages": [  # 所有对话消息(包含了Human/AI/Tools等),
       ...,
       AIMessage(content="Here is the final answer", tool_calls=[])
     ],
     "remaining_steps": 2,
     "structured_response": { ... }  # 如果使用了response_format
   }
   ```
   你可以从中拿到想要的最终 AI 回答。

---

# 五、如何查看“中间推理”或“工具调用”？

从 **langgraph 0.3** 开始，`create_react_agent` 及其返回的 Graph 已经**不再支持** `graph.add_state_change_listener` 或在函数参数里传入 `callbacks`。如果你想**监听**或**打印** Agent 的中间思考、工具调用等过程，最好的方式是 **使用 `graph.stream(...)`**——它会在每一小步执行结束后产出一个“部分状态( partial_state )”，你可以在循环里进行日志记录、可视化或其他操作。示例：

```python
graph = create_react_agent(model, tools=[...], prompt="...")

inputs = {
    "messages": [
       ("user", "请分析特斯拉2025年的发展预期，包括新车型计划、销量目标、技术创新和市场扩张战略。")
    ]
}

for partial_state in graph.stream(inputs, stream_mode="values"):
    messages = partial_state["messages"]
    last_msg = messages[-1]
    if last_msg.type == "ai":
        print("[AIMessage] => ", last_msg.content)
        if last_msg.tool_calls:
            print("AI wants to call tools:", last_msg.tool_calls)
    elif last_msg.type == "tool":
        print("[ToolMessage] => Name:", last_msg.name, "Content:", last_msg.content)
    elif last_msg.type == "human":
        print("[User] => ", last_msg.content)

# 最后一次迭代时，partial_state 就是最终结果
final_answer = partial_state["messages"][-1].content
print("最终回答:", final_answer)
```

这样就能够**在每一次** Agent 或 Tools 完成后都获取状态，不需要“回调监听器”。

---

# 六、关于一些进阶用法

1. **`interrupt_before` / `interrupt_after`**  
   如果你希望在“agent”节点**执行前**或者**后**打断，可以设置这两个可选参数，比如：
   ```python
   create_react_agent(
       model,
       tools=[...],
       interrupt_before=["tools"],
       interrupt_after=["agent"],
       ...
   )
   ```
   当执行流程跑到 agent 或 tools 时，会先/后给你一个“交互点”机会，你可以在**流式**执行中察觉到这个点，或者抛出异常提前终止等。但是它比较适合做“用户确认”或“调试介入”，而不是实时日志。

2. **`checkpointer` / `store`**  
   - `checkpointer` 主要用来将单个“线程”（单条对话）的状态进行保存、恢复，可以在多回合对话里保留上下文。
   - `store` 提供了更跨线程或跨用户的持久化能力。  
   通过把 `store` 绑定到 Graph，工具调用里还可以使用 `InjectedStore`，把数据写入或读取到 store 中（如相当于“全局数据库”）。

3. **`response_format`**  
   如果你想让最终输出符合某种 JSON Schema 或 Pydantic 验证，可以这样写：
   ```python
   from langchain_core.prompts import ChatPromptTemplate
   from pydantic import BaseModel, Field

   class TeslaPlan(BaseModel):
       new_models: list[str] = Field(..., description="新车型列表")
       sales_target: int = Field(..., description="预计销量")
       technology_innovations: str
       market_strategy: str

   my_response_format = TeslaPlan

   graph = create_react_agent(
       model, 
       tools, 
       prompt="你是一个专业汽车分析师。",
       response_format=my_response_format
   )
   ```
   当 ReAct 流程结束后，LangGraph 会调用一次 LLM 并要求它返回符合 `TeslaPlan` 的 JSON。最终的 `state["structured_response"]` 就是一个 Python 字典或 Pydantic 实例。

4. **`version="v1" / "v2"`**  
   - **v1**: 工具调用是“把当前 AIMessage 中的所有 tool_calls 一次性并行执行” → tools → 再回到 agent。  
   - **v2**: 更细粒度地把每个 tool_call 拆开，每个都进入一个独立的 ToolNode 实例。如果一个 AIMessage 里有 3 个 tool_calls，就会做 3 次独立的“tools执行→回到agent”循环**（通过 Send API）**。这种方式可以在多工具协作里更灵活，也可以插入更多自定义逻辑，但要做好相应的结构化处理。

---

# 七、常见问题与答疑

1. **Q: 我在旧版本使用 `graph.add_state_change_listener` 或 `callbacks`，现在为什么报错？**  
   A: 因为新的 LangGraph 0.3 取消了这种回调API，推荐使用 `graph.stream(...)` 在每一步迭代中自行处理日志或监听逻辑。

2. **Q: 如果不想每次都多轮循环，而只想 LLMC 接受一次输入就结束，怎么做？**  
   A: 你可以传递 `tools=[]`（空）到 `create_react_agent`，这样它就生成一个不支持工具调用的图；agent 只会输出一次，然后就结束。此时相当于纯LLM调用。

3. **Q: 要怎么限制调用工具的次数？**  
   A: 你可以在输入的 `state` 里设置 `remaining_steps`，或自定义 `AgentState` 包含 `remaining_steps=3` 一类初始值，每次 agent节点执行后，LangGraph 会自动减少1。用完就不会再允许工具调用了。

4. **Q: ReAct 会在同一个消息里多次请求调用工具吗？**  
   A: 是可能的。尤其是当 LLM 在回答中生成多个 tool_calls，就会全部执行。你可以在 `v1` 模式下并行运行它们，也可以在 `v2` 模式下逐个执行。

5. **Q: structured response 里的提示是如何工作的？**  
   A: 当 `response_format` 是 `(system_prompt, schema)` 这种 tuple 时，LangGraph 会在最后的 LLM 调用里给一个额外的 system_prompt，引导 LLM 返回符合 schema 的 JSON。这样可以做更严格的结构化要求。

---

# 八、总结

- **LangGraph** 是一个以“图”来编排对话和工具调用的框架；  
- **create_react_agent** 是“快捷构造 ReAct 风格图”的核心函数，一次性帮你搭建“agent(LLM) ↔ tools(工具节点) ↔ agent”循环；  
- 执行时默认从 `agent` 开始，如果 `AIMessage` 包含 `tool_calls` 就调用 `tools` 并注入结果，直到不再有工具调用；  
- 可以**流式**(`graph.stream(...)`) 或**一次性**(`graph.invoke(...)`)获取结果；  
- 要想查看中间推理和调用日志，使用 `stream` 在每一步循环里记录；  
- 可选地，你能通过 `interrupt_before` / `interrupt_after` 或 `checkpointer` / `store` 等更高级特性进一步定制执行流程或存储/恢复状态。

这就是从**原理**到**源码**再到**执行流程**的完整解析。希望能帮助你在实际项目里更好地运用 `create_react_agent` 和 LangGraph！

================================================
FILE: instructions/01.supervisor_pattern.md
================================================
# Supervisor 模式：多智能体协作的核心实现

## 1. 引言

在人工智能领域，多智能体系统（Multi-Agent System）是一种将复杂任务分解为多个专业智能体协同完成的架构模式。本文将详细介绍我们在 Mentis 项目中实现的 Supervisor（监督者）模式，这是一种高效组织和协调多个智能体的方法。

## 2. 多智能体系统的基本概念

多智能体系统由多个具有不同专业能力的智能体组成，每个智能体负责特定的任务领域。在这种系统中，智能体之间需要有效地协作和通信，以完成复杂的任务。

在我们的实现中，主要包含以下角色：

- **Supervisor（监督者）**：负责任务分发、协调和结果整合的中央控制智能体
- **Specialized Agents（专业智能体）**：具有特定领域专长的执行智能体

## 3. Supervisor 模式的工作流程

### 3.1 基本工作流程

Supervisor 模式的工作流程如下：

1. 用户向系统提交请求
2. Supervisor 接收请求并进行任务分析
3. Supervisor 决定调用哪个专业智能体处理任务
4. 专业智能体执行任务并返回结果
5. Supervisor 接收结果，可能进一步调用其他智能体
6. Supervisor 整合所有结果并返回给用户

### 3.2 控制权转移机制

Supervisor 模式的核心是控制权的转移机制。在我们的实现中，这通过 `handoff` 工具实现：

1. Supervisor 通过调用特定的 `handoff` 工具将控制权转移给目标智能体
2. 目标智能体完成任务后，通过 `handoff_back_messages` 将控制权返回给 Supervisor
3. 这种机制确保了在任何时刻只有一个智能体在处理任务，避免了冲突

## 4. Supervisor 的核心实现

### 4.1 核心代码分析

在 `supervisor.py` 中，`create_supervisor` 函数是实现 Supervisor 模式的核心：

```python
def create_supervisor(
    agents: list[Pregel],
    *,
    model: LanguageModelLike,
    tools: list[BaseTool | Callable] | None = None,
    prompt: Prompt | None = None,
    # ... 其他参数 ...
) -> StateGraph:
    # 检查智能体名称唯一性
    agent_names = set()
    for agent in agents:
        if agent.name is None or agent.name == "LangGraph":
            raise ValueError("Please specify a name when you create your agent...")
        if agent.name in agent_names:
            raise ValueError(f"Agent with name '{agent.name}' already exists...")
        agent_names.add(agent.name)
    
    # 为每个智能体创建 handoff 工具
    handoff_tools = [create_handoff_tool(agent_name=agent.name) for agent in agents]
    all_tools = (tools or []) + handoff_tools
    
    # 绑定工具到模型
    model = model.bind_tools(all_tools)
    
    # 创建 supervisor 智能体
    supervisor_agent = create_react_agent(
        name=supervisor_name,
        model=model,
        tools=all_tools,
        prompt=prompt,
        # ... 其他参数 ...
    )
    
    # 构建状态图
    builder = StateGraph(state_schema, config_schema=config_schema)
    builder.add_node(supervisor_agent, destinations=tuple(agent_names) + (END,))
    builder.add_edge(START, supervisor_agent.name)
    
    # 添加智能体节点和边
    for agent in agents:
        builder.add_node(
            agent.name,
            _make_call_agent(
                agent,
                output_mode,
                add_handoff_back_messages,
                supervisor_name,
            ),
        )
        builder.add_edge(agent.name, supervisor_agent.name)
    
    return builder
```

### 4.2 智能体调用机制

`_make_call_agent` 函数负责创建智能体调用的包装函数：

```python
def _make_call_agent(
    agent: Pregel,
    output_mode: OutputMode,
    add_handoff_back_messages: bool,
    supervisor_name: str,
) -> Callable[[dict], dict] | RunnableCallable:
    # ... 参数验证 ...
    
    def _process_output(output: dict) -> dict:
        messages = output["messages"]
        # 根据输出模式处理消息
        if output_mode == "full_history":
            pass
        elif output_mode == "last_message":
            messages = messages[-1:]
        
        # 添加控制权返回消息
        if add_handoff_back_messages:
            messages.extend(create_handoff_back_messages(agent.name, supervisor_name))
        
        return {
            **output,
            "messages": messages,
        }
    
    def call_agent(state: dict) -> dict:
        output = agent.invoke(state)
        return _process_output(output)
    
    # ... 异步版本 ...
    
    return RunnableCallable(call_agent, acall_agent)
```

### 4.3 设计亮点与最佳实践

Supervisor 模式的实现包含了多个多智能体系统设计的黄金经验，以下是关键设计亮点：

#### 4.3.1 自动控制权回传机制

`_make_call_agent` 中的自动 handoff back 机制非常巧妙：

```python
if add_handoff_back_messages:
    messages.extend(create_handoff_back_messages(agent.name, supervisor_name))
```

这种设计的优势在于：
- **隐式交接**：专业智能体无需知道 supervisor 的存在
- **自动转发**：智能体完成任务后，系统自动将结果打包并转交回 supervisor
- **消息插入**：在消息历史中自动插入 AIMessage 和 ToolMessage，表明控制权已转移
- **零侵入性**：对智能体代码没有任何侵入，实现了完全的关注点分离

#### 4.3.2 智能的上下文管理策略

`output_mode` 参数提供了对消息历史的精确控制：

```python
if output_mode == "last_message":
    messages = messages[-1:]
```

这允许开发者灵活选择：
- **全量历史模式**（`full_history`）：保留智能体输出的完整历史，提供完整上下文
- **最后消息模式**（`last_message`）：仅保留最后一条消息，有效节省 token 消耗

这种灵活的上下文压缩策略，在长对话或多轮智能体调用场景中尤为重要，可以有效防止上下文爆炸。

#### 4.3.3 动态工具生成与绑定

系统会自动为每个智能体创建对应的 handoff 工具：

```python
handoff_tools = [create_handoff_tool(agent_name=agent.name) for agent in agents]
```

这些工具允许 supervisor 通过类似 `transfer_to_writer()` 或 `transfer_to_researcher()` 的函数调用来转移控制权，实现了：
- **声明式调度**：调度逻辑由 LLM 决定，而非硬编码规则
- **可解释性**：每次转移都有明确的工具调用，便于追踪和调试
- **灵活性**：可以根据当前状态动态决定下一步调用哪个智能体

#### 4.3.4 统一的 Runnable 接口封装

每个智能体都被统一封装为 `RunnableCallable`：

```python
builder.add_node(agent.name, _make_call_agent(...))
```

这种封装提供了多种优势：
- **统一接口**：所有智能体都遵循相同的调用接口
- **状态管理**：状态由 LangGraph 自动管理，无需手动处理
- **异步支持**：同时支持同步和异步调用，适应不同场景
- **自动处理**：输入/输出状态转换自动完成，减少样板代码

#### 4.3.5 灵活的配置选项

系统支持多种配置选项，适应不同需求：
- **多种提示格式**：支持字符串、SystemMessage 或可调用函数作为提示
- **结构化输出**：支持 JSON schema、TypedDict 或 Pydantic 类作为输出格式
- **状态模式**：可自定义状态结构，支持复杂的状态追踪和管理
- **并行工具调用控制**：可以针对不同模型配置是否支持并行工具调用

## 5. 实践案例：笑话生成与研究专家

在 `01_supervisor_test.py` 中，我们实现了一个包含两个专业智能体的系统：

### 5.1 智能体创建

我们使用了两种不同的方式创建智能体：

#### 5.1.1 功能型 API（Functional API）

笑话生成器使用功能型 API 创建：

```python
@task
def generate_joke(messages):
    """Generate a short joke (no tool calls)."""
    system_message = {
        "role": "system", 
        "content": "You are a witty comedian. Write a short joke."
    }
    msg = model.invoke([system_message] + messages)
    return msg

@entrypoint()
def joke_agent(state):
    joke = generate_joke(state['messages']).result()
    messages = add_messages(state["messages"], [joke])
    return {"messages": messages}

joke_agent.name = "joke_agent"
```

#### 5.1.2 图形 API（Graph API）

研究专家使用图形 API 创建：

```python
def web_search(query: str) -> str:
    """Search the web for information. (Mocked data here)"""
    return (
        "Here are the headcounts for each of the FAANG companies in 2024:\n"
        # ... 模拟数据 ...
    )

research_agent = create_react_agent(
    model=model,
    tools=[web_search],
    name="research_expert",
    prompt=(
        "You are a world-class researcher. You have access to a 'web_search(query: str)' tool. "
        "Do not do any complicated math, just provide factual info from the web_search if needed."
    ),
)
```

### 5.2 Supervisor 配置

我们创建了一个 Supervisor 来协调这两个智能体：

```python
workflow = create_supervisor(
    [research_agent, joke_agent],
    model=model,
    prompt=(
        "You are the overall supervisor. You manage two specialized agents:\n"
        "1) joke_agent: for telling jokes.\n"
        "2) research_expert: for factual or data-related questions.\n\n"
        "If the user wants a joke AND some research data in the same query, "
        "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
        "After both calls, provide a final combined response. "
        "Do not call more than one agent in a single LLM message; do it step by step."
    ),
)
```

### 5.3 执行流程

当用户请求同时需要笑话和研究数据时，执行流程如下：

1. Supervisor 接收用户请求
2. Supervisor 分析请求，决定先调用 joke_agent
3. joke_agent 生成笑话并返回结果
4. Supervisor 接收笑话，然后调用 research_expert
5. research_expert 查询数据并返回结果
6. Supervisor 整合两个结果，生成最终回复

## 6. 可视化与调试

我们使用 LangGraph 的可视化功能生成了工作流图表，保存在 `examples/graphs/1_supervisor_test_01.png`，这有助于理解和调试多智能体系统的工作流程。

## 7. 总结

Supervisor 模式是一种高效组织多智能体系统的方法，它通过中央控制智能体协调专业智能体的工作，实现复杂任务的分解与协作。在我们的实现中，通过精心设计的 handoff 机制实现了智能体之间的控制权转移，确保系统的有序运行。

这种模式的优势在于：

1. **模块化**：每个智能体专注于特定领域，便于开发和维护
2. **可扩展性**：可以方便地添加新的专业智能体
3. **灵活性**：Supervisor 可以根据任务需求动态调用不同的智能体
4. **结果整合**：Supervisor 负责整合各个智能体的结果，提供一致的用户体验
5. **低耦合**：智能体之间通过消息传递交互，减少直接依赖
6. **可追踪性**：每次控制权转移都有明确的工具调用记录，便于调试和监控
7. **资源优化**：通过上下文管理策略，有效控制 token 消耗
8. **开发便捷**：统一的接口和自动化的状态管理，减少样板代码

通过本文的实践案例和深入分析，我们不仅展示了如何使用 LangGraph 和 LangChain 框架实现 Supervisor 模式，更揭示了背后的设计思想和最佳实践，为构建复杂的多智能体系统提供了宝贵参考。这些设计模式和技巧可以帮助开发者构建更加健壮、可维护和高效的智能体系统。

================================================
FILE: instructions/02.supervisor_pattern_agent.md
================================================
# Supervisor 模式：多智能体协作的核心实现 （Agent 封装模式）

## 1. 引言

在人工智能领域，多智能体系统（Multi-Agent System）是一种将复杂任务分解为多个专业智能体协同完成的架构模式。本文将详细介绍我们在 Mentis 项目中实现的 Supervisor（监督者）模式，这是一种高效组织和协调多个智能体的方法。

## 2. 多智能体系统的基本概念

多智能体系统由多个具有不同专业能力的智能体组成，每个智能体负责特定的任务领域。在这种系统中，智能体之间需要有效地协作和通信，以完成复杂的任务。

在我们的实现中，主要包含以下角色：

- **Supervisor（监督者）**：负责任务分发、协调和结果整合的中央控制智能体
- **Specialized Agents（专业智能体）**：具有特定领域专长的执行智能体

## 3. Supervisor 模式的工作流程

### 3.1 基本工作流程

Supervisor 模式的工作流程如下：

1. 用户向系统提交请求
2. Supervisor 接收请求并进行任务分析
3. Supervisor 决定调用哪个专业智能体处理任务
4. 专业智能体执行任务并返回结果
5. Supervisor 接收结果，可能进一步调用其他智能体
6. Supervisor 整合所有结果并返回给用户

### 3.2 控制权转移机制

Supervisor 模式的核心是控制权的转移机制。在我们的实现中，这通过 `handoff` 工具实现：

1. Supervisor 通过调用特定的 `handoff` 工具将控制权转移给目标智能体
2. 目标智能体完成任务后，通过 `handoff_back_messages` 将控制权返回给 Supervisor
3. 这种机制确保了在任何时刻只有一个智能体在处理任务，避免了冲突

## 4. 基础架构：BaseAgent 类

在我们的重构中，我们引入了 `BaseAgent` 基类，作为所有智能体的基础。这种设计使得不同类型的智能体可以共享通用功能，同时保持各自的特性。

### 4.1 BaseAgent 核心实现

```python
class BaseAgent:
    _PROMPT_TEMPLATE = """
    You have access to the following tools:
    {tools}
    Use the above tools to answer the question at the end.
    """
    def __init__(
        self,
        name: str,
        model: Union[BaseChatModel, LanguageModelLike],
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[Union[str, SystemMessage, Callable]] = None,
        checkpointer: Optional[Checkpointer] = None,
        max_context_messages: Optional[int] = None,  # 限制最近消息数量
        max_context_tokens: Optional[int] = None,    # 限制总估计token数
        model_name: Optional[str] = "gpt-4o-mini", # 用于未来token估计改进
    ):
        # 初始化基本属性
        self.name = name
        self.model = model
        self.tools = tools or []
        self.prompt = prompt
        self.checkpointer = checkpointer
        self.max_context_messages = max_context_messages
        self.max_context_tokens = max_context_tokens
        self.model_name = model_name
        self._workflow = None
        self._agent = None
```

### 4.2 上下文管理机制

`BaseAgent` 提供了智能的上下文管理机制，可以根据配置自动截断消息历史：

```python
def _inject_context(self, state: Dict[str, Any]) -> Dict[str, Any]:
    """注入记忆并根据配置截断消息。"""
    memory = state.get("memory") or []
    messages = state.get("messages", [])
    messages = self._truncate_messages(messages)
    memory_messages = [SystemMessage(content=chunk) for chunk in memory]
    state["messages"] = memory_messages + messages
    return state
```

### 4.3 通用方法接口

`BaseAgent` 定义了所有智能体共享的核心方法接口：

```python
def build(self) -> StateGraph:
    """构建工作流。"""
    
def compile(self) -> CompiledStateGraph:
    """编译工作流。"""
    
def invoke(self, state: Dict[str, Any]) -> Dict[str, Any]:
    """同步调用工作流。"""
    
async def ainvoke(self, state: Dict[str, Any]) -> Dict[str, Any]:
    """异步调用工作流。"""
```

## 5. ReactAgent 类实现

`ReactAgent` 是我们实现的基于 ReAct（Reasoning and Acting）模式的智能体，它继承自 `BaseAgent`，专注于推理和工具调用。

### 5.1 ReactAgent 类设计

```python
class ReactAgent(BaseAgent):
    """ReAct Agent class for reasoning and acting with tools.
    
    This class provides a high-level interface for creating a ReAct agent workflow
    that can perform multi-step reasoning and tool calling.
    """
    
    def __init__(
        self,
        model: LanguageModelLike,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[str] = None,
        response_format: Optional[
            Union[StructuredResponseSchema, tuple[str, StructuredResponseSchema]]
        ] = None,
        state_schema: StateSchemaType = AgentState,
        config_schema: Type[Any] = None,
        checkpointer: Optional[Checkpointer] = None,
        store: Optional[BaseStore] = None,
        interrupt_before: Optional[List[str]] = None,
        interrupt_after: Optional[List[str]] = None,
        debug: bool = False,
        version: Literal["v1", "v2"] = "v1",
        name: str = "react_agent",
        max_context_messages: Optional[int] = None,
        max_context_tokens: Optional[int] = None,
        model_name: Optional[str] = "gpt-4o-mini",
    ):
        # 调用父类初始化
        super().__init__(
            name=name,
            model=model,
            tools=tools or [],
            prompt=prompt,
            checkpointer=checkpointer,
            max_context_messages=max_context_messages,
            max_context_tokens=max_context_tokens,
            model_name=model_name
        )
        
        # 初始化ReactAgent特有属性
        self.response_format = response_format
        self.state_schema = state_schema
        self.config_schema = config_schema
        self.store = store
        self.interrupt_before = interrupt_before
        self.interrupt_after = interrupt_after
        self.debug = debug
        self.version = version
        self._agent = None
```

### 5.2 核心方法实现

#### 5.2.1 compile 方法

`compile` 方法负责编译 ReactAgent 工作流：

```python
def compile(self) -> CompiledGraph:
    """构建 ReAct agent 工作流。
    
    Returns:
        编译后的 CompiledGraph
    """
    # 如果_agent已经存在，直接返回，避免重复构建
    if self._agent is not None:
        return self._agent
        
    _react_agent = create_react_agent(
        model=self.model,
        tools=self.tools,
        prompt=self.prompt,
        response_format=self.response_format,
        state_schema=self.state_schema,
        config_schema=self.config_schema,
        checkpointer=self.checkpointer,
        store=self.store,
        interrupt_before=self.interrupt_before,
        interrupt_after=self.interrupt_after,
        debug=self.debug,
        version=self.version,
        name=self.name,
    )
    
    self._agent = CreateReactAgentWrapper(_react_agent, 
                                          name=self.name,
                                          before_invoke=self.invoke,
                                          before_ainvoke=self.ainvoke)
    return self._agent
```

#### 5.2.2 invoke 和 ainvoke 方法

`invoke` 和 `ainvoke` 方法负责调用 ReactAgent 处理用户请求，并提供调试信息：

```python
def invoke(self, state: Dict[str, Any]) -> Dict[str, Any]:
    """同步调用入口 (真正的 Agent 执行逻辑)."""
    # 打印调试信息
    messages = state.get("messages", [])
    if messages:
        for i, msg in enumerate(messages, 1):
            type_str = type(msg).__name__
            print(f"第 {i} 条消息 - {type_str} (Name: {msg.name}):")
            msg.pretty_print()

    # 上下文注入
    state = self._inject_context(state)
    return state

async def ainvoke(self, state: Dict[str, Any]) -> Dict[str, Any]:
    """异步调用入口."""
    # 上下文注入
    state = await self._inject_context(state)
    return state
```

## 6. SupervisorAgent 类实现

`SupervisorAgent` 类继承自 `BaseAgent`，专注于协调多个智能体的工作。在重构后，它增加了规划功能，可以更有效地管理复杂任务。

### 6.1 SupervisorAgent 类设计

```python
class SupervisorAgent(BaseAgent):
    """Supervisor class for managing multiple agents with planning capabilities.
    
    This class provides a high-level interface for creating a supervisor workflow
    that can manage and coordinate multiple agents. It also includes planning capabilities
    to create and manage a plan for complex tasks using a state-driven approach.
    
    The planning functionality is implemented using PlanningStateHandler and PlanningTool,
    which provide a more structured and flexible way to manage tasks compared to the
    previous TodolistTool approach.
    """
    
    def __init__(
        self,
        agents: List[BaseAgent],
        model: LanguageModelLike,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[str] = None,
        state_schema: StateSchemaType = AgentState,
        supervisor_name: str = "supervisor",
        checkpointer: Optional[Checkpointer] = None,
        output_mode: str = "last_message", # * full_history or last_message *
        enable_planning: bool = True, # * True or False *
    ):
        # 设置规划相关属性
        self._enable_planning = enable_planning
        
        # 如果启用规划功能，设置状态模式为PlanningAgentState
        if self._enable_planning and state_schema == AgentState:
            state_schema = PlanningAgentState
            
        # 存储特定于智能体的属性
        self.agents = agents
        self.output_mode = output_mode
        self.supervisor_name = supervisor_name
        self.state_schema = state_schema
        self.checkpointer = checkpointer
        self.tools = tools or []
        self._workflow = None
        self._agent = None
            
        # 生成基础提示词
        _final_prompt = self._PLANNING_PROMPT_TEMPLATE + "/n/n" + self._PLANNING_TOOL_TEMPLATE if self._enable_planning else self._PROMPT_TEMPLATE
        
        # 如果启用规划功能，添加规划工具
        if self._enable_planning:
            tools = tools or []
            tools.append(SimplePlanningTool())
        
        # 初始化BaseAgent父类
        super().__init__(
            name=supervisor_name,
            model=model,
            tools=tools,
            checkpointer=checkpointer,
            prompt=_final_prompt,
        )
```

### 6.2 核心方法实现

#### 6.2.1 build 方法

`build` 方法负责构建 Supervisor 工作流：

```python
def build(self) -> StateGraph:
    """构建 supervisor 工作流。
    
    Returns:
        构建的 StateGraph
    """
    
    if self._workflow is not None:
        return self._workflow
        
    self._workflow = create_supervisor(
        agents=self.agents,
        model=self.model,
        tools=self.tools,
        prompt=self.prompt,
        state_schema=self.state_schema,
        supervisor_name=self.supervisor_name,
        output_mode=self.output_mode,
    )
    
    return self._workflow
```

## 7. create_supervisor 函数实现

`create_supervisor` 函数是 SupervisorAgent 的核心依赖，它负责创建多智能体协作的工作流。

```python
def create_supervisor(
    agents: list[Pregel],
    *,
    model: LanguageModelLike,
    tools: list[BaseTool | Callable] | None = None,
    prompt: Prompt | None = None,
    response_format: Optional[
        Union[StructuredResponseSchema, tuple[str, StructuredResponseSchema]]
    ] = None,
    state_schema: StateSchemaType = AgentState,
    config_schema: Type[Any] | None = None,
    output_mode: OutputMode = "last_message",
    add_handoff_back_messages: bool = True,
    supervisor_name: str = "supervisor",
    include_agent_name: AgentNameMode | None = None,
) -> StateGraph:
    # 检查智能体名称唯一性
    agent_names = set()
    for agent in agents:
        if agent.name is None or agent.name == "LangGraph":
            raise ValueError(
                "Please specify a name when you create your agent..."
            )

        if agent.name in agent_names:
            raise ValueError(
                f"Agent with name '{agent.name}' already exists. Agent names must be unique."
            )

        agent_names.add(agent.name)

    # 为每个智能体创建 handoff 工具
    handoff_tools = [create_handoff_tool(agent_name=agent.name) for agent in agents]
    all_tools = (tools or []) + handoff_tools

    # 绑定工具到模型
    if _supports_disable_parallel_tool_calls(model):
        model = model.bind_tools(all_tools, parallel_tool_calls=False)
    else:
        model = model.bind_tools(all_tools)

    # 处理智能体名称显示方式
    if include_agent_name:
        model = with_agent_name(model, include_agent_name)
                
    # 创建 supervisor 智能体
    _react_agent = ReactAgent(
        name=supervisor_name,
        model=model,
        tools=all_tools,
        prompt=prompt,
        state_schema=state_schema,
        response_format=response_format,
        debug=False,
    )
    supervisor_agent = _react_agent.compile()
    
    # 构建状态图
    builder = StateGraph(state_schema, config_schema=config_schema)
    builder.add_node(supervisor_agent, destinations=tuple(agent_names) + (END,))
    builder.add_edge(START, supervisor_agent.name)
    
    # 添加智能体节点和边
    for agent in agents:
        # 如果智能体是 "ReactAgent" 或类似类型
        if hasattr(agent, "get_agent") and callable(agent.get_agent):
            agent = agent.get_agent()  # 获取编译后的子图
            
        builder.add_node(
            agent.name,
            _make_call_agent(
                agent,
                output_mode,
                add_handoff_back_messages,
                supervisor_name,
            ),
        )
        builder.add_edge(agent.name, supervisor_agent.name)

    return builder
```

## 8. 实践案例

### 8.1 使用 create_supervisor 函数（原始方式）

在 `01_supervisor_test.py` 中，我们使用原始的 `create_supervisor` 函数实现了一个包含两个专业智能体的系统：

```python
workflow = create_supervisor(
    [research_agent, joke_agent],
    model=model,
    prompt=(
        "You are the overall supervisor. You manage two specialized agents:\n"
        "1) joke_agent: for telling jokes.\n"
        "2) research_expert: for factual or data-related questions.\n\n"
        "If the user wants a joke AND some research data in the same query, "
        "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
        "After both calls, provide a final combined response. "
        "Do not call more than one agent in a single LLM message; do it step by step."
    ),
)

# 编译得到一个可调用的"App"
app = workflow.compile()
```

### 8.2 使用 SupervisorAgent 类（封装方式）

在 `02_supervisor_agent_test.py` 中，我们使用封装的 `SupervisorAgent` 类实现了相同的功能，但增加了规划能力：

```python
# 创建 SupervisorAgent 实例
supervisor = SupervisorAgent(
    agents=[research_agent, joke_agent],
    model=model,
    prompt=(
        "You are the overall supervisor. You manage two specialized agents:\n"
        "1) joke_agent: for telling jokes.\n"
        "2) research_expert: for factual or data-related questions.\n\n"
        "If the user wants a joke AND some research data in the same query, "
        "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
        "After both calls, provide a final combined response. "
        "Do not call more than one agent in a single LLM message; do it step by step."
    ),
    enable_planning=True,  # 启用规划功能
)

# 编译得到一个可调用的"App"
app = supervisor.compile()
```

### 8.3 两种方式的比较

两种实现方式在基本功能上相似，但使用 `SupervisorAgent` 类的方式有以下优势：

1. **更简洁的 API**：封装了复杂的参数和配置，提供了更简洁的接口
2. **更好的封装性**：将相关功能封装在一个类中，便于维护和扩展
3. **更好的可读性**：代码结构更清晰，意图更明确
4. **更好的可重用性**：可以方便地在不同项目中复用
5. **规划功能**：内置了任务规划能力，可以更有效地管理复杂任务
6. **上下文管理**：通过 BaseAgent 继承了智能的上下文管理机制

## 9. 总结

在重构后的实现中，我们引入了以下关键改进：

1. **BaseAgent 基类**：提供了所有智能体共享的基础功能，如上下文管理、工作流构建等
2. **ReactAgent 重构**：现在继承自 BaseAgent，使用 CreateReactAgentWrapper 增强功能
3. **SupervisorAgent 重构**：现在继承自 BaseAgent，增加了规划功能
4. **统一的接口**：所有智能体类型现在共享相同的核心方法接口
5. **智能上下文管理**：可以根据配置自动截断消息历史，优化性能

Supervisor 模式是一种高效组织多智能体系统的方法，它通过中央控制智能体协调专业智能体的工作，实现复杂任务的分解与协作。在我们的重构实现中，通过引入 BaseAgent 基类和增强 SupervisorAgent 的规划能力，使得多智能体系统更加灵活、高效，同时保持了良好的可维护性和可扩展性。

这种模式特别适合以下场景：
- 需要多种专业知识协作的复杂任务
- 需要动态决策调用不同专家的场景
- 需要结果整合和质量控制的任务流程
- 需要有计划地执行多步骤任务的场景

未来，我们将继续优化 Supervisor 模式的实现，增强其灵活性和可扩展性，并探索更多的应用场景。

================================================
FILE: instructions/03.tavily_search_integration.md
================================================
# Tavily搜索工具集成：为多智能体系统提供实时信息能力

## 1. 引言

在多智能体系统中，获取实时、准确的外部信息是提升系统实用性的关键因素。本文将详细介绍我们在 Mentis 项目中集成 Tavily 搜索工具的实现，这使得我们的智能体系统能够获取最新的网络信息，大幅提升了系统的实用价值。

## 2. Tavily 搜索工具概述

Tavily 是一个专为 AI 应用设计的搜索 API，它提供了高质量、结构化的网络搜索结果。在我们的实现中，Tavily 工具具有以下特点：

- **实时性**：能够获取最新的网络信息
- **结构化输出**：返回格式化的搜索结果，便于智能体处理
- **可配置性**：支持多种参数配置，如搜索深度、结果数量等
- **多媒体支持**：可选择性地包含图片等多媒体内容

## 3. Tavily 工具的实现

### 3.1 核心代码分析

在 `tavily_tools.py` 中，我们实现了 `TavilySearchResults` 类，它继承自 LangChain 的 `BaseTool`：

```python
class TavilySearchResults(BaseTool):
    """Tool that queries the Tavily Search API and gets back json."""
    
    name: str = "tavily_search_results_json"
    description: str = (
        "A search engine optimized for comprehensive, accurate, and trusted results. "
        "Useful for when you need to answer questions about current events. "
        "Input should be a search query."
    )
    args_schema: Type[BaseModel] = TavilyInput
    
    max_results: int = 5
    """Max search results to return, default is 5"""
    search_depth: str = "advanced"
    """The depth of the search. It can be "basic" or "advanced""""
    include_domains: List[str] = []
    """A list of domains to specifically include in the search results."""
    exclude_domains: List[str] = []
    """A list of domains to specifically exclude from the search results."""
    include_answer: bool = False
    """Include a short answer to original query in the search results."""
    include_raw_content: bool = False
    """Include cleaned and parsed HTML of each site search results."""
    include_images: bool = False
    """Include a list of query related images in the response."""
    
    api_wrapper: TavilySearchAPIWrapper = Field(default_factory=TavilySearchAPIWrapper)
    response_format: Literal["content_and_artifact"] = "content_and_artifact"
```

### 3.2 搜索执行方法

`TavilySearchResults` 类提供了同步和异步两种搜索方法：

```python
def _run(
    self,
    query: str,
    run_manager: Optional[CallbackManagerForToolRun] = None,
) -> Tuple[Union[List[Dict[str, str]], str], Dict]:
    """Use the tool."""
    try:
        raw_results = self.api_wrapper.raw_results(
            query,
            self.max_results,
            self.search_depth,
            self.include_domains,
            self.exclude_domains,
            self.include_answer,
            self.include_raw_content,
            self.include_images,
        )
    except Exception as e:
        return repr(e), {}
    return self.api_wrapper.clean_results(raw_results["results"]), raw_results

async def _arun(
    self,
    query: str,
    run_manager: Optional[AsyncCallbackManagerForToolRun] = None,
) -> Tuple[Union[List[Dict[str, str]], str], Dict]:
    """Use the tool asynchronously."""
    # 异步实现...
```

## 4. 在多智能体系统中集成 Tavily 工具

### 4.1 创建研究型智能体

在我们的多智能体系统中，我们创建了一个专门的研究型智能体，它使用 Tavily 搜索工具获取实时信息：

```python
# 创建Tavily搜索工具
tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=False,
    include_images=False,
    search_depth="advanced"
)

research_agent = create_react_agent(
    model=model,
    tools=[tavily_search],
    name="research_expert",
    prompt=(
        "You are a world-class researcher. You have access to the 'tavily_search_results_json' tool "
        "which can search the web for real-time information. "
        "When asked a question, use this tool to find accurate and up-to-date information. "
        "Summarize the search results in a clear and concise manner. "
        "Always cite your sources by including the URLs from the search results."
    ),
)
```

### 4.2 与 Supervisor 集成

研究型智能体作为专业智能体，被集成到 Supervisor 模式中：

```python
# 创建 SupervisorAgent 实例
supervisor = SupervisorAgent(
    agents=[research_agent, joke_agent],
    model=model,
    prompt=(
        "You are the overall supervisor. You manage two specialized agents:\n"
        "1) joke_agent: for telling jokes.\n"
        "2) research_expert: for factual or data-related questions using real-time web search.\n\n"
        "If the user wants a joke, call joke_agent.\n"
        "If the user wants factual information or research data, call research_expert.\n"
        "If the user wants a joke AND some research data in the same query, "
        "you MUST call joke_agent first, get the joke, then call research_expert for the data. "
        "After both calls, provide a final combined response. "
        "Do not call more than one agent in a single LLM message; do it step by step."
    ),
)
```

## 5. 实践案例

### 5.1 只询问研究数据

当用户只询问研究数据时，Supervisor 会直接调用研究型智能体：

```python
# 示例2：只询问研究数据
result2 = app.invoke({"messages": [{"role": "user", "content": "谁是现任美国总统？"}]})
```

在这种情况下，研究型智能体会使用 Tavily 搜索工具获取最新信息，并返回结构化的回答，包括引用的来源。

### 5.2 混合查询

当用户同时需要笑话和研究数据时，Supervisor 会先调用笑话智能体，然后调用研究型智能体：

```python
# 示例3：同时询问笑话和研究数据
result3 = app.invoke({"messages": [{"role": "user", "content": "讲个关于人工智能的笑话，然后告诉我什么是大型语言模型"}]})
```

这种情况下，Supervisor 会协调两个智能体的工作，并整合它们的结果。

## 6. 可视化与调试

我们使用 LangGraph 的可视化功能生成了工作流图表，保存在 `examples/graphs/03_tavily_tools_test.png`。这个图表展示了包含 Tavily 搜索工具的多智能体系统的工作流程，有助于理解和调试系统。

## 7. 总结

Tavily 搜索工具的集成为我们的多智能体系统带来了以下优势：

1. **实时信息获取**：系统能够获取最新的网络信息，不再局限于模型训练数据的时间范围
2. **信息准确性提升**：通过引用可靠的网络来源，提高了系统回答的准确性
3. **功能扩展**：使系统能够回答关于最新事件、数据和信息的问题
4. **灵活配置**：可以根据需要调整搜索参数，优化搜索结果

通过 Tavily 搜索工具的集成，我们的多智能体系统从一个封闭的知识系统转变为一个能够获取实时信息的开放系统，大大提升了系统的实用价值和应用范围。

未来，我们计划进一步优化搜索工具的使用策略，提高搜索效率和结果质量，并探索更多外部工具的集成，使系统能够处理更复杂的任务。

================================================
FILE: instructions/04.react_agent.md
================================================
# ReactAgent：基于ReAct方法论的多步推理与工具调用框架

## 1. 引言

ReactAgent是一个基于ReAct方法论的智能体框架，它能够通过多步推理和工具调用来解决复杂问题。本文将详细介绍ReactAgent的核心概念、工作原理、实现方式以及在实际应用中的使用方法。

## 2. ReactAgent的核心概念

### 2.1 什么是ReAct方法论

ReAct（Reasoning + Acting）是一种结合推理和行动的AI问题解决方法论，它包含两个核心步骤：

1. **推理（Reasoning）**：让语言模型进行思考，分析问题，并决定下一步行动。
2. **行动（Acting）**：执行具体的工具调用，获取外部信息或执行特定操作。

这两个步骤可以多次循环往复，直到问题被解决。ReAct方法论特别适合处理需要多步骤、多工具协作的复杂问题。

### 2.2 ReactAgent与LangGraph的关系

ReactAgent是基于LangGraph框架实现的，它利用LangGraph的图结构来编排推理和行动的流程。在LangGraph中，ReactAgent被表示为一个包含多个节点和边的有向图：

- **节点（Node）**：包括Agent节点（负责推理）和Tools节点（负责执行工具调用）
- **边（Edge）**：定义节点之间的转换条件，例如当Agent生成工具调用时，流程转向Tools节点

## 3. ReactAgent的实现

### 3.1 ReactAgent类的设计

在我们的实现中，ReactAgent类继承自LangGraph的Pregel类，提供了一个高级接口来创建和管理ReAct工作流：

```python
class ReactAgent(Pregel):
    """ReAct Agent class for reasoning and acting with tools.
    
    This class provides a high-level interface for creating a ReAct agent workflow
    that can perform multi-step reasoning and tool calling.
    """
    
    def __init__(
        self,
        model: LanguageModelLike,
        tools: Optional[List[Union[BaseTool, Callable]]] = None,
        prompt: Optional[str] = None,
        response_format: Optional[
            Union[StructuredResponseSchema, tuple[str, StructuredResponseSchema]]
        ] = None,
        state_schema: StateSchemaType = AgentState,
        config_schema: Type[Any] = None,
        interrupt_before: Optional[List[str]] = None,
        interrupt_after: Optional[List[str]] = None,
        debug: bool = False,
        version: Literal["v1", "v2"] = "v1",
        name: str = "react_agent",
    ):
        # 初始化代码...
```

### 3.2 核心方法

ReactAgent类提供了以下核心方法：

1. **build()**: 构建ReAct工作流图
2. **compile()**: 编译工作流为可执行应用
3. **invoke()**: 同步执行ReAct工作流
4. **ainvoke()**: 异步执行ReAct工作流
5. **stream()**: 流式执行，可以获取中间状态
6. **get_graph()**: 获取底层图结构，用于可视化或调试

### 3.3 与create_react_agent的关系

ReactAgent类内部使用了LangGraph提供的`create_react_agent`函数来构建工作流图。这个函数自动处理了：

- 创建Agent节点（用于调用语言模型）
- 创建Tools节点（用于执行工具调用）
- 在节点之间建立连接
- 处理状态管理和流程控制

## 4. 使用ReactAgent解决复杂问题

### 4.1 基本使用流程

使用ReactAgent的基本流程如下：

1. **初始化ReactAgent**：提供语言模型和工具
2. **编译工作流**：调用compile()方法
3. **准备初始状态**：通常包含用户的问题
4. **执行或流式执行**：使用invoke()或stream()方法
5. **处理结果**：分析最终状态或中间状态

### 4.2 集成Tavily搜索工具

在实际应用中，我们经常将ReactAgent与Tavily搜索工具集成，使其能够获取实时网络信息：

```python
# 创建Tavily搜索工具
tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=True,
    include_images=False,
    search_depth="advanced"
)

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=[tavily_search],
    prompt=(
        "你是一位专业的研究分析师，擅长分析复杂问题并提供深入见解。\n"
        "当面对复杂问题时，请遵循以下REACT方法论：\n"
        "1. 分解问题：将复杂问题分解为更小的子问题\n"
        "2. 制定计划：确定需要搜索哪些信息，以及搜索的顺序\n"
        "3. 执行搜索：使用tavily_search_results_json工具执行搜索\n"
        "4. 分析结果：分析搜索结果，确定是否需要进一步搜索\n"
        "5. 综合信息：将所有搜索结果综合成一个连贯的回答\n"
    ),
)

# 编译工作流
agent = react_agent.compile()
```

### 4.3 处理用户输入

以下是处理用户输入的示例代码：

```python
# 准备初始状态
initial_state = {
    "messages": [HumanMessage(content=user_input)]
}

# 流式执行并获取中间状态
for partial_state in react_agent.stream(initial_state, stream_mode="values"):
    # 处理中间状态
    messages = partial_state.get("messages", [])
    if messages:
        latest_message = messages[-1]
        # 记录或显示最新消息
        log_agent_actions({"messages": [latest_message]})

# 处理最终结果
final_state = partial_state  # 最后一个状态就是最终状态
```

## 5. ReactAgent的优势与应用场景

### 5.1 优势

- **多步推理**：能够分解复杂问题，逐步解决
- **工具调用**：可以集成各种外部工具，扩展能力边界
- **状态管理**：自动管理对话状态和中间结果
- **可视化**：支持工作流可视化，便于调试和理解
- **流式执行**：可以获取中间状态，实现更好的用户体验

### 5.2 应用场景

- **研究助手**：帮助用户研究复杂问题，获取最新信息
- **数据分析**：分步骤处理数据分析任务
- **决策支持**：通过多步推理和信息收集辅助决策
- **教育辅导**：分解复杂概念，逐步引导学习

## 6. 实际案例：研究特斯拉2025年发展预期

以下是使用ReactAgent研究特斯拉2025年发展预期的实际案例：

1. **问题分解**：将问题分解为新车型计划、销量目标、技术创新和市场扩张战略
2. **执行搜索**：针对每个子问题执行Tavily搜索
3. **分析结果**：分析每个搜索的结果，提取关键信息
4. **综合信息**：将所有信息整合为一个全面的分析报告

通过这种方式，ReactAgent能够提供比单次查询更全面、更深入的分析结果。

## 7. 总结

ReactAgent是一个强大的基于ReAct方法论的智能体框架，它通过多步推理和工具调用来解决复杂问题。在实际应用中，ReactAgent特别适合需要分步骤思考、收集信息和综合分析的任务。通过与Tavily等工具的集成，ReactAgent能够获取实时信息，大幅提升其实用价值。

在未来的开发中，我们将继续优化ReactAgent的性能，增强其推理能力，并集成更多实用工具，使其能够应对更广泛的应用场景。

================================================
FILE: instructions/05.react_agent_user_input.md
================================================
# ReactAgent与用户交互：构建交互式研究助手

## 1. 引言

本文将介绍如何使用ReactAgent构建一个能够与用户进行交互的研究助手，该助手能够接收用户输入，使用搜索工具获取信息，并提供深入的分析结果。这种交互式助手特别适合需要实时信息和多轮对话的场景。

## 2. 交互式研究助手的核心概念

### 2.1 用户输入处理

交互式研究助手需要能够处理用户的自然语言输入，理解用户的意图，并将其转化为可执行的搜索查询或其他操作。这涉及到：

1. **输入解析**：分析用户输入，提取关键信息和查询意图
2. **查询重构**：将用户的自然语言问题转化为更有效的搜索查询
3. **上下文维护**：在多轮对话中保持对话上下文的连贯性

### 2.2 搜索工具集成

研究助手的核心功能是能够获取和分析信息，这通常通过集成各种搜索工具来实现：

1. **Tavily搜索**：提供高质量的网络搜索结果，支持深度搜索模式
2. **结果处理**：对搜索结果进行过滤、排序和整合，提取最相关的信息
3. **多次搜索策略**：对复杂问题进行分解，执行多次有针对性的搜索

## 3. 实现交互式研究助手

### 3.1 基本架构

交互式研究助手的基本架构包括：

```
用户输入 → ReactAgent → 搜索工具 → 结果分析 → 回复生成 → 用户
```

这个流程可以多次循环，形成多轮对话。

### 3.2 ReactAgent配置

以下是创建交互式研究助手的核心代码：

```python
def create_react_agent_instance():
    """创建并返回ReactAgent实例"""
    react_agent = ReactAgent(
        model=model,
        tools=[tavily_search],
        name="research_assistant",
        # 提示词强调分解问题、多步思考和综合信息
        prompt=(
            "你是一位专业的研究分析师，擅长分析复杂问题并提供深入见解。\n"
            "你有一个强大的工具'tavily_search_results_json'可以搜索网络获取实时信息。\n\n"
            "当面对复杂问题时，请遵循以下REACT方法论：\n"
            "1. 分解问题：将复杂问题分解为更小的子问题\n"
            "2. 制定计划：确定需要搜索哪些信息，以及搜索的顺序\n"
            "3. 执行搜索：使用tavily_search_results_json工具执行搜索\n"
            "4. 分析结果：分析搜索结果，确定是否需要进一步搜索\n"
            "5. 综合信息：将所有搜索结果综合成一个连贯的回答\n\n"
            "重要提示：\n"
            "- 不要一次性搜索过于宽泛的问题\n"
            "- 对于复杂问题，进行多次有针对性的搜索\n"
            "- 每次搜索后评估结果，决定下一步行动\n"
            "- 在最终回答中引用来源，包括搜索结果中的URL\n"
            "- 清晰地展示你的思考过程，包括问题分解和计划制定\n"
        ),
    )
    
    return react_agent
```

### 3.3 Tavily搜索工具配置

```python
tavily_search = TavilySearchResults(
    max_results=3,
    include_answer=True,
    include_raw_content=True,  # 包含原始内容，便于分析
    include_images=False,
    search_depth="advanced"  # 使用高级搜索深度
)
```

### 3.4 用户交互循环

用户交互循环的核心是通过`stream`方法获取中间状态，并实时显示Agent的思考过程：

```python
def process_user_query(query):
    # 创建ReactAgent实例
    react_agent = create_react_agent_instance()
    agent = react_agent.compile()
    
    # 准备输入
    inputs = {
        "messages": [HumanMessage(content=query)]
    }
    
    # 使用stream方法逐步获取中间状态
    final_state = None
    for partial_state in react_agent.stream(inputs, stream_mode="values"):
        # 保存最终状态
        final_state = partial_state
        
        # 获取最新消息并记录
        messages = partial_state.get("messages", [])
        if messages:
            latest_message = messages[-1]
            log_agent_actions({"messages": [latest_message]})
    
    # 返回最终回答
    return final_state
```

## 4. 最佳实践与优化策略

### 4.1 提示词优化

提示词对研究助手的性能至关重要，应包含以下要素：

1. **角色定义**：明确助手的专业身份和能力
2. **方法论指导**：提供结构化的问题解决方法
3. **工具使用指南**：说明如何有效使用搜索工具
4. **输出格式要求**：规定回答的结构和引用方式

### 4.2 搜索策略优化

为提高搜索效率和结果质量，可采用以下策略：

1. **渐进式搜索**：从一般到具体，逐步缩小搜索范围
2. **多角度查询**：使用不同的关键词和表述方式进行搜索
3. **结果验证**：通过交叉检查多个来源验证信息的准确性
4. **深度参数调整**：根据问题复杂度调整搜索深度参数

### 4.3 用户体验优化

提升用户体验的关键点包括：

1. **透明的思考过程**：展示Agent的推理过程，增强可信度
2. **实时反馈**：通过流式输出提供即时反馈
3. **引用来源**：清晰标注信息来源，便于用户进一步探索
4. **交互式引导**：在复杂问题上引导用户提供更多上下文或澄清问题

## 5. 应用场景

交互式研究助手适用于多种场景：

1. **学术研究**：帮助研究人员快速获取和分析相关文献
2. **市场分析**：收集和整合市场趋势、竞争对手信息
3. **新闻摘要**：汇总和分析最新新闻事件
4. **技术调研**：探索新技术、框架或工具的特性和评价
5. **教育辅助**：为学生提供学习资料和解答问题

## 6. 总结

ReactAgent结合用户交互和搜索工具，可以构建功能强大的研究助手，能够处理复杂查询并提供深入分析。通过优化提示词、搜索策略和用户体验，可以进一步提升助手的性能和实用性。未来的发展方向包括集成更多专业数据源、增强多模态能力，以及提供更个性化的信息服务。

================================================
FILE: instructions/06.web_extraction_tools.md
================================================
# 网页提取工具：FireCrawl与Jina的集成与应用

## 1. 引言

网页内容提取是智能体系统中的重要能力，它使智能体能够从互联网获取、分析和处理结构化和非结构化的网页内容。本文将详细介绍如何在Mentis框架中集成和使用FireCrawl和Jina两种强大的网页提取工具，以实现高效的网站结构分析和内容提取。

## 2. 网页提取工具的核心概念

### 2.1 网页提取的两个关键步骤

高效的网页内容提取通常包含两个关键步骤：

1. **网站结构分析**：了解网站的组织结构、页面之间的链接关系，以及重要页面的位置。
2. **内容提取**：从特定页面中提取有价值的文本、图像或其他结构化信息。

### 2.2 FireCrawl与Jina的角色分工

在Mentis框架中，我们使用两种工具来分别处理这两个步骤：

1. **FireCrawl**：专注于网站结构分析，能够爬取网站的页面结构和链接关系。
2. **Jina**：专注于内容提取，能够从特定URL获取干净、结构化的内容。

## 3. FireCrawlTool的实现与使用

### 3.1 FireCrawlTool的基本结构

FireCrawlTool是对FireCrawl API的封装，提供了网站爬取和内容分析的能力：

```python
class FireCrawlTool(BaseTool):
    """Tool that uses FireCrawl API to crawl or scrape web content."""

    name: str = "firecrawl_tool"
    description: str = (
        "A web crawler and scraper that extracts content from websites. "
        "Useful for when you need to analyze the content of a specific website or webpage. "
        "Input should be a URL to crawl or scrape."
    )
    args_schema: Type[BaseModel] = FireCrawlInput
    
    api_key: Optional[str] = None
    api_url: Optional[str] = None
    mode: str = "crawl"
    params: Dict[str, Any] = Field(default_factory=dict)
```

### 3.2 FireCrawlTool的配置选项

FireCrawlTool提供了多种配置选项：

1. **mode**：工作模式，可选值包括：
   - `crawl`：爬取网站结构和链接
   - `scrape`：提取特定页面的内容
   - `map`：生成网站地图

2. **params**：额外参数，常用的包括：
   - `max_pages`：限制爬取的最大页面数量
   - `max_depth`：限制爬取的最大深度
   - `follow_links`：是否跟踪页面中的链接

### 3.3 使用FireCrawlTool爬取网站结构

以下是使用FireCrawlTool爬取网站结构的示例代码：

```python
# 创建FireCrawl工具 - 用于网站结构分析
firecrawl_tool = FireCrawlTool(
    mode="crawl",  # 使用爬取模式
    params={
        "max_pages": 5,  # 限制爬取页面数量
    }
)

# 在Agent中使用该工具
react_agent = create_react_agent(
    model=model,
    tools=[firecrawl_tool],
    name="web_crawler",
    prompt="你是一位网站结构分析专家..."
)
```

## 4. JinaSearch的实现与使用

### 4.1 JinaSearch的基本功能

JinaSearch是LangChain提供的一个工具，能够从网页中提取干净、可读的内容，去除广告、导航栏等干扰元素：

```python
from langchain_community.tools import JinaSearch

# 创建Jina Reader工具 - 用于内容提取
jina_reader_tool = JinaSearch()
```

### 4.2 使用JinaSearch提取网页内容

JinaSearch特别适合在确定了目标页面后，提取其中的核心内容：

```python
# 在Agent中结合FireCrawl和Jina
react_agent = create_react_agent(
    model=model,
    tools=[firecrawl_tool, jina_reader_tool],
    name="web_extraction_expert",
    prompt="你是一位网页内容分析专家..."
)
```

## 5. 网页提取的最佳实践

### 5.1 两阶段提取策略

为了高效地提取网页内容，建议采用两阶段策略：

1. **第一阶段**：使用FireCrawlTool爬取网站结构，了解网站的组织方式和重要页面。
2. **第二阶段**：根据第一阶段的结果，使用JinaSearch有针对性地提取重要页面的内容。

### 5.2 提示词优化

为了引导Agent正确使用这两个工具，提示词应该明确指出工具的使用顺序和方法：

```python
prompt = (
    "你是一位专业的网页内容分析专家，擅长提取和分析网站结构与内容。\n"
    "你有两个强大的工具:\n"
    "1. 'firecrawl_tool': 用于爬取网站结构和下级页面\n"
    "2. 'jina_reader_tool': 用于从特定URL提取结构化内容\n\n"
    "当面对网站分析任务时，请遵循以下方法论:\n"
    "1. 先使用firecrawl_tool了解网站结构\n"
    "2. 再使用jina_reader_tool提取关键页面内容\n"
    "3. 最后整合信息提供分析结果"
)
```

### 5.3 处理大型网站的策略

对于大型网站，可以采用以下策略：

1. **限制爬取范围**：设置合理的`max_pages`和`max_depth`参数
2. **分批处理**：先获取网站结构，然后每次只处理1-3个重要页面
3. **内容摘要**：对提取的内容进行摘要，减少token消耗

## 6. 实际应用案例

### 6.1 分析LangGraph文档网站

以下是使用FireCrawl和Jina分析LangGraph文档网站的示例：

```python
# 定义输入
inputs = {
    "messages": [
        {"role": "user", "content": "爬取LangGraph文档网站的每个章节的内容(https://langchain-ai.github.io/langgraph/how-tos/) "}
    ]
}

# 使用stream方法逐步获取中间状态
final_state = None
for partial_state in react_agent.stream(inputs, stream_mode="values"):
    # 处理中间状态...
    pass
```

### 6.2 结果分析与处理

Agent会首先使用FireCrawl获取网站结构，然后使用Jina提取重要页面的内容，最后整合信息提供分析结果：

1. **网站结构分析**：识别主要章节和子页面
2. **内容提取**：获取每个章节的详细内容
3. **信息整合**：将内容组织成结构化的文档或摘要

## 7. 总结

FireCrawl和Jina的结合为智能体提供了强大的网页内容提取能力。通过两阶段提取策略，可以高效地分析网站结构并提取有价值的内容。这种能力使智能体能够从互联网获取实时信息，为用户提供更加全面和准确的回答。

未来的发展方向包括增强对JavaScript渲染页面的支持、提高内容提取的准确性，以及集成更多专业领域的内容分析能力。

================================================
FILE: instructions/07.web_extraction_with_filesystem.md
================================================
# 网页提取与文件系统集成：构建内容采集与存储系统

## 1. 引言

在智能体系统中，网页内容提取通常需要与文件系统操作相结合，以便将提取的内容持久化存储。本文将详细介绍如何在Mentis框架中集成网页提取工具和文件系统工具，并使用SupervisorAgent协调多个专业智能体，构建一个完整的内容采集与存储系统。

## 2. 系统架构设计

### 2.1 三层架构模式

我们采用三层架构设计，包括：

1. **Supervisor层**：负责协调和管理其他智能体，接收用户指令并分配任务
2. **Research层**：负责网页内容提取，包括网站结构分析和内容提取
3. **FileSystem层**：负责文件操作，包括内容保存、读取和目录管理

### 2.2 智能体角色分工

系统中的三个智能体各自承担不同的职责：

1. **SupervisorAgent**：总协调者，负责理解用户需求，并将任务分配给适当的专业智能体
2. **Research Agent**：网页内容分析专家，负责使用FireCrawl和Jina工具提取网页内容
3. **FileSystem Agent**：文件系统管理专家，负责将提取的内容保存到本地文件系统

## 3. 组件实现

### 3.1 Research Agent实现

Research Agent负责网页内容提取，使用FireCrawl和Jina工具：

```python
# 创建FireCrawl工具 - 用于网站结构分析
firecrawl_tool = FireCrawlTool(
    mode="crawl",  # 使用爬取模式
    params={
        "max_pages": 5,  # 限制爬取页面数量
    }
)

# 创建Jina Reader工具 - 用于内容提取
jina_reader_tool = JinaSearch()

# 创建Research Agent
research_agent = create_react_agent(
    model=model,
    tools=[firecrawl_tool, jina_reader_tool],
    name="research_agent",
    prompt=(
        "你是一位专业的网页内容分析专家，擅长提取和分析网站结构与内容。\n"
        "你有两个强大的工具...\n"
        # 提示词内容
    ),
)
```

### 3.2 FileSystem Agent实现

FileSystem Agent负责文件操作，使用LangChain的FileManagementToolkit：

```python
# 设置文件系统工具的根目录
output_dir = os.path.join(os.path.dirname(__file__), "output")
os.makedirs(output_dir, exist_ok=True)

# 创建文件系统工具集
filesystem_toolkit = FileManagementToolkit(
    root_dir=output_dir,
    selected_tools=["write_file", "read_file", "list_directory"]
)

# 获取文件系统工具
filesystem_tools = filesystem_toolkit.get_tools()

# 创建FileSystem Agent
filesystem_agent = create_react_agent(
    model=model,
    tools=filesystem_tools,
    name="filesystem_agent",
    prompt=(
        "你是一位专业的文件系统管理专家，负责将网页内容保存到本地文件系统。\n"
        "你有以下工具可以使用...\n"
        # 提示词内容
    ),
)
```

### 3.3 SupervisorAgent实现

SupervisorAgent负责协调Research Agent和FileSystem Agent：

```python
# 创建Supervisor Agent
supervisor = SupervisorAgent(
    agents=[research_agent, filesystem_agent],
    model=model,
    prompt=(
        "你是一个智能助手的总协调者，负责管理两个专业智能体:\n"
        "1) research_agent: 网页内容分析专家，可以爬取和分析网站内容\n"
        "2) filesystem_agent: 文件系统管理专家，可以将内容保存到本地文件系统\n\n"
        # 提示词内容
    ),
)

# 创建内存存储器用于保存对话状态
memory_saver = MemorySaver()

# 编译得到一个可调用的"App"，添加checkpointer实现记忆功能
app = supervisor.compile(checkpointer=memory_saver)
```

## 4. 工作流程

### 4.1 基本工作流程

系统的基本工作流程如下：

1. **用户请求**：用户提出网页内容提取和保存的请求
2. **Supervisor分析**：SupervisorAgent分析用户请求，确定需要调用哪个专业智能体
3. **内容提取**：如果需要提取网页内容，SupervisorAgent调用Research Agent
4. **内容保存**：如果需要保存内容，SupervisorAgent将Research Agent的结果传递给FileSystem Agent
5. **结果返回**：SupervisorAgent将最终结果返回给用户

### 4.2 上下文管理策略

为了有效管理上下文长度，系统采用以下策略：

1. **分批处理**：对于大型网站，采用分批处理策略，每次只处理少量页面
2. **内容摘要**：对于大型内容，进行摘要处理，减少传递的token数量
3. **先保存再处理**：对于多页面内容，采用先保存再处理的策略，减轻上下文负担

## 5. 提示词设计

### 5.1 SupervisorAgent提示词

SupervisorAgent的提示词强调任务分配和协调：

```
你是一个智能助手的总协调者，负责管理两个专业智能体:
1) research_agent: 网页内容分析专家，可以爬取和分析网站内容
2) filesystem_agent: 文件系统管理专家，可以将内容保存到本地文件系统

你的工作流程如下:
1. 分析用户请求，确定是需要网页内容提取还是文件操作，或两者都需要
2. 如果需要网页内容提取，调用research_agent获取网页内容
3. 如果需要将提取的内容保存到文件，调用filesystem_agent进行保存
4. 如果用户同时需要提取内容并保存，先调用research_agent获取内容，再调用filesystem_agent保存内容

重要规则:
- 不要在一个消息中同时调用多个智能体，必须一步一步来
- 当调用filesystem_agent保存内容时，必须提供完整的内容和建议的文件名
- 确保在最终回复中告知用户内容已成功提取和/或保存
```

### 5.2 Research Agent提示词

Research Agent的提示词强调网页内容提取的方法论：

```
你是一位专业的网页内容分析专家，擅长提取和分析网站结构与内容。
你有两个强大的工具:
1. 'firecrawl_tool': 用于爬取网站结构和下级页面
2. 'jina_reader_tool': 用于从特定URL提取结构化内容，获取干净可读的内容

当面对网站分析任务时，请遵循以下方法论:
1. 分析任务: 明确需要从网站获取什么信息
2. 网站结构分析: 使用firecrawl_tool爬取网站结构，了解可用页面
3. 内容提取: 根据网站结构，使用jina_reader_tool从关键页面提取内容
4. 信息整合: 将提取的内容整合成有条理的分析结果
```

### 5.3 FileSystem Agent提示词

FileSystem Agent的提示词强调文件操作和内容保存：

```
你是一位专业的文件系统管理专家，负责将网页内容保存到本地文件系统。
你有以下工具可以使用:
1. 'write_file': 用于将内容写入文件
2. 'read_file': 用于读取文件内容
3. 'list_directory': 用于列出目录内容

当接收到保存内容的请求时，请遵循以下方法论:
1. 分析内容: 确定内容的类型和结构
2. 确定文件名: 根据内容类型和来源创建合适的文件名
3. 保存内容: 使用write_file工具将内容保存到文件中
4. 验证保存: 使用read_file或list_directory工具验证内容已正确保存
```

## 6. 记忆功能实现

### 6.1 使用MemorySaver实现记忆

系统使用LangGraph的MemorySaver实现对话状态的持久化：

```python
# 创建内存存储器用于保存对话状态
memory_saver = MemorySaver()

# 编译得到一个可调用的"App"，添加checkpointer实现记忆功能
app = supervisor.compile(checkpointer=memory_saver)
```

### 6.2 记忆功能的应用场景

记忆功能在以下场景中特别有用：

1. **多轮对话**：在多轮对话中保持上下文连贯性
2. **长时间任务**：对于需要长时间处理的任务，可以保存中间状态
3. **断点续传**：支持任务的暂停和恢复

## 7. 应用案例

### 7.1 提取并保存LangGraph文档

以下是一个完整的应用案例，提取并保存LangGraph文档：

```python
# 用户请求
inputs = {
    "messages": [
        HumanMessage(content="请爬取LangGraph文档网站(https://langchain-ai.github.io/langgraph/how-tos/)的内容，并保存为Markdown文件")
    ]
}

# 执行工作流
final_state = None
for partial_state in app.stream(inputs, stream_mode="values"):
    # 处理中间状态...
    final_state = partial_state
    # 记录状态
    log_agent_actions(partial_state)

# 最终结果
print("\n最终结果:")
if final_state and final_state.get("messages"):
    for message in final_state["messages"]:
        if isinstance(message, AIMessage) and not message.tool_calls:
            print(message.content)
```

## 8. 总结

网页提取与文件系统集成是构建完整内容采集系统的关键。通过SupervisorAgent协调Research Agent和FileSystem Agent，我们可以实现网页内容的提取、分析和持久化存储。这种多智能体协作模式不仅提高了系统的模块化程度，也使得每个智能体可以专注于自己的专业领域，从而提高整体系统的效率和质量。

未来的发展方向包括增强对复杂网站的处理能力、支持更多文件格式的存储和处理，以及集成数据库存储以支持更大规模的内容管理。

================================================
FILE: instructions/08.react_agent_tool_registry.md
================================================
# 工具注册机制与ReactAgent集成：构建可扩展的智能体系统

## 1. 引言

工具注册机制是构建可扩展智能体系统的关键组件，它允许我们以统一的方式管理和使用各种工具，并将这些工具与ReactAgent集成。本文将详细介绍Mentis框架中的工具注册机制，包括工具注册、分类管理以及与ReactAgent的集成方式。

## 2. 工具注册机制的核心概念

### 2.1 工具注册的意义

工具注册机制提供了以下优势：

1. **统一管理**：集中管理所有可用工具，避免重复创建和配置
2. **分类组织**：按功能和用途对工具进行分类，便于查找和使用
3. **动态加载**：支持动态注册和加载工具，提高系统的灵活性
4. **简化集成**：简化工具与Agent的集成过程，只需从注册表中获取工具列表

### 2.2 工具分类体系

在Mentis框架中，我们使用`ToolCategory`枚举定义了工具的分类体系：

```python
class ToolCategory(Enum):
    SEARCH = "Search"
    CODE_INTERPRETER = "Code Interpreter"
    WEB_BROWSING = "Web Browsing"
    DATABASE = "Database"
    FILE_SYSTEM = "FileSystem"
    OTHER = "Other"
```

这种分类体系使我们能够根据任务需求选择特定类别的工具，提高工具使用的针对性和效率。

## 3. 工具注册机制的实现

### 3.1 全局工具注册表

工具注册机制的核心是一个全局工具注册表，它是一个字典，用于存储所有已注册的工具及其分类信息：

```python
# 全局工具注册表
_registered_tools = {}
```

### 3.2 工具注册函数

`register_tool`函数用于将工具注册到全局注册表中：

```python
def register_tool(tool: Tool, category: ToolCategory) -> None:
    """注册一个工具到全局字典中，带有分类信息"""
    if tool.name in _registered_tools:
        raise ValueError(f"工具名 {tool.name} 已存在，请确保工具名唯一")
    _registered_tools[tool.name] = {
        "tool": tool,
        "category": category
    }
```

### 3.3 工具获取函数

框架提供了多种函数来获取已注册的工具：

```python
def get_registered_tools(as_dict: bool = False) -> Union[List[Tool], Dict[str, Dict]]:
    """返回所有已注册的工具"""
    if as_dict:
        return _registered_tools
    return [info["tool"] for info in _registered_tools.values()]

def get_tools_by_category(category: ToolCategory, return_instances: bool = True) -> List[Union[str, Tool]]:
    """返回指定分类的工具列表"""
    if return_instances:
        return [info["tool"] for name, info in _registered_tools.items() if info["category"] == category]
    return [name for name, info in _registered_tools.items() if info["category"] == category]
```

## 4. 简化工具注册的辅助函数

### 4.1 直接注册工具的函数

为了简化工具注册过程，框架提供了`register_direct_tool`函数，它可以根据工具类名自动判断工具类别：

```python
def register_direct_tool(tool_instance: BaseTool, category: ToolCategory = None) -> None:
    """注册直接从langchain_community.tools导入的工具"""
    if not category:
        # 获取工具类名
        tool_class_name = tool_instance.__class__.__name__
        # 根据工具类名自动判断类别
        category = tool_category_mapping.get(tool_class_name, tool_category_mapping["default"])
    
    # 注册工具
    register_tool(tool_instance, category)
    print(f"已注册工具: {tool_instance.name} (类别: {category.value})")
```

### 4.2 自动注册自定义工具

框架还支持自动扫描和注册自定义工具。在`__init__.py`中，我们使用以下代码自动注册自定义工具：

```python
# 遍历目录中的所有文件，注册自定义工具
for filename in os.listdir(tools_dir):
    # 只处理 .py 文件，且排除 __init__.py 和 registry.py
    if filename.endswith('.py') and filename not in ['__init__.py', 'registry.py']:
        # 提取模块名（去掉 .py 后缀）
        module_name = filename[:-3]
        try:
            # 动态导入模块
            module = importlib.import_module(f'.{module_name}', package='core.tools')
            
            # 查找模块中的工具类（继承自BaseTool的类）
            for name, obj in inspect.getmembers(module):
                # 检查是否是类且是BaseTool的子类
                if inspect.isclass(obj) and issubclass(obj, BaseTool) and obj != BaseTool:
                    # 检查该类是否已经被实例化并注册
                    tool_name = getattr(obj, 'name', None)
                    if tool_name and tool_name not in [info['tool'].name for info in get_registered_tools().values()]:
                        # 确定工具类别
                        category = getattr(module, 'category', ToolCategory.OTHER)
                        # 实例化并注册工具
                        try:
                            tool_instance = obj()
                            register_tool(tool_instance, category)
                            print(f"已注册工具类: {name} (工具名: {tool_instance.name}, 类别: {category.value})")
                        except Exception as e:
                            print(f"实例化工具类 {name} 时出错: {e}")
        except Exception as e:
            print(f"导入 {module_name} 时出错: {e}")
```

这段代码会自动扫描`core/tools`目录中的所有Python文件，查找继承自`BaseTool`的类，并自动实例化和注册这些工具。

## 5. 与ReactAgent的集成

### 5.1 从注册表获取工具列表

在创建ReactAgent实例时，我们可以从注册表中获取工具列表：

```python
# 从注册表中获取工具列表
tools_list = [info["tool"] for info in registered_tools.values()]

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=tools_list,
    name="fed_research_agent",
    prompt=(
        "你是一位专业的经济研究分析师，擅长分析复杂的经济问题并提供深入见解。\n"
        "你有多个强大的工具可以搜索网络获取实时信息：\n"
        "- jina_search: 用于进行网络搜索获取最新信息\n"
        "- wikipedia_query_run: 用于查询维基百科获取基础知识\n"
        "- firecrawl_tool: 用于抓取和分析特定网页内容\n\n"
        # 提示词内容
    ),
)
```

### 5.2 按类别选择工具

在某些场景下，我们可能只需要特定类别的工具。这时，可以使用`get_tools_by_category`函数：

```python
# 获取所有搜索类工具
search_tools = get_tools_by_category(ToolCategory.SEARCH)

# 创建专注于搜索的ReactAgent
search_agent = ReactAgent(
    model=model,
    tools=search_tools,
    name="search_agent",
    prompt="你是一位专业的信息搜索专家..."
)
```

## 6. 实际应用案例

### 6.1 美联储研究任务

以下是一个完整的应用案例，使用工具注册机制和ReactAgent进行美联储研究：

```python
# 注册搜索工具
jina_search = JinaSearch()
wiki_tool = WikipediaQueryRun(api_wrapper=WikipediaAPIWrapper())

# 使用register_direct_tool函数注册工具
register_direct_tool(jina_search)
register_direct_tool(wiki_tool)

# 注意：FireCrawlTool已经在core/tools/__init__.py中被注册，这里不需要再次注册

# 获取所有已注册的工具（以字典格式）
registered_tools = get_registered_tools(as_dict=True)

# 从注册表中获取工具列表
tools_list = [info["tool"] for info in registered_tools.values()]

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=model,
    tools=tools_list,
    name="fed_research_agent",
    prompt=(
        "你是一位专业的经济研究分析师，擅长分析复杂的经济问题并提供深入见解。\n"
        # 提示词内容
    ),
)

# 编译Agent
agent = react_agent.compile()

# 定义输入
inputs = {
    "messages": [
        HumanMessage(content="请提供美联储(Federal Reserve)的详细介绍，包括其历史、结构、职能，以及它如何通过货币政策影响全球经济。")
    ]
}

# 执行Agent
final_state = None
for partial_state in react_agent.stream(inputs, stream_mode="values"):
    # 处理中间状态...
    pass
```

### 6.2 结果保存

执行完成后，我们可以将结果保存到文件：

```python
# 打印最终回答
if final_state and final_state.get("messages"):
    for message in final_state["messages"]:
        if isinstance(message, AIMessage) and not message.tool_calls:
            print(message.content)
            
            # 将结果保存到文件
            output_dir = os.path.join(os.path.dirname(__file__), "output")
            os.makedirs(output_dir, exist_ok=True)
            output_file = os.path.join(output_dir, "fed_research_report.md")
            
            with open(output_file, "w", encoding="utf-8") as f:
                f.write("# 美联储研究报告\n\n")
                f.write(message.content)
            
            print(f"\n研究报告已保存到: {output_file}")
```

## 7. 最佳实践

### 7.1 工具命名规范

为了避免工具名冲突，建议遵循以下命名规范：

1. 使用有意义的名称，反映工具的功能
2. 对于同一类别的工具，使用统一的前缀或后缀
3. 避免使用过于通用的名称，如`search`、`get`等

### 7.2 工具分类策略

合理的工具分类策略可以提高工具使用的效率：

1. 根据工具的主要功能进行分类，而不是实现方式
2. 对于多功能工具，根据其主要功能进行分类
3. 只有在无法确定主要功能时，才将工具归类为`OTHER`

### 7.3 提示词优化

在提示词中明确说明可用工具及其用途，可以提高Agent的工具使用效率：

```
你是一位专业的经济研究分析师，擅长分析复杂的经济问题并提供深入见解。
你有多个强大的工具可以搜索网络获取实时信息：
- jina_search: 用于进行网络搜索获取最新信息
- wikipedia_query_run: 用于查询维基百科获取基础知识
- firecrawl_tool: 用于抓取和分析特定网页内容

当面对复杂问题时，请遵循以下方法论：
1. 分解问题：将复杂问题分解为更小的子问题
2. 制定计划：确定需要搜索哪些信息，以及使用哪些工具
3. 执行搜索：使用适当的工具执行搜索
4. 分析结果：分析搜索结果，确定是否需要进一步搜索
5. 综合信息：将所有搜索结果综合成一个连贯的回答
```

## 8. 总结

工具注册机制为Mentis框架提供了强大的可扩展性，使得智能体系统能够轻松集成各种工具，并根据任务需求灵活选择合适的工具组合。通过分类管理和自动注册，工具注册机制简化了工具的管理和使用流程，提高了开发效率。

结合ReactAgent，工具注册机制使得智能体能够访问丰富的外部功能，从而处理更复杂的任务。未来的发展方向包括支持更多类型的工具、增强工具的自动发现和选择能力，以及提供更细粒度的工具权限控制。

================================================
FILE: instructions/09.e2b_sandbox_integration.md
================================================
# E2B沙箱环境与智能代理集成指南

## 1. 引言

E2B沙箱环境是一个强大的代码执行工具，它提供了安全、隔离的环境来运行Python代码和Shell命令。将E2B沙箱与智能代理（如ReactAgent）集成，可以显著增强代理的能力，使其能够执行代码、处理数据、创建可视化，甚至与文件系统交互。本文将详细介绍E2B沙箱的核心概念、工作原理、实现方式以及在智能代理系统中的应用。

## 2. E2B沙箱环境的核心概念

### 2.1 什么是E2B沙箱

E2B（Execution Environment for Bots）是一个专为AI代理设计的代码执行环境，它提供以下核心功能：

1. **安全隔离**：在隔离的容器中执行代码，防止恶意代码影响宿主系统
2. **多语言支持**：主要支持Python，同时可通过Shell命令执行其他语言代码
3. **文件系统操作**：允许创建、读取、写入和管理文件
4. **包管理**：支持安装和使用第三方Python库
5. **持久化**：可以在会话之间保持状态和文件

### 2.2 E2B沙箱与代码解释器的关系

E2B沙箱是一种特殊的代码解释器实现，它不仅能执行代码，还提供了完整的操作系统环境（基于Debian）。这使得它比简单的代码解释器功能更强大，能够：

- 执行系统命令
- 管理文件和目录
- 安装和使用各种软件包
- 运行网络服务
- 处理复杂的数据分析和可视化任务

## 3. E2B沙箱的实现

### 3.1 E2BCodeInterpreterTool类的设计

在我们的实现中，`E2BCodeInterpreterTool`类继承自LangChain的`BaseTool`，提供了与E2B沙箱交互的接口：

```python
class E2BCodeInterpreterTool(BaseTool):
    """使用E2B SDK执行Python代码的工具
    
    该工具创建一个安全的沙箱环境，用于执行Python代码，并返回执行结果、
    标准输出、标准错误和任何错误信息。
    """
    
    name: str = "e2b_code_interpreter"
    description: str = (
        "在安全的 Debian 基础沙箱环境中执行 Python 代码或 shell 命令，并返回结果。"
        "适用于数据分析、可视化、复杂计算以及系统操作。"
        "输入应为有效的 Python 代码字符串，或以 '!' 开头的 shell 命令。"
        "常见 Python 库（如 numpy、pandas 和 matplotlib）已预装，若需其他库，可通过 pip 安装。"
        "沙箱环境充分利用 Debian 系统的强大功能，支持广泛的操作。"
    )
```

### 3.2 核心方法

`E2BCodeInterpreterTool`类提供了以下核心方法：

1. **_initialize_sandbox()**: 初始化沙箱环境
2. **_run()**: 在沙箱中执行代码并返回结果
3. **close()**: 关闭沙箱并释放资源
4. **format_to_tool_message()**: 将执行结果格式化为工具消息

### 3.3 沙箱初始化与资源管理

沙箱初始化过程包括：

1. 检查是否安装了`e2b_code_interpreter`包
2. 验证是否设置了`E2B_API_KEY`环境变量
3. 创建`Sandbox`实例
4. 设置沙箱状态标志

资源管理方面，工具提供了`close()`方法来释放沙箱资源：

```python
def close(self):
    """关闭沙箱，释放资源"""
    if hasattr(self, "sandbox") and self._is_available and self.sandbox is not None:
        try:
            print("正在关闭E2B沙箱并释放资源...")
            self.sandbox.kill()
            print("E2B沙箱已成功关闭")
        except Exception as e:
            print(f"关闭E2B沙箱时出错: {str(e)}")
```

## 4. 将E2B沙箱与ReactAgent集成

### 4.1 基本集成流程

将E2B沙箱与ReactAgent集成的基本流程如下：

1. **注册E2B工具**：将`E2BCodeInterpreterTool`注册到工具注册表中
2. **创建ReactAgent**：使用包含E2B工具的工具列表初始化ReactAgent
3. **设计提示词**：编写强调代码执行能力的提示词
4. **执行工作流**：让Agent使用E2B工具执行代码并处理结果

### 4.2 代码示例

以下是一个基本的集成示例：

```python
# 导入必要的库
from core.agents.react_agent import ReactAgent
from core.tools.registry import get_tools_by_category, ToolCategory
from langchain_openai import ChatOpenAI

# 获取代码解释器工具
tools_list = get_tools_by_category(ToolCategory.CODE_INTERPRETER)

# 创建ReactAgent实例
react_agent = ReactAgent(
    model=ChatOpenAI(model="gpt-4o-mini"),
    tools=tools_list,
    prompt=(
        "你是一位专业的数据分析师，可以使用Python代码解决问题。\n"
        "你有强大的代码执行工具可以使用：\n"
        "- e2b_code_interpreter: 用于执行Python代码和shell命令\n"
    ),
)

# 编译Agent
agent = react_agent.compile()

# 执行任务
result = agent.invoke({"messages": [HumanMessage(content="分析以下数据并创建可视化...")]})
```

## 5. E2B沙箱的高级功能

### 5.1 文件系统操作

E2B沙箱提供了完整的文件系统操作能力，可以：

- 创建和管理目录结构
- 读写文本和二进制文件
- 列出目录内容
- 移动和删除文件

示例代码：

```python
# 在沙箱中创建目录和文件
code = """
# 创建目录
import os
os.makedirs('test_dir/subdir', exist_ok=True)

# 创建并写入文件
with open('test_dir/example.txt', 'w') as f:
    f.write('Hello from E2B sandbox!')
    
# 列出目录内容
print(os.listdir('test_dir'))

# 读取文件内容
with open('test_dir/example.txt', 'r') as f:
    content = f.read()
    print(f'文件内容: {content}')
"""

# 执行代码
result = e2b_tool.invoke({"code": code})
```

### 5.2 包管理

E2B沙箱允许安装和使用第三方Python库：

```python
# 安装并使用第三方库
code = """
# 安装pandas库
!pip install pandas matplotlib

# 使用pandas进行数据分析
import pandas as pd
import matplotlib.pyplot as plt

# 创建示例数据
data = {'Category': ['A', 'B', 'C', 'D'], 'Values': [10, 25, 15, 30]}
df = pd.DataFrame(data)

# 打印数据
print(df)

# 创建可视化
plt.figure(figsize=(8, 4))
plt.bar(df['Category'], df['Values'])
plt.title('Sample Bar Chart')
plt.savefig('chart.png')
print('图表已保存为chart.png')
"""

# 执行代码
result = e2b_tool.invoke({"code": code})
```

### 5.3 从沙箱下载文件

可以将沙箱中生成的文件下载到本地系统：

```python
def download_file_from_sandbox(sandbox, sandbox_path, local_path):
    """从沙箱下载文件到本地"""
    try:
        # 从沙箱读取文件内容
        content = sandbox.files.read(sandbox_path)
        
        # 确保目标目录存在
        os.makedirs(os.path.dirname(local_path), exist_ok=True)
        
        # 写入本地文件
        with open(local_path, 'w', encoding='utf-8') as file:
            file.write(content)
            
        print(f"文件已从沙箱下载到本地: {local_path}")
        return True
    except Exception as e:
        print(f"从沙箱下载文件时出错: {str(e)}")
        return False
```

## 6. 实际应用案例

### 6.1 数据分析与可视化

E2B沙箱特别适合数据分析和可视化任务，可以：

- 加载和处理各种格式的数据（CSV、JSON、Excel等）
- 使用pandas进行数据清洗和转换
- 使用matplotlib、seaborn等创建可视化
- 生成分析报告

### 6.2 文件处理与转换

E2B沙箱可以处理各种文件格式的转换和处理：

- 文本文件处理（如日志分析）
- 图像处理和转换
- 数据格式转换（如CSV到JSON）
- 文档生成（如生成HTML或PDF报告）

### 6.3 Web爬虫与API调用

E2B沙箱可以执行网络相关任务：

- 使用requests或BeautifulSoup进行网页爬取
- 调用各种API并处理响应
- 下载和处理网络资源

## 7. 最佳实践与注意事项

### 7.1 安全考虑

虽然E2B沙箱提供了隔离环境，但在使用时仍需注意：

- 不要在沙箱中处理敏感数据
- 避免执行未经验证的用户输入代码
- 限制沙箱的网络访问权限
- 定期关闭和重新创建沙箱实例

### 7.2 资源管理

E2B沙箱会消耗系统资源，因此：

- 在不需要时关闭沙箱（使用`close()`方法）
- 避免在单个沙箱中运行过多或过大的任务
- 监控沙箱的内存和CPU使用情况

### 7.3 错误处理

在与E2B沙箱交互时，应当实施健壮的错误处理：

- 捕获并处理代码执行异常
- 验证沙箱初始化是否成功
- 提供有意义的错误消息给用户
- 实现重试机制处理临时故障

## 8. 总结

E2B沙箱为智能代理提供了强大的代码执行能力，使其能够处理各种复杂任务。通过将E2B沙箱与ReactAgent集成，我们可以创建能够执行代码、处理数据、创建可视化，甚至与文件系统交互的智能系统。

正确使用E2B沙箱需要理解其核心概念、实现方式和最佳实践。通过本文的指导，开发者应能够有效地将E2B沙箱集成到自己的智能代理系统中，并充分利用其强大功能。

## 9. 参考资源

- [E2B官方文档](https://e2b.dev/docs)
- [E2B Code Interpreter SDK](https://github.com/e2b-dev/code-interpreter)
- [LangChain工具集成指南](https://python.langchain.com/docs/integrations/tools)
- [ReactAgent文档](https://python.langchain.com/docs/modules/agents/agent_types/react)

================================================
FILE: log_analyzer.py
================================================
import re
import sys
import argparse
from collections import defaultdict
import json

def parse_log_file(file_path):
    """Parse the execution log file and extract agent interactions."""
    with open(file_path, 'r', encoding='utf-8') as f:
        content = f.read()
    
    # Extract different sections of the log
    sections = content.split("================================ Human Message =================================")
    if len(sections) > 1:
        main_content = sections[1]  # Skip header
    else:
        main_content = content
    
    # Extract messages
    messages = []
    
    # Pattern for AI messages
    ai_pattern = r"================================== Ai Message ==================================\nName: (\w+)\n\n(.*?)(?=(==================================|$))"
    ai_matches = re.finditer(ai_pattern, main_content, re.DOTALL)
    
    for match in ai_matches:
        agent_name = match.group(1)
        message_content = match.group(2).strip()
        
        # Check if message has tool calls
        tool_calls = []
        tool_call_pattern = r"Tool Calls:\n(.*?)(?=\n==================================|$)"
        tool_call_match = re.search(tool_call_pattern, message_content, re.DOTALL)
        if tool_call_match:
            # Extract tool calls
            tool_calls_text = tool_call_match.group(1)
            tool_call_entries = re.findall(r"  (\w+) \(([^)]+)\)", tool_calls_text)
            tool_calls = [{"name": name, "id": call_id} for name, call_id in tool_call_entries]
            
            # Remove tool calls from the message content
            message_content = re.sub(r"Tool Calls:.*?(?=\n==================================|$)", "", message_content, flags=re.DOTALL).strip()
        
        messages.append({
            "role": "agent",
            "agent": agent_name,
            "content": message_content,
            "tool_calls": tool_calls
        })
    
    # Pattern for Tool messages
    tool_pattern = r"================================= Tool Message =================================\nName: (\w+)\n\n(.*?)(?=(==================================|$))"
    tool_matches = re.finditer(tool_pattern, main_content, re.DOTALL)
    
    for match in tool_matches:
        tool_name = match.group(1)
        tool_content = match.group(2).strip()
        
        messages.append({
            "role": "tool",
            "tool": tool_name,
            "content": tool_content
        })
    
    # Sort messages by their position in the log
    messages.sort(key=lambda x: main_content.find(x["content"]))
    
    return messages

def analyze_agent_interactions(messages):
    """Analyze the interactions between agents."""
    interactions = []
    current_sender = None
    tool_call_map = {}
    
    for i, msg in enumerate(messages):
        if msg["role"] == "agent":
            current_sender = msg["agent"]
            # Check if this agent is using tool calls
            for tool_call in msg.get("tool_calls", []):
                tool_name = tool_call["name"]
                tool_id = tool_call["id"]
                tool_call_map[tool_id] = {
                    "sender": current_sender,
                    "tool": tool_name
                }
                interactions.append({
                    "step": i,
                    "from": current_sender,
                    "to": f"SYSTEM ({tool_name})",
                    "action": f"Called tool {tool_name}",
                    "content": f"Tool call ID: {tool_id}"
                })
        elif msg["role"] == "tool":
            # Find which agent invoked this tool
            for prev_msg in reversed(messages[:i]):
                if prev_msg["role"] == "agent" and any(tc["name"] == msg["tool"] for tc in prev_msg.get("tool_calls", [])):
                    sender = prev_msg["agent"]
                    break
            else:
                sender = "SYSTEM"
            
            interactions.append({
                "step": i,
                "from": f"SYSTEM ({msg['tool']})",
                "to": sender,
                "action": f"Tool response",
                "content": msg["content"]
            })
    
    return interactions

def visualize_interactions(interactions):
    """Visualize the interactions between agents."""
    print("\n" + "="*100)
    print(" "*40 + "AGENT INTERACTIONS SUMMARY")
    print("="*100 + "\n")
    
    for idx, interaction in enumerate(interactions):
        print(f"[{idx+1}] {interaction['from']} → {interaction['to']}")
        print(f"    Action: {interaction['action']}")
        content = interaction['content']
        if len(content) > 100:
            content = content[:97] + "..."
        print(f"    Content: {content}\n")

def visualize_conversation_flow(messages):
    """Visualize the conversation flow between agents."""
    print("\n" + "="*100)
    print(" "*40 + "CONVERSATION FLOW")
    print("="*100 + "\n")
    
    for idx, message in enumerate(messages):
        if message["role"] == "agent":
            agent_name = message["agent"]
            print(f"[{idx+1}] Agent: {agent_name}")
            content = message["content"]
            if len(content) > 150:
                content = content[:147] + "..."
            print(f"    Content: {content}")
            
            if message.get("tool_calls"):
                tools = ", ".join([tc["name"] for tc in message["tool_calls"]])
                print(f"    Tools Called: {tools}")
        else:
            print(f"[{idx+1}] Tool: {message['tool']}")
            content = message["content"]
            if len(content) > 100:
                content = content[:97] + "..."
            print(f"    Response: {content}")
        print()

def main():
    parser = argparse.ArgumentParser(description='Analyze Mentis execution logs.')
    parser.add_argument('log_file', help='Path to the log file')
    parser.add_argument('--format', choices=['interactions', 'flow', 'all'], default='all',
                      help='Output format: interactions, flow, or all')
    
    args = parser.parse_args()
    
    try:
        messages = parse_log_file(args.log_file)
        interactions = analyze_agent_interactions(messages)
        
        if args.format in ['interactions', 'all']:
            visualize_interactions(interactions)
        
        if args.format in ['flow', 'all']:
            visualize_conversation_flow(messages)
            
    except Exception as e:
        print(f"Error: {e}")
        sys.exit(1)

if __name__ == "__main__":
    main()


================================================
FILE: pyproject.toml
================================================
[build-system]
requires = ["setuptools>=42", "wheel"]
build-backend = "setuptools.build_meta"
readme = "README.md"
requires-python = ">=3.11"

[project]
name = "mentis"
version = "0.1.0"
description = "A Multi-Agents project based on langgraph"
requires-python = ">=3.11"
dependencies = [
    "dotenv>=0.9.9",
    "langchain-community>=0.3.19",
    "langchain-core>=0.3.45",
    "langchain-openai>=0.3.8",
    "langgraph>=0.3.11",
    "pydantic>=2.10.6",
    "typing-extensions>=4.12.2",
    "python-dotenv>=1.0.0",
    "firecrawl-py",
    "wikipedia>=1.4.0",
    "serpapi>=0.1.5",
    "google-search-results>=2.4.2",
    "duckduckgo-search>=7.5.2",
    "arxiv>=2.1.3",
    "rizaio>=0.9.0",
    "e2b-code-interpreter>=1.1.0",
    "fastapi>=0.115.11",
    "uvicorn>=0.34.0",
    "sse-starlette>=2.2.1",
    "exa-py>=1.9.1",
    "tavily-python>=0.5.1",
    "replicate>=1.0.4",
    "langchain-mcp-adapters>=0.0.7",
    "mcp>=1.6.0",
    "playwright>=1.51.0",
    "pillow>=11.2.1",
    "yfinance>=0.2.55",
]

[tool.setuptools]
packages = ["core"]


================================================
FILE: requirements.txt
================================================
# This file was autogenerated by uv via the following command:
#    uv pip compile pyproject.toml -o requirements.txt
aiohappyeyeballs==2.6.1
    # via aiohttp
aiohttp==3.11.14
    # via langchain-community
aiosignal==1.3.2
    # via aiohttp
annotated-types==0.7.0
    # via pydantic
anyio==4.9.0
    # via
    #   httpx
    #   openai
    #   rizaio
arxiv==2.1.3
    # via mentis (pyproject.toml)
attrs==25.3.0
    # via
    #   aiohttp
    #   e2b
    #   e2b-code-interpreter
beautifulsoup4==4.13.3
    # via wikipedia
certifi==2025.1.31
    # via
    #   httpcore
    #   httpx
    #   requests
charset-normalizer==3.4.1
    # via requests
click==8.1.8
    # via duckduckgo-search
dataclasses-json==0.6.7
    # via langchain-community
distro==1.9.0
    # via
    #   openai
    #   rizaio
dotenv==0.9.9
    # via mentis (pyproject.toml)
duckduckgo-search==7.5.2
    # via mentis (pyproject.toml)
e2b==1.1.0
    # via e2b-code-interpreter
e2b-code-interpreter==1.1.0
    # via mentis (pyproject.toml)
feedparser==6.0.11
    # via arxiv
firecrawl-py==1.14.1
    # via mentis (pyproject.toml)
frozenlist==1.5.0
    # via
    #   aiohttp
    #   aiosignal
google-search-results==2.4.2
    # via mentis (pyproject.toml)
greenlet==3.1.1
    # via sqlalchemy
h11==0.14.0
    # via httpcore
httpcore==1.0.7
    # via
    #   e2b
    #   httpx
httpx==0.28.1
    # via
    #   e2b
    #   e2b-code-interpreter
    #   langgraph-sdk
    #   langsmith
    #   openai
    #   rizaio
httpx-sse==0.4.0
    # via langchain-community
idna==3.10
    # via
    #   anyio
    #   httpx
    #   requests
    #   yarl
jiter==0.9.0
    # via openai
jsonpatch==1.33
    # via langchain-core
jsonpointer==3.0.0
    # via jsonpatch
langchain==0.3.20
    # via langchain-community
langchain-community==0.3.19
    # via mentis (pyproject.toml)
langchain-core==0.3.45
    # via
    #   mentis (pyproject.toml)
    #   langchain
    #   langchain-community
    #   langchain-openai
    #   langchain-text-splitters
    #   langgraph
    #   langgraph-checkpoint
    #   langgraph-prebuilt
langchain-openai==0.3.9
    # via mentis (pyproject.toml)
langchain-text-splitters==0.3.6
    # via langchain
langgraph==0.3.11
    # via mentis (pyproject.toml)
langgraph-checkpoint==2.0.20
    # via
    #   langgraph
    #   langgraph-prebuilt
langgraph-prebuilt==0.1.3
    # via langgraph
langgraph-sdk==0.1.57
    # via langgraph
langsmith==0.3.15
    # via
    #   langchain
    #   langchain-community
    #   langchain-core
lxml==5.3.1
    # via duckduckgo-search
marshmallow==3.26.1
    # via dataclasses-json
msgpack==1.1.0
    # via langgraph-checkpoint
multidict==6.2.0
    # via
    #   aiohttp
    #   yarl
mypy-extensions==1.0.0
    # via typing-inspect
nest-asyncio==1.6.0
    # via firecrawl-py
numpy==2.2.4
    # via langchain-community
openai==1.66.3
    # via langchain-openai
orjson==3.10.15
    # via
    #   langgraph-sdk
    #   langsmith
packaging==24.2
    # via
    #   e2b
    #   langchain-core
    #   langsmith
    #   marshmallow
primp==0.14.0
    # via duckduckgo-search
propcache==0.3.0
    # via
    #   aiohttp
    #   yarl
protobuf==5.29.3
    # via e2b
pydantic==2.10.6
    # via
    #   mentis (pyproject.toml)
    #   firecrawl-py
    #   langchain
    #   langchain-core
    #   langsmith
    #   openai
    #   pydantic-settings
    #   rizaio
pydantic-core==2.27.2
    # via pydantic
pydantic-settings==2.8.1
    # via langchain-community
python-dateutil==2.9.0.post0
    # via e2b
python-dotenv==1.0.1
    # via
    #   mentis (pyproject.toml)
    #   dotenv
    #   firecrawl-py
    #   pydantic-settings
pyyaml==6.0.2
    # via
    #   langchain
    #   langchain-community
    #   langchain-core
regex==2024.11.6
    # via tiktoken
requests==2.32.3
    # via
    #   arxiv
    #   firecrawl-py
    #   google-search-results
    #   langchain
    #   langchain-community
    #   langsmith
    #   requests-toolbelt
    #   serpapi
    #   tiktoken
    #   wikipedia
requests-toolbelt==1.0.0
    # via langsmith
rizaio==0.9.0
    # via mentis (pyproject.toml)
serpapi==0.1.5
    # via mentis (pyproject.toml)
sgmllib3k==1.0.0
    # via feedparser
six==1.17.0
    # via python-dateutil
sniffio==1.3.1
    # via
    #   anyio
    #   openai
    #   rizaio
soupsieve==2.6
    # via beautifulsoup4
sqlalchemy==2.0.39
    # via
    #   langchain
    #   langchain-community
tenacity==9.0.0
    # via
    #   langchain-community
    #   langchain-core
tiktoken==0.9.0
    # via langchain-openai
tqdm==4.67.1
    # via openai
typing-extensions==4.12.2
    # via
    #   mentis (pyproject.toml)
    #   anyio
    #   beautifulsoup4
    #   e2b
    #   langchain-core
    #   openai
    #   pydantic
    #   pydantic-core
    #   rizaio
    #   sqlalchemy
    #   typing-inspect
typing-inspect==0.9.0
    # via dataclasses-json
urllib3==2.3.0
    # via requests
websockets==15.0.1
    # via firecrawl-py
wikipedia==1.4.0
    # via mentis (pyproject.toml)
yarl==1.18.3
    # via aiohttp
zstandard==0.23.0
    # via langsmith


================================================
FILE: setup.py
================================================
from setuptools import setup

setup()


================================================
FILE: super_agents/__init__.py
================================================


================================================
FILE: super_agents/browser_use/README.md
================================================
n# Browser Agent (基于 LangGraph) - super_agents/browser_use

## 概述

本项目实现了一个基于 LangGraph 框架的 Web 浏览和交互 Agent。其核心目标是让一个大型语言模型 (LLM) 能够像人一样理解任务指令，自主地控制浏览器（通过 Playwright）来访问网页、分析内容、与页面元素交互（点击、输入、滚动等），并最终完成用户指定的任务，例如信息提取、表单填写、在线搜索等。

该 Agent 采用了多模态感知的设计思路，结合了传统的 DOM/Accessibility Tree 分析和可选的视觉语言模型 (VLM) 分析，以期在复杂网页上获得更鲁棒的理解和定位能力。

## 核心技术栈

* **流程编排:** LangGraph (LangChain 的状态图编排库)
* **浏览器自动化:** Playwright (异步 Python 版本)
* **模型调用:** LangChain ChatModels (`langchain-openai`, `langchain-community` 等)
* **语言模型 (LLM/VLM):**
    * **规划/决策 LLM:** 可配置，支持 OpenAI, Groq, xAI (Grok), 及其他 OpenAI 兼容 API (通过 `llm.py` 和 `.env` 配置)。
    * **视觉分析 VLM:** 可选，通过 OpenRouter 调用支持 Vision 的模型 (如 Qwen-VL, GPT-4o, Claude 3.5 Sonnet 等) (通过 `detector.py` 和 `.env` 配置)。
* **依赖管理:** `uv` (或 `pip`)
* **配置:** `.env` 文件

## 项目架构

项目主要文件和目录结构如下：

```
super_agents/
└── browser_use/              # Agent 根目录
    ├── agent/                # LangGraph 核心实现
    │   ├── __init__.py
    │   ├── graph.py          # 定义 LangGraph 图结构、节点连接、条件边
    │   ├── nodes.py          # 定义图中各节点 (Node) 的具体执行逻辑 (AgentNodes 类)
    │   ├── state.py          # 定义 Agent 在图中流转的状态 (AgentState)
    │   ├── schemas.py        # 定义数据模型 (如动作指令 Action Schema, VLM 输出 Schema)
    │   └── prompts.py        # 管理发送给规划 LLM 和 VLM 的 Prompt 模板
    │
    ├── browser/              # 浏览器交互底层实现 (基于原始项目代码)
    │   ├── __init__.py
    │   ├── browser.py        # 核心 Browser 类，封装 Playwright 操作、感知方法 (get_content, update_state)
    │   ├── detector.py       # 视觉检测器类，实现 VLM 调用逻辑
    │   ├── models.py         # 定义浏览器状态、元素等 Pydantic 模型
    │   ├── utils.py          # 浏览器相关的工具函数
    │   └── findVisibleInteractiveElements.js # 用于 DOM 元素检测的 JS 脚本
    │
    ├── llm/                  # LLM 相关实现
    │   ├── __init__.py
    │   └── llm.py            # 定义 ChatOpenRouter (VLM 调用), initialize_llms (规划 LLM 初始化), generate_structured_output
    │
    ├── main.py               # Agent 的主入口脚本
    ├── requirements.txt      # Python 依赖列表
    ├── README.md             # 本文件
    └── .env                  # 环境变量配置文件 (需要手动创建)
```

## 核心概念与设计

### 1. LangGraph 状态机

Agent 的核心控制流由 LangGraph 管理。它被实现为一个状态机 (`StateGraph`)：

* **状态 (State):** `agent/state.py` 中的 `AgentState` (TypedDict) 定义了在节点间传递的数据，包含当前任务、浏览器内容/状态、LLM 解析出的动作、历史记录、错误信息等。
* **节点 (Nodes):** `agent/nodes.py` 中的 `AgentNodes` 类定义了主要的处理步骤，作为图的节点：
    * `get_browser_state`: 调用 `Browser` 类的感知方法 (当前是 `get_content`) 获取页面信息。
    * `plan_action`: 将感知信息和任务包装成 Prompt，调用**规划 LLM** (通过 `llm.py` 的 `generate_structured_output`) 获取结构化的下一步动作 JSON。
    * `execute_action`: 解析 `plan_action` 返回的动作 JSON，并调用 `Browser` 类中相应的交互方法 (如 `Maps_to`, `click`, `type`, `scroll`, `wait`) 执行操作。
* **边 (Edges):** `agent/graph.py` 定义了节点间的固定跳转（如 `get_browser_state` -> `plan_action`）和条件跳转（如 `execute_action` 后根据 `should_end` 函数判断是结束 `END` 还是回到 `get_browser_state`）。

### 2. 感知 (Perception)

Agent 通过 `browser.py` 中的 `Browser.get_content()` 方法（被 `get_browser_state` 节点调用）来理解当前网页状态。该方法整合了多种信息源，旨在为 LLM 提供丰富且相对简洁的页面表示：

* **简化 DOM:** 通过注入并执行 `SIMPLIFY_PAGE_SCRIPT` JavaScript，移除无关标签（脚本、样式等），提取关键交互元素及其属性，并为这些元素添加 `x-pw-id` 唯一标识。结果以伪 HTML 字符串形式返回。
* **可访问性树 (AX Tree):** (当前实现中暂时禁用/存在错误) 理论上通过 `page.accessibility.snapshot()` 获取页面的语义结构信息（角色、名称等），以 JSON 字符串形式返回。
* **视觉元素 (VLM):** (可选，需配置)
    * 如果 `.env` 文件中配置了 VLM (`OPENROUTER_API_KEY`, `VLM_API_MODEL`)，`get_content` 会调用 `Detector` 实例。
    * `Detector` (在 `browser/detector.py` 中) 使用 LangChain 的 `ChatOpenRouter` (在 `llm.py` 中定义) 调用配置的 VLM API。
    * 通过精心设计的 Prompt (`VLM_PROMPT_TEMPLATE`) 请求 VLM 返回页面交互元素的**描述、类型和边界框百分比坐标** (JSON 格式)。
    * `Detector` 解析 VLM 返回的 JSON，创建 `InteractiveElement` 对象列表（目前坐标是占位符）。
    * `get_content` 将这些视觉元素信息格式化为**文本摘要** (包含 VLM 分配的 ID 和边界框信息)。
* **合并与截断:** `get_content` 将 URL、简化 DOM、AX Tree (如果成功)、视觉元素摘要合并为一个长的文本字符串，并在超过 `max_length` 时进行截断，最后返回给 `plan_action` 节点。

### 3. 规划 (Planning)

* `plan_action` 节点接收 `get_content` 返回的**混合文本字符串**。
* `agent/prompts.py` 中的 `create_agent_prompt` 函数将任务描述、历史记录、错误信息（如果有）和这段混合文本整合成一个 Prompt。
* 该 Prompt 被发送给**规划 LLM**（通过 `llm.py` 中的 `generate_structured_output` 函数，该函数使用 LangChain 的 `.with_structured_output()` 功能）。
* LLM 被要求分析输入信息，决定下一步动作，并**严格按照 `agent/schemas.py` 中定义的 `LLMResponse` Pydantic 模型返回一个包含具体动作指令的 JSON**。Prompt 中包含了对生成**健壮 CSS 选择器**（优先使用稳定 ID、aria-label、文本内容，结合 `x-pw-id`）的明确指导。

### 4. 行动 (Action Execution)

* `execute_action` 节点接收规划 LLM 返回的结构化动作 JSON (存储在 `state['parsed_action']`)。
* 它解析出动作类型 (`type`) 和参数 (`selector`, `url`, `text`, `direction` 等)。
* 根据动作类型，调用 `browser/browser.py` 中 `Browser` 类对应的**简单交互方法**:
    * `Maps_to(url)`
    * `click(selector)`
    * `type(selector, text)`
    * `scroll(direction)`
    * `wait(milliseconds)`
* 这些方法内部使用 Playwright 的 `page.goto`, `page.locator(...).click`, `page.locator(...).fill`, `page.evaluate(...)` 等函数执行实际的浏览器操作。
* 如果动作是 `finish` 或 `error`，图流程会根据 `graph.py` 中的 `should_end` 函数判断并终止。

## 安装与配置

1.  **环境:** 推荐使用 Python 3.10+。
2.  **依赖安装:**
    * 克隆项目。
    * 进入 `super_agents/browser_use/` 目录。
    * 创建并激活虚拟环境 (使用 uv):
        ```bash
        uv venv
        source .venv/bin/activate  # Linux/macOS
        # 或者 .venv\Scripts\activate # Windows
        ```
    * 安装依赖项 (使用 uv):
        ```bash
        uv sync
        ```
3.  **Playwright 浏览器:** 运行 `playwright install` (至少需要 `playwright install chromium`) 来下载浏览器驱动。
4.  **环境变量 (`.env` 文件):**
    * 在 `super_agents/browser_use/` 目录下创建一个名为 `.env` 的文件。
    * 参考我们之前讨论的 `.env` 示例，**至少需要配置**：
        * **规划 LLM:** 选择一个 Provider (如 `openai`), 设置 `LLM_PROVIDER`, `LLM_MODEL_NAME`, 以及对应的 API Key (如 `OPENAI_API_KEY`)。
        * **VLM (可选):** 如果要启用视觉分析，设置 `OPENROUTER_API_KEY` 和 `VLM_API_MODEL` (设置为 OpenRouter 上支持视觉的模型 ID，如 `openai/gpt-4.1`等)。
    * 确保 `.env` 文件被正确加载（`main.py` 和 `llm.py` 中包含 `load_dotenv()`）。

## 如何运行

1.  确保已完成安装和配置。
2.  激活虚拟环境。
3.  从 `super_agents/` 目录（即 `browser_use` 的**上级**目录）运行 `main.py`：

    ```bash
    # 基本运行
    python -m browser_use.main "您的任务描述"

    # 示例：访问 Hacker News 并获取导航栏信息
    python -m browser_use.main "访问 news.ycombinator.com，返回页面导航栏信息"

    # 示例：使用其他命令行参数（如果有定义，如下面的最大步骤数）
    python -m browser_use.main "您的任务描述" --max-steps 30
    ```

## 当前状态、局限性与未来工作

* **核心流程:** Agent 的基本 LangGraph 流程（感知-规划-行动循环）、浏览器操作（导航、点击、输入、滚动、等待）、规划 LLM 调用、可选的 VLM 调用**已经跑通**，能够完成一些多步骤的 Web 任务。
* **视觉集成 (部分):** VLM 调用流程已集成到 `Detector` 类并通过 `get_content` 触发（需配置 API Key 和 Model）。VLM 能够返回 JSON 格式的检测结果，并且可以被成功解析为内部数据结构 (`InteractiveElement`)。
* **局限性 & 待完善:**
    1.  **VLM 坐标处理:** VLM 返回的是百分比坐标，但在解析时 (`_parse_vlm_detections`) 目前使用的是**占位符像素坐标**。需要获取截图的实际尺寸，实现准确的百分比到像素的转换，才能真正利用视觉信息进行定位。
    2.  **动作执行方式:** 当前 `execute_action` 仍然**完全依赖规划 LLM 生成的 CSS 选择器**。尚未实现基于 VLM 的元素 ID 或坐标进行点击/输入的操作，这限制了视觉能力的实际应用，特别是在 CSS 选择器不可靠的复杂页面上。
    3.  **感知信息完整性:**
        * **内容截断:** `get_content` 方法返回的内容会因为 `max_length` 限制而被截断，影响需要完整页面信息的任务（如“摘录全文”）。需要增大 `max_length` 或实现更智能的内容提取/滚动策略。
        * **AX Tree 缺失:** 获取 Accessibility Tree 的代码目前被注释或存在错误，导致缺少重要的语义信息。需要修复 `page.accessibility.snapshot()` 调用。
    4.  **滚动策略:** 当前依靠 Prompt 指示 LLM 进行滚动。可能需要更鲁棒的机制来处理长页面，例如 Agent 内部判断是否需要滚动，或者让 LLM 能获取滚动状态信息。
    5.  **Pydantic V1 警告:** 调用规划 LLM 的 `with_structured_output` 时仍然出现 Pydantic V1 警告，建议保持 LangChain 相关库和 Pydantic 为最新版本。
    6.  **错误处理:** 当前错误处理相对简单（例如 VLM 解析失败直接跳过，执行错误直接终止图），可以增加更复杂的重试、回退或用户介入机制。
    7.  **VLM 稳定性:** VLM 能否稳定、准确地返回所需的 JSON 格式和边界框，高度依赖所选模型和 Prompt，可能需要进一步调优。

* **未来工作:**
    * 修复 AX Tree 获取。
    * 实现 VLM 百分比坐标到像素坐标的准确转换。
    * 增强 `execute_action` 和 `Browser` 类以支持基于坐标的交互。
    * 优化 Prompt，指导 LLM 输出 VLM 元素 ID 或在 CSS 选择器失败时提供坐标作为备选。
    * 实现更智能的滚动策略以处理长页面和完整内容提取。
    * 持续更新依赖库，解决 Pydantic 警告。
    * 增强错误处理和恢复能力。

================================================
FILE: super_agents/browser_use/__init__.py
================================================


================================================
FILE: super_agents/browser_use/agent/__init__.py
================================================
# super_agents/browser_use/agent/__init__.py
"""
Browser agent module that handles browser automation using LLM guidance.
"""


================================================
FILE: super_agents/browser_use/agent/graph.py
================================================
# super_agents/browser_use/agent/graph.py
import logging
from typing import Dict, Any

from langchain_core.runnables.base import RunnableSerializable
from langgraph.graph import StateGraph, END

from .state import AgentState
from .nodes import AgentNodes
from ..browser.browser import Browser

logger = logging.getLogger(__name__)

NODE_GET_BROWSER_STATE = "get_browser_state"
NODE_PLAN_ACTION = "plan_action"
NODE_EXECUTE_ACTION = "execute_action"

# --- UPDATED Conditional Edge Logic ---
def should_end(state: AgentState) -> bool:
    """Determines if the graph should end."""
    action = state.get("parsed_action", {})
    action_type = action.get("type")
    error_occurred = state.get("error") is not None # Check if execute_action reported an error

    # End if the LLM planned action is 'finish' or 'error'
    if action_type == "finish":
        logger.info("Graph execution: 'finish' action planned. Ending.")
        return True
    if action_type == "error":
        # Log the error message from the action payload
        logger.error(f"Graph execution: 'error' action planned by LLM: {action.get('message', 'Unknown error')}. Ending.")
        return True

    # End if the execute_action node reported an error in the state
    # Note: Depending on desired behavior, you might want to retry instead of ending on execution errors
    # if error_occurred:
    #     logger.error(f"Graph execution: Error occurred during execution: {state['error']}. Ending.")
    #     return True # Uncomment this line if ANY execution error should terminate the graph

    return False # Continue otherwise

def create_graph_app(browser: Browser, llm: RunnableSerializable):
    """
    Creates the LangGraph application using class-based nodes.
    """
    agent_nodes = AgentNodes(browser=browser, llm=llm)
    workflow = StateGraph(AgentState)

    workflow.add_node(NODE_GET_BROWSER_STATE, agent_nodes.get_browser_state)
    workflow.add_node(NODE_PLAN_ACTION, agent_nodes.plan_action)
    workflow.add_node(NODE_EXECUTE_ACTION, agent_nodes.execute_action)

    workflow.set_entry_point(NODE_GET_BROWSER_STATE)
    workflow.add_edge(NODE_GET_BROWSER_STATE, NODE_PLAN_ACTION)
    workflow.add_edge(NODE_PLAN_ACTION, NODE_EXECUTE_ACTION)

    # After executing action, decide whether to end or loop back
    workflow.add_conditional_edges(
        NODE_EXECUTE_ACTION,
        # Function to decide the next step based on the state *after* execution
        lambda state: END if should_end(state) else NODE_GET_BROWSER_STATE,
        {
            END: END,
            NODE_GET_BROWSER_STATE: NODE_GET_BROWSER_STATE
        }
    )

    logger.info("Compiling LangGraph workflow...")
    app = workflow.compile()
    logger.info("LangGraph workflow compiled successfully.")
    return app

================================================
FILE: super_agents/browser_use/agent/nodes.py
================================================
# super_agents/browser_use/agent/nodes.py
import asyncio
import logging
from typing import Dict, Any, Optional

# --- LangChain Core Import for Type Hint ---
from langchain_core.runnables.base import RunnableSerializable # <--- Import this

from .state import AgentState
from .schemas import (
    BaseAction, LLMResponse
)
from .prompts import create_agent_prompt
# --- CORRECTED LLM IMPORT ---
# Import only the necessary functions/classes that actually exist in llm.py
from ..llm import generate_structured_output

# Import the correct Browser from the browser subdirectory
from ..browser.browser import Browser

logger = logging.getLogger(__name__)

# --- Class to hold nodes and dependencies ---
class AgentNodes:
    """Encapsulates agent nodes and their dependencies (browser, llm)."""
    # --- CORRECTED TYPE HINT for llm ---
    def __init__(self, browser: Browser, llm: RunnableSerializable): # <--- Use RunnableSerializable
        if not isinstance(llm, RunnableSerializable):
             logger.warning(f"LLM instance provided to AgentNodes is not of type RunnableSerializable (actual type: {type(llm)}).")
        self.browser = browser
        self.llm = llm
        logger.info("AgentNodes initialized with browser and llm instances.")

    # --- Node method implementations remain the same ---
    async def get_browser_state(self, state: AgentState) -> Dict[str, Any]:
        """Node method to get the current state of the browser page."""
        logger.info("Node: get_browser_state")
        try:
            content = await self.browser.get_content()
            return {"browser_content": content, "error": None}
        except Exception as e:
            logger.error(f"Error getting browser state: {e}", exc_info=True)
            return {"error": f"Failed to get browser state: {e}"}

    async def plan_action(self, state: AgentState) -> Dict[str, Any]:
        """Node method to decide the next action using the LLM's structured output."""
        logger.info("Node: plan_action")
        if state.get("error"):
            logger.warning(f"Planning action with existing error: {state['error']}")

        prompt = create_agent_prompt(
            task=state["task"],
            current_browser_content=state["browser_content"],
            history=state.get("history", []),
            error_message=state.get("error")
        )
        system_message = "You are an AI agent controlling a web browser. Respond with the single next action formatted as JSON matching the required schema."

        try:
            llm_response: Optional[LLMResponse] = await generate_structured_output(
                model=self.llm, # Pass the llm instance
                schema=LLMResponse,
                prompt=prompt,
                system_message=system_message
            )

            if llm_response and isinstance(llm_response, LLMResponse):
                parsed_action_model: BaseAction = llm_response.action
                parsed_action_dict = parsed_action_model.dict()
                logger.info(f"LLM proposed action: {parsed_action_dict.get('type', 'unknown')}")
                return {"parsed_action": parsed_action_dict, "error": None}
            else:
                logger.error("Failed to get valid structured output from LLM.")
                error_action_dict = {"type": "error", "message": "Failed to get valid structured output from LLM."}
                return {"parsed_action": error_action_dict, "error": "LLM did not return valid structured output."}

        except Exception as e:
            logger.error(f"Error during structured action planning: {e}", exc_info=True)
            error_action_dict = {"type": "error", "message": f"LLM planning exception: {e}"}
            return {"parsed_action": error_action_dict, "error": f"LLM planning exception: {e}"}


    async def execute_action(self, state: AgentState) -> Dict[str, Any]:
        """Node method to execute the action dictionary from the state."""
        logger.info("Node: execute_action")
        action_dict = state.get("parsed_action")
        history = state.get("history", [])

        if not action_dict or not isinstance(action_dict, dict) or "type" not in action_dict:
            error_msg = "No valid action dictionary provided to execute."
            logger.error(error_msg)
            return {"error": error_msg}

        action_type = action_dict.get("type")
        action_repr = f"Action: {action_type}, Details: { {k:v for k,v in action_dict.items() if k != 'type'} }"
        logger.info(f"Executing {action_repr}")

        new_history = history + [action_repr]

        try:
            if action_type == "navigate":
                await self.browser.navigate_to(action_dict["url"]) # Check if method name/args match Browser class
            elif action_type == "click":
                 await self.browser.click(action_dict["selector"]) # Check Browser class for click method/args
            elif action_type == "type":
                  await self.browser.type(action_dict["selector"], action_dict["text"]) # Check Browser class for type method/args
            elif action_type == "scroll":
                  await self.browser.scroll(action_dict["direction"]) # Check Browser class for scroll method/args
            elif action_type == "wait":
                  await self.browser.wait(action_dict["milliseconds"]) # Check Browser class for wait method/args
            elif action_type == "get_content":
                 logger.info("Action 'get_content' requested (will be handled by next cycle)")
                 pass
            elif action_type == "finish":
                logger.info(f"Action 'finish' received. Result: {action_dict.get('result')}")
                pass
            elif action_type == "error":
                 error_msg = action_dict.get("message", "LLM signaled an error.")
                 logger.error(f"Executing 'error' action from LLM: {error_msg}")
                 return {"error": error_msg, "history": new_history}
            else:
                error_msg = f"Attempted to execute unknown/unhandled action type: {action_type}"
                logger.error(error_msg)
                return {"error": error_msg, "history": new_history}

            return {"error": None, "history": new_history}

        except Exception as e:
            logger.error(f"Error executing action '{action_type}': {e}", exc_info=True)
            return {"error": f"Failed to execute action '{action_type}': {e}", "history": new_history}

================================================
FILE: super_agents/browser_use/agent/prompts.py
================================================
from typing import List

def create_agent_prompt(
    task: str,
    current_browser_content: str, # This string now potentially contains URL, DOM, AX Tree, and Visual Elements
    history: List[str],
    error_message: str = None
) -> str:
    """
    Generates the prompt to be sent to the LLM based on the current state.
    Includes sections for Simplified DOM, Accessibility Tree, and Visual Elements.
    """
    prompt_parts = []
    prompt_parts.append("You are an AI agent controlling a web browser to complete a task.")
    prompt_parts.append(f"Your current task is: {task}")

    if error_message:
        prompt_parts.append(f"\nAn error occurred in the previous step: {error_message}")
        prompt_parts.append("Please analyze the error and the current browser state, then decide the next best action.")

    prompt_parts.append("\n\n# Current Browser Perception:")
    # The browser_content string now contains multiple sections, as generated by get_content
    prompt_parts.append(current_browser_content)

    if history:
        prompt_parts.append("\n\n# History of Previous Actions:")
        for i, item in enumerate(history[-5:], 1):
            prompt_parts.append(f"{i}. {item}")

    # --- Instructions with guidance on using all perception data ---
    instructions = """

# Instructions:
Analyze the **Current Browser Perception** section above, which includes:
1.  **Page URL:** The current web address.
2.  **Simplified DOM:** A structural view of the page with interactive elements marked with `x-pw-id` attributes.
3.  **Accessibility Tree:** Semantic information about elements (roles, names).
4.  **Visual Elements:** Elements detected visually via Computer Vision (CV), including their bounding boxes `[L:left, T:top, R:right, B:bottom]` and IDs (e.g., `cv-0`, `cv-1`).

Based on the task and ALL available perception information, decide the single next action to take.
Your response MUST be a JSON object with a single top-level key named "action".
The value of the "action" key MUST be an object matching one of the following action schemas:

- Navigate: {{"type": "navigate", "url": "<url_string>"}}
- Click: {{"type": "click", "selector": "<css_selector>", "description": "<element_description: optional>"}}
- Type: {{"type": "type", "selector": "<css_selector>", "text": "<text_to_type>", "description": "<element_description: optional>"}}
- Scroll: {{"type": "scroll", "direction": "<up|down|left|right>"}}
- Finish: {{"type": "finish", "result": "<final_answer_or_summary>"}}
- Error: {{"type": "error", "message": "<error_description>"}} (Use if you detect an unrecoverable error or loop)
- GetContent: {{"type": "get_content", "description": "<reason>"}}

**Important Task Handling Guidance:**
1.  **Identify elements** using the DOM, AX Tree (if available), and Visual Elements. Use robust selectors as previously guided.
2.  **If the task requires reading or extracting content that might extend beyond the current view (e.g., '摘录全文', 'find all items', 'read the article'), and you haven't finished scrolling, your next action should likely be to SCROLL DOWN.** Use: `{{"action": {{"type": "scroll", "direction": "down"}}}}`
3.  Only use `get_content` if you believe scrolling will not help or if you need to re-analyze after a non-scroll action.
4.  Once you believe you have scrolled enough and have all necessary information visible in the content provided, proceed with the extraction or final action.
5.  If the task is complete, use the 'finish' action.

Example Response:
```json
{{
  "action": {{
    "type": "click",
    "selector": "a[x-pw-id='pw-16']:has-text('new')",
    "description": "Click the 'new' link, corresponds to visual element cv-3"
  }}
}}
{{
  "action": {{
    "type": "scroll",
    "direction": "down"
  }}
}}
```

Provide ONLY the JSON object containing the 'action' key in a ```json ... ``` block.
Think step-by-step. Correlate information from the DOM, AX Tree, and Visual Elements if possible. Choose the most precise and stable selector.
If the task is complete, use the 'finish' action.
"""
    prompt_parts.append(instructions)
    # --- End Instructions ---

    final_prompt = "\n".join(prompt_parts)
    return final_prompt

================================================
FILE: super_agents/browser_use/agent/schemas.py
================================================
# super_agents/browser_use/agent/schemas.py
from typing import Literal, Optional, Union, List, Dict, Any, Type
# Use Pydantic V2+ if installed, otherwise V1 syntax
try:
    from pydantic.v1 import BaseModel, Field
except ImportError:
    from pydantic import BaseModel, Field # Fallback to V2

# --- Action Type ---
ActionTypeLiteral = Literal[
    "navigate",
    "click",
    "type",
    "scroll",
    "wait",
    "get_content",
    "finish",
    "error"
]

# --- Pydantic Schemas for Actions ---
# Using Pydantic allows for better validation and compatibility
# with LangChain's structured output features.

class BaseAction(BaseModel):
    """Base schema for all actions, containing the type."""
    type: ActionTypeLiteral = Field(..., description="The type of action to perform.")

class NavigateAction(BaseAction):
    type: Literal["navigate"] = "navigate"
    url: str = Field(..., description="The URL to navigate to.")

class ClickAction(BaseAction):
    type: Literal["click"] = "click"
    selector: str = Field(..., description="CSS selector for the element to click.")
    description: Optional[str] = Field(None, description="Optional description of the element being clicked.")

class TypeAction(BaseAction):
    type: Literal["type"] = "type"
    selector: str = Field(..., description="CSS selector for the input field.")
    text: str = Field(..., description="The text to type into the field.")
    description: Optional[str] = Field(None, description="Optional description of the element being typed into.")

class ScrollAction(BaseAction):
    type: Literal["scroll"] = "scroll"
    direction: Literal["up", "down", "left", "right"] = Field(..., description="The direction to scroll the page.")
    # selector: Optional[str] = Field(None, description="Optional CSS selector of element to scroll within.") # Add if needed

class WaitAction(BaseAction):
    type: Literal["wait"] = "wait"
    milliseconds: int = Field(..., description="Duration to wait in milliseconds.")

class GetContentAction(BaseAction):
    type: Literal["get_content"] = "get_content"
    # No extra fields needed, just signifies intent to refresh state
    description: Optional[str] = Field("Requesting updated browser content", description="Reason for requesting content.")

class FinishAction(BaseAction):
    type: Literal["finish"] = "finish"
    result: str = Field(..., description="The final answer or summary of the completed task.")

class ErrorAction(BaseAction):
    type: Literal["error"] = "error"
    message: str = Field(..., description="Description of the error encountered or signaled by the LLM.")

# --- Union for Parsing ---
# LangChain's with_structured_output often works best when targeting a single Pydantic model
# that uses discriminated unions (if available in your Pydantic version) or by prompting
# the LLM clearly to only output ONE type of action JSON matching the base structure.
# For simplicity here, we define the *expected output structure* the LLM should generate.
# The parsing function might need refinement based on how the LLM structures the output.

# Define the overall structure the LLM should output, which includes one of the actions.
# This structure helps `with_structured_output`.
class LLMResponse(BaseModel):
    action: Union[
        NavigateAction,
        ClickAction,
        TypeAction,
        ScrollAction,
        WaitAction,
        GetContentAction,
        FinishAction,
        ErrorAction
    ] = Field(..., description="The specific action determined by the LLM.")

# --- Parsing Function (Placeholder/Example) ---
# The `generate_structured_output` function in llm.py now handles the parsing
# directly into the Pydantic schema (LLMResponse).
# So, we might not need a separate manual parsing function here if using that.

# If you need manual parsing from raw text (less reliable):
# def parse_llm_response_manual(response: str) -> Optional[BaseAction]:
#     # ... (complex logic using regex or JSON parsing as in previous example)
#     # This would return one of the action models (NavigateAction, ClickAction, etc.)
#     pass


================================================
FILE: super_agents/browser_use/agent/state.py
================================================
# super_agents/browser_use/agent/state.py
from typing import Dict, List, Optional, Any, TypedDict

# Define the state structure using TypedDict for type hinting
class AgentState(TypedDict, total=False):
    """
    TypedDict representing the state of the browser agent during execution.
    
    Attributes:
        task: The user task description
        browser_content: The current HTML content of the browser
        parsed_action: The last action parsed from LLM response
        history: List of previous actions taken
        error: Any error message from the last operation
    """
    task: str
    browser_content: str
    parsed_action: Dict[str, Any]
    history: List[str]
    error: Optional[str]


================================================
FILE: super_agents/browser_use/agent/tools.py
================================================


================================================
FILE: super_agents/browser_use/agent.py
================================================
# super_agents/browser_use/agent.py
"""
Agent API for browser-based task execution.
Provides a simplified interface similar to the original implementation.
"""

import asyncio
import logging
from typing import Any, Dict, Optional

from .agent.graph import create_graph_app
from .agent.state import AgentState
from .browser.browser import Browser
from .browser.config import BrowserConfig
from .llm import initialize_llms

logger = logging.getLogger(__name__)

class Agent:
    """
    Agent class that provides a simple interface for browser automation with LLM.
    
    This implementation is similar to the original API but uses the current
    browser automation stack with LangGraph.
    """
    
    def __init__(
        self, 
        llm=None,
        browser_config: Optional[BrowserConfig] = None,
        max_steps: int = 50
    ):
        """
        Initialize the Agent with optional LLM and browser configuration.
        
        Args:
            llm: LLM instance to use (if None, will initialize from environment)
            browser_config: Browser configuration options
            max_steps: Maximum number of steps the agent can take
        """
        self.browser_config = browser_config or BrowserConfig()
        self.llm = llm
        self.max_steps = max_steps
        self.browser = None
        self._app = None
    
    async def _initialize(self):
        """Initialize the browser and LLM if not already initialized."""
        # Initialize LLM if not provided
        if self.llm is None:
            logger.info("Initializing LLM from environment variables")
            self.llm, _ = initialize_llms()
            
        if self.llm is None:
            raise ValueError("Failed to initialize LLM. Check API keys and .env settings.")
        
        # Initialize browser
        self.browser = Browser(config=self.browser_config)
        await self.browser.initialize()
        
        # Initialize LangGraph app
        self._app = create_graph_app(browser=self.browser, llm=self.llm)
    
    async def run(self, prompt: str) -> Dict[str, Any]:
        """
        Run the agent with the given prompt/task.
        
        Args:
            prompt: The task description or prompt for the agent
        
        Returns:
            Dictionary containing the execution result
        """
        # Ensure initialization
        if self.browser is None or self._app is None:
            await self._initialize()
        
        # Define the initial state
        initial_state = AgentState(
            task=prompt,
            browser_content="",
            parsed_action={},
            history=[],
            error=None
        )
        
        # Run the graph
        logger.info(f"Starting agent execution for task: {prompt}")
        try:
            final_state = await self._app.ainvoke(
                initial_state, 
                config={"recursion_limit": self.max_steps}
            )
            
            # Process result
            if final_state.get("error"):
                logger.error(f"Agent finished with error: {final_state['error']}")
                return {"result": f"Error: {final_state['error']}", "success": False}
            elif final_state.get("parsed_action", {}).get("type") == "finish":
                result = final_state["parsed_action"].get("result", "Task finished, but no result extracted.")
                logger.info(f"Agent finished successfully. Result: {result}")
                return {"result": result, "success": True}
            else:
                logger.warning("Agent finished without a 'finish' action or error.")
                return {
                    "result": "Agent stopped without producing a final answer.", 
                    "success": False,
                    "state": final_state
                }
                
        except Exception as e:
            logger.error(f"Agent execution failed: {e}", exc_info=True)
            return {"result": f"Error during execution: {str(e)}", "success": False}
        finally:
            # Clean up resources
            if self.browser:
                await self.browser.close()
                self.browser = None
            self._app = None
    
    def __del__(self):
        """Ensure resources are cleaned up."""
        if self.browser:
            asyncio.create_task(self.browser.close())


# Provider classes for compatibility with original API
class OpenAIProvider:
    """OpenAI provider compatible with the interface"""
    
    def __init__(self, model="gpt-4o-mini", api_key=None, temperature=0.1):
        """
        Initialize OpenAI provider.
        
        Args:
            model: Model name to use
            api_key: OpenAI API key (if None, will use from environment)
            temperature: Temperature for generation
        """
        self.model = model
        self.api_key = api_key
        self.temperature = temperature
        
        # These parameters will be used by initialize_llms() internally
        import os
        if api_key:
            os.environ["OPENAI_API_KEY"] = api_key
        os.environ["LLM_PROVIDER"] = "openai"
        os.environ["LLM_MODEL_NAME"] = model
        os.environ["LLM_TEMPERATURE"] = str(temperature)


class AnthropicProvider:
    """Anthropic provider compatible with the interface"""
    
    def __init__(self, model="claude-3-opus-20240229", api_key=None, temperature=0.1, 
                 enable_thinking=False, thinking_token_budget=None):
        """
        Initialize Anthropic provider.
        
        Args:
            model: Model name to use
            api_key: Anthropic API key (if None, will use from environment)
            temperature: Temperature for generation
            enable_thinking: Enable thinking step (not fully supported in current implementation)
            thinking_token_budget: Tokens for thinking (not fully supported)
        """
        self.model = model
        self.api_key = api_key
        self.temperature = temperature
        self.enable_thinking = enable_thinking
        self.thinking_token_budget = thinking_token_budget
        
        # These parameters will be used by initialize_llms() internally
        import os
        if api_key:
            os.environ["ANTHROPIC_API_KEY"] = api_key
        os.environ["LLM_PROVIDER"] = "anthropic" 
        os.environ["LLM_MODEL_NAME"] = model
        os.environ["LLM_TEMPERATURE"] = str(temperature)


# Add convenience imports to __init__.py
# This will allow: from super_agents.browser_use import Agent, OpenAIProvider, BrowserConfig


================================================
FILE: super_agents/browser_use/browser/browser.py
================================================
# super_agents/browser_use/browser/browser.py
"""
Streamlined Playwright browser implementation with integrated perception capabilities.
Includes DOM/AX Tree/Visual analysis and basic interaction methods.
"""

import asyncio
import json
import logging
import functools 
import base64
import os
from dataclasses import dataclass, field
# from importlib import resources # Not used
from typing import Any, Optional, TypedDict, List, Dict # Added List, Dict

# --- Local Imports (Ensure these files exist in the same directory) ---
try:
    from .observe_helper import observe
except ImportError:
    def observe(name, ignore_input=False, ignore_output=False):
        def decorator(func): return func
        return decorator
    logging.basicConfig(level=logging.WARNING) # Setup basic logging if needed
    logger_observe = logging.getLogger(__name__)
    logger_observe.warning("observe_helper not found, using dummy decorator.")

try:
    from .detector import Detector
    from .models import (
        BrowserError,
        BrowserState,
        InteractiveElementsData,
        TabInfo,
        InteractiveElement,
    )
    from .utils import (
        combine_and_filter_elements,
        put_highlight_elements_on_screenshot,
    )
except ImportError as e:
     logging.basicConfig(level=logging.ERROR)
     logger_import = logging.getLogger(__name__)
     logger_import.error(f"Failed to import local browser dependencies (detector, models, utils): {e}. Browser class may not function correctly.", exc_info=True)
     # Define dummy classes to allow file loading, but functionality will be broken
     class Detector: enabled=False
     class BrowserError(Exception): pass
     class BrowserState: pass
     class InteractiveElementsData: elements=[]; viewport={}
     class TabInfo: pass
     class InteractiveElement: pass
     def combine_and_filter_elements(a, b): return []
     def put_highlight_elements_on_screenshot(a, b): return None
# --- End Local Imports ---

# --- Playwright Imports ---
from playwright.async_api import (
    Browser as PlaywrightBrowser,
    BrowserContext as PlaywrightBrowserContext,
    Page,
    Playwright,
    StorageState,
    async_playwright,
    Error as PlaywrightError
)
# --- Tenacity Import ---
from tenacity import (
    retry,
    retry_if_exception_type,
    stop_after_attempt,
    wait_exponential,
)

logger = logging.getLogger(__name__)
# Ensure basic logging is configured if not done elsewhere
if not logger.hasHandlers():
     logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')


# --- Load JavaScript Files ---
INTERACTIVE_ELEMENTS_JS_CODE = ""
SIMPLIFY_PAGE_SCRIPT = ""
try:
    current_dir = os.path.dirname(os.path.abspath(__file__))
    # JS for DOM-based interactive elements used in get_interactive_elements_data
    js_file_path_interactive = os.path.join(current_dir, 'findVisibleInteractiveElements.js')
    with open(js_file_path_interactive, 'r', encoding='utf-8') as js_file:
        INTERACTIVE_ELEMENTS_JS_CODE = js_file.read()

    # JS for DOM simplification used in get_content
    # (Re-paste the script here for completeness)
    SIMPLIFY_PAGE_SCRIPT = """
    (() => {
        const MAX_ELEMENTS = 250; const MAX_TEXT_LENGTH = 200;
        const INTERACTIVE_TAGS = ['a', 'button', 'input', 'textarea', 'select', 'option', 'details', 'summary', 'label'];
        const EXCLUDED_TAGS = ['script', 'style', 'noscript', 'svg', 'link', 'meta', 'head', 'embed', 'object', 'path', 'canvas', 'iframe', 'video', 'audio'];
        let elementCount = 0; let uniqueIdCounter = 0;
        function isVisible(el) { if (!el || !el.checkVisibility) return false; return el.checkVisibility({checkOpacity: true, checkVisibilityCSS: true}); }
        function truncateText(text, maxLength = MAX_TEXT_LENGTH) { if (typeof text !== 'string') return text; return text.length > maxLength ? text.substring(0, maxLength) + '...' : text; }
        function getElementData(el) {
            const data = { tag: el.tagName.toLowerCase(), attributes: {}, text: '', children: [], pw_id: `pw-${uniqueIdCounter++}` };
            try { if (document.body.contains(el)) el.setAttribute('x-pw-id', data.pw_id); } catch(e){}
            const attrsToKeep = ['id', 'class', 'role', 'aria-label', 'aria-labelledby', 'aria-describedby', 'aria-hidden', 'aria-invalid', 'aria-required', 'placeholder', 'title', 'alt', 'for', 'name', 'type', 'href', 'value', 'selected', 'checked', 'disabled', 'readonly', 'open'];
            for (const attr of attrsToKeep) {
                if (el.hasAttribute(attr)) {
                    let value = el.getAttribute(attr);
                    if (attr === 'class' && value) value = value.split(' ').filter(c => c && c.length > 1 && c.length < 30 && !/^[0-9]+$/.test(c)).slice(0, 5).join(' ');
                    if (value !== null && value !== '') data.attributes[attr] = truncateText(String(value), 80);
                }
            }
            if (['button', 'a', 'label', 'summary'].includes(data.tag) && !data.attributes['aria-label'] && el.textContent) data.attributes['aria-label'] = truncateText(el.textContent.trim(), 80);
            try {
                if (el.tagName.toLowerCase() === 'input' && !data.attributes.value && el.value) data.attributes.value = truncateText(el.value);
                else if (el.tagName.toLowerCase() === 'textarea' && !data.attributes.value && el.value) data.attributes.value = truncateText(el.value);
                else if (el.tagName.toLowerCase() === 'select' && el.options && el.selectedIndex !== -1 && !data.attributes.value) data.attributes.value = truncateText(el.options[el.selectedIndex].text);
            } catch (e) {}
            try {
                const directText = Array.from(el.childNodes).filter(node => node.nodeType === Node.TEXT_NODE && node.textContent.trim().length > 0).map(node => node.textContent.trim()).join(' ').replace(/\s+/g, ' ');
                if (directText) data.text = truncateText(directText);
            } catch (e) {}
            return data;
        }
        function simplifyNode(node) {
            if (elementCount >= MAX_ELEMENTS) return null;
            if (node.nodeType !== Node.ELEMENT_NODE || EXCLUDED_TAGS.includes(node.tagName.toLowerCase())) { if(node.nodeType === Node.TEXT_NODE && node.textContent.trim().length === 0) return null; return null; }
            elementCount++; const elementData = getElementData(node);
            if (node.hasChildNodes()) {
                Array.from(node.childNodes).forEach(child => {
                    if (INTERACTIVE_TAGS.includes(node.tagName.toLowerCase()) && child.nodeType === Node.ELEMENT_NODE) return;
                    const simplifiedChild = simplifyNode(child); if (simplifiedChild) elementData.children.push(simplifiedChild);
                });
            }
            const isInteractive = INTERACTIVE_TAGS.includes(elementData.tag); const hasMeaningfulAttrs = Object.keys(elementData.attributes).some(k => k !== 'x-pw-id');
            if (!isInteractive && !hasMeaningfulAttrs && elementData.children.length === 0 && !elementData.text) { try { if (document.body.contains(node)) node.removeAttribute('x-pw-id'); } catch(e){} return null; }
            return elementData;
        }
        if (!document.body) return "<body> element not found."; const simplifiedBody = simplifyNode(document.body);
        function convertToPseudoHTML(node) {
            if (!node) return ''; let attrs = `x-pw-id="${node.pw_id}"`;
            for (const [key, value] of Object.entries(node.attributes)) attrs += ` ${key}="${String(value).replace(/"/g, '&quot;')}"`;
            let childrenHTML = node.children.map(convertToPseudoHTML).join('');
            let textContent = node.text ? String(node.text).replace(/</g, '&lt;').replace(/>/g, '&gt;') : '';
            if (['input', 'img', 'br', 'hr'].includes(node.tag)) return `<${node.tag} ${attrs} />`;
            else return `<${node.tag} ${attrs}>${textContent}${childrenHTML}</${node.tag}>`;
        }
        return convertToPseudoHTML(simplifiedBody);
    })()
    """
except FileNotFoundError:
    logger.error(f"JavaScript file 'findVisibleInteractiveElements.js' not found in {current_dir}. Interactive element detection (JS based) will fail.")
    INTERACTIVE_ELEMENTS_JS_CODE = "() => ({ viewport: { width: window.innerWidth, height: window.innerHeight }, elements: [] });" # Provide fallback
except Exception as e:
     logger.error(f"Error loading JavaScript file(s): {e}", exc_info=True)
     INTERACTIVE_ELEMENTS_JS_CODE = "() => ({ viewport: { width: window.innerWidth, height: window.innerHeight }, elements: [] });"
     SIMPLIFY_PAGE_SCRIPT = "() => 'Error loading simplification script.';"


# --- TypedDict for Viewport Size ---
class ViewportSize(TypedDict):
    width: int
    height: int

# --- BrowserConfig Dataclass (Corrected: No CV Endpoints) ---
@dataclass
class BrowserConfig:
    """
    Configuration for the Browser.
    """
    cdp_url: Optional[str] = None
    viewport_size: ViewportSize = field(default_factory=lambda: {"width": 1200, "height": 900})
    storage_state: Optional[StorageState] = None
    # CV/Sheets Endpoints Removed

# --- Main Browser Class ---
class Browser:
    """
    Unified Browser responsible for interacting with the browser via Playwright.
    Includes methods for navigation, simple actions, perception (DOM, AX Tree, optional VLM),
    and state management. Initializes its own VLM detector based on environment variables.
    """
    def __init__(self, config: BrowserConfig = BrowserConfig(), close_context: bool = True):
        """
        Initializes the Browser instance.
        """
        logger.debug('Initializing browser')
        self.config = config
        self.close_context = close_context
        # Playwright attributes
        self.playwright: Optional[Playwright] = None
        self.playwright_browser: Optional[PlaywrightBrowser] = None
        self.context: Optional[PlaywrightBrowserContext] = None
        # Page and state management
        self.current_page: Optional[Page] = None
        self._state: Optional[BrowserState] = None # This holds the rich state from update_state
        self._cdp_session = None
        # Initialize Detector internally
        try:
            self.detector: Optional[Detector] = Detector()
            if not self.detector.enabled:
                self.detector = None
                logger.warning("Detector initialized but disabled due to missing config/errors.")
            else:
                logger.info("Detector initialized successfully.")
        except NameError:
             logger.error("Detector class not found (likely due to import errors). Vision disabled.")
             self.detector = None
        except Exception as e:
             logger.error(f"Unexpected error initializing Detector: {e}", exc_info=True)
             self.detector = None
        # REMOVED self._init_state() call as method doesn't exist / state init is implicit

    # --- Context Management Methods ---
    async def __aenter__(self):
        await self.initialize()
        return self

    async def __aexit__(self, exc_type, exc_val, exc_tb):
        if self.close_context:
            await self.close()

    # --- Public Initialization and Closing ---
    async def initialize(self):
        """Initializes browser, context, page if not already done."""
        if self.current_page and self.context and self.playwright_browser and self.playwright:
             logger.debug("Browser already initialized.")
             return self
        logger.info("Initializing browser instance via initialize()") # Changed level
        await self._init_browser()
        return self

    async def close(self):
        """Closes the browser and cleans up Playwright resources."""
        if not self.playwright: return
        logger.info('Closing browser...')
        try:
            self._cdp_session = None
            if self.context:
                try: await self.context.close()
                except Exception as e: logger.warning(f'Failed to close context: {e}')
            if self.playwright_browser and not self.config.cdp_url:
                try: await self.playwright_browser.close()
                except Exception as e: logger.warning(f'Failed to close browser: {e}')
            if self.playwright:
                try: await self.playwright.stop()
                except Exception as e: logger.warning(f'Failed to stop Playwright: {e}')
        except Exception as e:
            logger.error(f'Error during browser cleanup: {e}', exc_info=True)
        finally: # Ensure attributes are cleared
            self.context = None; self.current_page = None; self._state = None
            self.playwright_browser = None; self.playwright = None; self._cdp_session = None
            logger.info("Browser closed.")

    # --- Internal Initialization Helper ---
    async def _init_browser(self):
        """Internal method to initialize Playwright components."""
        if self.current_page and self.context: return # Avoid re-init if basics exist
        logger.debug('Running internal browser context initialization _init_browser()')
        try:
            if self.playwright is None: self.playwright = await async_playwright().start()
            if self.playwright_browser is None:
                if self.config.cdp_url:
                    logger.info(f'Connecting to remote browser via CDP {self.config.cdp_url}')
                    self.playwright_browser = await self.playwright.chromium.connect_over_cdp(self.config.cdp_url, timeout=5000)
                else:
                    logger.info(f'Launching new browser instance (headless=False assumed)')
                    # Note: Headless mode might need to be configurable via BrowserConfig again if needed
                    self.playwright_browser = await self.playwright.chromium.launch(
                        headless=False,
                        args=[ # Common args for stability/anti-detection
                            '--no-sandbox', '--disable-setuid-sandbox', '--disable-infobars',
                            '--disable-blink-features=AutomationControlled',
                            '--disable-dev-shm-usage', '--disable-gpu', '--window-size=1200,900', # Use configured size later
                            # '--disable-web-security', # Use with caution
                            # '--disable-site-isolation-trials',
                            # '--disable-features=IsolateOrigins,site-per-process',
                        ]
                    )
            if self.context is None:
                existing_contexts = self.playwright_browser.contexts
                if existing_contexts and not self.config.cdp_url: # Reuse only if we launched it? Be careful.
                    self.context = existing_contexts[0]
                    logger.info("Reusing existing browser context.")
                else:
                    logger.info("Creating new browser context.")
                    self.context = await self.playwright_browser.new_context(
                        viewport=self.config.viewport_size,
                        user_agent='Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/108.0.0.0 Safari/537.36',
                        java_script_enabled=True, bypass_csp=True, ignore_https_errors=True,
                        storage_state=self.config.storage_state if self.config.storage_state else None
                    )
                    await self._apply_anti_detection_scripts() # Apply only to new contexts
                self.context.on('page', self._on_page_change) # Attach listener

            if self.current_page is None:
                if len(self.context.pages) > 0:
                    self.current_page = self.context.pages[-1] # Default to last open page
                    logger.info(f"Using existing page: {self.current_page.url}")
                else:
                    self.current_page = await self.context.new_page()
                    logger.info("Created new page.")
                # Ensure viewport is applied regardless
                try: await self.current_page.set_viewport_size(self.config.viewport_size)
                except Exception as vp_err: logger.warning(f"Failed to set viewport: {vp_err}")

            if not self.current_page: raise BrowserError("Failed to get or create a page.")
            await self.get_cdp_session() # Initialize CDP session for current page

        except PlaywrightError as pe:
            logger.error(f"Playwright Error during browser init: {pe}", exc_info=True)
            await self.close(); raise BrowserError(f"Playwright initialization failed: {pe}") from pe
        except Exception as e:
            logger.error(f"Unexpected error during browser init: {e}", exc_info=True)
            await self.close(); raise BrowserError(f"Unexpected browser initialization failed: {e}") from e

    # --- Method Implementations (Ensure ALL referenced methods are defined) ---

    async def _apply_anti_detection_scripts(self):
        """Apply scripts to avoid detection as automation"""
        if self.context is None: return # Should not happen if called from _init_browser correctly
        try:
            await self.context.add_init_script(
                """
                Object.defineProperty(navigator, 'webdriver', { get: () => undefined });
                Object.defineProperty(navigator, 'languages', { get: () => ['en-US', 'en'] });
                Object.defineProperty(navigator, 'plugins', { get: () => [] }); // Empty is safer
                // ... other scripts from previous version ...
                const originalQuery = window.navigator.permissions.query;
                window.navigator.permissions.query = (parameters) => (
                    parameters.name === 'notifications' ?
                        Promise.resolve({ state: Notification.permission }) :
                        originalQuery(parameters)
                );
                """
            )
            logger.debug("Applied anti-detection init script.")
        except Exception as e:
             logger.error(f"Failed to add anti-detection init script: {e}", exc_info=True)

    async def _on_page_change(self, page: Page):
        """Handle page creation/popup events."""
        # Don't automatically switch current page, just log
        logger.info(f'Page event detected. New/Popup URL: {page.url}')
        self._cdp_session = None # Invalidate CDP session as context changed

    async def get_current_page(self) -> Page:
        """Get the current page, ensuring browser is initialized."""
        if self.current_page is None or self.current_page.is_closed():
            logger.warning("Current page is None or closed, re-initializing.")
            await self._init_browser()
            if self.current_page is None: raise BrowserError("Unable to get a valid page.")
        return self.current_page

    # Inside Browser class in browser.py
    async def get_cdp_session(self):
        """Get or create a CDP session for the *current* page."""
        page = await self.get_current_page()
        session_invalid = True # Assume invalid
        if self._cdp_session:
            # More robust check: try a simple CDP command to see if session is active
            try:
                # Example: Get cookies via CDP (relatively harmless check)
                await self._cdp_session.send("Network.getAllCookies")
                # Check if session page matches current page (using internal attr is risky)
                if hasattr(self._cdp_session, '_client') and hasattr(self._cdp_session._client, '_page') and self._cdp_session._client._page == page:
                   session_invalid = False # Session seems alive and for the correct page
                else:
                   logger.debug("CDP session page mismatch or internals unclear, recreating.")
            except Exception as session_check_err:
                 logger.debug(f"Existing CDP session check failed ({session_check_err}), recreating.")
                 session_invalid = True

        if session_invalid:
            try:
                if self.context is None: await self._init_browser()
                logger.debug(f"Attempting to create new CDP session for page: {page.url}")
                self._cdp_session = await self.context.new_cdp_session(page)
                logger.debug(f"Created new CDP session successfully.")
            except Exception as e:
                logger.error(f"Failed to create CDP session: {e}", exc_info=True)
                self._cdp_session = None
                raise BrowserError(f"Failed to create CDP session: {e}") from e
        return self._cdp_session

    @observe(name='browser.fast_screenshot', ignore_output=True)
    async def fast_screenshot(self) -> str:
        """Returns a base64 encoded screenshot using CDP."""
        cdp_session = await self.get_cdp_session()
        try:
            screenshot_data = await cdp_session.send("Page.captureScreenshot", {"format": "png", "fromSurface": False, "captureBeyondViewport": False})
            return screenshot_data["data"]
        except Exception as e:
             logger.error(f"Failed to capture screenshot via CDP: {e}")
             # Fallback to playwright's screenshot? Or raise error?
             page = await self.get_current_page()
             try:
                 logger.warning("CDP screenshot failed, falling back to Playwright screenshot.")
                 buffer = await page.screenshot()
                 return base64.b64encode(buffer).decode()
             except Exception as pw_e:
                  logger.error(f"Fallback Playwright screenshot also failed: {pw_e}")
                  raise BrowserError(f"Failed to take screenshot: {e}") from e

    # --- Simple Action Methods ---
    @observe(name='browser.navigate_to')
    async def navigate_to(self, url: str):
        page = await self.get_current_page()
        logger.info(f"Navigating to: {url}")
        try:
            await page.goto(url, wait_until='domcontentloaded', timeout=60000)
            logger.info(f"Navigation successful. Current URL: {page.url}")
        except PlaywrightError as e: raise BrowserError(f"Navigation failed: {e}") from e
        except Exception as e: raise BrowserError(f"Navigation failed unexpectedly: {e}") from e

    @observe(name='browser.click')
    async def click(self, selector: str):
        page = await self.get_current_page()
        logger.info(f"Attempting to click element: '{selector}'")
        try:
            element = page.locator(selector).first
            await element.wait_for(state="visible", timeout=15000)
            await element.scroll_into_view_if_needed(timeout=10000)
            await element.click(timeout=15000, delay=50)
            logger.info(f"Successfully clicked element: '{selector}'")
        except PlaywrightError as e: raise BrowserError(f"Click action failed: {e}") from e
        except Exception as e: raise BrowserError(f"Click action failed unexpectedly: {e}") from e

    @observe(name='browser.type')
    async def type(self, selector: str, text: str):
        page = await self.get_current_page()
        log_text = '***' if 'password' in selector.lower() else text
        logger.info(f"Attempting to type into element: '{selector}', Text: '{log_text}'")
        try:
            element = page.locator(selector).first
            await element.wait_for(state="visible", timeout=15000)
            await element.scroll_into_view_if_needed(timeout=10000)
            await element.fill(text, timeout=15000)
            logger.info(f"Successfully typed into element: '{selector}'")
        except PlaywrightError as e: raise BrowserError(f"Type action failed: {e}") from e
        except Exception as e: raise BrowserError(f"Type action failed unexpectedly: {e}") from e

    @observe(name='browser.scroll')
    async def scroll(self, direction: str):
        page = await self.get_current_page()
        logger.info(f"Scrolling page {direction}")
        try:
            if direction == "down": await page.evaluate("window.scrollBy(0, window.innerHeight)")
            elif direction == "up": await page.evaluate("window.scrollBy(0, -window.innerHeight)")
            elif direction == "left": await page.evaluate("window.scrollBy(-window.innerWidth, 0)")
            elif direction == "right": await page.evaluate("window.scrollBy(window.innerWidth, 0)")
            else: logger.warning(f"Unknown scroll direction: {direction}"); return
            await asyncio.sleep(0.3)
            logger.info(f"Scrolled page {direction}")
        except PlaywrightError as e: raise BrowserError(f"Scroll action failed: {e}") from e
        except Exception as e: raise BrowserError(f"Scroll action failed unexpectedly: {e}") from e

    async def wait(self, milliseconds: int):
        logger.info(f"Waiting for {milliseconds} ms")
        if milliseconds <= 0: return
        await asyncio.sleep(milliseconds / 1000.0)
        logger.info("Wait finished")

    # --- Perception & State Methods ---
    async def get_content(self, max_length: int = 120000) -> str:
        """Gets comprehensive text representation: URL, DOM, AX Tree, VLM Elements."""
        page = await self.get_current_page()
        logger.info("Getting comprehensive page content with vision...")
        combined_content = ""
        error_messages = []
        current_url = "Unknown"
        screenshot_b64 = None
        try:
            current_url = page.url
            combined_content += f"# Page URL:\n{current_url}\n\n"
            try:
                screenshot_b64 = await self.fast_screenshot()
                logger.debug(f"Screenshot captured (size: {len(screenshot_b64) if screenshot_b64 else 0})")
            except Exception as ss_err: error_messages.append(f"Screenshot Error: {ss_err}"); logger.error("Screenshot error", exc_info=False); combined_content += "# Screenshot Error\n"
            try:
                if SIMPLIFY_PAGE_SCRIPT:
                     simplified_dom = await page.evaluate(SIMPLIFY_PAGE_SCRIPT)
                     if simplified_dom: combined_content += f"# Simplified DOM:\n```html\n{simplified_dom}\n```\n\n"; logger.debug(f"DOM length: {len(simplified_dom)}")
                     else: combined_content += "# Simplified DOM:\n(Empty)\n\n"; logger.warning("JS simplification empty.")
                else: combined_content += "# Simplified DOM:\n(JS Script Error)\n\n"; logger.error("SIMPLIFY_PAGE_SCRIPT empty.")
            except Exception as js_err: error_messages.append(f"JS Error: {js_err}"); logger.error("JS Simp. Error", exc_info=False); combined_content += f"# Simplified DOM Error: {js_err}\n"
            try:
                ax_tree = await page.accessibility.snapshot(interesting_only=False) # No root arg
                if ax_tree:
                    try:
                        ax_tree_str = json.dumps(ax_tree, separators=(',', ':')) # Compact
                        ax_max_len = 2000
                        if len(ax_tree_str) > ax_max_len: ax_tree_str = ax_tree_str[:ax_max_len] + "...(AX Tree truncated)"
                        combined_content += f"# Accessibility Tree (JSON, Partial):\n```json\n{ax_tree_str}\n```\n\n"; logger.debug(f"AX Tree length: {len(ax_tree_str)}")
                    except Exception as json_err: error_messages.append(f"AX JSON Error: {json_err}"); logger.error("AX JSON Error", exc_info=False); combined_content += "# AX Tree Error (JSON)\n"
                else: combined_content += "# Accessibility Tree:\n(Empty)\n\n"; logger.warning("AX snapshot empty.")
            except Exception as ax_err: error_messages.append(f"AX Tree Error: {ax_err}"); logger.error("AX Tree Error", exc_info=False); combined_content += f"# Accessibility Tree Error: {ax_err}\n"

            if self.detector and screenshot_b64:
                logger.info("Attempting visual detection via Detector...")
                try:
                    detect_sheets = 'docs.google.com/spreadsheets/d' in current_url
                    visual_elements = await self.detector.detect_from_image(screenshot_b64, detect_sheets)
                    if visual_elements:
                        formatted = [f"- ID: {el.browser_agent_id}, Box: [L:{el.rect.get('left',0)}, T:{el.rect.get('top',0)}, R:{el.rect.get('right',0)}, B:{el.rect.get('bottom',0)}] (Tag: {el.tag_name})" for el in visual_elements[:20]]
                        combined_content += f"# Visual Elements (Detected via CV, Max 20):\n{chr(10).join(formatted)}\n\n"; logger.info(f"Added {len(formatted)} visual elements.") # Use chr(10) for newline
                    else: combined_content += "# Visual Elements:\n(None detected or VLM error)\n\n"; logger.info("No visual elements detected.")
                except Exception as cv_err: error_messages.append(f"CV Error: {cv_err}"); logger.error("CV Detector Error", exc_info=True); combined_content += f"# Visual Elements Error: {cv_err}\n"
            else:
                 if not self.detector: logger.info("CV Detector not available.")
                 if not screenshot_b64: logger.info("Screenshot missing.")
                 combined_content += "# Visual Elements:\n(Not Run)\n\n"

            if len(combined_content) > max_length:
                logger.warning(f"Combined content ({len(combined_content)}) exceeds limit ({max_length}). Truncating.")
                reserve = len("\n\n# Content Retrieval Errors:\n- ") + sum(len(str(e)) + 4 for e in error_messages) + 50
                trunc_len = max(0, max_length - reserve); combined_content = combined_content[:trunc_len].rstrip() + "\n\n... (Content truncated)"
            if error_messages: combined_content += "\n\n# Content Retrieval Errors:\n- " + "\n- ".join(map(str, error_messages))
            logger.info(f"Finished getting content (final length: {len(combined_content)})")
            return combined_content
        except Exception as e: logger.error(f"General error in get_content: {e}", exc_info=True); return f"# Page URL:\n{current_url}\n# Error:\nFailed to get content: {e}"

    # --- Other Methods from Original Code ---

    async def get_cookies(self) -> list[dict[str, Any]]:
        """Get cookies from the current browser context."""
        if self.context:
            try: return await self.context.cookies()
            except Exception as e: logger.error(f"Failed to get cookies: {e}"); return []
        return []

    async def get_storage_state(self) -> dict[str, Any]:
        """Get storage state (currently only cookies) from the browser."""
        # Playwright's get_storage_state includes local/session storage too,
        # but might require more careful handling or filtering if large.
        # Sticking to cookies for simplicity based on original user code structure.
        if self.context:
            try:
                 # cookies = await self.context.cookies() # Redundant if get_cookies exists
                 # return {'cookies': cookies}
                 # Or use the full state function if available and needed
                 state = await self.context.storage_state()
                 return state
            except Exception as e:
                 logger.error(f"Failed to get storage state: {e}")
                 return {}
        return {}

    async def get_tabs_info(self) -> list[TabInfo]:
        """Get information about all open tabs in the current context."""
        tabs_info = []
        if not self.context: return []
        try:
            # Ensure pages list is accessed correctly
            pages = self.context.pages
            for i, page in enumerate(pages):
                 if not page.is_closed(): # Check if page is open
                     try:
                         url = page.url
                         title = await page.title()
                         # Ensure TabInfo model is available
                         tabs_info.append(TabInfo(page_id=i, url=url, title=title))
                     except Exception as page_err:
                          logger.warning(f"Failed to get info for tab {i}: {page_err}")
                          # Add placeholder if needed?
                          tabs_info.append(TabInfo(page_id=i, url="Error", title="Error retrieving info"))

        except Exception as e:
             logger.error(f"Failed to get tabs info: {e}")
        return tabs_info

    async def switch_to_tab(self, page_id: int) -> None:
        """Switch focus to a specific tab by its index."""
        if self.context is None: await self._init_browser()
        pages = self.context.pages
        if not 0 <= page_id < len(pages):
            raise BrowserError(f'Invalid page_id: {page_id}. Available pages: {len(pages)}')
        if pages[page_id].is_closed():
            raise BrowserError(f'Page with page_id {page_id} is closed.')

        logger.info(f"Switching to tab (page_id): {page_id}")
        self.current_page = pages[page_id]
        try:
            await self.current_page.bring_to_front()
            # Wait briefly for potential state changes after switch
            await self.current_page.wait_for_load_state('domcontentloaded', timeout=5000)
        except Exception as e:
             logger.warning(f"Error during tab switch finalization for page {page_id}: {e}")
             # Continue anyway, page is switched internally

    async def create_new_tab(self, url: str | None = None) -> None:
        """Create a new tab, optionally navigating to a URL, and switch to it."""
        if self.context is None: await self._init_browser()
        logger.info(f"Creating new tab. Navigate to: {url if url else 'about:blank'}")
        try:
            new_page = await self.context.new_page()
            self.current_page = new_page # Switch focus to the new page
            if url:
                await self.navigate_to(url) # Reuse navigate method
            else:
                 await new_page.wait_for_load_state('domcontentloaded') # Wait for about:blank load
            logger.info(f"Switched to new tab. URL: {self.current_page.url}")
        except Exception as e:
             logger.error(f"Failed to create new tab: {e}")
             raise BrowserError(f"Failed to create new tab: {e}") from e


    async def close_current_tab(self):
        """Close the currently focused tab."""
        if self.current_page is None: logger.warning("No current page to close."); return
        if len(self.context.pages) <= 1: logger.warning("Cannot close the last remaining tab."); return # Prevent closing last tab? Or allow context close?

        logger.info(f"Closing current tab: {self.current_page.url}")
        page_to_close = self.current_page
        # Find index to switch to after closing (e.g., previous or first)
        pages = self.context.pages
        current_index = pages.index(page_to_close) if page_to_close in pages else -1
        switch_to_index = 0 if current_index != 0 else 1 # Switch to first unless closing first
        if switch_to_index >= len(pages): switch_to_index = 0 # Fallback

        try:
            await page_to_close.close()
            logger.info("Tab closed.")
            # Need to wait briefly for context.pages to update sometimes
            await asyncio.sleep(0.1)
            # Switch to another tab if possible
            if self.context and self.context.pages:
                 new_current_page = self.context.pages[min(switch_to_index, len(self.context.pages)-1)]
                 self.current_page = new_current_page
                 await self.current_page.bring_to_front()
                 logger.info(f"Switched to tab index {min(switch_to_index, len(self.context.pages)-1)} after closing.")
            else:
                 self.current_page = None # No pages left
                 logger.info("Closed the last tab.")

        except Exception as e:
             logger.error(f"Error closing tab or switching: {e}")
             # Attempt to recover current page if possible
             if self.context and self.context.pages: self.current_page = self.context.pages[0]
             else: self.current_page = None

    async def refresh_page(self):
        """Refresh the current page."""
        page = await self.get_current_page()
        logger.info(f"Refreshing page: {page.url}")
        try:
             await page.reload(wait_until='domcontentloaded')
             logger.info("Page refreshed.")
        except Exception as e:
             logger.error(f"Failed to refresh page: {e}")
             raise BrowserError(f"Failed to refresh page: {e}") from e

    async def go_forward(self):
        """Navigate forward in the current page's history."""
        page = await self.get_current_page()
        logger.info(f"Going forward in history for: {page.url}")
        try:
            await page.go_forward(wait_until='domcontentloaded', timeout=10000) # Added timeout
            logger.info(f"Navigated forward. New URL: {page.url}")
        except Exception as e:
            # Often fails if no forward history exists, log as warning
            logger.warning(f'Failed to go forward (might be end of history): {e}')
            # raise BrowserError(f"Failed to go forward: {e}") from e # Option: re-raise if needed

    # --- State Update Methods (using CV potentially) ---
    def get_state(self) -> Optional[BrowserState]:
        """Get the last updated internal browser state."""
        # Returns the state cached from the last update_state call
        logger.debug(f"Returning cached browser state (URL: {self._state.url if self._state else 'None'})")
        return self._state

    @observe(name='browser.update_state', ignore_output=True)
    async def update_state(self) -> BrowserState:
        """Update the internal browser state by re-evaluating the page (incl. CV if enabled)."""
        logger.info("Updating browser state...")
        try:
            self._state = await self._update_state()
            logger.info("Browser state updated successfully.")
            if not self._state: raise BrowserError("State update returned None unexpectedly.") # Should not happen if _update_state raises
            return self._state
        except Exception as e:
             logger.error(f"Failed to update browser state: {e}", exc_info=True)
             # Decide whether to return old state or raise error
             # Raising error seems more appropriate if update fails
             raise BrowserError(f"Failed to update state: {e}") from e


    @observe(name='browser._update_state', ignore_output=True)
    async def _update_state(self) -> BrowserState:
        """Internal method to get comprehensive state with retry logic."""
        @retry(
            stop=stop_after_attempt(3),
            wait=wait_exponential(multiplier=0.5, min=0.5, max=2),
            retry=retry_if_exception_type((Exception)), # Retry on any exception during state fetch
            reraise=True # Re-raise the exception after retries fail
        )
        async def get_stable_state():
            page = await self.get_current_page() # Ensures page exists
            url = page.url
            detect_sheets = 'docs.google.com/spreadsheets/d' in url
            screenshot_b64 = await self.fast_screenshot() # Get screenshot

            interactive_elements_data: Optional[InteractiveElementsData] = None
            # Get combined elements using CV if detector is enabled
            if self.detector and screenshot_b64:
                logger.debug("Getting interactive elements with CV...")
                interactive_elements_data = await self.get_interactive_elements_with_cv(screenshot_b64, detect_sheets)
            # Fallback to browser-only if detector disabled or screenshot failed
            elif INTERACTIVE_ELEMENTS_JS_CODE: # Ensure JS code loaded
                 logger.debug("Getting interactive elements with browser JS only...")
                 interactive_elements_data = await self.get_interactive_elements_data()
            else:
                 logger.error("Cannot get interactive elements: Detector disabled/failed and JS code missing.")
                 interactive_elements_data = InteractiveElementsData(viewport={"width":0,"height":0}, elements=[]) # Return empty state


            # Check if interactive_elements_data is valid before proceeding
            if interactive_elements_data is None or not hasattr(interactive_elements_data, 'elements'):
                 raise BrowserError("Failed to retrieve valid interactive elements data.")

            # Process elements into dictionary for state
            interactive_elements = {element.browser_agent_id: element for element in interactive_elements_data.elements}

            # Generate highlighted screenshot
            screenshot_with_highlights = None
            if screenshot_b64 and 'put_highlight_elements_on_screenshot' in globals():
                try:
                     screenshot_with_highlights = put_highlight_elements_on_screenshot(
                         list(interactive_elements.values()), # Pass list of elements
                         screenshot_b64
                     )
                except Exception as high_err:
                     logger.warning(f"Failed to generate highlighted screenshot: {high_err}")

            # Get tab info
            tabs = await self.get_tabs_info()

            # Ensure BrowserState model is available
            if 'BrowserState' not in globals() or 'BrowserState' not in locals():
                 raise ImportError("BrowserState model is not defined or imported.")

            # Create and return the state object
            return BrowserState(
                url=url,
                tabs=tabs,
                screenshot_with_highlights=screenshot_with_highlights,
                screenshot=screenshot_b64,
                viewport=interactive_elements_data.viewport, # Use viewport from data
                interactive_elements=interactive_elements,
            )

        # Execute the retry logic
        try:
            new_state = await get_stable_state()
            self._state = new_state # Cache the new state
            return new_state
        except Exception as e:
            logger.error(f'Failed to update state after multiple attempts: {e}', exc_info=True)
            # Don't return potentially stale state, let error propagate
            raise BrowserError(f"Failed to update state definitively: {e}") from e

    @observe(name='browser.get_interactive_elements')
    async def get_interactive_elements_data(self) -> InteractiveElementsData:
        """Gets interactive elements using only in-browser JavaScript."""
        page = await self.get_current_page()
        if not INTERACTIVE_ELEMENTS_JS_CODE:
             logger.error("INTERACTIVE_ELEMENTS_JS_CODE is empty. Cannot get elements.")
             # Return default empty structure
             vp = await page.viewport_size() or {"width":0, "height":0}
             return InteractiveElementsData(viewport=vp, elements=[])
        try:
            result = await page.evaluate(INTERACTIVE_ELEMENTS_JS_CODE)
            # Validate result basic structure
            if not isinstance(result, dict) or 'viewport' not in result or 'elements' not in result:
                 logger.error(f"JS evaluation returned unexpected structure: {type(result)}")
                 vp = await page.viewport_size() or {"width":0, "height":0}
                 return InteractiveElementsData(viewport=vp, elements=[])
            # Parse using Pydantic model if available
            if 'InteractiveElementsData' in globals() and 'InteractiveElementsData' in locals():
                 return InteractiveElementsData(**result)
            else:
                 # Fallback if model missing (though this indicates setup error)
                 logger.error("InteractiveElementsData model missing, returning raw dict.")
                 return result # type: ignore
        except Exception as e:
             logger.error(f"Error evaluating INTERACTIVE_ELEMENTS_JS_CODE: {e}", exc_info=True)
             vp = await page.viewport_size() or {"width":0, "height":0}
             return InteractiveElementsData(viewport=vp, elements=[])


    @observe(name='browser.get_interactive_elements_with_cv')
    async def get_interactive_elements_with_cv(self, screenshot_b64: Optional[str] = None, detect_sheets: bool = False) -> InteractiveElementsData:
        """Combines browser JS element detection with VLM detection."""
        if self.detector is None:
            logger.warning("CV detector not available. Falling back to browser-only detection.")
            return await self.get_interactive_elements_data()

        # Ensure screenshot exists
        current_screenshot_b64 = screenshot_b64 or await self.fast_screenshot()
        if not current_screenshot_b64:
             logger.error("Screenshot unavailable for CV detection.")
             return await self.get_interactive_elements_data() # Fallback

        logger.debug("Getting combined browser + CV elements...")
        try:
            # Run browser JS detection and VLM detection concurrently
            browser_elements_data_task = asyncio.create_task(self.get_interactive_elements_data())
            cv_elements_task = asyncio.create_task(self.detector.detect_from_image(current_screenshot_b64, detect_sheets))

            browser_elements_data = await browser_elements_data_task
            cv_elements = await cv_elements_task

            # Ensure results are valid before combining
            if not browser_elements_data or not hasattr(browser_elements_data, 'elements'):
                 logger.warning("Browser element data invalid or missing for combine step.")
                 browser_elements = []
                 viewport = await self.get_current_page().viewport_size() or {"width":0,"height":0}
            else:
                 browser_elements = browser_elements_data.elements
                 viewport = browser_elements_data.viewport # Use viewport from browser data

            if not isinstance(cv_elements, list):
                 logger.warning("CV elements result is not a list.")
                 cv_elements = []

            # Combine results using utility function
            if 'combine_and_filter_elements' in globals():
                 combined_elements = combine_and_filter_elements(browser_elements, cv_elements)
                 logger.info(f"Combined browser ({len(browser_elements)}) and CV ({len(cv_elements)}) elements into {len(combined_elements)}.")
            else:
                 logger.error("combine_and_filter_elements utility function not found. Returning only browser elements.")
                 combined_elements = browser_elements # Fallback

             # Return combined data in the expected structure
            if 'InteractiveElementsData' in globals() and 'InteractiveElementsData' in locals():
                 return InteractiveElementsData(viewport=viewport, elements=combined_elements)
            else:
                 logger.error("InteractiveElementsData model missing, returning raw combined list.")
                 # This fallback is problematic, structure is needed downstream
                 return {"viewport": viewport, "elements": combined_elements} # type: ignore

        except Exception as e:
            logger.error(f"Error during combined CV+Browser element detection: {e}", exc_info=True)
            # Fallback gracefully to browser-only if possible
            try: return await self.get_interactive_elements_data()
            except Exception: return InteractiveElementsData(viewport={"width":0,"height":0}, elements=[]) # Final fallback

================================================
FILE: super_agents/browser_use/browser/detector.py
================================================
# super_agents/browser_use/browser/detector.py
import os
import json
import logging
import base64
from typing import List, Optional, Dict, Any

# LangChain Core Imports
from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.runnables.base import RunnableSerializable
# Pydantic for schema
try:
    from pydantic.v1 import BaseModel
except ImportError:
    from pydantic import BaseModel

from tenacity import (
    retry,
    retry_if_exception_type,
    stop_after_attempt,
    wait_exponential,
)

# Local imports (ensure they exist)
try:
    from .observe_helper import observe
except ImportError:
    def observe(name, ignore_input=False, ignore_output=False):
        def decorator(func): return func
        return decorator
    # Setup basic logger if not configured by main app yet
    logging.basicConfig(level=logging.WARNING)
    logger = logging.getLogger(__name__)
    logger.warning("observe_helper not found, using dummy decorator.")
try:
    from .models import InteractiveElement
    # Define the expected VLM output schema here or import from agent.schemas
    # Let's define it here for clarity in this step
    class VLMJsonOutput(BaseModel):
        detected_elements: List[Dict[str, Any]] = []
except ImportError:
    class InteractiveElement: pass
    class VLMJsonOutput(BaseModel): detected_elements: List = []
    # Setup basic logger if not configured by main app yet
    logging.basicConfig(level=logging.WARNING)
    logger = logging.getLogger(__name__)
    logger.error("Failed to import InteractiveElement or define VLMJsonOutput! Detector parsing will fail.")

# Import the specific ChatOpenRouter class from the updated llm.py
# Adjust path if llm.py is elsewhere relative to detector.py
try:
    from ..llm import ChatOpenRouter # Assumes llm.py is one level up
except ImportError:
     logger.error("Failed to import ChatOpenRouter from ..llm. Ensure llm.py is in the parent directory.")
     # Define a dummy class to allow loading, but it won't work
     class ChatOpenRouter: pass

logger = logging.getLogger(__name__)

# --- VLM Configuration (Read by Detector's __init__ via ChatOpenRouter) ---
VLM_API_MODEL = os.getenv("VLM_API_MODEL", "openai/gpt-4o") # Read desired VLM model from .env

# --- VLM Prompt Template ---
VLM_PROMPT_TEMPLATE = """
Analyze the provided screenshot of a webpage. Your task is to identify all significant interactive elements visible on the screen. Interactive elements include: buttons, links (<a> tags), text input fields (<input type='text'>, <input type='search'>, etc.), password fields (<input type='password'>), text areas (<textarea>), select dropdowns (<select>), checkboxes (<input type='checkbox'>), radio buttons (<input type='radio'>), and any other clearly clickable areas (e.g., some <div>s or <span>s styled as buttons).

For EACH identified interactive element, provide the following information:
1.  `type`: A string indicating the type of the element (e.g., "button", "link", "input-text", "input-password", "textarea", "select", "checkbox", "radio", "clickable-area").
2.  `description`: A brief string describing the element, preferably using its visible text label or aria-label. If no text is available, describe its appearance or function (e.g., "Search icon button", "Dropdown menu arrow").
3.  `box_percent`: A list of four floating-point numbers `[xmin, ymin, xmax, ymax]`, representing the bounding box coordinates as percentages of the image's total width and height. Each value must be between 0.0 and 1.0. `xmin` is the left edge, `ymin` is the top edge, `xmax` is the right edge, and `ymax` is the bottom edge, all relative to the image dimensions.

Your response MUST be a single, valid JSON object. This object must contain exactly one key: `"detected_elements"`. The value associated with this key must be a list (`[]`) where each item in the list is an object containing the `type`, `description`, and `box_percent` for one detected element.

Example of the required EXACT output format:
```json
{{
  "detected_elements": [
    {{
      "type": "link",
      "description": "new",
      "box_percent": [0.152, 0.015, 0.180, 0.035]
    }},
    {{
      "type": "input-text",
      "description": "Search query input",
      "box_percent": [0.3, 0.1, 0.7, 0.15]
    }},
    {{
       "type": "button",
       "description": "Login",
       "box_percent": [0.85, 0.1, 0.95, 0.15]
    }}
  ]
}}
```

Output ONLY the JSON object within a ```json ... ``` block. Do not include any other explanatory text before or after the JSON block. Be precise with the bounding box percentages.
"""

class Detector:
    """
    Uses ChatOpenRouter (LangChain) to call a VLM for visual element detection.
    Initializes its own VLM client based on environment variables.
    """
    def __init__(self):
        """
        Initialize the detector by creating a ChatOpenRouter instance.
        Reads OPENROUTER_API_KEY and VLM_API_MODEL from environment variables.
        """
        self.vlm_client: Optional[ChatOpenRouter] = None
        self.enabled = False
        openrouter_key = os.getenv("OPENROUTER_API_KEY")

        if not openrouter_key:
            logger.error("OPENROUTER_API_KEY environment variable not set. Vision detector disabled.")
        elif not VLM_API_MODEL:
            logger.error("VLM_API_MODEL environment variable not set (e.g., 'alibaba/qwen-vl-max'). Vision detector disabled.")
        else:
            try:
                # Instantiate ChatOpenRouter using the VLM model from env var
                # It reads OPENROUTER_API_KEY internally via its Field definition
                self.vlm_client = ChatOpenRouter(
                    model_name=VLM_API_MODEL,
                    temperature=0.05,
                    max_tokens=2048,
                    # Note: API key is handled by ChatOpenRouter's default_factory
                )
                self.enabled = True
                logger.info(f"ChatOpenRouter VLM Detector initialized. Enabled: {self.enabled}. Model: {VLM_API_MODEL}")
            except Exception as e:
                 logger.error(f"Failed to initialize ChatOpenRouter in Detector: {e}", exc_info=True)
                 self.enabled = False # Ensure disabled if init fails


    @observe(name="detector.detect_from_image", ignore_input=True)
    @retry(
        stop=stop_after_attempt(3),
        wait=wait_exponential(multiplier=1, min=1, max=10),
        retry=retry_if_exception_type(Exception), # Retry on LangChain exceptions too
        reraise=True,
    )
    async def detect_from_image(self, image_b64: str, detect_sheets: bool = False) -> List[InteractiveElement]:
        """
        Sends a base64 encoded image to the configured VLM via ChatOpenRouter.

        Args:
            image_b64: Base64 encoded image.
            detect_sheets: Currently ignored.

        Returns:
            List of InteractiveElement objects parsed from the VLM response.
        """
        if not self.enabled or not self.vlm_client or not image_b64:
            logger.warning("Detector disabled, VLM client not initialized, or image missing. Skipping detection.")
            return []

        logger.info(f"Calling VLM {VLM_API_MODEL} via ChatOpenRouter...")
        image_url_data = f"data:image/png;base64,{image_b64}"

        prompt_text = VLM_PROMPT_TEMPLATE
        # Optional: Modify prompt if detect_sheets is True

        messages = [
            HumanMessage(
                content=[
                    {"type": "text", "text": prompt_text},
                    {"type": "image_url", "image_url": {"url": image_url_data}}
                ]
            )
        ]

        try:
            # Use with_structured_output targeting the VLMJsonOutput schema
            # Ensure VLMJsonOutput is correctly defined/imported
            structured_llm_vlm = self.vlm_client.with_structured_output(VLMJsonOutput)
            vlm_output: Optional[VLMJsonOutput] = await structured_llm_vlm.ainvoke(messages)

            if vlm_output and isinstance(vlm_output, VLMJsonOutput):
                detection_result = vlm_output.detected_elements
                if not isinstance(detection_result, list): # Add validation
                    logger.error(f"Parsed VLM output 'detected_elements' is not a list: {detection_result}")
                    return []
                logger.info(f"Successfully received and parsed VLM JSON with {len(detection_result)} potential elements.")
                elements = self._parse_vlm_detections(detection_result)
                logger.info(f"Created {len(elements)} InteractiveElement objects from VLM detections.")
                return elements
            else:
                logger.error("VLM response failed validation against VLMJsonOutput schema or returned None.")
                return []

        except Exception as e:
            logger.error(f"Error calling VLM or processing structured output: {e}", exc_info=True)
            raise # Re-raise to trigger tenacity retry or fail the node

    # Inside class Detector in detector.py

    def _parse_vlm_detections(self, detections: List[Dict[str, Any]]) -> List[InteractiveElement]:
        """
        Parses VLM JSON output into InteractiveElement objects, populating
        top-level VLM fields instead of nested attributes.
        NOTE: Still needs image dimensions for pixel coordinates.
        """
        elements = []
        if not isinstance(detections, list):
            logger.warning(f"VLM detections expected to be a list, but got {type(detections)}")
            return []

        # Placeholder dimensions
        img_w, img_h = 100, 100

        for i, pred in enumerate(detections):
            if not isinstance(pred, dict):
                logger.warning(f"Skipping detection item as it's not a dict: {pred}")
                continue

            try:
                box_percent = pred.get('box_percent')
                vlm_description = pred.get('description', '') # Get VLM description
                vlm_type = pred.get('type', 'unknown') # Get VLM suggested type

                if not isinstance(box_percent, list) or len(box_percent) != 4 or not all(isinstance(n, (int, float)) for n in box_percent):
                     logger.warning(f"Skipping detection due to invalid box_percent format: {box_percent}")
                     continue
                box_percent_clamped = [max(0.0, min(1.0, p)) for p in box_percent]

                # Calculate placeholder pixel values
                xmin = round(box_percent_clamped[0] * img_w); ymin = round(box_percent_clamped[1] * img_h)
                xmax = round(box_percent_clamped[2] * img_w); ymax = round(box_percent_clamped[3] * img_h)
                if xmax < xmin: xmax = xmin;
                if ymax < ymin: ymax = ymin
                width = xmax - xmin; height = ymax - ymin

                index_id = f"vlm-{i}"
                # Use VLM type as tag_name, or maybe default to 'div'?
                tag_name = vlm_type # Or 'div'

                if 'InteractiveElement' not in globals() and 'InteractiveElement' not in locals(): continue

                element = InteractiveElement(
                    index=i,
                    browser_agent_id=index_id,
                    tag_name=tag_name,
                    # Basic attributes remain empty for pure VLM detections for now
                    attributes={},
                    weight=0.8, # VLM weight
                    # Use calculated placeholder pixel values
                    viewport={"x": xmin, "y": ymin, "width": width, "height": height},
                    page={"x": xmin, "y": ymin, "width": width, "height": height},
                    center={"x": xmin + width//2, "y": ymin + height//2},
                    rect={"left": xmin, "top": ymin, "right": xmax, "bottom": ymax, "width": width, "height": height},
                    z_index=0,
                    # --- Populate NEW VLM specific fields ---
                    vlm_description=vlm_description,
                    vlm_type=vlm_type,
                    box_percent=box_percent_clamped
                    # --- End VLM specific fields ---
                )
                elements.append(element)

            except Exception as e:
                logger.warning(f"Error parsing individual VLM detection: {e} - Data: {pred}", exc_info=False)

        return elements
    # def _parse_vlm_detections(self, detections: List[Dict[str, Any]]) -> List[InteractiveElement]:
    #     """
    #     Parses the list of detections from the VLM JSON output into
    #     InteractiveElement objects.
    #     NOTE: Needs image dimensions passed in to calculate meaningful pixel coordinates.
    #           Currently uses placeholder coordinates.
    #     """
    #     elements = []
    #     if not isinstance(detections, list):
    #         logger.warning(f"VLM detections expected to be a list, but got {type(detections)}")
    #         return []

    #     # Placeholder dimensions - THIS IS STILL A PROBLEM TO SOLVE LATER
    #     img_w, img_h = 100, 100

    #     for i, pred in enumerate(detections):
    #         if not isinstance(pred, dict):
    #             logger.warning(f"Skipping detection item as it's not a dict: {pred}")
    #             continue

    #         try:
    #             box_percent = pred.get('box_percent')
    #             description = pred.get('description', '')
    #             element_type = pred.get('type', 'unknown')

    #             if not isinstance(box_percent, list) or len(box_percent) != 4 or not all(isinstance(n, (int, float)) for n in box_percent):
    #                  logger.warning(f"Skipping detection due to invalid box_percent format: {box_percent}")
    #                  continue
    #             box_percent_clamped = [max(0.0, min(1.0, p)) for p in box_percent]

    #             # Calculate placeholder pixel values
    #             xmin = round(box_percent_clamped[0] * img_w); ymin = round(box_percent_clamped[1] * img_h)
    #             xmax = round(box_percent_clamped[2] * img_w); ymax = round(box_percent_clamped[3] * img_h)
    #             if xmax < xmin: xmax = xmin;
    #             if ymax < ymin: ymax = ymin
    #             width = xmax - xmin; height = ymax - ymin

    #             index_id = f"vlm-{i}"; tag_name = element_type

    #             if 'InteractiveElement' not in globals() and 'InteractiveElement' not in locals():
    #                  logger.error("InteractiveElement class definition is missing. Cannot create elements.")
    #                  continue

    #             element = InteractiveElement(
    #                 index=i, browser_agent_id=index_id, tag_name=tag_name, text=description,
    #                 attributes={'description': description, 'vlm_type': element_type, 'box_percent': box_percent_clamped}, weight=0.8,
    #                 viewport={"x": xmin, "y": ymin, "width": width, "height": height}, page={"x": xmin, "y": ymin, "width": width, "height": height},
    #                 center={"x": xmin + width//2, "y": ymin + height//2}, input_type=element_type if 'input' in element_type else None,
    #                 rect={"left": xmin, "top": ymin, "right": xmax, "bottom": ymax, "width": width, "height": height}, z_index=0)
    #             elements.append(element)

    #         except Exception as e:
    #             logger.warning(f"Error parsing individual VLM detection: {e} - Data: {pred}", exc_info=False)

    #     return elements

================================================
FILE: super_agents/browser_use/browser/findVisibleInteractiveElements.js
================================================
() => {

    console.time('totalExecutionTime');

    // Define element weights for interactive likelihood - moved to higher scope
    const elementWeights = {
        'button': 10,
        'a': 10,
        'input': 10,
        'select': 10,
        'textarea': 10,
        'summary': 8,
        'details': 7,
        'label': 5, // Labels are clickable but not always interactive
        'option': 7,
        'tr': 4,
        'th': 3,
        'td': 3,
        'li': 8,
        'div': 2,
        'span': 1,
        'img': 2,
        'svg': 3,
        'path': 3
    };

    function generateUniqueId() {
        const rand = Math.random().toString(36);
        return `ba-${rand}`;
    } 

    // Add this helper function to check element coverage
    function isElementTooBig(rect) {
        const viewportWidth = window.innerWidth || document.documentElement.clientWidth;
        const viewportHeight = window.innerHeight || document.documentElement.clientHeight;
        const viewportArea = viewportWidth * viewportHeight;

        // Calculate visible area of the element
        const visibleWidth = Math.min(rect.right, viewportWidth) - Math.max(rect.left, 0);
        const visibleHeight = Math.min(rect.bottom, viewportHeight) - Math.max(rect.top, 0);
        const visibleArea = visibleWidth * visibleHeight;

        // Check if element covers more than 50% of viewport
        return (visibleArea / viewportArea) > 0.5;
    }

    // Helper function to check if element is in the visible viewport
    function isInViewport(rect) {
        // Get viewport dimensions
        const viewportWidth = window.innerWidth || document.documentElement.clientWidth;
        const viewportHeight = window.innerHeight || document.documentElement.clientHeight;
        
        // Element must have meaningful size
        if (rect.width < 2 || rect.height < 2) {
            return false;
        }
        
        // Check if substantial part of the element is in viewport (at least 30%)
        const visibleWidth = Math.min(rect.right, viewportWidth) - Math.max(rect.left, 0);
        const visibleHeight = Math.min(rect.bottom, viewportHeight) - Math.max(rect.top, 0);
        
        if (visibleWidth <= 0 || visibleHeight <= 0) {
            return false; // Not in viewport at all
        }
        
        const visibleArea = visibleWidth * visibleHeight;
        const totalArea = rect.width * rect.height;
        const visiblePercent = visibleArea / totalArea;
        
        return visiblePercent >= 0.3; // At least 30% visible
    }

    // Helper function to get correct bounding rectangle, accounting for iframes
    function getAdjustedBoundingClientRect(element, contextInfo = null) {
        const rect = element.getBoundingClientRect();
        
        // If element is in an iframe, adjust coordinates
        if (contextInfo && contextInfo.iframe) {
            const iframeRect = contextInfo.iframe.getBoundingClientRect();
            return {
                top: rect.top + iframeRect.top,
                right: rect.right + iframeRect.left,
                bottom: rect.bottom + iframeRect.top,
                left: rect.left + iframeRect.left,
                width: rect.width,
                height: rect.height
            };
        }
        
        return rect;
    }

    // Helper function to check if element is the top element at its position
    function isTopElement(element) {

        try {
            const rect = getAdjustedBoundingClientRect(element, element._contextInfo);
            const centerX = rect.left + rect.width / 2;
            const centerY = rect.top + rect.height / 2;
            
            // Check if the element is visible at its center point
            const elementsAtPoint = document.elementsFromPoint(centerX, centerY);
            
            // Nothing at this point (might be covered by an overlay)
            if (!elementsAtPoint || elementsAtPoint.length === 0) {
                return false;
            }
            
            // Handle iframe cases
            if (element._contextInfo && element._contextInfo.iframe) {
                // For elements in iframes, check if the iframe itself is the top-level element
                // then check if the element is topmost within that iframe
                const iframe = element._contextInfo.iframe;
                
                // First check if iframe is visible at the adjusted center point
                const iframeVisibleAtPoint = elementsAtPoint.includes(iframe);
                if (!iframeVisibleAtPoint) {
                    return false;
                }
                
                // Then check if element is topmost within the iframe
                try {
                    const iframeDoc = iframe.contentDocument || iframe.contentWindow.document;
                    // Convert coordinates to iframe's local coordinate system
                    const iframeRect = iframe.getBoundingClientRect();
                    const localX = centerX - iframeRect.left;
                    const localY = centerY - iframeRect.top;
                    
                    const elementAtPointInIframe = iframeDoc.elementFromPoint(localX, localY);

                    if (!elementAtPointInIframe) return false;

                    return elementAtPointInIframe === element || element.contains(elementAtPointInIframe) || elementAtPointInIframe.contains(element);

                } catch (e) {
                    console.warn('Error checking element position in iframe:', e);
                    return false;
                }
            }
            
            // Handle shadow DOM cases
            if (element._contextInfo && element._contextInfo.shadowHost) {
                // For shadow DOM elements, first check if its shadow host is visible
                const shadowHost = element._contextInfo.shadowHost;
                const shadowHostVisible = elementsAtPoint.includes(shadowHost);
                
                if (!shadowHostVisible) {
                    return false;
                }
                
                // Shadow DOM elements aren't directly accessible via elementsFromPoint
                // So we're simplifying and assuming visibility based on the host visibility
                return true;
            }
            
            const elementAtPoint = document.elementFromPoint(centerX, centerY);
            
            if (!elementAtPoint) return false;
            // Check if the element at this point is our element or a descendant/ancestor of our element
            return element === elementAtPoint || 
                    element.contains(elementAtPoint) || 
                    elementAtPoint.contains(element);
            
        } catch (e) {
            console.warn('Error in isTopElement check:', e);
            return false;
        }
    }

    // Add helper function to get effective z-index
    function getEffectiveZIndex(element) {
        let current = element;
        let zIndex = 'auto';
        
        while (current && current !== document) {
            const style = window.getComputedStyle(current);
            if (style.position !== 'static' && style.zIndex !== 'auto') {
                zIndex = parseInt(style.zIndex, 10);
                break;
            }
            current = current.parentElement;
        }
        
        return zIndex === 'auto' ? 0 : zIndex;
    }

    // Function to find all interactive elements
    function findInteractiveElements() {
        console.time('findInteractiveElements');
        
        // Batch selectors for better performance
        const selectors = {
            highPriority: 'button, a[href], input:not([type="hidden"]), select, textarea, [role="button"], [role="link"], [role="checkbox"], [role="menuitem"], [role="tab"], li[role="option"], [role="switch"]',
            mediumPriority: 'details, summary, svg, path, td, [role="option"], [role="radio"], [role="switch"], [tabindex]:not([tabindex="-1"]), [aria-label], [aria-labelledby]',
            lowPriority: '[onclick], .clickable, .btn, .button, .nav-item, .menu-item'
        };
        
        // Process only elements in viewport for better performance
        const allElements = [];
        const processedElements = new Set();
        const viewportElements = [];
        
        // Function to query elements within a document or shadow root
        function queryElementsInContext(context, selector) {
            try {
                return context.querySelectorAll(selector);
            } catch (e) {
                console.warn('Error querying for elements:', e);
                return [];
            }
        }
        
        // Function to process a document or shadow root
        function processContext(context, contextInfo = { iframe: null, shadowHost: null }) {
            // Process elements in priority order
            Object.keys(selectors).forEach(priority => {
                try {
                    const elements = queryElementsInContext(context, selectors[priority]);
                    
                    for (let i = 0; i < elements.length; i++) {
                        const element = elements[i];
                        
                        // Skip already processed
                        if (processedElements.has(element)) {
                            continue;
                        }
                        
                        processedElements.add(element);
                        
                        // Add context information to the element
                        element._contextInfo = contextInfo;
                        
                        allElements.push(element);
                    }
                } catch (e) {
                    console.warn(`Error processing ${priority} elements:`, e);
                }
            });
            
            // Process shadow DOM
            const shadowHosts = queryElementsInContext(context, '*');
            for (let i = 0; i < shadowHosts.length; i++) {
                const host = shadowHosts[i];
                if (host.shadowRoot) {
                    processContext(
                        host.shadowRoot, 
                        { 
                            iframe: contextInfo.iframe, 
                            shadowHost: host 
                        }
                    );
                }
            }
        }
        
        // Process main document
        processContext(document);
        
        // Process iframes
        try {
            const iframes = document.querySelectorAll('iframe');
            for (let i = 0; i < iframes.length; i++) {
                const iframe = iframes[i];
                
                // Skip iframes from different origins
                try {
                    // This will throw if cross-origin
                    const iframeDoc = iframe.contentDocument || iframe.contentWindow.document;
                    processContext(iframeDoc, { iframe: iframe, shadowHost: null });
                } catch (e) {
                    console.warn('Could not access iframe content (likely cross-origin):', e);
                }
            }
        } catch (e) {
            console.warn('Error processing iframes:', e);
        }
        
        // Process cursor:pointer elements in all contexts
        function processCursorPointerElements(context, contextInfo = { iframe: null, shadowHost: null }) {
            try {
                const allElementsInContext = queryElementsInContext(context, '*');
                
                for (let i = 0; i < allElementsInContext.length; i++) {
                    const element = allElementsInContext[i];
                    
                    // Skip already processed
                    if (processedElements.has(element)) {
                        continue;
                    }
                    
                    // Quick check before expensive operations
                    const rect = getAdjustedBoundingClientRect(element, contextInfo);
                    if (!isInViewport(rect)) {
                        continue;
                    }
                    
                    // Check style
                    if (isTopElement(element) && window.getComputedStyle(element).cursor === 'pointer') {
                        // Add context information to the element
                        element._contextInfo = contextInfo;
                        
                        processedElements.add(element);
                        allElements.push(element);
                        
                        viewportElements.push({
                            element: element,
                            rect: rect,
                            weight: 1,
                            zIndex: getEffectiveZIndex(element)
                        });
                    }
                    
                    // Process shadow DOM of this element
                    if (element.shadowRoot) {
                        processCursorPointerElements(
                            element.shadowRoot,
                            {
                                iframe: contextInfo.iframe,
                                shadowHost: element
                            }
                        );
                    }
                }
            } catch (e) {
                console.warn('Error processing cursor:pointer elements:', e);
            }
        }
        
        // Process cursor:pointer elements in the main document
        processCursorPointerElements(document);
        
        // Process cursor:pointer elements in iframes
        try {
            const iframes = document.querySelectorAll('iframe');
            for (let i = 0; i < iframes.length; i++) {
                const iframe = iframes[i];
                try {
                    const iframeDoc = iframe.contentDocument || iframe.contentWindow.document;
                    processCursorPointerElements(iframeDoc, { iframe: iframe, shadowHost: null });
                } catch (e) {
                    // Already logged in previous iframe processing
                }
            }
        } catch (e) {
            // Already logged in previous iframe processing
        }
        
        // Filter for visible elements
        for (let i = 0; i < allElements.length; i++) {
            const element = allElements[i];
            
            // Skip detailed processing if not in viewport
            const rect = getAdjustedBoundingClientRect(element, element._contextInfo);
            if (!isInViewport(rect)) {
                continue;
            }
            
            // Skip disabled elements
            if (element.hasAttribute('disabled') || 
                element.getAttribute('aria-disabled') === 'true') {
                continue;
            }

            // Add check for too-large elements
            if (isElementTooBig(rect)) {
                continue; // Skip elements that cover more than 50% of viewport
            }
            
            // Check if the element is the top element at its position
            if (!isTopElement(element)) {
                continue;
            }
            
            // Calculate element weight
            let weight = elementWeights[element.tagName.toLowerCase()] || 1;
            
            // Boost weight for elements with specific attributes
            if (element.getAttribute('role') === 'button') weight = Math.max(weight, 8);
            if (element.hasAttribute('onclick')) weight = Math.max(weight, 7);
            if (element.hasAttribute('href')) weight = Math.max(weight, 8);
            if (window.getComputedStyle(element).cursor === 'pointer') weight = Math.max(weight, 4);
            
            // Add to viewport elements
            viewportElements.push({
                element: element,
                rect: rect,
                weight: weight,
                zIndex: getEffectiveZIndex(element)
            });

            // Add this to the code that processes each element
            element.setAttribute('data-element-index', i);

            // Add a unique identifier attribute to the element
            const uniqueId = generateUniqueId();
            element.setAttribute('data-browser-agent-id', uniqueId);
        }
        
        console.timeEnd('findInteractiveElements');
        console.log(`Found ${viewportElements.length} interactive elements in viewport (out of ${allElements.length} total)`);
        return viewportElements;
    }

    // Calculate Intersection over Union (IoU) between two rectangles
    function calculateIoU(rect1, rect2) {
        // Calculate area of each rectangle
        const area1 = (rect1.right - rect1.left) * (rect1.bottom - rect1.top);
        const area2 = (rect2.right - rect2.left) * (rect2.bottom - rect2.top);
        
        // Calculate intersection
        const intersectLeft = Math.max(rect1.left, rect2.left);
        const intersectTop = Math.max(rect1.top, rect2.top);
        const intersectRight = Math.min(rect1.right, rect2.right);
        const intersectBottom = Math.min(rect1.bottom, rect2.bottom);
        
        // Check if intersection exists
        if (intersectRight < intersectLeft || intersectBottom < intersectTop) {
            return 0; // No intersection
        }
        
        // Calculate area of intersection
        const intersectionArea = (intersectRight - intersectLeft) * (intersectBottom - intersectTop);
        
        // Calculate union area
        const unionArea = area1 + area2 - intersectionArea;
        
        // Calculate IoU
        return intersectionArea / unionArea;
    }

    // Check if rect1 is fully contained within rect2
    function isFullyContained(rect1, rect2) {
        return rect1.left >= rect2.left && 
               rect1.right <= rect2.right &&
               rect1.top >= rect2.top &&
               rect1.bottom <= rect2.bottom;
    }

    // Filter overlapping elements using weight and IoU
    function filterOverlappingElements(elements) {
        console.time('filterOverlappingElements');
        
        // Sort by area (descending - larger first), then by weight (descending) for same area
        elements.sort((a, b) => {
            // Calculate areas
            const areaA = a.rect.width * a.rect.height;
            const areaB = b.rect.width * b.rect.height;
            
            // Sort by area first (larger area first)
            if (areaB !== areaA) {
                return areaB - areaA; // Larger area first
            }
            
            // For same area, sort by weight (higher weight first)
            return b.weight - a.weight;
        });
        
        const filteredElements = [];
        const iouThreshold = 0.7; // Threshold for considering elements as overlapping
        
        // Add elements one by one, checking against already added elements
        for (let i = 0; i < elements.length; i++) {
            const current = elements[i];
            let shouldAdd = true;
            
            // For each element already in our filtered list
            for (let j = 0; j < filteredElements.length; j++) {
                const existing = filteredElements[j];
                
                // Convert DOMRect to plain object for IoU calculation
                const currentRect = {
                    left: current.rect.left,
                    top: current.rect.top,
                    right: current.rect.right,
                    bottom: current.rect.bottom
                };
                
                const existingRect = {
                    left: existing.rect.left,
                    top: existing.rect.top,
                    right: existing.rect.right,
                    bottom: existing.rect.bottom
                };
                
                // Check for high overlap
                const iou = calculateIoU(currentRect, existingRect);
                if (iou > iouThreshold) {
                    shouldAdd = false;
                    break;
                }
                
                // Check if current element is fully contained within an existing element with higher weight
                if (existing.weight > current.weight && 
                    isFullyContained(currentRect, existingRect) && 
                    existing.zIndex === current.zIndex) {
                    shouldAdd = false;
                    break;
                }
            }
            
            if (shouldAdd) {
                filteredElements.push(current);
            }
        }
        
        console.timeEnd('filterOverlappingElements');
        return filteredElements;
    }

    // Main function to get interactive elements with coordinates
    function getInteractiveElementsData() {
        // Find all potential interactive elements
        const potentialElements = findInteractiveElements();
        
        // Filter out overlapping elements
        const filteredElements = filterOverlappingElements(potentialElements);
        console.log(`Filtered to ${filteredElements.length} non-overlapping elements`);
        
        // Sort elements by position (top-to-bottom, left-to-right)
        const sortedElements = sortElementsByPosition(filteredElements);
        
        // Prepare result with viewport metadata
        const result = {
            viewport: {
                width: window.innerWidth,
                height: window.innerHeight,
                scrollX: Math.round(window.scrollX),
                scrollY: Math.round(window.scrollY),
                devicePixelRatio: window.devicePixelRatio || 1,
                scrollDistanceAboveViewport: Math.round(window.scrollY),
                scrollDistanceBelowViewport: Math.round(document.documentElement.scrollHeight - window.scrollY - window.innerHeight)
            },
            elements: []
        };
        
        // Process each interactive element (now sorted by position)
        sortedElements.forEach((item, index) => {
            const element = item.element;
            const rect = item.rect;
            
            // Ensure each element has a index_id
            let browserId = element.getAttribute('data-browser-agent-id');

            if (!browserId) {
                const uniqueId = generateUniqueId();
                element.setAttribute('data-browser-agent-id', uniqueId);
                browserId = uniqueId;
            }
            
            // Get element text (direct or from children)
            let text = element.innerText || '';
            if (!text) {
                const textNodes = Array.from(element.childNodes)
                    .filter(node => node.nodeType === Node.TEXT_NODE)
                    .map(node => node.textContent.trim())
                    .filter(content => content.length > 0);
                text = textNodes.join(' ');
            }
            
            // Extract important attributes
            const attributes = {};
            ['id', 'class', 'href', 'type', 'name', 'value', 'placeholder', 'aria-label', 'title', 'role'].forEach(attr => {
                if (element.hasAttribute(attr)) {
                    attributes[attr] = element.getAttribute(attr);
                }
            });
            
            // Determine input type and element role more clearly
            let elementType = element.tagName.toLowerCase();
            let inputType = null;

            // Handle input elements specifically
            if (elementType === 'input' && element.hasAttribute('type')) {
                inputType = element.getAttribute('type').toLowerCase();
            }

            // Create element data object
            const elementData = {
                tagName: elementType,
                text: text.trim(),
                attributes,
                index,
                weight: item.weight,
                browserAgentId: browserId,  // Use the guaranteed ID
                inputType: inputType,  // Add specific input type
                viewport: {
                    x: Math.round(rect.left),
                    y: Math.round(rect.top),
                    width: Math.round(rect.width),
                    height: Math.round(rect.height)
                },
                page: {
                    x: Math.round(rect.left + window.scrollX),
                    y: Math.round(rect.top + window.scrollY),
                    width: Math.round(rect.width),
                    height: Math.round(rect.height)
                },
                center: {
                    x: Math.round(rect.left + rect.width/2),
                    y: Math.round(rect.top + rect.height/2)
                },
                rect: {
                    left: Math.round(rect.left),
                    top: Math.round(rect.top),
                    right: Math.round(rect.right),
                    bottom: Math.round(rect.bottom),
                    width: Math.round(rect.width),
                    height: Math.round(rect.height)
                },
                zIndex: item.zIndex
            };
            
            // Add context information for iframe or shadow DOM if applicable
            if (element._contextInfo) {
                elementData.context = {};
                
                // Add iframe information if element is within an iframe
                if (element._contextInfo.iframe) {
                    const iframeRect = element._contextInfo.iframe.getBoundingClientRect();
                    elementData.context.iframe = {
                        id: element._contextInfo.iframe.id || null,
                        name: element._contextInfo.iframe.name || null,
                        src: element._contextInfo.iframe.src || null,
                        rect: {
                            x: Math.round(iframeRect.left),
                            y: Math.round(iframeRect.top),
                            width: Math.round(iframeRect.width),
                            height: Math.round(iframeRect.height)
                        }
                    };
                }
                
                // Add shadow DOM information if element is within a shadow DOM
                if (element._contextInfo.shadowHost) {
                    const shadowHost = element._contextInfo.shadowHost;
                    const shadowHostRect = shadowHost.getBoundingClientRect();
                    elementData.context.shadowDOM = {
                        hostTagName: shadowHost.tagName.toLowerCase(),
                        hostId: shadowHost.id || null,
                        hostRect: {
                            x: Math.round(shadowHostRect.left),
                            y: Math.round(shadowHostRect.top),
                            width: Math.round(shadowHostRect.width),
                            height: Math.round(shadowHostRect.height)
                        }
                    };
                }
            }
            
            result.elements.push(elementData);
            
        });
        
        return result;
    }

    // Add new function to sort elements by position
    function sortElementsByPosition(elements) {
        // Define what "same row" means (elements within this Y-distance are considered in the same row)
        const ROW_THRESHOLD = 20; // pixels
        
        // First, group elements into rows based on their Y position
        const rows = [];
        let currentRow = [];
        
        // Copy elements to avoid modifying the original array
        const sortedByY = [...elements].sort((a, b) => {
            return a.rect.top - b.rect.top;
        });
        
        // Group into rows
        sortedByY.forEach(element => {
            if (currentRow.length === 0) {
                // Start a new row
                currentRow.push(element);
            } else {
                // Check if this element is in the same row as the previous ones
                const lastElement = currentRow[currentRow.length - 1];
                if (Math.abs(element.rect.top - lastElement.rect.top) <= ROW_THRESHOLD) {
                    // Same row
                    currentRow.push(element);
                } else {
                    // New row
                    rows.push([...currentRow]);
                    currentRow = [element];
                }
            }
        });
        
        // Add the last row if not empty
        if (currentRow.length > 0) {
            rows.push(currentRow);
        }
        
        // Sort each row by X position (left to right)
        rows.forEach(row => {
            row.sort((a, b) => a.rect.left - b.rect.left);
        });
        
        // Flatten the rows back into a single array
        return rows.flat();
    }

    // Execute and measure performance
    console.time('getInteractiveElements');
    const result = getInteractiveElementsData();
    console.timeEnd('getInteractiveElements');
    console.timeEnd('totalExecutionTime');

    return result;
};   

================================================
FILE: super_agents/browser_use/browser/models.py
================================================
# super_agents/browser_use/browser/models.py
from typing import List, Dict, Optional, Any

# --- Force Pydantic V2 Import ---
from pydantic import BaseModel, Field, ConfigDict
from pydantic.alias_generators import to_camel
# --- End Pydantic V2 Import ---

# --- BrowserError Exception ---
class BrowserError(Exception): pass
class URLNotAllowedError(BrowserError): pass

# --- Data Models ---
class TabInfo(BaseModel):
    page_id: int
    url: str
    title: str

class Coordinates(BaseModel):
    x: int
    y: int
    width: Optional[int] = Field(default=None)
    height: Optional[int] = Field(default=None)

class Viewport(BaseModel):
    model_config = ConfigDict(alias_generator=to_camel, populate_by_name=True, from_attributes=True, extra='ignore')
    width: int = Field(default=1200)
    height: int = Field(default=900)
    scroll_x: int = Field(default=0)
    scroll_y: int = Field(default=0)
    device_pixel_ratio: float = Field(default=1.0)
    scroll_distance_above_viewport: Optional[int] = Field(default=0)
    scroll_distance_below_viewport: Optional[int] = Field(default=0)

class InteractiveElement(BaseModel):
    """Represents an interactive element, combining DOM/AX/VLM info."""
    model_config = ConfigDict(
        alias_generator=to_camel,
        populate_by_name=True,
        from_attributes=True,
        extra='ignore'
    )

    # Common fields
    index: int
    browser_agent_id: str # Unique ID (pw-X or vlm-Y)
    tag_name: str
    text: Optional[str] = Field(default=None)
    attributes: Dict[str, str] = Field(default_factory=dict) # Keep basic DOM attributes as string dict?
    weight: float = Field(default=1.0)
    viewport: Optional[Coordinates] = Field(default=None) # Make optional as VLM might not provide perfectly
    page: Optional[Coordinates] = Field(default=None)     # Make optional
    center: Optional[Coordinates] = Field(default=None)   # Make optional
    input_type: Optional[str] = Field(default=None)
    rect: Optional[Dict[str, int]] = Field(default=None) # Make optional
    z_index: int = Field(default=0)

    # --- Fields specifically from VLM (added as top-level optional) ---
    vlm_description: Optional[str] = Field(default=None, description="Description provided by VLM")
    vlm_type: Optional[str] = Field(default=None, description="Element type suggested by VLM")
    box_percent: Optional[List[float]] = Field(default=None, description="Bounding box [xmin, ymin, xmax, ymax] as percentages from VLM")
    # --- End VLM specific fields ---

class InteractiveElementsData(BaseModel):
    model_config = ConfigDict(extra='ignore')
    viewport: Viewport
    elements: List[InteractiveElement] = Field(default_factory=list)

class BrowserState(BaseModel):
    model_config = ConfigDict(extra='ignore')
    url: str
    tabs: List[TabInfo] = Field(default_factory=list)
    viewport: Optional[Viewport] = Field(default=None)
    screenshot_with_highlights: Optional[str] = Field(default=None)
    screenshot: Optional[str] = Field(default=None)
    # Use str key (browser_agent_id)
    interactive_elements: Dict[str, InteractiveElement] = Field(default_factory=dict)

================================================
FILE: super_agents/browser_use/browser/utils.py
================================================
import base64
import logging
from io import BytesIO
from pathlib import Path
from typing import Dict, List

from PIL import Image, ImageDraw, ImageFont

# 修正从 index.browser 导入改为本地相对导入
from .models import InteractiveElement

logger = logging.getLogger(__name__)

def put_highlight_elements_on_screenshot(elements: dict[int, InteractiveElement], screenshot_b64: str) -> str:
    """Highlight elements using Pillow instead of OpenCV"""
    try:
        # Decode base64 to PIL Image
        image_data = base64.b64decode(screenshot_b64)
        image = Image.open(BytesIO(image_data))
        draw = ImageDraw.Draw(image)
        
        # Colors (RGB format for PIL)
        colors = [
            (204, 0, 0),
            (0, 136, 0),
            (0, 0, 204),
            (204, 112, 0),
            (102, 0, 102),
            (0, 102, 102),
            (204, 51, 153),
            (44, 0, 102),
            (204, 35, 0), 
            (28, 102, 66),
            (170, 0, 0),
            (36, 82, 123)
        ]
        placed_labels = []
        
        # Load custom font from the package
        try:
            # Path to your packaged font
            font_path = Path(__file__).parent / "fonts" / "OpenSans-Medium.ttf"
            font = ImageFont.truetype(str(font_path), 14)
        except Exception as e:
            logger.warning(f"Could not load custom font: {e}, falling back to default")
            font = ImageFont.load_default()
            
        for idx, element in elements.items():

            # don't draw sheets elements
            if element.browser_agent_id.startswith("row_") or element.browser_agent_id.startswith("column_"):
                continue

            color = colors[idx % len(colors)]
            rect = element.viewport
            
            # Draw rectangle
            draw.rectangle(
                [(rect.x, rect.y), (rect.x + rect.width, rect.y + rect.height)],
                outline=color,
                width=2
            )
            
            # Prepare label
            text = str(idx)
            
            # Get precise text dimensions for proper centering
            text_bbox = draw.textbbox((0, 0), text, font=font)
            text_width = text_bbox[2] - text_bbox[0]
            text_height = text_bbox[3] - text_bbox[1]
            
            # Make label size exactly proportional for better aesthetics
            # Square labels look better for single digits as seen in the example image
            label_width = text_width + 6
            label_height = text_height + 6
            
            # Positioning logic
            if label_width > rect.width or label_height > rect.height:
                label_x = rect.x + rect.width
                label_y = rect.y
            else:
                label_x = rect.x + rect.width - label_width
                label_y = rect.y
            
            # Check for overlaps with existing labels
            label_rect = {
                'left': label_x, 'top': label_y,
                'right': label_x + label_width, 'bottom': label_y + label_height
            }
            
            for existing in placed_labels:
                if not (label_rect['right'] < existing['left'] or 
                        label_rect['left'] > existing['right'] or 
                        label_rect['bottom'] < existing['top'] or 
                        label_rect['top'] > existing['bottom']):
                    label_y = existing['bottom'] + 2
                    label_rect['top'] = label_y
                    label_rect['bottom'] = label_y + label_height
                    break
            
            # Ensure label is visible within image boundaries
            img_width, img_height = image.size
            if label_x < 0:
                label_x = 0
            elif label_x + label_width >= img_width:
                label_x = img_width - label_width - 1
                
            if label_y < 0:
                label_y = 0
            elif label_y + label_height >= img_height:
                label_y = img_height - label_height - 1
            
            # Draw label background
            draw.rectangle(
                [(label_x, label_y), (label_x + label_width, label_y + label_height)],
                fill=color
            )
                        
			# magic numbers to center the text
            text_x = label_x + 3
            text_y = label_y - 1
            
            # Draw text
            draw.text(
                (text_x, text_y),
                text,
                fill=(255, 255, 255),
                font=font
            )
            
            placed_labels.append(label_rect)
        
        # Convert back to base64
        buffer = BytesIO()
        image.save(buffer, format="PNG")
        new_image_base64 = base64.b64encode(buffer.getvalue()).decode()
        
        return new_image_base64
    
    except Exception as e:
        logger.error(f"Failed to add highlights to screenshot: {str(e)}")
        return screenshot_b64


def scale_b64_image(image_b64: str, scale_factor: float) -> str:
    """
    Scale down a base64 encoded image using Pillow.
    
    Args:
        image_b64: Base64 encoded image string
        scale_factor: Factor to scale the image by (0.5 = half size)
    
    Returns:
        Base64 encoded scaled image
    """
    try:
        # Decode base64 to PIL Image
        image_data = base64.b64decode(image_b64)
        image = Image.open(BytesIO(image_data))
        
        if image is None:
            return image_b64
            
        # Get original dimensions
        width, height = image.size
        
        # Calculate new dimensions
        new_width = int(width * scale_factor)
        new_height = int(height * scale_factor)
        
        # Resize the image using high quality resampling
        resized_image = image.resize(
            (new_width, new_height),
            Image.LANCZOS
        )
        
        # Convert back to base64
        buffer = BytesIO()
        resized_image.save(buffer, format="PNG")
        resized_image_b64 = base64.b64encode(buffer.getvalue()).decode()
        
        return resized_image_b64
        
    except Exception:
        return image_b64


def calculate_iou(rect1: Dict, rect2: Dict) -> float:
    """
    Calculate Intersection over Union between two rectangles.
    
    Args:
        rect1: First rectangle with left, top, right, bottom keys
        rect2: Second rectangle with left, top, right, bottom keys
        
    Returns:
        IoU value
    """
    # Calculate intersection
    intersect_left = max(rect1["left"], rect2["left"])
    intersect_top = max(rect1["top"], rect2["top"])
    intersect_right = min(rect1["right"], rect2["right"])
    intersect_bottom = min(rect1["bottom"], rect2["bottom"])
    
    # Check if intersection exists
    if intersect_right < intersect_left or intersect_bottom < intersect_top:
        return 0.0  # No intersection
    
    # Calculate area of each rectangle
    area1 = (rect1["right"] - rect1["left"]) * (rect1["bottom"] - rect1["top"])
    area2 = (rect2["right"] - rect2["left"]) * (rect2["bottom"] - rect2["top"])
    
    # Calculate area of intersection
    intersection_area = (intersect_right - intersect_left) * (intersect_bottom - intersect_top)
    
    # Calculate union area
    union_area = area1 + area2 - intersection_area
    
    # Calculate IoU
    return intersection_area / union_area if union_area > 0 else 0.0


def is_fully_contained(rect1: Dict, rect2: Dict) -> bool:
    """
    Check if rect1 is fully contained within rect2.
    
    Args:
        rect1: First rectangle with left, top, right, bottom keys
        rect2: Second rectangle with left, top, right, bottom keys
        
    Returns:
        True if rect1 is fully contained within rect2
    """
    return (rect1["left"] >= rect2["left"] and
            rect1["right"] <= rect2["right"] and
            rect1["top"] >= rect2["top"] and
            rect1["bottom"] <= rect2["bottom"])


def filter_overlapping_elements(elements: List[InteractiveElement], iou_threshold: float = 0.7) -> List[InteractiveElement]:
    """
    Filter overlapping elements using weight and IoU.
    
    Args:
        elements: Elements to filter
        iou_threshold: Threshold for considering elements as overlapping
        
    Returns:
        Filtered elements
    """
    if not elements:
        return []
        
    # Sort by area (descending), then by weight (descending)
    elements.sort(key=lambda e: (
        -(e.rect["width"] * e.rect["height"]),  # Negative area for descending sort
        -e.weight  # Negative weight for descending sort
    ))
    
    filtered_elements: List[InteractiveElement] = []
    
    # Add elements one by one, checking against already added elements
    for current in elements:
        should_add = True
        
        # For each element already in our filtered list
        for existing in filtered_elements:
            # Check overlap with IoU
            iou = calculate_iou(current.rect, existing.rect)
            if iou > iou_threshold:
                should_add = False
                break
            
            # Check if current element is fully contained within an existing element with higher weight
            if is_fully_contained(current.rect, existing.rect):
                if existing.weight >= current.weight and existing.z_index == current.z_index:
                    should_add = False
                    break
                else:
                    # If current element has higher weight and is more than 50% of the size of the existing element, remove the existing element
                    if current.rect["width"] * current.rect["height"] >= existing.rect["width"] * existing.rect["height"] * 0.5:
                        filtered_elements.remove(existing)
                        break
        
        if should_add:
            filtered_elements.append(current)
    
    return filtered_elements


def sort_elements_by_position(elements: List[InteractiveElement]) -> List[InteractiveElement]:
    """
    Sort elements by position (top to bottom, left to right).
    
    Args:
        elements: Elements to sort
        
    Returns:
        Sorted elements
    """
    if not elements:
        return []
    
    # Define what "same row" means
    ROW_THRESHOLD = 20  # pixels
    
    # First, group elements into rows based on Y position
    rows = []
    current_row = []
    
    # Copy and sort elements by Y position
    sorted_by_y = sorted(elements, key=lambda e: e.rect["top"])
    
    # Group into rows
    for element in sorted_by_y:
        if not current_row:
            # Start a new row
            current_row.append(element)
        else:
            # Check if this element is in the same row as the previous ones
            last_element = current_row[-1]
            if abs(element.rect["top"] - last_element.rect["top"]) <= ROW_THRESHOLD:
                # Same row
                current_row.append(element)
            else:
                # New row
                rows.append(list(current_row))
                current_row = [element]
    
    # Add the last row if not empty
    if current_row:
        rows.append(current_row)
    
    # Sort each row by X position (left to right)
    for row in rows:
        row.sort(key=lambda e: e.rect["left"])
    
    # Flatten the rows back into a single array
    elements = [element for row in rows for element in row]

    for i, element in enumerate(elements):
        element.index = i

    return elements


def combine_and_filter_elements(
    browser_elements: List[InteractiveElement], 
    cv_elements: List[InteractiveElement],
    iou_threshold: float = 0.7
) -> List[InteractiveElement]:
    """
    Combine browser elements and CV elements and filter duplicates.
    
    Args:
        browser_elements: Browser detection elements
        cv_elements: CV detection elements
        iou_threshold: Threshold for considering elements as overlapping
        
    Returns:
        Combined and filtered elements
    """
    # Combine elements
    all_elements = list(browser_elements) + cv_elements
    
    # Filter overlapping elements
    filtered = filter_overlapping_elements(all_elements, iou_threshold)
    
    # Sort elements by position
    sorted_elements = sort_elements_by_position(filtered)
    
    return sorted_elements

================================================
FILE: super_agents/browser_use/llm.py
================================================
# super_agents/browser_use/llm.py
import os
import json
import asyncio
from typing import Optional, Tuple, Type, Dict

# --- Environment Variable Loading ---
from dotenv import load_dotenv
load_dotenv()

# --- Pydantic & LangChain Core ---
try:
    # Import necessary Pydantic components if needed elsewhere (e.g., for generate_structured_output)
    from pydantic.v1 import BaseModel
except ImportError:
    from pydantic import BaseModel

from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.runnables.base import RunnableSerializable
# No longer need secret_from_env here if ChatOpenRouter doesn't use Field/SecretStr
# from langchain_core.utils.utils import secret_from_env
from langchain_openai import ChatOpenAI # Use the standard import

# --- API Key Loading (For initialize_llms) ---
LLM_API_KEY_FROM_ENV = os.getenv("LLM_API_KEY")
OPENAI_API_KEY_FROM_ENV = os.getenv("OPENAI_API_KEY")
GROQ_API_KEY_FROM_ENV = os.getenv("GROQ_API_KEY")
# OPENROUTER key will be loaded directly in ChatOpenRouter init
OPENROUTER_API_KEY_DIRECT = os.getenv("OPENROUTER_API_KEY")

# --- ChatOpenRouter Definition (Based on User's Example 1 Logic) ---
class ChatOpenRouter(ChatOpenAI):
    """
    Wrapper for ChatOpenAI configured for OpenRouter.
    Handles API key loading within __init__ using standard strings
    to avoid Pydantic V2 SecretStr issues during class definition.
    """
    # No class-level Field definition for openai_api_key to avoid Pydantic V2 error

    def __init__(self,
                 model_name: str, # Make model_name required
                 openai_api_key: Optional[str] = None, # Accept optional string key
                 openai_api_base: str = "https://openrouter.ai/api/v1", # Default OpenRouter base
                 **kwargs):
        """
        Initializes the ChatOpenRouter client.

        Args:
            model_name: The model identifier on OpenRouter (e.g., "alibaba/qwen-vl-max").
            openai_api_key: Optional OpenRouter API key (string). If None, reads from
                             OPENROUTER_API_KEY environment variable.
            openai_api_base: The API base URL. Defaults to OpenRouter.
            **kwargs: Additional arguments passed to ChatOpenAI.
        """
        # Resolve the API key: use passed argument first, then environment variable
        resolved_key = openai_api_key or OPENROUTER_API_KEY_DIRECT
        if not resolved_key:
            # Log warning or raise error if key is missing, depending on desired strictness
            # Raising an error is safer to prevent unexpected failures later
            raise ValueError("OpenRouter API key not provided directly or via OPENROUTER_API_KEY env var.")

        # Call the parent __init__ method, passing the resolved string key
        # Use openai_api_base argument expected by ChatOpenAI
        super().__init__(
            openai_api_base=openai_api_base,
            openai_api_key=resolved_key, # Pass resolved string key
            model_name=model_name, # Pass model_name
            **kwargs # Pass other arguments like temperature, max_tokens
        )
        # Optional: Log successful initialization
        # logger.info(f"ChatOpenRouter initialized for model {model_name}") # Requires logger setup

# --- Configurable LLM Initialization (For Planning LLM - unchanged) ---
def initialize_llms() -> Tuple[Optional[RunnableSerializable], Optional[RunnableSerializable]]:
    # ... (function remains the same as before) ...
    provider = os.getenv("LLM_PROVIDER", "openai").lower()
    model_name = os.getenv("LLM_MODEL_NAME", "gpt-4o-mini")
    api_key = LLM_API_KEY_FROM_ENV
    base_url = os.getenv("LLM_BASE_URL")
    temperature = float(os.getenv("LLM_TEMPERATURE", "0.1"))
    creative_temperature = float(os.getenv("LLM_CREATIVE_TEMPERATURE", "0.4"))
    print(f"\n--- Initializing Planning LLM ---")
    print(f"Provider: '{provider}'")
    print(f"Model Name: '{model_name}'")
    print(f"Base URL: {base_url if base_url else 'Default'}")
    print(f"Temperatures: Main={temperature}, Creative={creative_temperature}")
    print(f"-----------------------------")
    llm_instance: Optional[RunnableSerializable] = None
    llm_creative_instance: Optional[RunnableSerializable] = None
    try:
        if provider == "openai": # ... (rest of provider logic) ...
             key_to_use = api_key or OPENAI_API_KEY_FROM_ENV
             if not key_to_use: raise ValueError("OpenAI API key not found for planning LLM.")
             llm_instance = ChatOpenAI(model=model_name, temperature=temperature, api_key=key_to_use)
             llm_creative_instance = ChatOpenAI(model=model_name, temperature=creative_temperature, api_key=key_to_use)
        elif provider == "groq": # ...
             key_to_use = api_key or GROQ_API_KEY_FROM_ENV
             if not key_to_use: raise ValueError("Groq API key not found.")
             llm_instance = ChatOpenAI(model=model_name, temperature=temperature, openai_api_key=key_to_use, openai_api_base="https://api.groq.com/openai/v1")
             llm_creative_instance = ChatOpenAI(model=model_name, temperature=creative_temperature, openai_api_key=key_to_use, openai_api_base="https://api.groq.com/openai/v1")
        elif provider == "xai" or provider == "grok": # ...
             key_to_use = api_key
             if not key_to_use: raise ValueError(f"LLM_API_KEY required for '{provider}'.")
             if not base_url: raise ValueError(f"LLM_BASE_URL required for '{provider}'.")
             if not model_name: raise ValueError(f"LLM_MODEL_NAME required for '{provider}'.")
             llm_instance = ChatOpenAI(model=model_name, temperature=temperature, openai_api_key=key_to_use, openai_api_base=base_url)
             llm_creative_instance = ChatOpenAI(model=model_name, temperature=creative_temperature, openai_api_key=key_to_use, openai_api_base=base_url)
        elif provider == "openai_compatible": # ...
             key_to_use = api_key
             if not key_to_use: raise ValueError(f"LLM_API_KEY required for '{provider}'.")
             if not base_url: raise ValueError(f"LLM_BASE_URL required for '{provider}'.")
             if not model_name: raise ValueError(f"LLM_MODEL_NAME required for '{provider}'.")
             llm_instance = ChatOpenAI(model=model_name, temperature=temperature, openai_api_key=key_to_use, openai_api_base=base_url)
             llm_creative_instance = ChatOpenAI(model=model_name, temperature=creative_temperature, openai_api_key=key_to_use, openai_api_base=base_url)
        else:
            raise ValueError(f"Unsupported LLM_PROVIDER for planning LLM: '{provider}'.")
        print("--- Planning LLM Initialization Successful ---")
        return llm_instance, llm_creative_instance
    except Exception as e:
        print(f"!!! ERROR during Planning LLM Initialization: {e}")
        return None, None

# --- generate_structured_output (Helper used by Planning Node - unchanged) ---
async def generate_structured_output(model: Optional[RunnableSerializable], schema: Type[BaseModel], prompt: str, system_message: str = "") -> Optional[BaseModel]:
    # ... (function remains the same as before) ...
    if model is None: return None
    if not isinstance(model, RunnableSerializable): return None
    try:
        # Ensure schema is Pydantic BaseModel (imported from V1 or V2)
        if not issubclass(schema, BaseModel):
             print(f"Error: schema provided to generate_structured_output is not a Pydantic BaseModel (type: {type(schema)})")
             return None
        structured_llm = model.with_structured_output(schema)
        messages = []
        if system_message: messages.append(SystemMessage(content=system_message))
        messages.append(HumanMessage(content=prompt))
        response = await structured_llm.ainvoke(messages)
        if isinstance(response, schema): return response
        else:
            print(f"Warning: Structured output did not match expected schema {schema.__name__}. Got type: {type(response)}")
            return None
    except Exception as e:
        print(f"Error during structured output generation: {e}")
        # import traceback; traceback.print_exc() # Uncomment for full debug trace
        return None

================================================
FILE: super_agents/browser_use/main.py
================================================
# super_agents/browser_use/main.py
import asyncio
import argparse
import logging
import os
from typing import Dict
from dotenv import load_dotenv

# Import components
from .agent.graph import create_graph_app
from .agent.state import AgentState
# Import CORRECT Browser and BrowserConfig from browser.browser
from .browser.browser import Browser, BrowserConfig
# Import LLM initializer and type hint
from .llm import initialize_llms, RunnableSerializable

# --- Logging Setup ---
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
logger = logging.getLogger(__name__)

# --- Main Execution Logic ---
async def run_agent(task: str, config: Dict):
    """Initializes components and runs the agent graph."""

    load_dotenv()

    # 1. Initialize Browser Configuration (Removed CV/Sheets endpoints)
    browser_config = BrowserConfig( # <--- Uses CORRECT imported BrowserConfig
        viewport_size=config.get("viewport"),
        cdp_url=config.get("cdp_url"),
        storage_state=config.get("storage_state"), # Keep if storage_state is still in your BrowserConfig
        # cv_model_endpoint=config.get("cv_model_endpoint"), # <--- REMOVED
        # sheets_model_endpoint=config.get("sheets_model_endpoint"), # <--- REMOVED
    )

    # 2. Initialize ONLY the Planning LLM Provider
    llm, _ = initialize_llms() # Use _ to ignore creative llm if not needed
    if llm is None:
        logger.error("Failed to initialize planning LLM. Exiting.")
        return {"error": "Planning LLM Initialization failed."}

    # 3. Initialize Browser Tool (No longer needs vlm passed)
    browser_tool = None
    try:
        # Detector is now initialized internally by Browser using env vars
        browser_tool = Browser(config=browser_config)
        await browser_tool.initialize()

        # 4. Create the LangGraph App
        app = create_graph_app(browser=browser_tool, llm=llm)

        # 5. Define the initial state
        initial_state: AgentState = {
            "task": task, "browser_content": "", "parsed_action": {}, "history": [], "error": None,
        }

        # 6. Run the graph
        final_state = None
        logger.info(f"Starting agent execution for task: {task}")
        final_state = await app.ainvoke(initial_state, config={"recursion_limit": config.get("max_steps", 50)})
        logger.info("Agent execution finished.")

    except Exception as e:
        logger.error(f"Agent execution failed: {e}", exc_info=True)
        # Ensure error is propagated
        return {"error": f"Agent execution failed: {e}"}
    finally:
        # 7. Clean up browser instance
        if browser_tool:
            await browser_tool.close()

    # 8. Process and return the result
    if final_state:
         if final_state.get("error"):
             logger.error(f"Agent finished with error: {final_state['error']}")
             return {"error": final_state['error']}
         elif final_state.get("parsed_action", {}).get("type") == "finish":
             result = final_state["parsed_action"].get("result", "Task finished.")
             logger.info(f"Agent finished successfully. Result: {result}")
             return {"result": result}
         else:
             logger.warning("Agent finished without a 'finish' action or error.")
             final_action = final_state.get("parsed_action", {}).get("type", "N/A")
             return {"result": f"Agent stopped unexpectedly after action: {final_action}.", "final_state": final_state}
    else:
         # This case typically means an exception occurred before final state was reached
         # The error should have been returned from the except block
         return {"error": "Agent execution failed to produce a final state (likely due to earlier exception)."}


# --- Command Line Interface ---
if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Run the LangGraph Browser Agent.")
    parser.add_argument("task", help="The task description for the agent.")
    # Browser args (Align with updated BrowserConfig)
    parser.add_argument("--cdp-url", help="CDP URL.", default=None)
    parser.add_argument("--width", type=int, default=1200)
    parser.add_argument("--height", type=int, default=900)
    # REMOVED CV/Sheets Endpoint Args
    # parser.add_argument("--cv-endpoint", help="CV Model Endpoint.", default=None)
    # parser.add_argument("--sheets-endpoint", help="Sheets Model Endpoint.", default=None)
    # Add storage state path if needed
    # parser.add_argument("--storage-state-path", help="Path to storage state JSON file.", default=None)

    # Planning LLM args (Optional overrides for .env)
    parser.add_argument("--llm-provider", help="Force planning LLM provider.")
    parser.add_argument("--llm-model", help="Force planning LLM model name.")
    parser.add_argument("--llm-api-key", help="Force planning LLM API key (uses LLM_API_KEY env var).")
    parser.add_argument("--llm-base-url", help="Force planning LLM base URL.")

    # REMOVED VLM specific CLI args

    # Execution args
    parser.add_argument("--max-steps", type=int, default=50)

    args = parser.parse_args()

    # Prepare config dict for run_agent (Browser config + max_steps)
    run_config = {
        "cdp_url": args.cdp_url,
        "viewport": {"width": args.width, "height": args.height},
        "max_steps": args.max_steps,
        # Load storage state from path if implemented
        # "storage_state": load_storage_state(args.storage_state_path) if args.storage_state_path else None,
        # REMOVED cv/sheets endpoints from config passed to run_agent
    }

    # Set environment variables for planning LLM if args provided
    if args.llm_provider: os.environ['LLM_PROVIDER'] = args.llm_provider
    if args.llm_model: os.environ['LLM_MODEL_NAME'] = args.llm_model
    if args.llm_api_key: os.environ['LLM_API_KEY'] = args.llm_api_key # Set generic key
    if args.llm_base_url: os.environ['LLM_BASE_URL'] = args.llm_base_url
    # VLM config now solely relies on VLM_* env vars read by Detector/ChatOpenRouter

    # Run the async function
    result = asyncio.run(run_agent(args.task, run_config))

    # Print result
    print("\n--- Agent Result ---")
    if isinstance(result, dict):
        if "result" in result: print(f"Result: {result['result']}")
        if "error" in result: print(f"Error: {result['error']}")
        if "final_state" in result and "result" not in result and "error" not in result:
             # Limited printing of final state for brevity
             print(f"Final State (Debug): Keys={list(result['final_state'].keys())}")
    else:
         print(f"Output (unexpected format): {result}")

================================================
FILE: super_agents/customized_deep_research/PRD_README.md
================================================
**M&A DeepResearch Agent - Product Document**

**Version:** 1.0 (Optimized - YF/Web Focus)
**Date:** 2025年4月21日
**Status:** Design & Initial Implementation Phase

**Table of Contents:**

1.  Introduction
    1.1 Product Name
    1.2 Purpose & Vision
    1.3 Target Audience
    1.4 Document Scope
2.  Project Background & Business Need
    2.1 The Challenge of Preliminary M&A Research
    2.2 The Opportunity for Automation
    2.3 Product Goal
3.  Business & Functional Requirements
    3.1 Input Requirements
    3.2 Core Processing Requirements
    3.3 Output Requirements
    3.4 Non-Functional Requirements
4.  Core Features
5.  System Architecture & Core Implementation
    5.1 Overview
    5.2 Core Framework
    5.3 State Management & Data Models
    5.4 Workflow Orchestration (LangGraph)
    5.5 Task Execution (Nodes)
    5.6 AI / Large Language Models (LLM)
    5.7 External Tools & Data Sources
    5.8 Prompts
    5.9 Execution Entrypoint
6.  Workflow Diagram & Description
7.  Data Requirements & Input Format
    7.1 Input JSON Specification
    7.2 Environment Variables & API Keys
8.  Limitations & Constraints
9.  Future Work & Potential Enhancements

---

**1. Introduction**

**1.1 Product Name**

M&A DeepResearch Agent (Preliminary Assessment - YF/Web Version)

**1.2 Purpose & Vision**

* **Purpose:** To automate the process of conducting *preliminary* due diligence research on potential Mergers and Acquisitions (M&A) target companies. The agent leverages publicly available data sources – primarily Yahoo Finance for basic financial indicators and extensive web searches for qualitative context – to generate a structured, initial assessment report.
* **Vision:** To provide M&A professionals with a rapid, scalable, and consistent tool for initial target screening. By quickly identifying potential synergies, risks, and critical information gaps, the agent aims to significantly reduce the manual effort involved in the early stages of the M&A pipeline, enabling teams to focus resources on the most promising opportunities requiring deep, official-source due diligence.

**1.3 Target Audience**

* Mergers & Acquisitions (M&A) Analysts
* Investment Bankers
* Private Equity & Venture Capital Investment Professionals
* Corporate Development Teams
* Strategy Consultants involved in M&A screening

**1.4 Document Scope**

This document provides a comprehensive overview of the M&A DeepResearch Agent, covering its background, business needs, functional requirements, core features, system architecture, implementation details, workflow, data inputs, inherent limitations, and potential future directions. It reflects the state of the agent after incorporating optimizations focused on handling limited data sources (Yahoo Finance, Web Search) effectively, including JSON input handling and YFinance failure fallback mechanisms.

**2. Project Background & Business Need**

**2.1 The Challenge of Preliminary M&A Research**

The initial screening and preliminary research phase of the M&A process is critical but often faces significant challenges:

* **Time-Consuming:** Manually gathering information from disparate public sources (news, company websites, basic financial portals, web searches) for numerous potential targets is incredibly time-intensive.
* **Resource-Intensive:** Requires significant analyst hours, diverting resources from deeper analysis on higher-priority targets.
* **Data Accessibility Issues:** For many companies, especially non-US listed or private entities, easily accessible, standardized financial filings (like SEC EDGAR) are unavailable. Analysts must rely on fragmented, potentially unreliable public data.
* **Consistency:** Manual research quality and depth can vary significantly depending on the analyst and time constraints.
* **Information Overload:** Sifting through vast amounts of web search results to find relevant M&A signals is difficult.
* **Decision Bottleneck:** The difficulty in quickly getting a baseline understanding often delays the crucial decision: "Is this target worth dedicating serious resources for full due diligence?"

**2.2 The Opportunity for Automation**

Recent advancements in Large Language Models (LLMs) and workflow automation frameworks (like LangGraph) present an opportunity to address these challenges. An AI agent can be designed to:

* Automate the process of querying APIs (like Yahoo Finance) and performing targeted web searches.
* Leverage LLMs to understand, analyze, synthesize, and structure information gathered from these diverse, often unstructured sources.
* Execute a predefined, consistent research workflow across multiple targets.
* Generate structured reports highlighting key findings, potential red flags, and critical information gaps.

**2.3 Product Goal**

The primary goal of the M&A DeepResearch Agent is to **provide M&A professionals with a rapid, structured, and appropriately cautious preliminary research report on potential acquisition targets.** This report, based *only* on readily available public data (Yahoo Finance and Web Search), should:

* Offer a baseline understanding of the target's business, market position, and preliminary financial signals.
* Identify potential (speculative) M&A angles and key risks apparent from public sources.
* Crucially, highlight the significant limitations of the data used and the specific information gaps that **must** be addressed through deep due diligence using official sources (e.g., audited financial statements, regulatory filings).
* Ultimately, empower users to make more informed and efficient decisions about which targets warrant the significant investment required for a full due diligence process.

**3. Business & Functional Requirements**

**3.1 Input Requirements**

* The agent must accept input identifying the target company via a standardized JSON object.
* The JSON object **must** contain non-empty `identifier_ric` (e.g., "AAPL", "9417.T") and `company_name` fields.
* The JSON object **may** contain optional auxiliary/validation fields: `country_of_exchange`, `market_cap_usd`, `business_description`, `pe_timeseries_ratio`, `ebitda_fy0_usd`, `query_date`.
* The agent should allow configuration of analysis depth (e.g., 'basic', 'detailed').

**3.2 Core Processing Requirements**

* **Initialization:** Parse JSON input, identify core target info (Ticker/RIC, Name), store all provided input fields in the initial state.
* **Financial Data Fetch:** Attempt to fetch basic financial data from Yahoo Finance using the provided Ticker/RIC. Handle potential errors gracefully (e.g., invalid ticker, no data). Serialize fetched DataFrame data into JSON-compatible dictionaries. Set a state flag (`yfinance_fetch_failed`) upon significant fetch failure.
* **Research Planning:** Generate a dynamic research plan based on the target profile and the success/failure of the YFinance fetch.
    * If YFinance succeeded, plan includes one YF fetch step and multiple targeted web search queries across M&A angles.
    * If YFinance failed, plan **omits** the YF step and instead includes specific **financial web search queries** (using initial JSON data as context) alongside the general M&A angle web searches.
    * Plan must define corresponding analysis goals requiring synthesis of available financial data (YF or Web) and general web findings.
* **Web Searching:** Execute planned web search queries (using Tavily API). Handle both financial fallback searches and general M&A angle searches systematically. Store structured results.
* **Multi-Angle Analysis:** Perform distinct analysis steps based on planned goals:
    * **Financial Analysis:** Analyze available financial data (either serialized YF dicts or financial web search results), correlate findings with general web context, identify preliminary signals/flags, and note data source limitations.
    * **Competitive Analysis:** Analyze market niche, competitors, positioning, and potential moat based on YF info hints and web searches.
    * **Management/Governance Analysis:** Analyze hints about key personnel, ownership (YF), and governance signals from web searches.
* **Gap Analysis:** Analyze the limitations of the research performed (YF/Web only), identify critical information gaps requiring official sources, and suggest potentially actionable (though uncertain) follow-up web search queries aimed at finding clues or links.
* **Gap Filling Search (Conditional):** If actionable web follow-up queries were suggested by Gap Analysis, execute them.
* **Synthesis:** Consolidate findings from all previous steps (initial data, YF/Web financials, web searches, analyses, gaps) into a coherent M&A-focused narrative, highlighting key themes (strengths/risks) and critical remaining uncertainties.
* **Reporting:** Generate a final Markdown report including:
    * A structured summary table (generated from state).
    * All standard report sections (Exec Summary, Intro, Overview, Market, Financials, Mgmt/Gov, Risks/Angles, **Critical Limitations**, Conclusion).
    * Appropriate tone (analytical, objective, acknowledging limitations without excessive repetition).
    * Correctly reflecting the source of financial information (YF or Web Fallback).

**3.3 Output Requirements**

* The primary output must be a single Markdown file containing the comprehensive Preliminary Research Briefing.
* The report must begin with the structured summary table.
* The report must follow the defined section structure.
* The report must clearly cite sources where appropriate (YF, Web).
* The report must prominently feature the "CRITICAL LIMITATIONS & NEXT STEPS" section, detailing necessary official sources for deep diligence.
* (Optional) The agent should provide streaming updates (`StreamUpdate` schema) indicating progress through the research workflow steps.

**3.4 Non-Functional Requirements**

* **Scalability:** The architecture should conceptually support processing a large number of targets (e.g., the user's ~1400 inputs) sequentially or potentially in parallel (with infrastructure adjustments).
* **Configurability:** Allow configuration of LLM provider, model name, API keys, and potentially parameters like search result counts via environment variables (`.env`).
* **Maintainability:** Code should be modular, well-commented, and use clear variable/function names.
* **Robustness:** Implement error handling for API calls (LLM, YFinance, Tavily) and potential data parsing issues. The YFinance fallback mechanism enhances robustness.

**4. Core Features**

* **Automated M&A Preliminary Research Workflow:** End-to-end execution managed by LangGraph.
* **JSON Input Processing:** Accepts standardized JSON for target identification and context.
* **Yahoo Finance Integration:** Fetches and serializes basic financial data.
* **YFinance Failure Fallback:** Automatically switches to targeted web searches for financial hints if YFinance fails.
* **Advanced Web Search (Tavily):** Performs targeted web searches for qualitative insights across multiple M&A dimensions.
* **Multi-Angle LLM Analysis:** Leverages LLMs for Financial, Competitive, and Management/Governance analysis based on combined data.
* **Automated Gap Analysis:** Identifies key information gaps inherent in YF/Web-only research.
* **Conditional Gap-Filling Search:** Attempts targeted web searches to address identified gaps (if deemed potentially fruitful).
* **LLM-Powered Synthesis:** Consolidates all findings into an M&A-focused summary.
* **Structured Markdown Report Generation:** Produces a standardized, readable report including a summary table and detailed sections.
* **Configurable LLM Backend:** Supports various LLM providers via environment variables.
* **Streaming Progress Updates:** Provides real-time feedback on the research process.

**5. System Architecture & Core Implementation**

**5.1 Overview**

The agent is implemented as a Python application utilizing the LangGraph library to orchestrate a multi-step research process. It interacts with external APIs (LLM, YFinance, Tavily) and follows a state-driven execution model.

**5.2 Core Framework**

* **Language:** Python 3.8+
* **Orchestration:** LangGraph (`StateGraph`)

**5.3 State Management & Data Models**

* **State:** `ResearchState` TypedDict (`state.py`) defines the graph's memory, holding all inputs, intermediate results, and final outputs.
* **Data Models:** Pydantic models (`schemas.py`) define structured inputs/outputs for LLM calls (e.g., `ResearchPlan`, `GapAnalysisResult`, `FinalSynthesisResult`) and data structures (e.g., `SearchResultItem`, `StreamUpdate`).

**5.4 Workflow Orchestration (LangGraph)**

* `graph.py` defines the `StateGraph` instance.
* Nodes representing research tasks are added (`workflow.add_node`).
* Edges define the sequence of execution (`workflow.add_edge`).
* Conditional edges (`workflow.add_conditional_edges`) control branching based on state evaluation functions (e.g., `should_continue_web_search`, `decide_gap_followup`).

**5.5 Task Execution (Nodes)**

* `nodes.py` implements the core logic for each step as asynchronous Python functions.
* Each node function receives the current `ResearchState`, performs its task (e.g., calling tools, formatting prompts, invoking LLMs), and returns a dictionary containing updates to the state.

**5.6 AI / Large Language Models (LLM)**

* Configured in `tools.py` via `initialize_llms()`. Supports OpenAI, XAI (Grok), Groq (via OpenAI-compatible API), or generic OpenAI-compatible endpoints based on `.env` settings.
* Uses `langchain_openai.ChatOpenAI` (or potentially provider-specific classes).
* Two instances typically used: `llm` (lower temperature for analytical tasks) and `llm_creative` (higher temperature for planning, synthesis, report generation).
* Leverages LangChain's `with_structured_output` for reliable JSON generation based on Pydantic schemas.

**5.7 External Tools & Data Sources**

* **Yahoo Finance:** Accessed via the `yfinance` Python library. A wrapper function `Workspace_yfinance_data` in `tools.py` handles API calls, error catching, and **DataFrame serialization into dictionaries**.
* **Web Search:** Accessed via the `Tavily` Python client. A wrapper function `perform_web_search` in `tools.py` handles API calls and result formatting into `SearchResultItem` schema.

**5.8 Prompts**

* Defined as constants in `prompt.py`.
* Specifically crafted for each LLM-driven task: Planning, Financial Analysis (adapts based on YF status), Competitive Analysis, Management/Governance Analysis, Gap Analysis, Synthesis, and Final Report Generation.
* Prompts are designed to guide the LLM, provide context from the state, and request output in specific formats (often structured JSON or Markdown).

**5.9 Execution Entrypoint**

* `main.py` serves as the script's entry point.
* Handles command-line argument parsing (JSON input).
* Initializes the `ResearchState` based on JSON input.
* Retrieves the compiled LangGraph application (`get_mna_app_yfinance` from `graph.py`).
* Executes the graph using `research_app.astream()`.
* Processes streaming updates for console output.
* Handles final state processing and saving the Markdown report to the `./Output/` directory.

**6. Workflow Diagram & Description**

```mermaid
graph TD
    A[Start: Input JSON] --> B(Initialize Research State);
    B --> C{Check Init OK?};
    C -- Yes --> D(Plan Research (Adapts based on YF flag));
    C -- No --> Z(Finalize Basic Research / Error);
    D --> E{Check Plan OK?};
    E -- Yes --> F(Prepare Steps);
    E -- No --> Z;
    F --> G(Fetch YFinance Data (Sets YF Flag));
    G --> H(Execute Search);
    H --> I{Continue Web Search? (Checks Total vs Completed)};
    I -- Yes --> H;
    I -- No --> J{Analysis Planned?};
    J -- Yes --> K(Perform Analysis);
    J -- No --> L(Analyze Gaps);
    K --> M{Continue Analysis? (Checks Index vs Planned/Max)};
    M -- Yes --> K;
    M -- No --> L;
    L --> N{Actionable Web Gaps Found & Gap Search Not Run?};
    N -- Yes --> O(Execute Gap Search);
    N -- No --> P(Synthesize Final Report);
    O --> P;
    P --> Q{Check Synthesis OK?};
    Q -- Yes --> R(Generate Final Markdown Report (with Table));
    Q -- No --> Z;
    R --> Y(END);
    Z --> Y;

    subgraph Web Search Loop
        H
        I
    end
    subgraph Analysis Loop
        K
        M
    end
    subgraph Optional Gap Fill
        N
        O
    end

```

**Workflow Description:**

1.  **Initialize:** Start with JSON input, create initial state including company details and flags.
2.  **Plan Research:** Based on initial info and whether YFinance is expected to work (or has already failed - though flag is set *after* fetch), LLM generates a plan including financial data steps (YF or Web) and general web search queries, plus analysis goals.
3.  **Prepare Steps:** Creates a list of steps for potential UI display.
4.  **Fetch YFinance:** Attempts to get data from Yahoo Finance. Sets the `yfinance_fetch_failed` flag in the state if it encounters significant errors. Serializes successful data.
5.  **Execute Search:** Enters a loop. Checks the `yfinance_fetch_failed` flag. If true, it first executes planned *financial* web searches. Once those are done (or if YF succeeded), it executes the *general* M&A angle web searches. It updates a counter (`completed_web_search_count`) after each successful search.
6.  **Continue Web Search?:** The conditional edge checks if `completed_web_search_count` is less than the total number of *required* web searches (financial fallback + general). If yes, loop back to Execute Search. If no, proceed.
7.  **Perform Analysis:** If analysis steps were planned, enter a loop. Execute analysis based on the goal (Financial, Competitive, Mgmt/Gov), using appropriate prompts that consider the `yfinance_fetch_failed` flag to select the correct financial context (YF dicts or financial web results). Loop until all planned steps are done or `max_analysis_steps` is reached.
8.  **Analyze Gaps:** Evaluate all gathered information (YF/Web financials, web search results, analyses) to identify critical limitations requiring official sources and suggest *actionable* web follow-up queries.
9.  **Decide Gap Follow-up:** Check if actionable web follow-up queries were generated and if the gap search hasn't already run.
10. **Execute Gap Search:** If needed, run the suggested web follow-up queries.
11. **Synthesize Report:** Consolidate all information (initial inputs, YF/Web financials, all web search results, all analyses, gap summary) into a final synthesis focused on M&A themes and uncertainties.
12. **Generate Final Report:** Create the structured summary table from the state. Call the LLM using the final report prompt, providing the table and all synthesized context. Prepend the table to the LLM's generated report body. Save the final Markdown.
13. **End:** Terminate the process. `Finalize Basic Research` is a fallback endpoint for early termination due to errors.

**7. Data Requirements & Input Format**

**7.1 Input JSON Specification**

The agent expects a JSON object with the following structure:

```json
{
  "identifier_ric": "string", // REQUIRED: Reuters Instrument Code or Ticker (e.g., "AAPL", "9417.T")
  "company_name": "string", // REQUIRED: Full company name
  "country_of_exchange": "string", // OPTIONAL: Country where the primary exchange is located (e.g., "USA", "Japan")
  "market_cap_usd": number, // OPTIONAL: Recent market capitalization in USD
  "business_description": "string", // OPTIONAL: A brief description of the company's business
  "pe_timeseries_ratio": number, // OPTIONAL: Recent P/E ratio (note context if timeseries)
  "ebitda_fy0_usd": number, // OPTIONAL: EBITDA for the last full fiscal year (FY0) in USD
  "query_date": "string" // OPTIONAL: Date the input data was sourced (e.g., "YYYY-MM-DD")
}
```

**7.2 Environment Variables & API Keys**

The agent requires API keys and configuration set via a `.env` file in the project root:

* `LLM_PROVIDER`: e.g., "openai", "xai", "groq"
* `LLM_MODEL_NAME`: e.g., "gpt-4-turbo", "grok-2"
* `LLM_API_KEY`: API Key for the selected LLM provider (or provider-specific key like `OPENAI_API_KEY`, `XAI_API_KEY`, `GROQ_API_KEY`).
* `LLM_BASE_URL`: Required for non-default OpenAI endpoints (like XAI).
* `LLM_TEMPERATURE`, `LLM_CREATIVE_TEMPERATURE`: LLM temperature settings.
* `TAVILY_API_KEY`: API Key for Tavily web search.
* *(Optional)* `EXA_API_KEY`: If Exa search tools were enabled.

**8. Limitations & Constraints**

* **Data Source Reliance:** The agent's output quality is fundamentally limited by the accuracy, completeness, and timeliness of data available on Yahoo Finance and public web search. It **cannot replace** analysis based on official, audited sources.
* **No Official Filings Access:** The agent **does not** parse or analyze official financial filings (e.g., SEC EDGAR 10-K/10-Q, local Annual Reports). This is the most significant limitation for deep M&A diligence.
* **YFinance Data Limitations:** Yahoo Finance data can have gaps, inaccuracies, or delays. It lacks detailed footnotes and Management Discussion & Analysis (MD&A).
* **Web Search Limitations:** Public web search results can be noisy, biased, outdated, lack context, or miss critical non-public information. Sentiment and opinions found online may not be representative.
* **LLM Limitations:** Subject to standard LLM risks, including potential inaccuracies ("hallucinations"), biases present in training data, and inability to perform complex multi-step reasoning without explicit guidance. Structured output parsing can occasionally fail.
* **Non-US/Private Company Data:** Publicly available information (especially structured financial data via YF and English web search results) is often significantly less comprehensive for non-US listed companies and practically non-existent for private companies.
* **Analysis vs. Judgment:** The agent provides analysis and identifies potential signals based on limited data. It does **not** provide investment advice or a definitive judgment on whether a target *should* be acquired. That requires human expertise and deep diligence.

**9. Future Work & Potential Enhancements**

* **Official Document Ingestion (High Impact, High Complexity):** Develop capabilities to ingest and parse specific sections of downloaded official documents (e.g., PDF Annual Reports, specific SEC filing sections) if available, to augment YF/Web data.
* **Premium Data Integration:** Integrate with commercial financial data providers (e.g., Bloomberg API, Refinitiv Eikon Data API, S&P Capital IQ) for more reliable and detailed financial data (requires subscriptions).
* **Advanced Iteration & Re-planning:** Implement more sophisticated loops where the agent re-evaluates its plan or re-runs specific analyses based on intermediate findings or identified high-priority gaps.
* **Human-in-the-Loop:** Integrate optional steps for human review and feedback to guide the research process or validate findings.
* **Knowledge Base Integration:** Connect the agent to internal knowledge bases or databases containing prior research or proprietary company information.
* **Multi-Lingual Enhancements:** Improve web search and analysis capabilities for targets operating primarily in non-English speaking markets.
* **Deployment & Scalability:** Package the agent for deployment as a scalable microservice (potentially using the A2A adapter framework mentioned in the README).
* **UI Development:** Create a dedicated web interface for easier input, configuration, and visualization of streaming results and final reports.
* **Valuation Module:** Add a preliminary valuation analysis module (e.g., based on comparable companies analysis using YF data or web-found multiples), clearly stating its high-level, indicative nature.

================================================
FILE: super_agents/customized_deep_research/README.md
================================================
# M&A DeepResearch Agent (Preliminary Assessment)

这是 Deep Research Agent 的一个定制化版本，旨在简化 M&A 专业人士的研究流程，帮助他们快速评估潜在标的，并为后续的尽职调查提供基础。我认为有效的 Agent 大概率是定制化的，是针对特定任务和特定场景的服务的。

## 概述 (Overview)

M&A DeepResearch Agent 是一个基于 LangGraph 构建的、专注于执行**初步并购目标尽职调查**的自动化研究工具。它利用公开可用的数据源——主要包括 **Yahoo Finance** (用于获取基础财务指标) 和广泛的 **Web 搜索** (通过 Tavily 获取定性信息、市场背景、新闻等)——来为 M&A 专业人士提供支持。

该 Agent 能够针对用户通过 JSON 格式提供的目标公司信息，自动化地执行一个标准化的初步研究流程，涵盖信息规划、数据获取（含 YFinance 失败时的 Web 搜索回退）、多维度分析和报告生成。最终产出是一份结构化的 Markdown 格式初步研究简报，旨在帮助用户快速评估潜在标的，识别关键风险点和信息缺口，并就是否投入资源进行更深入的、基于官方文件的尽职调查做出更明智的决策。

## 核心特性 (Core Features)

* **自动化初步 M&A 研究流程**: 实现了从目标初始化、研究规划、数据获取、多源信息分析到最终报告生成的端到端自动化工作流 (基于 YFinance 和 Web Search)。
* **JSON 输入**: 通过标准化的 JSON 对象接收目标公司信息（必需：RIC/Ticker、公司名；可选：国家、市值、业务描述等），确保输入稳定性和可扩展性。
* **Yahoo Finance 集成**: 调用 `yfinance` 库获取基础财务数据（公司信息、财报概览、股东信息等），并进行序列化处理。
* **YFinance 失败回退**: 当无法从 Yahoo Finance 获取有效数据时，能自动切换到执行针对性的 Web 搜索来尝试获取替代性的财务线索。
* **定向网络搜索 (Tavily)**: 利用 Tavily 执行高级 Web 搜索，围绕 M&A 关键角度（管理层、产品技术、市场竞争、客户、风险等）收集定性信息和市场背景。
* **多角度 LLM 分析**: 基于获取的 YF/Web 数据，利用 LLM 进行多个维度的初步分析，包括：
    * 财务概况与风险分析 (结合 YF 数据或 Web 回退结果与网络信息)
    * 市场竞争格局与定位分析
    * 管理层与治理初步评估
* **M&A 聚焦的 Gap 分析**: 评估当前研究的局限性（强调 YF/Web 数据的不足），识别进行可靠 M&A 决策所必需的关键信息缺口（通常需要官方文件），并尝试提出可行的补充性 Web 搜索建议。
* **结构化 Markdown 报告输出**: 生成包含标准章节（含关键局限性说明）、初步发现、以及**报告头部结构化摘要表**的研究简报。
* **可配置 LLM 后端**: 支持通过环境变量配置不同的 LLM 提供商 (OpenAI, XAI Grok, Groq 等兼容 OpenAI API 的模型) 和模型参数。
* **流式进度更新**: (通过 Agent 内部机制) 支持输出研究过程中的状态更新，便于观察执行进度。


================================================
FILE: super_agents/customized_deep_research/__init__.py
================================================


================================================
FILE: super_agents/customized_deep_research/main.py
================================================
# /Users/peng/Dev/AI_AGENTS/mentis/super_agents/company_deep_research/main.py
# (Optimized Version - Accepts JSON Input)

import sys
from pathlib import Path
import asyncio
import json
import os
import re
import time
from datetime import datetime
from typing import Literal, List, Dict, Any, Optional # Ensure Optional is imported

# --- OpenAI RateLimitError Handling ---
try:
    from openai import RateLimitError
except ImportError:
    print("Warning: 'openai' package not installed. RateLimitError handling will use a basic Exception.")
    class RateLimitError(Exception):
        pass

# --- Dynamic Path Setup (Keep as is) ---
try:
    # ... (keep existing dynamic path setup code) ...
    current_script_path = Path(__file__).resolve()
    project_root = current_script_path.parent
    while not (project_root / '.git').exists() and project_root.parent != project_root:
        project_root = project_root.parent
    if not (project_root / '.git').exists():
        print("Warning: Could not automatically determine project root based on '.git'. Adding script's directory parent.")
        project_root = current_script_path.parent.parent
    path_to_add = project_root
    if str(path_to_add) not in sys.path:
        sys.path.insert(0, str(path_to_add))
    print(f"Dynamically added project root to sys.path: {path_to_add}")
except Exception as e:
    print(f"Error during dynamic path setup: {e}. Please ensure script is run from correct location or manually set PYTHONPATH.")
    exit(1)


# --- LangGraph and Internal Module Imports ---
try:
    from super_agents.company_deep_research.reason_graph.graph import get_mna_app_yfinance
    from super_agents.company_deep_research.reason_graph.state import ResearchState # Import updated state
    from super_agents.company_deep_research.reason_graph.schemas import StreamUpdate
except ImportError as e:
    print(f"Error importing graph components: {e}")
    print(f"Please ensure all required files exist in 'reason_graph' and dependencies are installed.")
    exit(1)
except Exception as e:
    print(f"An unexpected error occurred during imports: {e}")
    exit(1)


# --- Helper Function for Filenames (Keep as is) ---
def slugify(text: str) -> str:
    """Converts text into a safe filename component."""
    if not text:
        return "no_topic_provided"
    core_text = text.split(" (")[0].split(" ")[0]
    if not core_text: core_text = text
    core_text = core_text.lower()
    core_text = re.sub(r'\s+', '_', core_text)
    core_text = re.sub(r'[^\w\-\.]+', '', core_text)
    core_text = core_text.strip('_.- ')
    return core_text[:50] if core_text else "sanitized_topic"

# --- **NEW**: Function to create initial state from JSON ---
def create_initial_state_from_json(input_data: Dict[str, Any], depth: Literal['basic', 'detailed']) -> ResearchState:
    """Creates the initial ResearchState dictionary from the input JSON data."""
    if not input_data.get("identifier_ric") or not input_data.get("company_name"):
        raise ValueError("Input JSON must contain non-empty 'identifier_ric' and 'company_name'.")

    # Use .get with appropriate defaults (e.g., None or specific like 'N/A', 0.0)
    # Storing None is okay if subsequent nodes handle it correctly.
    state: ResearchState = {
        "identifier_ric": input_data["identifier_ric"],
        "company_name": input_data["company_name"],
        "country_of_exchange": input_data.get("country_of_exchange"), # Default is None if not present
        "market_cap_usd": input_data.get("market_cap_usd"), # Default is None
        "input_business_description": input_data.get("business_description"), # Default is None
        "input_pe_ratio": input_data.get("pe_timeseries_ratio"), # Default is None
        "input_ebitda_usd": input_data.get("ebitda_fy0_usd"), # Default is None
        "input_query_date": input_data.get("query_date"), # Default is None

        # Initialize other fields
        "topic": f"M&A Research for {input_data['company_name']} ({input_data['identifier_ric']})",
        "ticker": input_data["identifier_ric"],
        "max_search_iterations": 3,
        "max_analysis_steps": 5,
        "analysis_depth": depth,
        "research_plan": None,
        "search_steps_planned": [],
        "financial_web_search_steps": [],
        "analysis_steps_planned": [],
        "current_analysis_step_index": 0,
        "completed_web_search_count": 0, # Initialize counter
        "yfinance_data": None,
        "yfinance_fetch_failed": False,
        "search_results": [],
        "financial_web_search_results": [],
        "analysis_results": [],
        "financial_analysis": None,
        "competitive_analysis": None,
        "management_governance_assessment": None,
        "gaps_identified": None,
        "gap_search_results": [],
        "final_synthesis": None,
        "final_report_markdown": None,
        "structured_summary_table": None,
        "stream_updates": [],
        "completed_steps_count": 0.0,
        "total_steps": None,
        "error_message": None
    }
    return state

# --- Main Research Execution Function ---
async def run_research(initial_state: ResearchState): # Takes pre-filled state
    """
    Runs the M&A research graph using the provided initial state,
    handling streaming output and errors. Saves the final report.
    """
    company_name = initial_state['company_name']
    ticker = initial_state['ticker']
    depth = initial_state['analysis_depth']

    print("\n--- Starting M&A Research Graph (Optimized - JSON Input) ---")
    print(f"Company Name: '{company_name}'")
    print(f"Ticker/RIC: '{ticker}'")
    print(f"Analysis Depth: '{depth}'")
    print("-" * 30)

    processed_updates_count = 0
    config = {"recursion_limit": 150}
    final_state: Optional[ResearchState] = None
    error_occurred: Optional[Exception] = None

    # --- Streaming Execution ---
    try:
        research_app = get_mna_app_yfinance(for_web=False)
        async for state_update_chunk in research_app.astream(initial_state, config=config, stream_mode="values"):
            final_state = state_update_chunk
            all_current_updates: List[Dict] = final_state.get("stream_updates", [])
            new_updates_count = len(all_current_updates) - processed_updates_count

            if new_updates_count > 0:
                newly_added_updates = all_current_updates[processed_updates_count:]
                print(f"--- Processing {new_updates_count} New Stream Update(s) ---")
                for update_dict in newly_added_updates:
                    update_data = update_dict.get('data', {})
                    status = update_data.get('status', 'N/A')
                    step_id = update_data.get('id', 'N/A')
                    msg = update_data.get('message', '')
                    update_type = update_data.get('type', 'N/A')
                    title = update_data.get('title', '')
                    print(f"[{datetime.fromtimestamp(update_dict.get('timestamp', time.time())):%H:%M:%S}] "
                          f"[{update_type.upper()}|{status.upper()}|ID:{step_id}] "
                          f"{title+': ' if title else ''}{msg}")
                    payload = update_data.get('payload')
                    # (Keep payload preview logic as before)
                    if payload:
                         try:
                             payload_preview = json.dumps(payload, indent=2, default=str, ensure_ascii=False)
                             if len(payload_preview) > 500: payload_preview = payload_preview[:500] + "..."
                             print(f"  Payload Preview: {payload_preview}")
                         except Exception as json_e: print(f"  Payload Preview: [Could not serialize: {json_e}]")

                print("-" * 30)
                processed_updates_count = len(all_current_updates)

    except RateLimitError as e:
        error_occurred = e
        print("\n" + "="*40 + "\n!!! OpenAI API Error: Insufficient Quota !!!\n" + "="*40 + "\n")
        # (Keep detailed error message)
        print("The research process was stopped due to OpenAI quota limits.")
        print("Please check your OpenAI plan and billing details.")
        print(f"Original error: {e}")
    except ImportError as e:
        error_occurred = e
        print("\n" + "="*40 + "\n!!! Python Import Error !!!\n" + "="*40 + "\n")
        # (Keep detailed error message)
        print(f"Could not import necessary modules: {e}")
        print("Please ensure all dependencies are installed and the project structure is correct.")
    except Exception as e:
        error_occurred = e
        print("\n" + "="*40 + "\n!!! An Unexpected Error Occurred During Graph Execution !!!\n" + "="*40 + "\n")
        # (Keep detailed error message)
        print(f"Error type: {type(e).__name__}")
        print(f"Error details: {e}")
        import traceback
        traceback.print_exc()


    # --- Process Final State ---
    if error_occurred:
         print("\n--- Graph Execution INTERRUPTED by Error ---")
         print("Attempting to process the last known state (may be incomplete).")
    else:
         print("\n--- Graph Execution Finished ---")

    # Check if final_state is valid before proceeding
    if not final_state or not isinstance(final_state, dict):
         print("Error: Final state is invalid or unavailable after execution.")
         error_report = f"# Research Failed\n\nCompany: {initial_state['company_name']} ({initial_state['ticker']})\nReason: Workflow execution failed to produce a valid final state."
         if error_occurred: error_report += f"\nError Details: {type(error_occurred).__name__}: {error_occurred}"
         # (Keep minimal error report saving logic)
         try:
             topic_slug = slugify(initial_state['ticker']) # Use ticker for filename slug
             timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
             filename = f"research_ERROR_{topic_slug}_{timestamp}.md"
             script_dir = Path(__file__).parent
             output_dir = script_dir / "Output"
             output_dir.mkdir(parents=True, exist_ok=True)
             filepath = output_dir / filename
             with open(filepath, "w", encoding="utf-8") as f: f.write(error_report)
             print(f"Saved error summary to: {filepath}")
         except Exception as save_e: print(f"Could not save error summary report: {save_e}")
         return None # Indicate failure

    # --- Print Final State Summary ---
    print("\n--- FINAL STATE SUMMARY (May be partial if error occurred) ---")
    print(f"Company Name: {final_state.get('company_name', 'N/A')}")
    print(f"Ticker/RIC: {final_state.get('ticker', 'N/A')}")
    print(f"Depth: {final_state.get('analysis_depth', 'N/A')}")
    print(f"Completed Steps Count: {final_state.get('completed_steps_count', 'N/A')}")
    print(f"Total Steps Estimated: {final_state.get('total_steps', 'N/A')}")
    yf_failed = final_state.get('yfinance_fetch_failed', False)
    yf_data = final_state.get('yfinance_data')
    yf_error_msg = "Fetch Failed/Skipped" if yf_failed else (yf_data.get('error', 'None') if isinstance(yf_data, dict) else 'N/A')
    print(f"Yahoo Finance Fetch Status: {'FAILED (Used Web Fallback)' if yf_failed else 'OK'}")
    if yf_error_msg != 'None': print(f"  YF Error Message: {yf_error_msg}")
    print(f"General Web Searches Planned/Executed: {len(final_state.get('search_steps_planned', []))} / {final_state.get('current_search_step_index', 0)}")
    print(f"Financial Web Searches (Fallback) Planned/Executed: {len(final_state.get('financial_web_search_steps', []))} / {final_state.get('current_financial_web_search_index', 0) if yf_failed else 'N/A'}") # Adjust index key maybe
    print(f"Analysis Steps Performed: {final_state.get('current_analysis_step_index', 0)}")
    print(f"Total Web Results Collected (All): {len(final_state.get('search_results', []) + final_state.get('financial_web_search_results', []) + final_state.get('gap_search_results', []))}")
    print(f"Final Synthesis Generated: {'Yes' if final_state.get('final_synthesis') else 'No'}")
    print(f"Summary Table Generated: {'Yes' if final_state.get('structured_summary_table') else 'No'}")


    # --- Save Final Report ---
    final_markdown = final_state.get('final_report_markdown')

    if final_markdown and isinstance(final_markdown, str):
        if "Report Generation Failed" in final_markdown and not error_occurred:
             print("\n--- Final Report Generation Node Failed ---")
             print(final_markdown.split('\n\n', 1)[-1])
             print("Report not saved.")
        elif not error_occurred:
             print("\n--- Saving Final Report to Markdown ---")
             try:
                 filename_base = final_state['ticker'] # Use ticker for filename
                 topic_slug = slugify(filename_base)
                 timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
                 filename = f"research_report_{topic_slug}_{timestamp}.md"
                 script_dir = Path(__file__).parent
                 output_dir = script_dir / "Output"
                 output_dir.mkdir(parents=True, exist_ok=True)
                 filepath = output_dir / filename
                 with open(filepath, "w", encoding="utf-8") as f: f.write(final_markdown)
                 print(f"Successfully saved report to: {filepath}")
             except Exception as e:
                 print(f"\nError saving final report to Markdown: {e}")
                 print("Report content was:\n" + final_markdown[:1000] + "...")
        else:
             # Error occurred, but report might exist (e.g., from finalize node)
             print("\nFinal Report: Not saved due to earlier execution error.")
             print("Partial/Fallback report content (if available):\n" + str(final_markdown)[:1000] + "...")

    elif error_occurred:
         print("\nFinal Report: Not generated or incomplete due to execution error.")
    else:
         print("\nFinal Report: Not found in final state.")

    print("\n--- END OF RESEARCH ---")
    return final_state


# --- Main Execution Block ---
async def main():
     # **MODIFIED: Accept JSON file path or JSON string as argument**
     if len(sys.argv) < 2:
         print("Usage: python main.py <path_to_json_file_or_json_string>")
         print("Example (File): python main.py input_data/9417.T.json")
         print("Example (String): python main.py '{\"identifier_ric\": \"AAPL\", \"company_name\": \"Apple Inc.\"}'")
         return

     input_arg = sys.argv[1]
     input_json_data = None

     try:
         # Try to load as file path first
         input_path = Path(input_arg)
         if input_path.is_file():
             print(f"Loading input data from file: {input_path}")
             with open(input_path, 'r', encoding='utf-8') as f:
                 input_json_data = json.load(f)
         else:
             # Try to load as JSON string
             print("Input is not a file path, attempting to parse as JSON string.")
             input_json_data = json.loads(input_arg)
     except json.JSONDecodeError:
         print(f"Error: Input argument '{input_arg}' is neither a valid file path nor a valid JSON string.")
         return
     except FileNotFoundError:
         print(f"Error: Input file not found at '{input_arg}'")
         return
     except Exception as e:
         print(f"Error processing input argument: {e}")
         return

     if not input_json_data or not isinstance(input_json_data, dict):
         print("Error: Parsed input data is not a valid JSON object.")
         return

     # Get analysis depth (optional second argument or default)
     depth_input = sys.argv[2].strip().lower() if len(sys.argv) > 2 else 'detailed'
     depth: Literal['basic', 'detailed'] = 'basic' if depth_input == 'basic' else 'detailed'

     # Create initial state from JSON
     try:
          initial_research_state = create_initial_state_from_json(input_json_data, depth)
     except ValueError as ve:
          print(f"Error creating initial state: {ve}")
          return
     except Exception as state_e:
          print(f"Unexpected error creating initial state: {state_e}")
          return


     # Run the research process
     await run_research(initial_research_state)

if __name__ == "__main__":
    try:
        print("Starting M&A Deep Research Runner (Optimized)...")
        if sys.version_info < (3, 8): # Asyncio.run needs 3.7+, some async features better in 3.8+
             print("Warning: Python 3.8+ recommended for best asyncio performance.")
        asyncio.run(main())
    except KeyboardInterrupt:
        print("\nResearch process interrupted by user (Ctrl+C).")
    except Exception as e:
        print(f"\nA critical error occurred in the main execution block: {e}")
        import traceback
        traceback.print_exc()
    finally:
        print("\nProgram finished.")

================================================
FILE: super_agents/customized_deep_research/reason_graph/__init__.py
================================================


================================================
FILE: super_agents/customized_deep_research/reason_graph/graph.py
================================================
# /Users/peng/Dev/AI_AGENTS/mentis/super_agents/company_deep_research/reason_graph/graph.py
# (Optimized Version v2 - Adjusted Conditional Logic)

from typing import Literal, Optional, Dict, Any
from langgraph.graph import StateGraph, END, START

# Use updated state definition
from .state import ResearchState
# Import updated node functions
from .nodes import (
    initialize_research,
    plan_research,
    prepare_steps,
    fetch_financial_data,
    execute_search, # Handles both financial and general web searches now
    perform_analysis,
    analyze_gaps,
    execute_gap_search,
    synthesize_final_report,
    finalize_basic_research,
    generate_final_markdown_report
)

# --- Conditional Edge Functions (Revised) ---

def check_initialization(state: ResearchState) -> Literal["plan_research", "finalize_basic_research"]:
    """Decides whether to proceed after initialization."""
    # Initialization now primarily uses guaranteed JSON input
    if state.get('ticker') and state.get('company_name'):
        print("[Graph Condition] Initialization successful (used JSON input), proceeding to plan.")
        # Initialize web search count here
        state['completed_web_search_count'] = 0
        return "plan_research"
    else:
        # This path should ideally not be hit if main.py enforces JSON input
        print("[Graph Condition] Initialization failed (missing core data from state), finalizing.")
        state['error_message'] = "Initialization failed: Missing core company info."
        return "finalize_basic_research"

def check_planning(state: ResearchState) -> Literal["prepare_steps", "finalize_basic_research"]:
     """Checks if the research plan was successfully generated."""
     if state.get("research_plan"):
         print("[Graph Condition] Planning successful, proceeding to prepare steps.")
         return "prepare_steps"
     else:
         print("[Graph Condition] Planning failed or plan is empty, finalizing research.")
         return "finalize_basic_research"

# --- REVISED Web Search Continuation Logic ---
def should_continue_web_search(state: ResearchState) -> Literal["execute_search", "perform_analysis", "analyze_gaps"]:
    """Decides whether to continue web searching (financial fallback or general) or move to analysis."""
    completed_count = state.get('completed_web_search_count', 0)
    yfinance_failed = state.get('yfinance_fetch_failed', False)

    # Calculate total web searches needed
    financial_searches_planned = state.get('financial_web_search_steps', [])
    general_searches_planned = state.get('search_steps_planned', [])
    total_web_searches_needed = 0
    if yfinance_failed:
        total_web_searches_needed += len(financial_searches_planned)
    total_web_searches_needed += len(general_searches_planned)

    print(f"[Graph Condition Check] Web Searches: Completed={completed_count}, Total Needed={total_web_searches_needed}")

    if completed_count < total_web_searches_needed:
        # If there are more web searches planned (either type), continue the loop.
        print(f"[Graph Condition] Continue web search ({completed_count + 1}/{total_web_searches_needed}).")
        return "execute_search"
    else:
        # If all planned web searches are done, check if analysis is needed.
        analysis_steps_planned = state.get('analysis_steps_planned', [])
        if analysis_steps_planned and isinstance(analysis_steps_planned, list) and len(analysis_steps_planned) > 0:
             # If analysis steps exist, move to the analysis phase.
             print("[Graph Condition] All applicable web searches complete. Moving to analysis.")
             return "perform_analysis"
        else:
             # If no analysis steps were planned, skip analysis and go directly to gap identification.
             print("[Graph Condition] All applicable web searches complete, no analysis planned. Moving to gap analysis.")
             return "analyze_gaps"


def should_continue_analysis(state: ResearchState) -> Literal["perform_analysis", "analyze_gaps"]:
    """Decides whether to continue executing planned analysis steps or move to gap analysis."""
    current_analysis_index = state.get('current_analysis_step_index', 0)
    analysis_steps_planned = state.get('analysis_steps_planned', [])
    if not isinstance(analysis_steps_planned, list): analysis_steps_planned = [] # Safety check
    max_steps = state.get('max_analysis_steps', 5) # Use configured max steps

    if current_analysis_index < len(analysis_steps_planned) and current_analysis_index < max_steps:
        # If more analysis steps are left within plan and limit, continue the loop.
        print(f"[Graph Condition] Continue analysis ({current_analysis_index + 1}/{len(analysis_steps_planned)}, Max: {max_steps}).")
        return "perform_analysis"
    else:
        if current_analysis_index >= max_steps:
            print(f"[Graph Condition] Reached max analysis steps ({max_steps}). Moving to gap analysis.")
        else:
            print("[Graph Condition] All planned analysis steps complete. Moving to gap analysis.")
        return "analyze_gaps"

def decide_gap_followup(state: ResearchState) -> Literal["execute_gap_search", "synthesize_final_report"]:
    """Decides whether to execute gap-filling web searches or move to synthesis."""
    gaps = state.get('gaps_identified')
    # Check if gap analysis suggested *actionable* web follow-up queries
    # AND if the gap search node hasn't already run (check presence/content of gap_search_results)
    has_run_gap_search = len(state.get('gap_search_results', [])) > 0
    follow_up_queries_exist = gaps and gaps.follow_up_queries and isinstance(gaps.follow_up_queries, list) and len(gaps.follow_up_queries) > 0

    if follow_up_queries_exist and not has_run_gap_search:
         print("[Graph Condition] Actionable gaps identified with web search suggestions, proceeding to execute gap search.")
         return "execute_gap_search"
    else:
        if has_run_gap_search:
             print("[Graph Condition] Gap search already performed or skipped previously. Moving to synthesis.")
        elif not follow_up_queries_exist:
             print("[Graph Condition] No actionable web follow-up needed based on gap analysis. Moving to synthesis.")
        else: # Should not happen but safety catch
             print("[Graph Condition] Unexpected state in gap decision. Moving to synthesis.")
        return "synthesize_final_report"

def check_synthesis(state: ResearchState) -> Literal["generate_final_markdown_report", "finalize_basic_research"]:
     """Checks if the synthesis step was successful before generating the final report."""
     final_synthesis = state.get("final_synthesis")
     # Check if synthesis result exists and has non-empty key findings
     if final_synthesis and hasattr(final_synthesis, 'key_findings_summary') and final_synthesis.key_findings_summary and \
        "fail" not in final_synthesis.key_findings_summary.lower(): # Basic check for failure text
         print("[Graph Condition] Synthesis successful, proceeding to report generation.")
         return "generate_final_markdown_report"
     else:
         print("[Graph Condition] Synthesis failed, missing, or empty, finalizing research.")
         state['error_message'] = "Synthesis failed or produced empty results." # Set error
         return "finalize_basic_research"


# --- Build the Optimized M&A Workflow ---
def build_mna_research_graph_yfinance_optimized(for_web: bool = False) -> StateGraph:
    """
    Builds the LangGraph StateGraph for M&A preliminary research (Optimized Version).
    """
    workflow = StateGraph(ResearchState)

    # --- Define Nodes ---
    workflow.add_node("initialize_research", initialize_research)
    workflow.add_node("plan_research", plan_research)
    workflow.add_node("prepare_steps", prepare_steps)
    workflow.add_node("fetch_financial_data", fetch_financial_data)
    workflow.add_node("execute_search", execute_search) # Handles both search types
    workflow.add_node("perform_analysis", perform_analysis)
    workflow.add_node("analyze_gaps", analyze_gaps)
    workflow.add_node("execute_gap_search", execute_gap_search)
    workflow.add_node("synthesize_final_report", synthesize_final_report)
    workflow.add_node("generate_final_markdown_report", generate_final_markdown_report)
    workflow.add_node("finalize_basic_research", finalize_basic_research)

    # --- Define Edges ---

    # 1. Set Entry Point
    workflow.set_entry_point("initialize_research")

    # 2. Initialization to Planning (Conditional)
    workflow.add_conditional_edges(
        "initialize_research",
        check_initialization,
        {"plan_research": "plan_research", "finalize_basic_research": "finalize_basic_research"}
    )

    # 3. Planning to Prepare Steps (Conditional)
    workflow.add_conditional_edges(
        "plan_research",
        check_planning,
        {"prepare_steps": "prepare_steps", "finalize_basic_research": "finalize_basic_research"}
    )

    # 4. Prepare Steps to Fetching Financial Data
    # Always attempt YF fetch after preparing steps (node handles failure flag).
    workflow.add_edge("prepare_steps", "fetch_financial_data")

    # 5. Fetch Financial Data to Starting Web Search
    # Always proceed to execute_search node after fetch attempt.
    # execute_search node internally decides which searches to run based on YF flag.
    workflow.add_edge("fetch_financial_data", "execute_search")

    # 6. Web Search Loop (Handles both Financial Fallback and General)
    # **MODIFIED Condition:** Uses the revised condition function.
    workflow.add_conditional_edges(
        "execute_search",
        should_continue_web_search, # Uses revised logic checking total searches needed vs completed
        {
            "execute_search": "execute_search", # Loop back if more searches needed
            "perform_analysis": "perform_analysis", # Move to analysis if searches done & analysis planned
            "analyze_gaps": "analyze_gaps" # Move to gaps if searches done & no analysis planned
        }
    )

    # 7. Analysis Loop to Gap Analysis
    workflow.add_conditional_edges(
        "perform_analysis",
        should_continue_analysis, # Function checks if more analysis steps are planned within limits
        {"perform_analysis": "perform_analysis", "analyze_gaps": "analyze_gaps"}
    )

    # 8. Gap Analysis to Gap Search or Synthesis
    workflow.add_conditional_edges(
        "analyze_gaps",
        decide_gap_followup, # Checks for *actionable* web follow-ups
        {"execute_gap_search": "execute_gap_search", "synthesize_final_report": "synthesize_final_report"}
    )

    # 9. After Gap Search (if run) to Synthesis
    # Always go to synthesis after attempting gap search.
    workflow.add_edge("execute_gap_search", "synthesize_final_report")

    # 10. Synthesis to Final Report (Conditional)
    workflow.add_conditional_edges(
        "synthesize_final_report",
        check_synthesis, # Checks if synthesis result is valid
        {"generate_final_markdown_report": "generate_final_markdown_report", "finalize_basic_research": "finalize_basic_research"}
    )

    # 11. Final Report to END
    workflow.add_edge("generate_final_markdown_report", END)

    # 12. Fallback End Path
    workflow.add_edge("finalize_basic_research", END)

    print("M&A Research Graph Built (Optimized JSON Input & YF Fallback Version).")
    return workflow

# --- Build and Compile ---
graph_app_builder = build_mna_research_graph_yfinance_optimized

# Compile the graph instance for script execution
app_mna_yf_opt = graph_app_builder(for_web=False).compile()
# Optionally compile for web if needed
# web_app_mna_yf_opt = graph_app_builder(for_web=True).compile()

# --- Function for main.py to Import ---
def get_mna_app_yfinance(for_web: bool = False) -> Any:
    """Returns the compiled optimized M&A graph."""
    print(f"[Graph Module] Providing compiled OPTIMIZED graph instance (for_web={for_web})...")
    # if for_web:
    #     return web_app_mna_yf_opt # If you have a web version
    # else:
    return app_mna_yf_opt # Return the optimized version

================================================
FILE: super_agents/customized_deep_research/reason_graph/nodes.py
================================================
# /Users/peng/Dev/AI_AGENTS/mentis/super_agents/company_deep_research/reason_graph/nodes.py
# (Optimized Version)

import re
import asyncio
import json
import time
from datetime import datetime
from typing import Dict, Any, List, Literal, Optional
import pandas as pd
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage

# --- Internal Imports ---
from .state import ResearchState, YFinanceData
from .schemas import (
    SearchQuery, RequiredAnalysis, AnalysisResult, GapAnalysisResult, GapFollowUpQuery,
    FinalSynthesisResult, SearchStepResult, SearchResultItem, StreamUpdate, StepInfo, ResearchPlan, KeyFinding
)
from .tools import (
    llm, llm_creative, generate_structured_output,
    perform_web_search,
    fetch_yfinance_data,
    create_update # Use the corrected helper
)
from .prompt import (
    PLAN_RESEARCH_PROMPT_YFINANCE,
    FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE_YFINANCE_ONLY,
    FINANCIAL_ANALYSIS_PROMPT_YFINANCE,
    COMPETITIVE_ANALYSIS_PROMPT_YFINANCE,
    MANAGEMENT_GOVERNANCE_PROMPT_YFINANCE,
    GAP_ANALYSIS_PROMPT_YFINANCE,
    SYNTHESIS_PROMPT_YFINANCE
)
# Import logger from tools if defined there, or set up locally
# from .tools import logger # Assuming logger is setup in tools.py
# Fallback basic logger if not imported
import logging
logger = logging.getLogger(__name__)
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - [%(funcName)s] %(message)s')


# --- Node Functions (Optimized Version) ---

async def initialize_research(state: ResearchState) -> Dict[str, Any]:
    """Initializes research using guaranteed JSON input fields."""
    # Assumes state is pre-populated with JSON input by main.py
    identifier_ric = state['identifier_ric'] # Guaranteed
    company_name = state['company_name'] # Guaranteed
    step_id = 'initialize-research'

    # Use guaranteed fields directly
    ticker = identifier_ric # Use RIC as the ticker for yfinance
    research_topic = f"M&A Preliminary Deep Research for {company_name} ({ticker})"

    logger.info(f"--- Running Node: initialize_research ({company_name} / {ticker}) ---")
    logger.info(f"Using guaranteed input: Ticker='{ticker}', Name='{company_name}'")
    # Log optional fields if present
    for key in ['country_of_exchange', 'market_cap_usd', 'input_business_description', 'input_pe_ratio', 'input_ebitda_usd', 'input_query_date']:
        if state.get(key):
            logger.info(f"Input {key}: {state[key]}")

    message = f"Initialization complete. Target: {company_name} ({ticker})"
    status = 'completed'
    # Corrected create_update call
    all_updates = create_update(state, {
        'id': step_id,
        'type': 'setup',
        'status': status,
        'title': 'Initialize Research',
        'message': message,
        'overwrite': True
    })
    # Corrected create_update call for progress
    all_updates.extend(create_update(state, {
        'id': 'research-progress',
        'type': 'progress',
        'status': 'running',
        'title': 'Research Progress',
        'completedSteps': 0.5,
        'message':'Initialization complete, planning research...',
        'overwrite': True
    }))

    logger.info(f"--- Exiting Node: initialize_research ---")
    # Return minimal update as core info is already in state
    return {
        "topic": research_topic, # Set derived topic
        "ticker": ticker, # Ensure ticker is explicitly set from RIC
        "yfinance_fetch_failed": False, # Initialize YF status flag
        "stream_updates": state.get('stream_updates', []) + all_updates
    }


async def plan_research(state: ResearchState) -> Dict[str, Any]:
    """Generates research plan, adapting based on yfinance fetch status."""
    ticker = state['ticker'] # Guaranteed from init
    company_name = state['company_name'] # Guaranteed from init
    topic = state['topic'] # Derived topic string
    yfinance_failed = state.get('yfinance_fetch_failed', False) # Check YF status flag
    step_id = 'research-plan-initial'

    all_updates = create_update(state, {
        'id': step_id, 'type': 'plan', 'status': 'running',
        'title': 'Research Plan', 'message': 'Creating research plan...', 'overwrite': True
    })
    logger.info(f"\n--- Running Node: plan_research (Target: {company_name} / {ticker}) ---")
    logger.info(f"Yahoo Finance fetch status (before plan): {'Failed' if yfinance_failed else 'Assumed OK / Pending'}")

    # Prepare context for the planning prompt, including initial JSON data
    yfinance_status_text = "Failed" if yfinance_failed else "Successful" # Text for prompt
    country = state.get('country_of_exchange', 'N/A')
    market_cap = state.get('market_cap_usd', 'N/A')
    ebitda = state.get('input_ebitda_usd', 'N/A')
    query_date = state.get('input_query_date', 'N/A')
    business_desc = state.get('input_business_description', 'N/A')


    plan_prompt = PLAN_RESEARCH_PROMPT_YFINANCE.format(
        company_name=company_name,
        ticker=ticker,
        country=country,
        market_cap=market_cap,
        ebitda=ebitda,
        query_date=query_date,
        business_desc=business_desc,
        yfinance_status=yfinance_status_text
        # topic=topic # Topic string might be less useful now
    )

    try:
        research_plan_result: Optional[ResearchPlan] = await generate_structured_output(
            llm_creative, ResearchPlan, plan_prompt
        )

        if not research_plan_result:
             raise ValueError("Research plan generation failed or yielded empty result.")

        # Separate planned steps
        search_steps_planned = research_plan_result.search_queries if research_plan_result.search_queries else []
        analysis_steps_planned = research_plan_result.required_analyses if research_plan_result.required_analyses else []

        # Filter out yfinance step if YF failed - it shouldn't be planned anyway based on prompt, but double-check.
        if yfinance_failed:
            search_steps_planned = [s for s in search_steps_planned if s.tool_hint != 'yfinance']
            num_yfinance_steps = 0
        else:
             num_yfinance_steps = sum(1 for s in search_steps_planned if s.tool_hint == 'yfinance')

        # Separate financial web searches if YF failed (assuming they are generated by the prompt)
        financial_web_search_steps = []
        other_web_search_steps = []
        if yfinance_failed:
             # Heuristic: Identify financial web searches based on keywords in query
             financial_keywords = ['revenue', 'profit', 'financials', 'market cap', 'ebitda', 'funding', 'financing', 'debt', 'valuation']
             for s in search_steps_planned:
                 if s.tool_hint == 'web_search' and any(keyword in s.query.lower() for keyword in financial_keywords):
                     financial_web_search_steps.append(s)
                 elif s.tool_hint == 'web_search': # Keep other web searches
                     other_web_search_steps.append(s)
             logger.info(f"YF failed. Identified {len(financial_web_search_steps)} potential financial web searches and {len(other_web_search_steps)} other web searches.")
             search_steps_planned = other_web_search_steps # Main loop handles non-financial web searches
        else:
             search_steps_planned = [s for s in search_steps_planned if s.tool_hint != 'yfinance'] # Remove YF step for web search loop

        num_web_search_steps = len(search_steps_planned)
        num_financial_web_search_steps = len(financial_web_search_steps)
        num_analysis_steps = len(analysis_steps_planned)
        # Adjust total steps estimate
        total_steps = 1 + 1 + (0 if yfinance_failed else 1) + num_web_search_steps + num_financial_web_search_steps + num_analysis_steps + 1 + 1 + 1 + 1

        message = f"Research plan created: {num_web_search_steps} general web searches, {num_financial_web_search_steps} financial web searches (YF fallback), {num_analysis_steps} analyses."
        if not yfinance_failed: message = f"Research plan created: 1 yfinance step, {num_web_search_steps} web searches, {num_analysis_steps} analyses."

        all_updates.extend(create_update(state, {
            'id': step_id, 'type': 'plan', 'status': 'completed', 'title': 'Research Plan',
            'message': message,
            'payload': research_plan_result.dict() if research_plan_result else {},
            'overwrite': True
        }))
        all_updates.extend(create_update(state, {
            'id': 'research-progress', 'type': 'progress', 'status': 'running', 'title': 'Research Progress',
            'message': 'Research plan complete.', 'completedSteps': 1.5, 'totalSteps': total_steps,
            'isComplete': False, 'overwrite': True
        }))

        logger.info("--- Exiting Node: plan_research (Success) ---")
        return {
            "research_plan": research_plan_result,
            "search_steps_planned": search_steps_planned, # General web searches
            "financial_web_search_steps": financial_web_search_steps, # Financial web searches (if YF failed)
            "analysis_steps_planned": analysis_steps_planned,
            "current_search_step_index": 0,
            "current_analysis_step_index": 0,
            "completed_steps_count": 1.5,
            "total_steps": total_steps,
            "stream_updates": state.get('stream_updates', []) + all_updates,
        }
    except Exception as e:
        logger.error(f"Error in plan_research: {e}", exc_info=True)
        error_updates = create_update(state, {
            'id': step_id, 'type': 'plan', 'status': 'error', 'title': 'Research Plan',
            'message': f"Failed to create plan: {e}", 'overwrite': True
            })
        progress_error = create_update(state, {
            'id': 'research-progress', 'type': 'progress', 'status': 'error', 'title': 'Research Progress',
            'message': 'Research planning failed.', 'isComplete': True, 'overwrite': True
            })
        logger.info("--- Exiting Node: plan_research (Error) ---")
        return {"stream_updates": state.get('stream_updates', []) + all_updates + error_updates + progress_error, "research_plan": None}


async def prepare_steps(state: ResearchState) -> Dict[str, Any]:
    """Prepares step info for UI, reflecting dynamic plan."""
    # Get planned steps from state
    yfinance_failed = state.get('yfinance_fetch_failed', False)
    web_search_steps = state.get('search_steps_planned', []) # General web searches
    financial_web_searches = state.get('financial_web_search_steps', []) # Financial web searches (if YF failed)
    analysis_steps = state.get('analysis_steps_planned', [])
    steps_info = []
    all_updates = state.get('stream_updates', [])
    logger.info("--- Running Node: prepare_steps ---")

    # Create StepInfo objects for UI display
    steps_info.append(StepInfo(id='initialize-research', type='setup', status='completed', title='Initialize Research', description=f"Target: {state['company_name']} ({state['ticker']})"))
    steps_info.append(StepInfo(id='research-plan-initial', type='plan', status='completed', title='Research Plan', description='Plan Created'))

    # Add YFinance Step OR Financial Web Search Steps
    if not yfinance_failed:
        steps_info.append(StepInfo(id='fetch-yfinance', type='data_fetch', status='pending', title='Fetch Yahoo Finance Data', description=f"Get financial data for {state['ticker']}"))
    else:
        for i, step in enumerate(financial_web_searches):
            steps_info.append(StepInfo(id=f'financial-web-search-{i}', type='search', status='pending', title=f"Financial Web Search #{i+1}", description=f"Alt for YF: {step.query[:60]}..." ))

    # Add General Web Search Steps
    for i, step in enumerate(web_search_steps):
        steps_info.append(StepInfo(id=f'web-search-{i}', type='search', status='pending', title=f"Web Search #{i+1}", description=step.query[:60]+"..." ))

    # Add Analysis Steps
    for i, step in enumerate(analysis_steps):
         steps_info.append(StepInfo(id=f'analysis-{i}', type='analysis', status='pending', title=f"Analysis #{i+1}", description=step.analysis_goal[:60]+"..." ))

    # Add Fixed Subsequent Steps
    steps_info.append(StepInfo(id='gap-analysis', type='analysis', status='pending', title='Identify Gaps', description='Analyze limitations.'))
    steps_info.append(StepInfo(id='gap-search', type='search', status='pending', title='Gap Filling Search', description='Follow-up web searches.'))
    steps_info.append(StepInfo(id='synthesis', type='synthesis', status='pending', title='Synthesize Findings', description='Combine all findings.'))
    steps_info.append(StepInfo(id='final-report', type='report', status='pending', title='Generate Final Report', description='Create final report.'))

    # Send steps list update
    all_updates.extend(create_update(state, {
        'id': 'research-steps-list',
        'type': 'steps_list',
        'status': 'completed',
        'title': 'Research Steps',
        'payload': [s.dict() for s in steps_info] # Use model_dump for Pydantic V2
    }))

    # Update total steps based on actual steps listed for better accuracy
    total_steps_actual = len(steps_info)
    if state.get('total_steps') != total_steps_actual:
        all_updates.extend(create_update(state, {
            'id': 'research-progress', 'type': 'progress', 'status': 'running',
            'title': 'Research Progress', 'totalSteps': total_steps_actual,
            'message': 'Steps prepared.', 'overwrite': True
            }))

    logger.info(f"--- Exiting Node: prepare_steps (Prepared {total_steps_actual} steps) ---")
    return {"stream_updates": all_updates, "total_steps": total_steps_actual} # Return updated total_steps


async def fetch_financial_data(state: ResearchState) -> Dict[str, Any]:
    """Fetches data using the yfinance tool and sets failure flag."""
    ticker = state['ticker'] # Guaranteed from init
    step_id = 'fetch-yfinance'
    yfinance_fetch_failed = False # Default to success initially
    all_updates = create_update(state, {
        'id': step_id, 'type': 'data_fetch', 'status': 'running',
        'title': 'Fetch Yahoo Finance Data', 'message': f"Fetching Yahoo Finance data for {ticker}...",
        'overwrite': True
    })
    logger.info(f"\n--- Running Node: fetch_financial_data ({ticker}) ---")

    yfinance_result: YFinanceData = {"error": "Fetch not attempted."} # Default
    status = 'pending'

    try:
        # Call the tool function from tools.py
        yfinance_result = await fetch_yfinance_data(ticker) # Assumes tool is async
        fetch_error = yfinance_result.get('error')

        if fetch_error:
            # Check if it's a critical failure (e.g., info failed, or many errors)
            if "Failed to fetch core info" in fetch_error or "critical error" in fetch_error.lower():
                 message = f"Yahoo Finance critical error: {fetch_error[:150]}..."
                 status = 'error'
                 yfinance_fetch_failed = True # Set failure flag
                 logger.error(message)
            else:
                 # Treat other errors as warnings, data might be partially useful
                 message = f"Yahoo Finance fetch completed with non-critical error: {fetch_error[:100]}..."
                 status = 'warning'
                 # yfinance_fetch_failed = False # Assume partial success is okay unless explicitly critical
                 logger.warning(message)
        else:
             message = "Yahoo Finance data fetched successfully."
             status = 'completed'
             logger.info(message)

    except Exception as e:
        message = f"Critical system error in fetch_financial_data node: {e}"
        logger.error(message, exc_info=True)
        yfinance_result = {"error": message}
        status = 'error'
        yfinance_fetch_failed = True # Set failure flag on system error

    # Update UI for node completion/status
    payload = {'keys': list(yfinance_result.keys()), 'error': yfinance_result.get('error')} if isinstance(yfinance_result, dict) else None
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': 'data_fetch', 'status': status,
        'title': 'Fetch Yahoo Finance Data', 'message': message,
        'payload': payload, 'overwrite': True
    }))

    # Update progress
    completed_steps = state.get('completed_steps_count', 0) + 1
    all_updates.extend(create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': 'running',
        'title': 'Research Progress', 'completedSteps': completed_steps,
        'message': f'Completed financial data fetch step ({status}).',
        'overwrite': True
    }))

    logger.info(f"--- Exiting Node: fetch_financial_data ({status}, YF_Failed={yfinance_fetch_failed}) ---")
    return {
        "yfinance_data": yfinance_result,
        "yfinance_fetch_failed": yfinance_fetch_failed, # Pass the flag status
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates
    }


async def execute_search(state: ResearchState) -> Dict[str, Any]:
    """Executes planned web searches: financial fallback first (if YF failed), then general."""
    yfinance_failed = state.get('yfinance_fetch_failed', False)
    completed_web_search_total = state.get('completed_web_search_count', 0) # Use the total count

    financial_searches_planned = state.get('financial_web_search_steps', [])
    general_searches_planned = state.get('search_steps_planned', [])

    num_financial_to_do = len(financial_searches_planned) if yfinance_failed else 0
    num_general_to_do = len(general_searches_planned)

    search_to_execute = None
    list_being_processed = None # 'financial' or 'general'
    current_local_index = -1 # Index within the specific list
    result_key = None # State key to append results to
    step_prefix = None
    step_type = 'search'
    step_title_prefix = None

    # Determine which search step is next based on the total completed count
    if yfinance_failed and completed_web_search_total < num_financial_to_do:
        list_being_processed = 'financial'
        current_local_index = completed_web_search_total
        search_to_execute = financial_searches_planned[current_local_index]
        result_key = 'financial_web_search_results'
        step_prefix = 'financial-web-search-'
        step_title_prefix = "Financial Web Search #"
    elif completed_web_search_total < (num_financial_to_do + num_general_to_do):
        list_being_processed = 'general'
        # Adjust index based on whether financial searches were done
        current_local_index = completed_web_search_total - num_financial_to_do
        search_to_execute = general_searches_planned[current_local_index]
        result_key = 'search_results'
        step_prefix = 'web-search-'
        step_title_prefix = "Web Search #"
    else:
        # Should not be called if condition in graph is correct, but handle defensively
        logger.warning("execute_search called but all web searches seem complete. Check graph logic.")
        return {"completed_web_search_count": completed_web_search_total} # No changes


    step_id = f'{step_prefix}{current_local_index}'
    all_updates = create_update(state, {
        'id': step_id, 'type': step_type, 'status': 'running',
        'title': f'{step_title_prefix}{current_local_index + 1}', # Use local index for title numbering
        'message': f"Executing: {search_to_execute.query[:60]}...", 'overwrite': True
    })
    logger.info(f"\n--- Running Node: execute_search ({step_title_prefix}{current_local_index + 1}) ---")
    logger.info(f"Overall Web Step: {completed_web_search_total + 1} / {num_financial_to_do + num_general_to_do}")
    logger.info(f"Query: {search_to_execute.query}")

    search_step_result = SearchStepResult(query=search_to_execute.query, results=[], tool_used="web_search")
    status = 'error'

    try:
        web_results = await perform_web_search(search_to_execute.query, max_results=5)
        search_step_result.results = web_results
        message = f"{step_title_prefix}{current_local_index + 1} finished, found {len(web_results)} results."
        status = 'completed'
        logger.info(message)
    except Exception as e:
        message = f"{step_title_prefix}{current_local_index + 1} failed: {e}"
        status = 'error'
        logger.error(f"Error during web search for query '{search_to_execute.query}': {e}", exc_info=True)
        search_step_result.results = []

    # --- Update UI for node completion ---
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': step_type, 'status': status,
        'title': f'{step_title_prefix}{current_local_index + 1}',
        'message': message, 'overwrite': True
    }))

    # --- Update PROGRESS (Overall step count AND web search count) ---
    completed_steps = state.get('completed_steps_count', 0) + 1
    new_completed_web_search_count = completed_web_search_total + 1 # Increment total web search count

    all_updates.extend(create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': 'running',
        'title': 'Research Progress', 'completedSteps': completed_steps,
        'message': f'Completed Web Search Step {new_completed_web_search_count} ({status}).', # Use total count in message
        'overwrite': True
    }))

    # --- Append result to the correct list in the state ---
    current_results_list = state.get(result_key, [])
    new_results = current_results_list + [search_step_result]

    logger.info(f"--- Exiting Node: execute_search ({step_title_prefix}{current_local_index + 1}) ---")

    return {
        result_key: new_results,
        "completed_web_search_count": new_completed_web_search_count, # Return updated total count
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates,
    }


async def perform_analysis(state: ResearchState) -> Dict[str, Any]:
    """Performs analysis, adapting prompt context based on YFinance status."""
    current_index = state.get('current_analysis_step_index', 0)
    analysis_steps_planned = state.get('analysis_steps_planned', [])

    if current_index >= len(analysis_steps_planned):
        logger.info("No more analysis steps planned.")
        return {"current_analysis_step_index": current_index}

    analysis_step = analysis_steps_planned[current_index]
    company_name = state['company_name']
    ticker = state['ticker']
    topic = state['topic']
    step_id = f'analysis-{current_index}'
    yfinance_failed = state.get('yfinance_fetch_failed', False)

    all_updates = create_update(state, {
        'id': step_id, 'type': 'analysis', 'status': 'running',
        'title': f'Analysis #{current_index + 1}',
        'message': f"Performing: {analysis_step.analysis_goal[:60]}...", 'overwrite': True
    })
    logger.info(f"\n--- Running Node: perform_analysis (Step {current_index + 1}/{len(analysis_steps_planned)}) ---")
    logger.info(f"Goal: {analysis_step.analysis_goal}")
    logger.info(f"YFinance Status: {'Failed - Using Web Fallback' if yfinance_failed else 'OK - Using YF Data'}")

    # --- Gather Context ---
    # Financial Context (Conditional)
    financial_context = "[Financial Context]\n"
    financial_data_source_description = "N/A" # Default
    if yfinance_failed:
        financial_web_results = state.get('financial_web_search_results', [])
        if financial_web_results:
             financial_context += "Source: Financial Web Search Results (Yahoo Finance Failed)\n"
             financial_data_source_description = "financial web search results"
             for i, res in enumerate(financial_web_results):
                 financial_context += f"Query {i+1}: {res.query}\n"
                 for item in res.results[:3]: # Limit snippets
                     financial_context += f"- {item.title}: {item.snippet[:150]}...\n"
             # Include initial JSON financial data if available
             initial_market_cap = state.get('market_cap_usd')
             initial_ebitda = state.get('input_ebitda_usd')
             initial_pe = state.get('input_pe_ratio')
             if initial_market_cap or initial_ebitda or initial_pe:
                  financial_context += "\nInitial Input Data Hints:\n"
                  if initial_market_cap: financial_context += f"- Market Cap (USD): {initial_market_cap}\n"
                  if initial_ebitda: financial_context += f"- EBITDA (USD, FY0): {initial_ebitda}\n"
                  if initial_pe: financial_context += f"- P/E Ratio: {initial_pe}\n"
        else:
             financial_context += "Source: Yahoo Finance Failed and NO financial web search results available.\n"
             financial_data_source_description = "web search (YF failed, limited results)"
    else:
        yfinance_data = state.get('yfinance_data')
        if yfinance_data and not yfinance_data.get('error'):
             financial_context += "Source: Yahoo Finance Data (Serialized Dictionaries)\n"
             financial_data_source_description = "Yahoo Finance data"
             # Summarize available YF data keys/presence
             financial_context += f"Available YF Keys: {list(yfinance_data.keys())}\n"
             # Optionally include snippets of info or structure hints if needed by prompt
             if yfinance_data.get('info'):
                  info_preview = {k: v for k, v in yfinance_data['info'].items() if k in ['sector', 'industry', 'marketCap', 'currency']}
                  financial_context += f"Info Preview: {json.dumps(info_preview)}\n"
             # Add note about serialized format
             financial_context += "(Financial statements are dicts with 'index', 'columns', 'data')\n"
        elif yfinance_data and yfinance_data.get('error'):
             financial_context += f"Source: Yahoo Finance Data (Fetch completed with error: {yfinance_data.get('error')})\n"
             financial_data_source_description = "Yahoo Finance data (with errors)"
        else:
            financial_context += "Source: Yahoo Finance Data (Not Available or Fetch Error)\n"
            financial_data_source_description = "Yahoo Finance data (unavailable)"


    # General Web Search Context
    web_search_context = "[General Web Search Results Context]\n"
    general_web_results = state.get('search_results', [])
    gap_web_results = state.get('gap_search_results', [])
    all_web_for_context = general_web_results + gap_web_results
    if all_web_for_context:
        for i, res in enumerate(all_web_for_context):
            web_search_context += f"Query {i+1}: {res.query}\n"
            for item in res.results[:3]: # Limit snippets
                web_search_context += f"- {item.title}: {item.snippet[:150]}...\n"
    else:
        web_search_context += "N/A\n"

    # Previous Analysis Context
    previous_analysis_context = "[Previous Analysis Steps Summary]\n"
    analyses = state.get('analysis_results', [])
    if isinstance(analyses, list) and analyses:
        formatted_analyses = []
        for idx, ar in enumerate(analyses):
             # Simplified access assuming AnalysisResult objects are stored
             goal_summary = ar.analysis_goal[:60] if isinstance(ar, AnalysisResult) else f'Goal N/A step {idx}'
             result_summary = ar.analysis_result[:200] if isinstance(ar, AnalysisResult) else f'Result N/A step {idx}'
             formatted_analyses.append(f"- Step {idx+1} ({goal_summary}...): {result_summary}...")
        previous_analysis_context += "\n".join(formatted_analyses)
    else:
         previous_analysis_context += "N/A\n"

    # Company Info Context (YF Info + Input Desc)
    info_context = "[Company Info Context]\n"
    input_desc = state.get('input_business_description', 'N/A')
    yf_info_data = state.get('yfinance_data', {}).get('info') if not yfinance_failed else None
    info_context += f"Input Description: {input_desc}\n"
    if yf_info_data:
         info_context += f"YF Info Summary: Sector: {yf_info_data.get('sector', 'N/A')}, Industry: {yf_info_data.get('industry', 'N/A')}, Employees: {yf_info_data.get('fullTimeEmployees', 'N/A')}\n"
         info_context += f"YF Long Description: {yf_info_data.get('longBusinessSummary', 'N/A')[:500]}...\n" # Limit length
    else:
         info_context += "YF Info: Not available or fetch failed.\n"

    # YF Holders Context (if not failed)
    yfinance_info_context = "[Yahoo Finance Info/Holders Context]\n" + info_context # Reuse info part
    if not yfinance_failed and state.get('yfinance_data'):
         holders_summary = ""
         major = state['yfinance_data'].get('major_holders')
         inst = state['yfinance_data'].get('institutional_holders')
         if major is not None: holders_summary += f"Major Holders data present (structure: {major.get('columns') if isinstance(major,dict) else 'N/A'}).\n"
         if inst is not None: holders_summary += f"Institutional Holders data present (structure: {inst.get('columns') if isinstance(inst,dict) else 'N/A'}).\n"
         yfinance_info_context += holders_summary if holders_summary else "Holders data: Not found in YF results.\n"
    else:
         yfinance_info_context += "Holders data: Not applicable (YF fetch failed or data unavailable).\n"


    # --- Determine Prompt & State Key ---
    analysis_prompt_template = None
    state_key_to_update = None # Key in ResearchState to store result

    analysis_goal_lower = analysis_step.analysis_goal.lower()
    is_financial_analysis_goal = "financial" in analysis_goal_lower or "财务" in analysis_goal_lower
    is_competitive_analysis_goal = "competitive" in analysis_goal_lower or "竞争" in analysis_goal_lower or "market" in analysis_goal_lower or "moat" in analysis_goal_lower
    is_mgmt_gov_analysis_goal = "management" in analysis_goal_lower or "governance" in analysis_goal_lower or "管理" in analysis_goal_lower

    if is_financial_analysis_goal:
        logger.info("Using FINANCIAL_ANALYSIS_PROMPT_YFINANCE...")
        analysis_prompt_template = FINANCIAL_ANALYSIS_PROMPT_YFINANCE
        state_key_to_update = "financial_analysis"
    elif is_competitive_analysis_goal:
         logger.info("Using COMPETITIVE_ANALYSIS_PROMPT_YFINANCE...")
         analysis_prompt_template = COMPETITIVE_ANALYSIS_PROMPT_YFINANCE
         state_key_to_update = "competitive_analysis"
    elif is_mgmt_gov_analysis_goal:
         logger.info("Using MANAGEMENT_GOVERNANCE_PROMPT_YFINANCE...")
         analysis_prompt_template = MANAGEMENT_GOVERNANCE_PROMPT_YFINANCE
         state_key_to_update = "management_governance_assessment"
    else:
        logger.warning(f"No specific prompt matched goal: '{analysis_step.analysis_goal}'. Using generic approach.")
        # Fallback generic analysis (less structured)
        analysis_prompt_template = """Analyze the provided context for the goal: '{analysis_goal}'.
        Combine information from financial context ({financial_data_source_description}), web searches, company info, and previous analyses.
        Focus on insights relevant to M&A if possible.

        Goal: {analysis_goal}

        Financial Context ({financial_data_source_description}):
        {financial_context}

        General Web Search Context:
        {web_context}

        Company Info Context:
        {info_context}

        Previous Analysis Context:
        {previous_analysis_context}

        Analysis:
        """
        state_key_to_update = None # Store in general list


    analysis_content = f"Analysis failed for goal: {analysis_step.analysis_goal}" # Default content
    status = 'error'

    # Ensure template exists before formatting
    if analysis_prompt_template:
         try:
             # Format the selected prompt with all gathered context
             prompt = analysis_prompt_template.format(
                 company_name=company_name,
                 ticker=ticker,
                 financial_data_source_description=financial_data_source_description, # Pass the description
                 financial_context=financial_context[:8000], # Limit context
                 web_context=web_search_context[:8000], # Limit context
                 info_context=info_context[:3000],
                 previous_analysis_context=previous_analysis_context[:3000],
                 yfinance_info_context=yfinance_info_context[:6000], # For mgmt/gov prompt
                 analysis_goal=analysis_step.analysis_goal, # For generic prompt
                 market_cap=state.get('market_cap_usd', 'N/A'), # Pass market cap for financial prompt context
                 ebitda=state.get('input_ebitda_usd', 'N/A') # Pass EBITDA for financial prompt context
             )

             # --- Invoke LLM ---
             analysis_response = await llm.ainvoke(prompt) # Use standard LLM for analysis
             analysis_content = analysis_response.content if hasattr(analysis_response, 'content') else str(analysis_response)
             message = f"Analysis #{current_index + 1} finished."
             status = 'completed'
             logger.info(message)

         except KeyError as ke:
              message = f"Analysis #{current_index + 1} failed: Missing key in prompt format - {ke}"
              status = 'error'
              logger.error(message, exc_info=True)
              analysis_content = f"Analysis prompt formatting failed: {ke}"
         except Exception as e:
             message = f"Analysis #{current_index + 1} failed: {e}"
             status = 'error'
             logger.error(f"Error during analysis for goal '{analysis_step.analysis_goal}': {e}", exc_info=True)
             analysis_content = f"Analysis failed: {e}"
    else:
         # This case should ideally not happen if generic fallback exists
         message = f"Analysis #{current_index + 1} skipped: No suitable prompt template found."
         status = 'skipped'
         logger.error(message)
         analysis_content = "Analysis skipped."


    # --- Prepare State Update ---
    state_update = {}
    if state_key_to_update:
        state_update = {state_key_to_update: analysis_content}
    else:
        # Store generic analysis in the list
        analysis_result_obj = AnalysisResult(analysis_goal=analysis_step.analysis_goal, analysis_result=analysis_content)
        new_analysis_results = state.get('analysis_results', []) + [analysis_result_obj]
        state_update = {"analysis_results": new_analysis_results}


    # Update UI for node completion
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': 'analysis', 'status': status,
        'title': f'Analysis #{current_index + 1}', 'message': message,
        'overwrite': True
    }))

    # Update progress
    completed_steps = state.get('completed_steps_count', 0) + 1
    all_updates.extend(create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': 'running',
        'title': 'Research Progress', 'completedSteps': completed_steps,
        'message': f'Completed analysis step {current_index + 1} ({status}).',
        'overwrite': True
    }))

    logger.info(f"--- Exiting Node: perform_analysis (Step {current_index + 1}) ---")
    # Merge state_update into the return dictionary
    return_state = {
        "current_analysis_step_index": current_index + 1,
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates,
    }
    return_state.update(state_update)
    return return_state


async def analyze_gaps(state: ResearchState) -> Dict[str, Any]:
    """Analyzes gaps, potentially suggesting actionable web searches."""
    step_id = 'gap-analysis'
    all_updates = create_update(state, {
        'id': step_id, 'type': 'analysis', 'status': 'running',
        'title': 'Gap Analysis', 'message': 'Analyzing for knowledge gaps & limitations...',
        'overwrite': True
        })
    logger.info(f"\n--- Running Node: analyze_gaps ---")
    yfinance_failed = state.get('yfinance_fetch_failed', False)
    yfinance_status_text = "Failed (Used Web Fallback)" if yfinance_failed else "Successful"

    # --- Gather Context ---
    # Consolidate context from various analysis steps and data sources
    context_parts = []
    context_parts.append(f"Research Target: {state['company_name']} ({state['ticker']})")
    context_parts.append(f"Yahoo Finance Status: {yfinance_status_text}")
    if state.get('financial_analysis'): context_parts.append(f"\n[Financial Analysis Summary]\n{state['financial_analysis'][:1000]}...")
    if state.get('competitive_analysis'): context_parts.append(f"\n[Competitive Analysis Summary]\n{state['competitive_analysis'][:1000]}...")
    if state.get('management_governance_assessment'): context_parts.append(f"\n[Mgmt/Gov Assessment Summary]\n{state['management_governance_assessment'][:1000]}...")
    # Include snippets from web searches maybe?
    # search_summary = "\n[Web Search Snippet Highlights]\n"
    # ... logic to add highlights ...
    # context_parts.append(search_summary)

    context = "\n".join(context_parts)

    # --- Format Prompt ---
    prompt = GAP_ANALYSIS_PROMPT_YFINANCE.format(
        topic=state['topic'], # Keep original topic for reference if needed
        company_name=state['company_name'],
        ticker=state['ticker'],
        yfinance_status=yfinance_status_text, # Pass status to prompt
        context=context[:10000] # Limit context
    )

    gap_analysis_result: Optional[GapAnalysisResult] = None # Initialize
    status = 'error' # Default
    message = "Gap analysis failed before LLM call."

    try:
        gap_analysis_result = await generate_structured_output(
            llm_creative, GapAnalysisResult, prompt
        )
        if not gap_analysis_result:
             gap_analysis_result = GapAnalysisResult(summary="Failed to generate structured gap analysis.", follow_up_queries=[])
             message = "Gap analysis LLM call succeeded but failed to parse structure."
             status = 'warning'
        else:
             # Filter follow-up queries - Keep this filtering
             original_query_count = len(gap_analysis_result.follow_up_queries)
             gap_analysis_result.follow_up_queries = [
                 q for q in gap_analysis_result.follow_up_queries if isinstance(q, GapFollowUpQuery) and q.tool_hint == 'web_search'
             ]
             filtered_query_count = len(gap_analysis_result.follow_up_queries)
             message = f"Gap analysis completed. Identified limitations. {filtered_query_count} actionable follow-up web searches suggested (out of {original_query_count} raw suggestions)."
             status = 'completed'
        logger.info(message)
    except Exception as e:
        logger.error(f"Error during gap analysis LLM call or parsing: {e}", exc_info=True)
        gap_analysis_result = GapAnalysisResult(summary=f"Gap analysis failed: {e}", follow_up_queries=[])
        message = f"Gap analysis failed: {e}"
        status = 'error'

    # Update UI for node completion
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': 'analysis', 'status': status,
        'title': 'Gap Analysis', 'message': message,
        'payload': gap_analysis_result.dict() if hasattr(gap_analysis_result, 'dict') else {"summary": "Error or N/A"},
        'overwrite': True
    }))
    # Update progress
    completed_steps = state.get('completed_steps_count', 0) + 1
    all_updates.extend(create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': 'running',
        'title': 'Research Progress', 'completedSteps': completed_steps,
        'message': f'Completed gap analysis step ({status}).', 'overwrite': True
    }))

    logger.info(f"--- Exiting Node: analyze_gaps ---")
    return {
        "gaps_identified": gap_analysis_result,
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates
    }


async def execute_gap_search(state: ResearchState) -> Dict[str, Any]:
    """Executes follow-up *web* searches based on identified gaps."""
    step_id = 'gap-search'
    all_updates = create_update(state, {
        'id': step_id, 'type':'search', 'status': 'running',
        'title': 'Gap Filling Web Search', 'message': 'Executing follow-up web searches...',
        'overwrite': True
        })
    logger.info(f"\n--- Running Node: execute_gap_search ---")

    gaps = state.get('gaps_identified')
    follow_up_web_queries = gaps.follow_up_queries if gaps and hasattr(gaps, 'follow_up_queries') and isinstance(gaps.follow_up_queries, list) else []
    status = 'skipped' # Default if no queries
    message = "No actionable follow-up web searches suggested by gap analysis."

    gap_search_step_results: List[SearchStepResult] = []

    if follow_up_web_queries:
        max_gap_queries = 3 # Keep limit or adjust if needed
        queries_to_run = follow_up_web_queries[:max_gap_queries]
        status = 'running' # Will be updated later
        logger.info(f"Executing {len(queries_to_run)} gap web queries (max {max_gap_queries})...")
        try:
            for i, gap_query_obj in enumerate(queries_to_run):
                if not isinstance(gap_query_obj, GapFollowUpQuery): continue
                query_text = gap_query_obj.query
                logger.info(f"Executing Gap Web Query {i+1}/{len(queries_to_run)}: {query_text}")
                try:
                    web_results = await perform_web_search(query_text, 3) # Use slightly fewer results for gap fill?
                    gap_search_step_results.append(SearchStepResult(query=query_text, results=web_results, tool_used="web_search_gap"))
                except Exception as e_inner:
                    logger.error(f"Error during specific gap web search for query '{query_text}': {e_inner}")
                    gap_search_step_results.append(SearchStepResult(query=query_text, results=[], tool_used="web_search_gap")) # Add empty result on error

            message = f"Gap web search finished. Executed {len(queries_to_run)} queries, found {sum(len(r.results) for r in gap_search_step_results)} total results."
            status = 'completed'
            logger.info(message)
        except Exception as e_outer:
            message = f"Error during gap search execution loop: {e_outer}"
            status = 'error'
            logger.error(message, exc_info=True)
    else:
        logger.info(message) # Log skip message

    # Update UI for node completion
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': 'search', 'status': status,
        'title': 'Gap Filling Web Search', 'message': message,
        'overwrite': True
    }))

    # Update progress - Count as one step overall
    completed_steps = state.get('completed_steps_count', 0) + 1
    all_updates.extend(create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': 'running',
        'title': 'Research Progress', 'completedSteps': completed_steps,
        'message': f'Completed gap search step ({status}).', 'overwrite': True
    }))

    logger.info(f"--- Exiting Node: execute_gap_search ---")
    # Append gap search results to the main search results list OR keep separate?
    # Let's keep them separate for now in state, but combine for context later.
    return {
        "gap_search_results": gap_search_step_results, # Store gap results separately
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates
    }


async def synthesize_final_report(state: ResearchState) -> Dict[str, Any]:
    """Synthesizes findings, adapting context based on YF status."""
    step_id = 'synthesis'
    all_updates = create_update(state, {
        'id': step_id, 'type':'synthesis', 'status': 'running',
        'title': 'Synthesize Findings', 'message': 'Synthesizing all findings...',
        'overwrite': True
        })
    logger.info(f"\n--- Running Node: synthesize_final_report ---")
    yfinance_failed = state.get('yfinance_fetch_failed', False)
    yfinance_status_text = "Failed (Used Web Fallback)" if yfinance_failed else "Successful"

    # --- Gather Context (More robust handling of potential None values) ---
    context_parts = []
    context_parts.append(f"Research Target: {state.get('company_name', 'N/A')} ({state.get('ticker', 'N/A')})")
    context_parts.append(f"Yahoo Finance Status: {yfinance_status_text}")

    # Add initial input data summary with checks for None
    input_summary = "\n[Initial Input Data Summary]\n"
    country = state.get('country_of_exchange')
    input_summary += f"- Country: {country if country else 'N/A'}\n"
    market_cap = state.get('market_cap_usd')
    input_summary += f"- Market Cap (USD, {state.get('input_query_date', 'N/A')}): {market_cap if market_cap is not None else 'N/A'}\n"
    ebitda = state.get('input_ebitda_usd')
    input_summary += f"- EBITDA (USD, FY0, {state.get('input_query_date', 'N/A')}): {ebitda if ebitda is not None else 'N/A'}\n"
    input_pe = state.get('input_pe_ratio')
    input_summary += f"- P/E Ratio ({state.get('input_query_date', 'N/A')}): {input_pe if input_pe is not None else 'N/A'}\n"
    # *** FIX: Check if description is None before slicing ***
    business_desc_val = state.get('input_business_description')
    input_summary += f"- Business Desc: {(business_desc_val[:300] + '...') if business_desc_val else 'N/A'}\n"
    context_parts.append(input_summary)

    # Add analysis summaries (Safely access potentially None values)
    financial_analysis_val = state.get('financial_analysis')
    if financial_analysis_val: context_parts.append(f"\n[Financial Analysis Summary (Source: {'Web Fallback' if yfinance_failed else 'YF Data'})]\n{financial_analysis_val[:1500]}...")

    competitive_analysis_val = state.get('competitive_analysis')
    if competitive_analysis_val: context_parts.append(f"\n[Competitive Analysis Summary]\n{competitive_analysis_val[:1500]}...")

    mgmt_gov_val = state.get('management_governance_assessment')
    if mgmt_gov_val: context_parts.append(f"\n[Mgmt/Gov Assessment Summary]\n{mgmt_gov_val[:1500]}...")

    analysis_results_list = state.get('analysis_results')
    if analysis_results_list: # Check if the list itself exists
        generic_analysis_summary = "\n[Other Analysis Results]\n"
        for ar in analysis_results_list:
            if isinstance(ar, AnalysisResult): # Check type for safety
                 generic_analysis_summary += f"- {ar.analysis_goal[:50]}...: {ar.analysis_result[:150]}...\n"
        context_parts.append(generic_analysis_summary)

    # Add Gap Analysis Summary (Safely access)
    gaps = state.get('gaps_identified')
    if gaps and isinstance(gaps, GapAnalysisResult): context_parts.append(f"\n[Gap Analysis Summary]\n{gaps.summary[:1000]}...")

    # Add Web Search Highlights (Combine all searches safely)
    web_highlights = "\n[Web Search Highlights (All Searches)]\n"
    search_results = state.get('search_results', []) or []
    financial_web_results = state.get('financial_web_search_results', []) or []
    gap_search_results = state.get('gap_search_results', []) or []
    all_searches = search_results + financial_web_results + gap_search_results
    highlight_count = 0
    max_highlights = 15
    if all_searches: # Check if there are any search results at all
        for res in all_searches:
            if highlight_count >= max_highlights: break
            if isinstance(res, SearchStepResult): # Check type
                web_highlights += f"Query: {res.query}\n"
                if res.results: # Check if results list exists
                     for item in res.results[:2]:
                         if highlight_count >= max_highlights: break
                         if isinstance(item, SearchResultItem): # Check type
                             title = item.title or "N/A"
                             snippet = item.snippet or ""
                             web_highlights += f"- {title}: {snippet[:100]}...\n"
                             highlight_count += 1
    context_parts.append(web_highlights if highlight_count > 0 else "\n[Web Search Highlights: None available or processed]\n")

    context = "\n".join(context_parts)

    # --- Use Synthesis Prompt ---
    prompt = SYNTHESIS_PROMPT_YFINANCE.format(
        company_name=state.get('company_name', 'N/A'), # Use .get for safety
        ticker=state.get('ticker', 'N/A'),
        yfinance_status=yfinance_status_text,
        context=context[:20000] # Limit context
    )

    # ... (Rest of the synthesize_final_report function remains the same: LLM call, error handling, state update) ...
    # ... (LLM call and result handling as before) ...
    synthesis_result: Optional[FinalSynthesisResult] = None
    status = 'error'
    message = "Synthesis failed before LLM call."

    try:
         synthesis_result = await generate_structured_output(
             llm_creative, FinalSynthesisResult, prompt
         )
         if not synthesis_result or not synthesis_result.key_findings_summary: # Check summary content
             synthesis_result = FinalSynthesisResult(
                 key_findings_summary="Synthesis generation failed or returned empty summary.",
                 remaining_uncertainties=["Data limitations significantly impacted synthesis.", "Error during parsing or generation."]
             )
             message = "Synthesis completed but failed to generate valid/meaningful structure."
             status = 'warning'
         else:
             message = "Synthesis of all findings completed."
             status = 'completed'
         logger.info(message)
    except Exception as e:
        logger.error(f"Error during synthesis: {e}", exc_info=True)
        synthesis_result = FinalSynthesisResult(key_findings_summary=f"Synthesis failed: {e}", remaining_uncertainties=["Error during synthesis process."])
        message = f"Synthesis failed: {e}"
        status = 'error'

    # Update UI for node completion
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': 'synthesis', 'status': status,
        'title': 'Synthesize Findings', 'message': message,
        'payload': synthesis_result.dict() if hasattr(synthesis_result, 'dict') else {"key_findings_summary": "Error or N/A"},
        'overwrite': True
    }))
    # Update progress
    completed_steps = state.get('completed_steps_count', 0) + 1
    all_updates.extend(create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': 'running',
        'title': 'Research Progress', 'completedSteps': completed_steps,
        'message': f'Completed synthesis step ({status}).', 'overwrite': True
    }))

    logger.info(f"--- Exiting Node: synthesize_final_report ---")
    return {
        "final_synthesis": synthesis_result,
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates
    }


async def generate_final_markdown_report(state: ResearchState) -> Dict[str, Any]:
    """Generates the final Markdown report, including summary table and adjusted tone."""
    step_id = 'final-report-generation'
    all_updates = create_update(state, {
        'id': step_id, 'type':'report', 'status': 'running',
        'title':'Final Report Generation', 'message': 'Generating final report...',
        'overwrite': True
        })
    logger.info(f"\n--- Running Node: generate_final_markdown_report ---")

    # --- 1. Generate Structured Summary Table ---
    # ... (Summary table generation logic remains the same as previous version) ...
    summary_table_md = "# ERROR: Could not generate summary table." # Default
    try:
        # (Keep the table generation logic here)
        company_name = state.get('company_name', 'N/A')
        ticker = state.get('ticker', 'N/A')
        country = state.get('country_of_exchange', 'N/A')
        query_date = state.get('input_query_date', 'N/A')
        market_cap = state.get('market_cap_usd') # Get value, might be None
        market_cap_str = f"{market_cap:,.2f}" if isinstance(market_cap, (int, float)) else "N/A"
        ebitda = state.get('input_ebitda_usd') # Get value, might be None
        ebitda_str = f"{ebitda:,.2f}" if isinstance(ebitda, (int, float)) else "N/A"
        input_pe = state.get('input_pe_ratio') # Get value, might be None
        input_pe_str = f"{input_pe:.2f}" if isinstance(input_pe, (int, float)) else "N/A" # Format if number

        # Infer Industry (best effort)
        industry = "N/A"
        yf_info = state.get('yfinance_data', {}).get('info') if not state.get('yfinance_fetch_failed') else None
        if yf_info and yf_info.get('industry'):
            industry = yf_info['industry']
        elif state.get('input_business_description'):
             business_desc_val = state.get('input_business_description') # Check if None later
             if business_desc_val: # Check if not None before using
                 desc_lower = business_desc_val.lower()
                 # ... (industry inference logic) ...
                 if 'cloud service' in desc_lower: industry = "Cloud Services (from Desc)"
                 # ... (other heuristics) ...
                 else: industry = business_desc_val[:30] + "... (from Desc)"

        # Extract from Synthesis
        synthesis = state.get('final_synthesis')
        prelim_rationale = "See Exec Summary" # Default
        key_risks = "See Exec Summary / Risks Section" # Default
        if synthesis and isinstance(synthesis, FinalSynthesisResult) and synthesis.key_findings_summary:
             summary_text = synthesis.key_findings_summary.lower()
             rationale_hints = re.findall(r"(?:potential rationale|attractive aspect|strength).{0,100}", summary_text)
             if rationale_hints: prelim_rationale = rationale_hints[0][20:].strip() # Basic extraction

             risk_hints = re.findall(r"(?:red flag|major risk|key risk|concern).{0,100}", summary_text)
             if risk_hints: key_risks = risk_hints[0][10:].strip() # Basic extraction

        # Format Table (Ensure N/A for None values passed)
        summary_table_md = f"""
| Key Information Item          | Details (Preliminary - Based on YF/Web)                     |
| :---------------------------- | :---------------------------------------------------------- |
| **Company Name** | {company_name}                                              |
| **Ticker / RIC** | {ticker}                                                    |
| **Country of Exchange** | {country if country else 'N/A'}                           |
| **Market Cap (USD)** | {market_cap_str} *(as of {query_date if query_date else 'N/A'})* |
| **Input EBITDA (USD, FY0)** | {ebitda_str} *(as of {query_date if query_date else 'N/A'})* |
| **Input P/E Ratio** | {input_pe_str} *(as of {query_date if query_date else 'N/A'})* |
| **Industry (Inferred)** | {industry}                                                  |
| **Preliminary M&A Rationale** | {prelim_rationale} *(Speculative)* |
| **Key Preliminary Risks** | {key_risks} *(Speculative)* |
| **Data Confidence Level** | **Low (YF/Web Only)** |
| **Next Step Recommendation** | **Deep Due Diligence using Official Filings REQUIRED** |
"""
        logger.info("Successfully generated structured summary table.")
    except Exception as table_e:
        logger.error(f"Error generating summary table: {table_e}", exc_info=True)
        summary_table_md = f"# Error Generating Summary Table: {table_e}\n"
        # Ensure it's still a string even on error
        if not isinstance(summary_table_md, str): summary_table_md = "# Summary Table Error\n"


    # --- 2. Prepare Context for Final Report LLM (More robust handling of None) ---
    synthesis = state.get('final_synthesis')
    gaps = state.get('gaps_identified')
    yfinance_failed = state.get('yfinance_fetch_failed', False)
    yfinance_status_text = "Failed (Used Web Fallback)" if yfinance_failed else "Successful"
    financial_data_source = "Web Search Fallback" if yfinance_failed else "Yahoo Finance"
    financial_section_source_note = f"Based on {financial_data_source}"

    final_report_text = f"{summary_table_md}\n\n# Report Generation Failed\nSynthesis data missing." # Default error
    status = 'error'
    message = "Report generation failed: Missing synthesis data."

    if synthesis and isinstance(synthesis, FinalSynthesisResult): # Check synthesis exists and is correct type
        context_parts = {
            "structured_summary_table_context": summary_table_md, # Pass generated table
            "synthesis_context": "",
            "gap_context": "",
            "analysis_summaries_context": "",
            "search_results_context": "",
            "initial_input_context": "" # Will be built below
        }

        # Synthesis Context
        context_parts["synthesis_context"] = f"Synthesized Key Findings:\n{synthesis.key_findings_summary}\n\nRemaining Uncertainties:\n" + "\n".join(f"- {u}" for u in (synthesis.remaining_uncertainties or [])) # Handle None

        # Gap Context
        context_parts["gap_context"] = f"Gap Analysis Summary:\n{gaps.summary if gaps and isinstance(gaps, GapAnalysisResult) else 'N/A'}" # Check gaps type

        # Analysis Summaries Context (Handle None values safely)
        analysis_summaries = []
        fin_analysis = state.get('financial_analysis')
        if fin_analysis: analysis_summaries.append(f"### Financial Analysis (Source: {financial_data_source})\n{fin_analysis}")
        comp_analysis = state.get('competitive_analysis')
        if comp_analysis: analysis_summaries.append(f"### Competitive Analysis\n{comp_analysis}")
        mgmt_gov = state.get('management_governance_assessment')
        if mgmt_gov: analysis_summaries.append(f"### Management/Governance Assessment\n{mgmt_gov}")
        other_analysis = state.get('analysis_results')
        if other_analysis: # Check list exists
             generic_summary = "### Other Analysis Results\n"
             for ar in other_analysis:
                 if isinstance(ar, AnalysisResult): # Check type
                     generic_summary += f"- **{ar.analysis_goal}**: {ar.analysis_result}\n"
             analysis_summaries.append(generic_summary)
        context_parts["analysis_summaries_context"] = "\n\n".join(analysis_summaries) if analysis_summaries else "N/A"

        # Search Results Context (Handle None values safely)
        search_context = "[Web Search Results Context for Reference]\n"
        search_results = state.get('search_results', []) or []
        financial_web_results = state.get('financial_web_search_results', []) or []
        gap_search_results = state.get('gap_search_results', []) or []
        all_searches = search_results + financial_web_results + gap_search_results
        search_count = 0
        max_search_items = 20
        if all_searches:
            for res in all_searches:
                if search_count >= max_search_items: break
                if isinstance(res, SearchStepResult): # Check type
                    search_context += f"Query: {res.query}\n"
                    if res.results:
                        for item in res.results[:2]:
                            if search_count >= max_search_items: break
                            if isinstance(item, SearchResultItem):
                                title = item.title or "N/A"
                                snippet = item.snippet or ""
                                url = item.url or "#" # Provide fallback URL
                                search_context += f"- [{title}]({url}): {snippet[:150]}...\n"
                                search_count +=1
        context_parts["search_results_context"] = search_context[:15000] if search_count > 0 else "[Web Search Results Context for Reference]\nN/A"


        # *** FIX: Build Initial Input Context Safely ***
        input_ctx = "[Initial Input Data]\n"
        company_name_val = state.get('company_name', 'N/A')
        ticker_val = state.get('ticker', 'N/A')
        country_val = state.get('country_of_exchange')
        market_cap_val = state.get('market_cap_usd')
        ebitda_val = state.get('input_ebitda_usd')
        pe_val = state.get('input_pe_ratio')
        desc_val = state.get('input_business_description') # Get the value, could be None
        query_date_val = state.get('input_query_date')

        input_ctx += f"- Name: {company_name_val}\n"
        input_ctx += f"- RIC/Ticker: {ticker_val}\n"
        input_ctx += f"- Country: {country_val if country_val else 'N/A'}\n"
        input_ctx += f"- Market Cap (USD, {query_date_val if query_date_val else 'N/A'}): {market_cap_val if market_cap_val is not None else 'N/A'}\n"
        input_ctx += f"- EBITDA (USD, FY0, {query_date_val if query_date_val else 'N/A'}): {ebitda_val if ebitda_val is not None else 'N/A'}\n"
        input_ctx += f"- P/E Ratio ({query_date_val if query_date_val else 'N/A'}): {pe_val if pe_val is not None else 'N/A'}\n"
        # Check desc_val before slicing
        input_ctx += f"- Business Desc: {(desc_val[:500] + '...') if desc_val else 'N/A'}\n"
        context_parts["initial_input_context"] = input_ctx
        # *** END FIX ***

        # --- 3. Format Final Report Prompt ---
        current_date_str = datetime.now().strftime('%Y-%m-%d')
        try:
            prompt = FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE_YFINANCE_ONLY.format(
                current_date=current_date_str,
                research_topic=state.get('topic', 'N/A'), # Use .get
                yfinance_status=yfinance_status_text,
                financial_section_source_note=financial_section_source_note,
                financial_data_source=financial_data_source,
                **context_parts # Pass all context sections
            )
        except KeyError as ke:
            logger.error(f"KeyError formatting final report prompt: {ke}. Context keys: {list(context_parts.keys())}", exc_info=True)
            final_report_text = f"{summary_table_md}\n\n# Report Generation Failed\n\nError: Missing key in final report prompt template: {ke}"
            message = f"Error formatting report prompt: Missing key {ke}"
            status = 'error'
            prompt = None # Prevent LLM call

        # --- 4. Invoke LLM for Report Generation (only if prompt formatting succeeded) ---
        if prompt:
            try:
                final_report = await llm_creative.ainvoke(prompt) # Use creative for report writing
                final_report_text = final_report.content if hasattr(final_report, 'content') else str(final_report)

                if len(final_report_text) < 500 or "report generation failed" in final_report_text.lower():
                     logger.warning("Final report seems short or indicates internal failure.")
                     message = "Final report generated, but may be incomplete or failed."
                     status = 'warning'
                     # Keep the potentially faulty report text
                else:
                     message = "Final research report generated successfully."
                     status = 'completed'
                logger.info(message)

            except Exception as e:
                logger.error(f"Error generating final report via LLM: {e}", exc_info=True)
                final_report_text = f"{summary_table_md}\n\n# Report Generation Failed\n\nError during LLM call: {str(e)}"
                message = f"Error generating report via LLM: {str(e)[:100]}..."
                status = 'error'

    else: # Synthesis was missing
         logger.error("Cannot generate report: Final synthesis is missing.")
         final_report_text = f"{summary_table_md}\n\n" + final_report_text # Include table even if synthesis failed
         message = "Report generation failed: Missing synthesis data."
         status = 'error'


    # --- 5. Update UI and Progress ---
    all_updates.extend(create_update(state, {
        'id': step_id, 'type': 'report', 'status': status,
        'title': 'Final Report Generation', 'message': message,
        'payload': {'report_preview': final_report_text[:500]+"..."} if status != 'error' else None,
        'overwrite': True
        }))

    completed_steps = state.get('completed_steps_count', 0) + 1
    final_total_steps = state.get('total_steps', completed_steps)
    progress_final = create_update(state, {
        'id': 'research-progress', 'type': 'progress',
        'status': status if status == 'error' else 'completed',
        'title': 'Research Progress', 'message': f'Research finished ({status}).',
        'completedSteps': completed_steps if status == 'completed' else completed_steps -1, # Adjust completed on error?
        'totalSteps': final_total_steps, 'isComplete': True, 'overwrite': True
    })
    all_updates.extend(progress_final)

    logger.info(f"--- Exiting Node: generate_final_markdown_report ({status}) ---")
    return {
        "final_report_markdown": final_report_text,
        "structured_summary_table": summary_table_md,
        "completed_steps_count": completed_steps,
        "stream_updates": state.get('stream_updates', []) + all_updates,
    }

async def finalize_basic_research(state: ResearchState) -> Dict[str, Any]:
    """Fallback finalizer, attempts to include summary table."""
    step_id = 'finalize-research'
    all_updates = state.get('stream_updates', [])
    final_message = state.get("error_message", "Research process finalized via fallback path.")
    all_updates.extend(create_update(state, {
        'id': step_id, 'type':'end', 'status': 'completed',
        'title':'Research Finalized', 'message': final_message, 'overwrite': True
        }))
    logger.info(f"\n--- Running Node: finalize_basic_research ({final_message}) ---")

    # Determine final overall progress status
    is_error_final = bool(state.get("error_message"))
    final_status = 'error' if is_error_final else 'completed'
    final_completed_steps = state.get('completed_steps_count', 0)
    final_total_steps = state.get('total_steps', final_completed_steps)

    progress_final = create_update(state, {
        'id': 'research-progress', 'type': 'progress', 'status': final_status,
        'title': 'Research Progress', 'message': f'Research finished ({final_status} via fallback).',
        'completedSteps': final_completed_steps, 'totalSteps': final_total_steps,
        'isComplete': True, 'overwrite': True
    })
    all_updates.extend(progress_final)

    # Try to provide a minimal useful report, including summary table if available
    final_report = state.get("final_report_markdown")
    summary_table = state.get("structured_summary_table", "\n# Summary Table Generation Failed in Fallback\n")

    if not final_report or "Report Generation Failed" in final_report or "final state." in final_report: # Check for various failure states
        fallback_report_content = f"\n\n# Research Finalized ({final_status.upper()})\n\n{final_message}\n\n"
        final_synthesis = state.get('final_synthesis')
        if final_synthesis and hasattr(final_synthesis, 'key_findings_summary'):
            fallback_report_content += f"## Last Available Synthesis Summary\n{final_synthesis.key_findings_summary}\n\n## Remaining Uncertainties\n" + "\n".join(f"- {u}" for u in final_synthesis.remaining_uncertainties)
        else:
            fallback_report_content += "No usable synthesis or report was generated prior to fallback."
        # Prepend summary table to the fallback content
        final_report = summary_table + fallback_report_content

    return {"final_report_markdown": final_report, "stream_updates": all_updates}

================================================
FILE: super_agents/customized_deep_research/reason_graph/prompt.py
================================================
# --- REVISED Plan Research Prompt ---
# Goal: Generate deeper, more diverse queries, handle YF failure, create actionable analysis steps.
PLAN_RESEARCH_PROMPT_YFINANCE = """You are an expert M&A research analyst planning preliminary due diligence for: **{company_name} ({ticker})**.
Country: {country}. Initial Market Cap (USD): {market_cap}. Initial EBITDA (USD): {ebitda}. Source Date: {query_date}.
Business Desc: {business_desc}

**Constraint:** Rely ONLY on 'yfinance' (if available) and 'web_search'. No direct access to official filings or premium databases.

**Scenario:** Yahoo Finance data fetch status: **{yfinance_status}**.

**Goal:** Create a focused research plan combining financial tool usage (if applicable) and deep web searching to uncover M&A-critical insights.

**Plan Requirements:**

1.  **Financial Data Step:**
    * **IF `yfinance_status` is 'Successful'**: Include exactly ONE step with `tool_hint: 'yfinance'` for ticker '{ticker}'. Query: "Fetch comprehensive financial data summary".
    * **IF `yfinance_status` is 'Failed'**: **DO NOT include a 'yfinance' step.** Instead, generate 3-5 **specific 'web_search' queries** aiming to find alternative financial information online. Use the initial Market Cap ({market_cap}) and EBITDA ({ebitda}) as context/validation points. Examples:
        * `"{company_name} estimated revenue trend 2023-2025"`
        * `"analyst report summary {company_name} profitability OR debt"`
        * `"{company_name} market capitalization verification news OR source"`
        * `"news {company_name} recent funding OR financing rounds"`
        * `"{company_name} EBITDA margin discussion OR competitor comparison"`

2.  **Deep Web Search Queries (Generate 8-10 DIVERSE queries minimum, regardless of YF status):** Design **specific, targeted `web_search` queries** for '{company_name}' ({ticker}) covering these angles. Aim for queries likely to hit news, industry analysis, forums, reviews, executive mentions, etc.:
    * **Management & Strategy:** Search for **named executive interviews/quotes on strategy, reports on management changes/stability, discussions on company culture (e.g., Glassdoor summary if mentioned), analysis of recent strategic moves (partnerships, M&A).** Examples:
        * `"Interview OR Quote [CEO Name if known, else 'CEO'] {company_name} future strategy"`
        * `"Analysis {company_name} management team effectiveness OR recent changes"`
    * **Product/Tech Competitiveness & Risk:** Search for **independent reviews of core products/services, technical comparisons vs. specific competitors, user forum discussions on product quality/bugs/features, mentions of technical debt or platform scalability, news on R&D/patents.** Examples:
        * `"comparison review {company_name} [main product/service] vs [Competitor A]"`
        * `"{company_name} product user forum common complaints OR issues"`
        * `"Analysis {company_name} technology stack OR technical debt"`
    * **Market Position & Moat:** Search for **market share estimates (even if in news/blogs), analysis of competitive advantages (moat), discussion of pricing power, recent competitor actions impacting {company_name}, relevant market trends/forecasts.** Examples:
        * `"{company_name} market share [specific niche derived from Business Desc]"`
        * `"Analysis {company_name} competitive advantages OR economic moat"`
        * `"Impact of [Market Trend] on {company_name}"`
    * **Customer Insights:** Search for **mentions of major customer wins/losses, case studies, discussions on customer satisfaction/churn (if public), reviews on B2B sites (if applicable).** Examples:
        * `"{company_name} major client announcement OR case study"`
        * `"{company_name} customer reviews OR satisfaction rating"`
    * **Key Risks (Operational, Legal, etc.):** Search specifically for **news/reports on lawsuits/litigation, regulatory scrutiny/fines in {country} or key markets, supply chain issues, product recalls, negative analyst commentary on risks.** Examples:
        * `"{company_name} lawsuit OR regulatory action {country}"`
        * `"{company_name} operational challenges OR supply chain news"`
    * **M&A Context:** Search for **M&A rumors/speculation (note source quality), analysis of {company_name} as potential target/acquirer, industry M&A trends relevant to its niche.** Examples:
        * `"{company_name} acquisition speculation OR target analysis"`
        * `"M&A trends {company_name} industry sector"`

3.  **Analysis Steps (`required_analyses` - Generate for key M&A themes):** Define analysis goals that EXPLICITLY require **synthesizing insights from AVAILABLE financial data (YF dict OR financial web search results) AND the broader web search findings.** Focus on M&A implications:
    * **Financial Profile & Risks:** "Analyze the company's financial health signals (growth, profitability, debt) based *solely* on the available **[financial data source - e.g., Yahoo Finance or Web Search]** and corroborating/contradicting web search context. Identify key financial red flags for M&A diligence, noting data limitations." # <<< MODIFIED: Removed placeholder, using static description
    * **Competitive Position & Moat:** "Evaluate {company_name}'s market position, competitive advantages/disadvantages, and potential economic moat based on web search findings (competitors, market share hints, reviews). Assess attractiveness for an M&A acquirer."
    * **Management & Execution:** "Assess apparent management stability, strategic direction hints, and potential governance flags based on web search findings (executive mentions, news, culture hints). Consider M&A execution risk implications."
    * **Overall Preliminary M&A Assessment:** "Synthesize all findings into a preliminary view: Is {company_name}, based *only* on this limited YF/Web research, a potentially attractive M&A target? What are the 1-2 biggest perceived strengths and 1-2 biggest red flags requiring immediate deep dive with official data?"

**Output Format:** A JSON object adhering to the `ResearchPlan` schema. Ensure high query quality and diversity, and actionable analysis goals.
"""


# --- REVISED Financial Analysis Prompt ---
# Goal: Analyze available financial data (YF dict or Web results), correlate deeply with web context, infer M&A implications, reduce excessive caution in tone.
FINANCIAL_ANALYSIS_PROMPT_YFINANCE = """You are an M&A financial analyst reviewing **{company_name} ({ticker})**.
Your analysis is based ONLY on the provided financial context ({financial_data_source_description}) and qualitative context from general web searches. Be analytical and objective, noting data limitations where relevant.

**Analysis Goals:**

1.  **Financial Data Summary:** Briefly summarize key figures and trends observed in the provided `{financial_data_source_description}`. Note any obvious data gaps or inconsistencies within this source. If analyzing serialized YF data (dictionaries with index/columns/data), interpret trends from the 'data' arrays over time periods in 'columns'.
2.  **Correlation with Web Context:** **Critically connect** the financial signals (e.g., revenue trend, profitability metrics, debt hints, market cap from input {market_cap}) with the narrative found in web searches.
    * Does web news (e.g., product launches, market changes, partnerships) **support or contradict** the financial trends?
    * Are there web discussions (e.g., competition, pricing pressure, operational issues) that **explain** observed financial metrics (e.g., margins, EBITDA {ebitda})?
    * Does the company's reported activity level in web searches seem consistent with its financial scale (Market Cap, Revenue hints)?
    * **Highlight key consistencies and discrepancies.**
3.  **M&A Implications & Potential Red Flags (Inferred):** Based *only* on this combined, limited information:
    * What **potential financial strengths** (e.g., reported growth seemingly validated by web news, potentially manageable debt based on context) might be attractive? (Label as preliminary).
    * What **potential financial RED FLAGS** (e.g., negative trends contradicted by optimistic news, high debt without clear financing context online, discrepancies between reported scale and web presence) demand urgent investigation using official filings?
    * What is the **preliminary assessment of financial viability/risk** from an M&A perspective, acknowledging the data source limitations?
4.  **Key Limitations Note:** Briefly state that this analysis lacks audited figures, footnotes, MD&A, and segment details, which are essential for definitive M&A financial due diligence.

**Instructions:**
- Focus on **analysis and interpretation**, not just data listing.
- Prioritize connecting the financial data points with the qualitative web narrative.
- Use objective but insightful language. Label speculative inferences clearly (e.g., "This *suggests*...", "A potential implication *could be*...").
- Structure logically (e.g., ## Financial Summary, ## Web Correlation, ## M&A Implications/Flags, ## Limitations Note).
- Output only the analysis text.

**Provided Financial Context ({financial_data_source_description}):**
{financial_context}

**Provided General Web Search Context:**
{web_context}

**Financial Analysis (Preliminary - Based on {financial_data_source_description} & Web Search):**
"""

# --- REVISED Competitive Analysis Prompt ---
# Goal: Deeper analysis of positioning, moat hints, M&A implications.
COMPETITIVE_ANALYSIS_PROMPT_YFINANCE = """You are an M&A market analyst assessing the competitive landscape for **{company_name} ({ticker})**.
Analyze the provided context from its business description, Yahoo Finance profile hints, and general web search results.

**Analysis Goals:**

1.  **Market Definition & Niche:** Define the specific market niche(s) {company_name} operates in, based on available info. Estimate market size or growth potential if any hints exist in the context.
2.  **Competitor Landscape:** List key competitors identified. Summarize any available information on their relative size, product focus, or recent strategic moves found in the web context.
3.  **Competitive Positioning & Potential Moat:** Synthesize information to assess {company_name}'s likely market position (e.g., leader, niche player, challenger).
    * What are its apparent **strengths or differentiators** mentioned (e.g., specific tech, strong brand hints, key partnerships)?
    * Are there hints of a **competitive advantage or 'moat'** (e.g., network effects, high switching costs suggested by discussions, unique IP mentions)? (Label as speculative).
    * What **weaknesses or vulnerabilities** are suggested (e.g., negative reviews, limited scale, strong competitor actions)?
4.  **Market Dynamics & Trends:** Summarize relevant market trends, technological shifts, or regulatory factors mentioned in web searches that could impact {company_name} and its competitors.
5.  **M&A Implications:**
    * How attractive is the target's **apparent market position and potential moat** for an acquirer?
    * What are the **key competitive dynamics or threats** an acquirer needs to consider?
    * Does the competitive landscape suggest **synergy potential** (e.g., consolidation opportunities, cross-selling)?
    * Assess the **difficulty of replicating** the target's position (barrier to entry assessment based on web hints).
6.  **Limitations Note:** Briefly state this analysis relies on public web information and lacks professional market research data.

**Instructions:**
- Integrate findings cohesively.
- Focus on **competitive strength/weakness assessment** and **M&A relevance**.
- Be specific where evidence allows, label inferences clearly.
- Structure logically (e.g., ## Market Niche, ## Competitors, ## Positioning & Moat Analysis, ## Dynamics, ## M&A Implications, ## Limitations Note).
- Output only the analysis text.

**Provided Company Info/Description Context:**
{info_context}

**Provided Web Search Context:**
{web_context}

**Competitive Landscape Analysis (Preliminary - Based on Public Web/YF Info):**
"""


# --- REVISED Management & Governance Prompt ---
# Goal: Focus on M&A implications of findings, even if limited.
MANAGEMENT_GOVERNANCE_PROMPT_YFINANCE = """You are an analyst evaluating management and governance hints for M&A target **{company_name} ({ticker})**.
Base your assessment *only* on provided context from **Yahoo Finance info/holders data** and **general web search results**.

**Assessment Goals:**

1.  **Key Personnel:** Identify key executives (from YF 'info' or web searches). Summarize any available hints about their background, tenure, or public statements found.
2.  **Ownership Structure Hints (YF):** Summarize basic ownership structure from YF holders data (e.g., % institutions, % insiders if available). Any notable holders mentioned?
3.  **Governance Signals (Web Search):** Summarize any significant governance-related news or discussions found (e.g., board changes, shareholder issues, compensation controversy hints, positive/negative reputation mentions).
4.  **M&A Implications (Inferred):** Based ONLY on these limited signals:
    * Are there preliminary **positive signs** regarding management stability, relevant experience, or alignment that might facilitate an M&A deal? (Label as speculative).
    * Are there potential **red flags** (e.g., high turnover hints, negative press, questionable decisions mentioned online, concentrated ownership issues suggested by YF data) that warrant caution or deeper investigation in M&A diligence? (Label as speculative).
    * Consider potential impact on **integration or post-acquisition strategy**.
5.  **Critical Limitations Note:** Briefly state this assessment is highly superficial, lacking official proxy statements, detailed board/compensation info, and internal governance documents crucial for M&A.

**Instructions:**
- Stick strictly to the provided context.
- Focus on potential **M&A relevance** of the limited findings.
- Structure logically (e.g., ## Key Personnel Hints, ## Ownership Overview (YF), ## Governance Signals (Web), ## M&A Implications (Speculative), ## Limitations Note).
- Output only the assessment text.

**Provided Yahoo Finance Context (Info/Holders):**
{yfinance_info_context}

**Provided Web Search Context:**
{web_context}

**Management & Governance Glimpse (Preliminary - Based on YF/Web):**
"""


# --- REVISED Gap Analysis Prompt ---
# Goal: Balance identifying critical official data gaps with suggesting *actionable* creative web searches.
GAP_ANALYSIS_PROMPT_YFINANCE = """Analyze the research findings summary provided below for **{company_name} ({ticker})**.
The research relied ONLY on **Yahoo Finance (YF)** (status: {yfinance_status}) and **general web search**.

**Goal:**
1.  Identify **critical knowledge gaps** for M&A due diligence that REQUIRE **official company filings** (e.g., Annual Reports, 10-K/10-Q equivalents, Proxy Statements) or specialized databases, which YF/Web cannot reliably provide. List major categories (e.g., Detailed Audited Financials & Footnotes, MD&A, Official Risk Factors, Legal/Compliance Details, Customer Contracts, IP Details, Detailed Governance/Compensation). Briefly explain *why* YF/Web are insufficient for each.
2.  Suggest **1-3 specific, creative follow-up WEB search queries** (`tool_hint: 'web_search'`) **ONLY IF** they have a realistic (even if small) chance of uncovering **partial insights, third-party summaries, links to official sources, or corroborating context** related to the identified gaps. **Focus on actionable queries.** Examples:
    * `"analyst report summary {company_name} key risks OR financial outlook"`
    * `"{company_name} investor relations contact OR website link"`
    * `"news {company_name} recent patent filing OR litigation update"`
    * `"summary {company_name} latest annual report highlights"`
    * `"{company_name} corporate governance rating OR report"`
    **Do NOT suggest searching directly for unobtainable data** like "detailed financial footnotes". Prioritize queries likely to yield *some* relevant signal, however indirect. If no plausible web follow-up seems possible for the key gaps, return an empty list for `follow_up_queries`.

**Instructions:**
- Be specific about the limitations of YF and Web Search for M&A.
- Be realistic but creative in suggesting follow-up *web* queries.
- Output should be structured using the `GapAnalysisResult` schema format (`summary` and `follow_up_queries` list).

**Provided Research Context Summary:**
{context}

**Gap Analysis Output (Using GapAnalysisResult Schema):**
"""


# --- REVISED Synthesis Prompt ---
# Goal: Stronger M&A narrative, clearer themes, balanced tone.
SYNTHESIS_PROMPT_YFINANCE = """Synthesize the research findings for **{company_name} ({ticker})** from an **M&A preliminary due diligence perspective**.
The research relied ONLY on **Yahoo Finance** data (status: {yfinance_status}) and **general web search**.

**Goal:** Create a concise synthesis forming a preliminary M&A narrative. Highlight the most critical **themes** (potential strengths/attractions and red flags/risks) emerging from the combined data. Identify key remaining uncertainties crucial for an M&A decision.

**Synthesize & Evaluate for M&A Relevance:**
1.  **Preliminary M&A Narrative:** Based *only* on the available YF/Web information, what initial "story" emerges about this company as an M&A target? (e.g., Is it presented as a growth opportunity needing financial validation? A niche tech asset with unclear market traction? A stable but slow-moving player? A situation with significant red flags needing immediate investigation?).
2.  **Key Themes (Strengths/Attractions - Speculative):** What 2-3 potential strengths or attractive aspects stand out from the analysis (e.g., apparent market niche leadership, positive product reviews found online, seemingly consistent reported growth)? Note the evidence basis (YF hint, Web mention) and the need for verification.
3.  **Key Themes (Risks/Red Flags - Speculative):** What 2-3 major risks or red flags are most prominent (e.g., concerning financial signals from YF/Web, strong competitive threats identified, negative management/governance hints, significant data gaps in critical areas)? Note the evidence basis and the need for verification.
4.  **Remaining Critical Uncertainties:** List the 3-5 most important unanswered questions that *must* be addressed through deep diligence using official sources before any M&A decision could be made.

**Instructions:**
- Focus on creating a coherent **M&A-focused narrative**.
- Use objective language but draw clear (labeled) preliminary conclusions based on the synthesized themes.
- **Acknowledge the low confidence level** due to data sources concisely within the summary.
- Output using the `FinalSynthesisResult` schema: `key_findings_summary` should contain the narrative synthesis including themes (strengths/risks), and `remaining_uncertainties` lists the critical unanswered questions.

**Comprehensive Research Context:**
{context}

**Synthesis Output (Using FinalSynthesisResult Schema):**
"""


# --- REVISED Final Report Prompt Template ---
# Goal: Maintain structure, significantly reduce repetitive warnings, integrate summary table, adjust financial section based on source.
FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE_YFINANCE_ONLY = """You are an M&A analyst writing a **Preliminary Research Briefing** on **{research_topic}**.
This briefing is based *only* on **Yahoo Finance aggregated data (Status: {yfinance_status})** and **public web search results**. No official filings or proprietary databases were consulted.
The purpose is to provide a highly preliminary assessment to inform the decision on whether to commit resources to full due diligence using official sources.
Current date: {current_date}.

**Report Requirements:**

1.  **Tone & Qualification:** Be analytical and objective. Present findings derived from the provided context. Briefly note the source (YF/Web) for key points where necessary. Acknowledge limitations primarily in the dedicated "Limitations" section, rather than excessively throughout. Label clearly speculative conclusions derived from limited data (e.g., "This *might suggest*...", "A *potential* implication...").
2.  **Structure (M&A Assessment Focus):**
    * **(Optional but Recommended) Structured Summary Table:** (If a pre-formatted table is provided in the context, include it here).
    * `## Executive Summary`: (~2-3 paragraphs) High-level overview: company profile, market context. Briefly mention the preliminary M&A rationale hints (if any) and the most significant potential red flags identified from YF/Web analysis. Conclude with a clear statement on the overall confidence level (Low, due to data sources) and the necessity of deep diligence using official sources if proceeding.
    * `## Introduction`: State the report's purpose and the data sources used (YF/Web Only).
    * `## Company & Business Overview (From Input, YF Info & Web Search)`: Describe the business based on initial input description, YF Info, and web search findings.
    * `## Market & Competitive Environment (Web Derived Insights)`: Summarize findings on market niche, competitors, positioning, and dynamics based *only* on web search analysis. Note reliance on public information.
    * `## Financial Overview ({financial_section_source_note})`: **Start with a brief disclaimer acknowledging the data source (YF or Web Fallback).** Present key findings from the financial analysis node (trends, balance sheet signals, web correlations). Discuss potential M&A implications (strengths/flags) identified in the analysis, labeling them as preliminary. Reference `(Source: {financial_data_source})`.
    * `## Management & Governance Glimpse (YF Holders & Web Derived)`: Summarize findings about personnel, ownership hints (YF), and any governance signals from web searches. Note the superficial nature of this information.
    * `## Key Preliminary Risks & Potential M&A Angles (Synthesized)`: Based on the `final_synthesis` context, summarize the key synthesized risks and potential (speculative) M&A angles.
    * `## CRITICAL LIMITATIONS & NEXT STEPS`: **Crucial Section.** Elaborate using the `gap_context`. Clearly explain *why* YF/Web data is insufficient for M&A (lack of audited financials, footnotes, MD&A, verified segment data, detailed risks, governance docs, etc.). List the **specific types of information** and **official documents** (e.g., Annual Reports from relevant exchanges, SEC filings, Prospectuses) that *must* be obtained and analyzed for proper due diligence.
    * `## Conclusion`: Briefly reiterate the preliminary nature of the assessment and the **absolute necessity** of deep due diligence using reliable official sources before making any M&A decisions.
3.  **Formatting:** Use Markdown. Use H2 (`##`) for main sections and H3 (`###`) for subsections if needed. Ensure clear paragraphs.

**Context Sections Provided:**
- Section I: Structured Summary Table (`structured_summary_table_context`) - Optional pre-formatted table.
- Section II: Synthesized Key Findings & Uncertainties (`synthesis_context`) - Narrative synthesis based on YF/Web.
- Section III: Gap Analysis Summary (`gap_context`) - Focused on limitations of YF/Web.
- Section IV: Analysis Summaries Context (`analysis_summaries_context`) - Outputs from financial, competitive, mgmt nodes.
- Section V: Search Results Context (`search_results_context`) - Snippets from web searches for context.
- Section VI: Initial Input Data (`initial_input_context`) - Key fields from the input JSON.

**Your goal is to deliver an informative preliminary briefing that is objective about findings based on limited data, manages expectations appropriately, and clearly guides the necessary next steps involving official data sources.**
"""

================================================
FILE: super_agents/customized_deep_research/reason_graph/schemas.py
================================================
from typing import List, Optional, Dict, Any, Literal
from pydantic import BaseModel, Field
import time

# --- Schemas for Planning ---
class SearchQuery(BaseModel):
    query: str = Field(..., description="The specific search query string.")
    tool_hint: str = Field("web_search", description="Hint for which tool to use (e.g., 'yfinance', 'web_search', 'news_api').")
    # Optional: Add expected information type if needed

class RequiredAnalysis(BaseModel):
    analysis_goal: str = Field(..., description="The specific question or goal for the analysis step.")
    required_inputs: List[str] = Field(default_factory=list, description="Data types needed for this analysis (e.g., 'yfinance_financials', 'web_search_market_info').")

class ResearchPlan(BaseModel):
    search_queries: List[SearchQuery] = Field(..., description="List of planned search queries.")
    required_analyses: List[RequiredAnalysis] = Field(..., description="List of planned analysis steps.")

# --- Schemas for Search Results ---
class SearchResultItem(BaseModel):
    title: str
    url: Optional[str] = None
    snippet: str

class SearchStepResult(BaseModel):
    query: str
    results: List[SearchResultItem] = Field(default_factory=list)
    tool_used: Optional[str] = None # Optional: Track which tool generated results

# --- Schemas for Analysis ---
class AnalysisResult(BaseModel):
    analysis_goal: str
    analysis_result: str # The textual output of the analysis

# --- Schemas for Gap Analysis ---
class GapFollowUpQuery(BaseModel):
     query: str = Field(..., description="Specific web search query to fill a gap.")
     tool_hint: str = Field("web_search", description="Should primarily be 'web_search' in this version.")
     rationale: Optional[str] = Field(None, description="Why this query helps fill a gap.")

class GapAnalysisResult(BaseModel):
    summary: str = Field(..., description="Summary of key limitations and information gaps, focusing on YFinance/Web constraints for M&A.")
    follow_up_queries: List[GapFollowUpQuery] = Field(default_factory=list, description="Suggested *web search* queries to potentially find related info.")

# --- Schemas for Synthesis & Reporting ---
class KeyFinding(BaseModel):
     finding: str = Field(..., description="A single key finding or insight.")
     evidence_source: Optional[str] = Field(None, description="Brief note on source (e.g., 'YFinance Trend', 'Web Search Mention').")

class FinalSynthesisResult(BaseModel):
    key_findings_summary: str = Field(..., description="Synthesized summary of the most important findings relevant to M&A, based on YFinance/Web.")
    remaining_uncertainties: List[str] = Field(..., description="List of key questions or uncertainties remaining due to data limitations.")
    # Optional: Add structured key findings list if needed
    # key_findings: List[KeyFinding] = Field(default_factory=list)

# --- Schemas for UI Streaming & State ---
class StreamUpdateData(BaseModel):
    id: str # Unique ID for the step/update type
    type: Literal["plan", "search", "analysis", "data_fetch", "synthesis", "report", "progress", "steps_list", "error", "info", "setup", "end"]
    status: Literal["pending", "running", "completed", "error", "skipped", "warning"]
    title: Optional[str] = None # User-friendly title for the step
    message: Optional[str] = None # Status message
    payload: Optional[Dict[str, Any] | List[Dict[str, Any]]] = None # Any associated data (e.g., results preview, step list)
    overwrite: bool = False # Whether this update should replace previous updates with the same ID
    isComplete: Optional[bool] = None # For progress updates
    completedSteps: Optional[float] = None # For progress updates
    totalSteps: Optional[int] = None # For progress updates

class StreamUpdate(BaseModel):
    data: StreamUpdateData
    timestamp: float = Field(default_factory=time.time)

class StepInfo(BaseModel):
    id: str
    type: str
    status: str
    title: str
    description: Optional[str] = None

================================================
FILE: super_agents/customized_deep_research/reason_graph/state.py
================================================
# /Users/peng/Dev/AI_AGENTS/mentis/super_agents/company_deep_research/reason_graph/state.py
# (Optimized Version v2 - Adjusted for Graph Logic)

from typing import TypedDict, List, Optional, Dict, Any, Literal
import pandas as pd
import time

from .schemas import (
    SearchQuery, RequiredAnalysis, AnalysisResult, GapAnalysisResult,
    FinalSynthesisResult, SearchStepResult, StreamUpdate, StepInfo, ResearchPlan, KeyFinding
)

class YFinanceData(TypedDict, total=False):
    info: Optional[Dict[str, Any]]
    financials: Optional[Dict]
    quarterly_financials: Optional[Dict]
    balance_sheet: Optional[Dict]
    quarterly_balance_sheet: Optional[Dict]
    cashflow: Optional[Dict]
    quarterly_cashflow: Optional[Dict]
    major_holders: Optional[Dict]
    institutional_holders: Optional[Dict]
    recommendations: Optional[Dict]
    news: Optional[List[Dict[str, Any]]]
    error: Optional[str]

class ResearchState(TypedDict):
    # --- Input Fields ---
    identifier_ric: str
    company_name: str
    country_of_exchange: Optional[str]
    market_cap_usd: Optional[float]
    input_business_description: Optional[str]
    input_pe_ratio: Optional[float]
    input_ebitda_usd: Optional[float]
    input_query_date: Optional[str]

    # --- Derived/Internal Fields ---
    topic: str
    ticker: str
    max_search_iterations: int # Might not be used with current loop logic
    max_analysis_steps: int # Max steps for the analysis loop
    analysis_depth: Literal["basic", "detailed"]

    # --- Planning ---
    research_plan: Optional[ResearchPlan]
    search_steps_planned: List[SearchQuery] # General web searches
    financial_web_search_steps: List[SearchQuery] # Financial web searches (if YF failed)
    analysis_steps_planned: List[RequiredAnalysis]

    # --- Data Collection ---
    yfinance_data: Optional[YFinanceData]
    yfinance_fetch_failed: bool

    search_results: List[SearchStepResult] # Stores general web search results
    financial_web_search_results: List[SearchStepResult] # Stores financial web search results

    # --- Analysis & Synthesis ---
    analysis_results: List[AnalysisResult] # Generic analysis results
    financial_analysis: Optional[str]
    competitive_analysis: Optional[str]
    management_governance_assessment: Optional[str]

    # --- Gap Analysis & Follow-up ---
    gaps_identified: Optional[GapAnalysisResult]
    gap_search_results: List[SearchStepResult]

    # --- Final Output ---
    final_synthesis: Optional[FinalSynthesisResult]
    final_report_markdown: Optional[str]
    structured_summary_table: Optional[str]

    # --- Workflow State Tracking ---
    # REMOVED: current_search_step_index (replaced by completed_web_search_count logic)
    # REMOVED: current_financial_web_search_index (handled internally or via count)
    completed_web_search_count: int # **NEW**: Tracks total web searches completed (both types)
    current_analysis_step_index: int
    completed_steps_count: float # Overall progress counter
    total_steps: Optional[int]

    # --- UI / Streaming ---
    stream_updates: List[StreamUpdate]

    # --- Error Tracking ---
    error_message: Optional[str]

================================================
FILE: super_agents/customized_deep_research/reason_graph/tools.py
================================================
import os
import json
import time
import re
import logging # Use logging instead of just print for warnings/errors
import asyncio
from datetime import datetime
from typing import Optional, List, Literal, Dict, Any, Tuple, Set, Type

# --- Environment Variable Loading ---
from dotenv import load_dotenv
load_dotenv()
import yfinance as yf
import pandas as pd

# --- Pydantic & LangChain Core ---
from pydantic import BaseModel, ValidationError, Field # Import Field for schema descriptions
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.messages import HumanMessage, SystemMessage, AIMessage
from langchain_core.runnables.base import RunnableSerializable # Type hint for LLM
# Use specific import for ChatOpenAI or other providers as needed
from langchain_openai import ChatOpenAI

# --- Internal Imports ---
# Assuming schemas.py and state.py exist in the same directory or path is correctly set
try:
    from .schemas import SearchResultItem, SearchQuery, StreamUpdate, StreamUpdateData # Relative import
    from .state import ResearchState, YFinanceData # Relative import
except ImportError as e:
    print(f"Error importing local schemas/state within tools.py: {e}")
    # Define dummy classes if needed for script loading without full context
    class BaseModel: pass # Basic placeholder
    class SearchResultItem(BaseModel): title: str = ""; url: Optional[str] = None; snippet: str = ""
    class SearchQuery(BaseModel): query: str = ""; tool_hint: str = "web_search"
    class StreamUpdateData(BaseModel): id: str = ""; type: str = ""; status: str = ""
    class StreamUpdate(BaseModel): data: Optional[StreamUpdateData] = None; timestamp: float = 0.0
    class ResearchState(dict): pass
    class YFinanceData(dict): pass

# --- Configure Logging ---
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
logger = logging.getLogger(__name__)

# --- API Key Loading ---
LLM_API_KEY_FROM_ENV = os.getenv("LLM_API_KEY")
OPENAI_API_KEY_FROM_ENV = os.getenv("OPENAI_API_KEY")
GROQ_API_KEY_FROM_ENV = os.getenv("GROQ_API_KEY")
TAVILY_API_KEY = os.getenv("TAVILY_API_KEY")
# EXA_API_KEY = os.getenv("EXA_API_KEY") # Keep commented unless Exa tools are re-enabled

# --- Configurable LLM Initialization ---
def initialize_llms() -> Tuple[Optional[RunnableSerializable], Optional[RunnableSerializable]]:
    """
    Initializes and returns the main and creative LLM instances based on environment variables.
    Supports providers: "openai", "groq", "xai"/"grok", "openai_compatible".
    Returns: (llm, llm_creative) or (None, None) on failure.
    """
    provider = os.getenv("LLM_PROVIDER", "openai").lower()
    model_name = os.getenv("LLM_MODEL_NAME") # Get model name from env
    api_key = LLM_API_KEY_FROM_ENV
    base_url = os.getenv("LLM_BASE_URL")

    # Validate essential config based on provider
    if not model_name:
         logger.error("LLM_MODEL_NAME environment variable is not set.")
         return None, None

    try:
        temperature = float(os.getenv("LLM_TEMPERATURE", "0.0"))
        creative_temperature = float(os.getenv("LLM_CREATIVE_TEMPERATURE", "0.5"))
    except ValueError:
        logger.warning("Invalid LLM temperature value in .env. Using defaults (0.0 / 0.5).")
        temperature = 0.0
        creative_temperature = 0.5

    logger.info("--- Initializing LLM ---")
    logger.info(f"Provider: '{provider}'")
    logger.info(f"Model Name: '{model_name}'")
    logger.info(f"Base URL: {base_url if base_url else 'Default'}")
    logger.info(f"Temperatures: Main={temperature}, Creative={creative_temperature}")
    logger.info("------------------------")

    llm_instance = None
    llm_creative_instance = None

    try:
        # Consolidate key logic
        key_to_use = None
        if provider == "openai":
            key_to_use = api_key or OPENAI_API_KEY_FROM_ENV
            if not key_to_use: raise ValueError("OpenAI API key not found (checked LLM_API_KEY, OPENAI_API_KEY).")
            # Use default base_url for OpenAI if not provided
            if not base_url: base_url = None # Let ChatOpenAI use default
        elif provider in ["xai", "grok", "openai_compatible"]:
            provider_name = "xAI/Grok" if provider in ["xai", "grok"] else "OpenAI Compatible"
            logger.info(f"Configuring provider '{provider_name}'. Assuming OpenAI-compatible API endpoint.")
            key_to_use = api_key # Must use LLM_API_KEY
            if not key_to_use: raise ValueError(f"LLM_API_KEY is required for provider '{provider}'.")
            if not base_url: raise ValueError(f"LLM_BASE_URL is required for provider '{provider}'.")
            logger.info(f"Note: Ensure '{model_name}' is valid for the API at {base_url}.")
        elif provider == "groq":
            key_to_use = api_key or GROQ_API_KEY_FROM_ENV
            if not key_to_use: raise ValueError("Groq API key not found (checked LLM_API_KEY, GROQ_API_KEY).")
            # Groq uses ChatGroq class, needs separate import if used.
            # For simplicity, let's assume it behaves like ChatOpenAI for now,
            # but ideally, use the specific Groq class.
            # from langchain_groq import ChatGroq
            # llm_instance = ChatGroq(...)
            # For now, treat as openai_compatible requires user to ensure compatibility
            logger.warning("Groq provider selected, using ChatOpenAI assuming compatibility. Consider using ChatGroq.")
            if not base_url: base_url = "https://api.groq.com/openai/v1" # Default Groq compatible endpoint
        else:
            raise ValueError(f"Unsupported LLM_PROVIDER: '{provider}'. Check .env. Supported: 'openai', 'groq', 'xai'/'grok', 'openai_compatible'.")

        # Instantiate LLMs using ChatOpenAI (or specific provider class if needed)
        common_params = {
             "model": model_name,
             "api_key": key_to_use,
             "base_url": base_url, # Pass None if using default OpenAI URL
        }
        # Filter out None values for base_url if using default OpenAI
        if provider == "openai" and base_url is None:
            del common_params["base_url"]

        llm_instance = ChatOpenAI(**common_params, temperature=temperature)
        llm_creative_instance = ChatOpenAI(**common_params, temperature=creative_temperature)

        logger.info("--- LLM Initialization Successful ---")
        return llm_instance, llm_creative_instance

    except ImportError as e:
        logger.error(f"!!! ERROR: Missing required LangChain provider package for '{provider}': {e}")
        logger.error("Please install the necessary package (e.g., 'pip install langchain-openai', 'pip install langchain-groq').")
        return None, None
    except Exception as e:
        logger.error(f"!!! ERROR during LLM Initialization: {e}")
        import traceback
        traceback.print_exc() # Print traceback for debugging init errors
        return None, None

# --- Initialize LLM instances at module level ---
llm, llm_creative = initialize_llms()

# --- Initialize External Service Clients ---
# Tavily Client (for web search)
tavily_client = None
if TAVILY_API_KEY:
    try:
        from tavily import AsyncTavilyClient
        tavily_client = AsyncTavilyClient(api_key=TAVILY_API_KEY)
        logger.info("Tavily client initialized.")
    except ImportError:
        logger.warning("tavily-python not installed, Tavily web search will not be available.")
    except Exception as e:
        logger.error(f"Failed to initialize Tavily client: {e}")
else:
    logger.warning("TAVILY_API_KEY not found in environment variables. Tavily web search will fail.")

# Exa Client (Commented out as per simplified plan)
# exa_client = None
# if EXA_API_KEY:
#     try:
#         from exa_py import Exa
#         exa_client = Exa(api_key=EXA_API_KEY)
#         logger.info("Exa client initialized.")
#     except ImportError:
#         logger.warning("exa-py not installed, Exa searches will not be available.")
#     except Exception as e:
#         logger.error(f"Failed to initialize Exa client: {e}")
# else:
#     logger.warning("EXA_API_KEY not found in environment variables. Exa searches will fail.")


# --- Tool Helper Functions ---

async def generate_structured_output(
    model: Optional[RunnableSerializable],
    schema: Type[BaseModel], # Use Type[BaseModel] for typing Pydantic models
    prompt: str,
    system_message: str = ""
) -> Optional[BaseModel]:
    """
    Uses langchain's `.with_structured_output` for reliable JSON generation
    conforming to the provided Pydantic schema.

    Args:
        model: The LangChain LLM runnable instance (e.g., llm_creative).
        schema: The Pydantic model class to structure the output.
        prompt: The main user prompt for the LLM.
        system_message: Optional system message to guide the LLM.

    Returns:
        An instance of the Pydantic schema if successful, otherwise None.
    """
    if model is None:
        logger.error("LLM instance is None, cannot generate structured output.")
        return None # Return None if LLM failed to initialize

    logger.info(f"[Tool] Attempting structured output generation for schema: {schema.__name__}")
    try:
        # Use with_structured_output - method='function_calling' is often reliable
        # method='json_mode' might be available/preferable for newer models/versions
        structured_llm = model.with_structured_output(schema, method="function_calling")
        # structured_llm = model.with_structured_output(schema, method="json_mode") # Alternative

        messages = []
        if system_message:
            messages.append(SystemMessage(content=system_message))
        messages.append(HumanMessage(content=prompt))

        # Use asynchronous invoke if the model supports it (most ChatModels do)
        response = await structured_llm.ainvoke(messages)

        # Check if the response is of the correct Pydantic type
        if isinstance(response, schema):
             logger.info(f"[Tool] Successfully generated structured output for {schema.__name__}.")
             return response
        else:
             # This case might happen if parsing fails within the LangChain method
             logger.error(f"[Tool] Structured output generation returned unexpected type: {type(response)}. Expected {schema.__name__}.")
             # Log the raw response if possible for debugging
             logger.error(f"Raw response: {response}")
             return None

    except NotImplementedError as nie:
        # Handle cases where the model/method combination isn't supported
        logger.error(f"Structured output method not implemented for this LLM/schema combination: {nie}")
        logger.error("Try switching the 'method' argument in with_structured_output (e.g., 'json_mode').")
        return None
    except ValidationError as ve:
        # Catch Pydantic validation errors if LangChain parsing returns data that doesn't fit the schema
        logger.error(f"Pydantic validation failed for structured output: {ve}")
        # Log the prompt or relevant context if helpful for debugging schema mismatches
        # logger.error(f"Prompt leading to validation error: {prompt[:500]}...")
        return None
    except Exception as e:
        logger.error(f"Error during structured output generation for {schema.__name__}: {e}")
        import traceback
        traceback.print_exc() # Print full traceback for unexpected errors
        return None


def create_update(state: Dict[str, Any], update_data: Dict[str, Any]) -> List[Dict[str, Any]]:
    """
    Helper to create stream update dictionaries adhering to StreamUpdate schema.
    Ensures required keys for StreamUpdateData are present based on schema definition.
    """
    # Define REQUIRED fields for StreamUpdateData based on your schemas.py
    # Assuming 'id', 'type', 'status' are always required
    required_keys = {'id', 'type', 'status'}

    # Set defaults for optional fields if not provided in update_data
    defaults = {
        'title': None,
        'message': None,
        'payload': None,
        'overwrite': False,
        'isComplete': None,
        'completedSteps': None,
        'totalSteps': None,
    }
    # Merge defaults with provided data
    data_payload = {**defaults, **update_data}

    # Validate required keys
    missing_keys = required_keys - data_payload.keys()
    if missing_keys:
        logger.warning(f"create_update missing required keys {missing_keys} in data: {data_payload}")
        # Decide how to handle: fill with defaults, raise error, or just log?
        # Let's fill with defaults for robustness, but log clearly.
        for key in missing_keys:
            data_payload[key] = f"MISSING_{key.upper()}" # Make missing value obvious

    # Construct the final update object matching StreamUpdate structure
    timestamp = time.time()
    stream_update_obj = {
        # Assuming StreamUpdate is {'data': StreamUpdateData, 'timestamp': float}
        # If StreamUpdate IS StreamUpdateData + timestamp, adjust structure
        "data": data_payload,
        "timestamp": timestamp
    }

    # Validate against Pydantic models if desired (adds overhead but ensures correctness)
    # try:
    #     StreamUpdate(**stream_update_obj) # Validate structure
    # except ValidationError as ve:
    #     logger.error(f"Validation failed for created StreamUpdate object: {ve}")
    #     logger.error(f"Object causing error: {stream_update_obj}")
    #     return [] # Return empty list on validation failure

    # Return a list containing the single update dictionary
    return [stream_update_obj]

# --- Tool Wrappers ---

async def perform_web_search(query: str, max_results: int = 5) -> List[SearchResultItem]:
    """Performs web search using Tavily async client."""
    if not tavily_client:
        logger.warning(f"Tavily client not available. Skipping web search for: '{query}'")
        return []

    # Ensure max_results is reasonable
    max_results = max(1, min(max_results, 10)) # Clamp between 1 and 10

    try:
        logger.info(f"[Tool] Calling Tavily API for: '{query}' (Max results: {max_results})")
        # Use include_raw_content=False unless you need the full webpage content
        response = await tavily_client.search(
            query=query,
            search_depth="advanced", # Use advanced for potentially better M&A context
            include_answer=False, # Typically don't need Tavily's generated answer
            max_results=max_results,
            include_raw_content=False,
            # include_images=False, # Don't need images
        )
        logger.info(f"[Tool] Tavily API call successful for: '{query}'")

        results_list = response.get('results', []) if isinstance(response, dict) else []

        # Convert Tavily results to our internal SearchResultItem schema
        formatted_results = []
        for r in results_list:
             if isinstance(r, dict) and r.get('url'):
                 formatted_results.append(
                     SearchResultItem(
                         # source='tavily_web', # Optional: track source tool
                         title=r.get('title', 'N/A'),
                         url=r.get('url'),
                         snippet=r.get('content', '') # Tavily 'content' is the snippet
                     )
                 )
        logger.info(f"Formatted {len(formatted_results)} results from Tavily.")
        return formatted_results
    except Exception as e:
        logger.error(f"Error during Tavily search for '{query}': {e}")
        return []


# --- NEW yfinance Data Fetching Tool ---
async def fetch_yfinance_data(ticker_symbol: str) -> YFinanceData:
    """
    Fetches comprehensive financial data for a given ticker using yfinance.
    Handles potential errors during data retrieval. Returns YFinanceData dict.
    """
    if not ticker_symbol or not isinstance(ticker_symbol, str):
        msg = "Invalid or missing ticker symbol provided for yfinance."
        logger.warning(f"[Tool] {msg}")
        return {"error": msg} # Return error in expected structure

    logger.info(f"[Tool] Fetching yfinance data for Ticker: {ticker_symbol}")
    # Initialize with None or empty structures matching YFinanceData TypedDict
    data: YFinanceData = {
        "info": None, "financials": None, "quarterly_financials": None,
        "balance_sheet": None, "quarterly_balance_sheet": None,
        "cashflow": None, "quarterly_cashflow": None,
        "major_holders": None, "institutional_holders": None,
        "recommendations": None, "news": [], "error": None # Default news to empty list
    }
    fetched_items_count = 0
    total_items_to_fetch = 11 # info, fin*2, bs*2, cf*2, holders*2, recs, news

    try:
        # Instantiate Ticker object
        ticker = yf.Ticker(ticker_symbol)

        # Fetch data points individually with error handling
        # Use asyncio.gather to fetch some potentially slow items concurrently?
        # Example: Fetch info first, then others concurrently if info looks valid.

        # 1. Fetch Info (Critical)
        try:
            info_data = ticker.info
            # Basic validation: Check if info dict is not empty and has a common key like 'symbol' or 'longName'
            if info_data and ('symbol' in info_data or 'longName' in info_data):
                 data['info'] = info_data
                 fetched_items_count += 1
                 logger.info(f"  Fetched .info for {ticker_symbol}")
            else:
                 raise ValueError(f"ticker.info for {ticker_symbol} is empty or invalid.")
        except Exception as e:
            logger.error(f"  Error fetching critical .info for {ticker_symbol}: {e}")
            data['error'] = f"Failed to fetch core info for ticker '{ticker_symbol}'. It might be invalid or delisted. Error: {e}"
            # If core info fails, maybe don't bother fetching others? Return early.
            logger.warning(f"[Tool] Aborting yfinance fetch for {ticker_symbol} due to critical info error.")
            return data # Return immediately with error

        # 2. Fetch other data points (can potentially be concurrent)
        async def _fetch_yf(attr_name):
             try:
                 # Use getattr to call the property/method on the ticker object
                 result = getattr(ticker, attr_name)
                 # Basic check for empty DataFrames
                 if isinstance(result, pd.DataFrame) and result.empty:
                     logger.warning(f"  yfinance returned empty DataFrame for .{attr_name}")
                     return attr_name, None # Return None for empty df? Or empty df itself? Let's return None.
                 elif isinstance(result, list) and not result:
                      logger.warning(f"  yfinance returned empty list for .{attr_name}")
                      return attr_name, [] # Return empty list for news
                 logger.info(f"  Successfully fetched .{attr_name}")
                 return attr_name, result
             except Exception as e:
                 logger.warning(f"  Error fetching .{attr_name} for {ticker_symbol}: {e}")
                 return attr_name, None # Return None on error

        attributes_to_fetch = [
             'financials', 'quarterly_financials', 'balance_sheet', 'quarterly_balance_sheet',
             'cashflow', 'quarterly_cashflow', 'major_holders', 'institutional_holders',
             'recommendations', 'news'
        ]
        # Run fetches concurrently
        results = await asyncio.gather(*[_fetch_yf(attr) for attr in attributes_to_fetch])

        # Populate the data dictionary from results
        for attr_name, result_value in results:
            if result_value is not None:
                data[attr_name] = result_value # Assign fetched data
                fetched_items_count += 1

        logger.info(f"[Tool] Fetched {fetched_items_count}/{total_items_to_fetch} data items total from yfinance for {ticker_symbol}")

    except Exception as e:
        # Catch errors during Ticker instantiation or other critical issues
        error_message = f"Critical error initializing yfinance.Ticker or during fetch process for {ticker_symbol}: {str(e)}"
        logger.error(f"[Tool] {error_message}")
        # Ensure error key exists and is updated, avoid overwriting previous specific errors if possible
        if data.get('error') is None:
             data['error'] = error_message

    # --- NEW: Convert DataFrames to serializable dict format ---
    serializable_data = {}
    for key, value in data.items():
        if isinstance(value, pd.DataFrame):
            try:
                # 'split' orientation is often good for preserving structure
                # Handle potential Timestamp conversion issues in index/columns here if necessary before to_dict
                # Example: Convert index to string if it's Timestamp
                if pd.api.types.is_datetime64_any_dtype(value.index):
                    value.index = value.index.strftime('%Y-%m-%d') # Or another suitable string format
                # Example: Convert columns to string if they are Timestamps (less common for yfinance columns)
                if any(isinstance(col, pd.Timestamp) for col in value.columns):
                    value.columns = [str(col) for col in value.columns]

                serializable_data[key] = value.to_dict(orient='split')
                logger.debug(f"  Converted DataFrame '{key}' to dict.")
            except Exception as convert_e:
                logger.error(f"  Error converting DataFrame '{key}' to dict: {convert_e}")
                serializable_data[key] = {"error": f"Failed to serialize DataFrame: {convert_e}"}
        else:
            # Keep non-DataFrame items (like info dict, news list, error string) as they are
            serializable_data[key] = value

    if data.get('error'):
        logger.warning(f"Returning yfinance data for {ticker_symbol} with error: {data['error']}")
    else:
        logger.info(f"[Tool] Completed yfinance fetch and serialization for {ticker_symbol} successfully.")

    # Return the dictionary with serialized DataFrames
    return serializable_data # Return the modified dictionary


# --- Commented out Exa Tools (Keep if desired, ensure EXA_API_KEY is set) ---
# async def perform_academic_search(query: str, max_results: int = 3) -> List[SearchResultItem]:
#      if not exa_client:
#          logger.warning(f"Exa client not available. Skipping academic search for: '{query}'")
#          return []
#      logger.info(f"[Tool] Performing Academic Search for: {query} (Using Exa - Requires EXA_API_KEY)")
#      # ... Implementation using exa_client ...
#      return []

# async def perform_x_search(query: str, max_results: int = 5) -> List[SearchResultItem]:
#      if not exa_client:
#          logger.warning(f"Exa client not available. Skipping X search for: '{query}'")
#          return []
#      logger.info(f"[Tool] Performing X Search for: {query} (Using Exa - Requires EXA_API_KEY)")
#      # ... Implementation using exa_client ...
#      return []

================================================
FILE: super_agents/deep_research/README.md
================================================
# DeepResearch Agent

## 概述

DeepResearch Agent 是一个基于 LangGraph 构建的、能够执行深度研究并调用外部工具的复杂 Agent。它能够针对用户提供的任意主题，自动化地执行一个完整的研究流程，从搜索信息到分析数据，最终生成一份详细的研究报告。

最近，我们还实现了与 Google 的 **Agent-to-Agent (A2A) 协议**的集成，使 DeepResearch Agent 可以作为标准的 A2A 服务被发现和调用，响应 A2A 请求，并通过同步或流式方式返回结构化的研究结果。

## 特性

### 核心功能

* **自动化研究流程**：从主题分析、多源搜索到最终报告生成的端到端流程
* **多工具集成**：集成了 Tavily 搜索、Exa 学术搜索等外部工具
* **结构化报告**：生成包含引用、章节和关键发现的 Markdown 格式研究报告
* **状态驱动**：基于 LangGraph 的状态驱动设计，支持复杂的研究流程管理

### A2A 适配器特性

* **解耦设计:** 适配器层 (`DeepResearchTaskManager`) 与 DeepResearch 核心 Agent 逻辑分离，方便维护和扩展
* **A2A 协议兼容:** 实现了 A2A 协议的核心方法，如 `tasks/send`, `tasks/sendSubscribe`, `tasks/get` 等
* **类型安全:** 基于 Pydantic 模型进行严格的请求/响应校验
* **流式响应:** 支持通过 Server-Sent Events (SSE) 实时返回研究进度和中间状态更新
* **推送通知框架:** 包含了处理和发送推送通知的逻辑框架

## 目录结构

```
.
├── a2a_adapter/                # DeepResearch 的 A2A 适配层
│   ├── README.md              # A2A 适配器的详细文档
│   ├── client_example.py      # 测试 A2A 适配器的客户端示例
│   ├── deep_research_task_manager.py # 核心适配器逻辑
│   ├── run_server.py          # 启动 A2A 服务器的脚本
│   └── setup.py               # 配置和组装 A2A 服务器
├── main.py                    # DeepResearch Agent 的主入口点
├── output/                    # 生成的研究报告输出目录
└── reason_graph/              # DeepResearch 的 LangGraph 图和状态定义
    ├── graph.py               # LangGraph 图定义
    ├── nodes.py               # 图节点实现
    ├── prompt.py              # 提示模板
    ├── schemas.py             # 数据模型定义
    ├── state.py               # 状态定义
    └── tools.py               # 工具实现
```

## 安装

确保已安装所有必要的依赖。推荐使用虚拟环境。

1. **创建并激活虚拟环境 (使用 uv):**
   ```bash
   uv venv
   source .venv/bin/activate  # Linux/macOS
   # 或者 .venv\Scripts\activate # Windows
   ```
   *(如果未使用 uv, 可用 `python -m venv .venv`)*

2. **安装依赖项 (使用 uv):**
   ```bash
   uv sync
   ```
   *(如果未使用 uv, 可用 `pip install -r requirements.txt`)*

## 配置

1. 在项目**根目录**下创建 `.env` 文件（如果不存在，可以复制 `.env.example` 并重命名）。
2. 确保设置了必要的环境变量：
   ```dotenv
   # LLM API 配置 (根据实际使用的 LLM 修改)
   OPENAI_API_KEY=sk-...  # 如果使用 OpenAI
   # XAI_API_KEY=...      # 如果使用 Grok
   # DEEPSEEK_API_KEY=... # 如果使用 DeepSeek
   # GROQ_API_KEY=...     # 如果使用 Groq

   # 研究工具 API Keys
   TAVILY_API_KEY=tvly-...
   EXA_API_KEY=...

   # A2A 服务器配置 (如果使用 A2A 适配器)
   A2A_HOST=127.0.0.1
   A2A_PORT=8000
   ```

## 使用方法

### 直接使用 DeepResearch Agent

在项目根目录下，运行：

```bash
# 从项目根目录 (mentis/) 运行
python -m super_agents.deep_research.main
```

脚本会提示您输入研究主题。输入后，Agent 将开始执行研究流程，并在完成后在 `output/` 目录中生成一份 Markdown 格式的研究报告。

### 使用 A2A 适配器

#### 启动 A2A 服务器

在项目根目录下，运行：

```bash
python -m super_agents.deep_research.a2a_adapter.run_server
```

服务器将根据 `.env` 文件中的 `A2A_HOST` 和 `A2A_PORT` 启动，默认监听 `http://127.0.0.1:8000`。

#### 使用客户端示例

项目提供了一个专门测试 DeepResearch A2A 适配器的客户端示例。在服务器运行的情况下，打开**新的终端**并运行：

```bash
python -m super_agents.deep_research.a2a_adapter.client_example
```

它会连接服务器，获取 Agent 信息，然后提示你输入研究主题（或使用默认的特斯拉主题），并通过流式方式显示研究进度和最终报告。

#### 在代码中集成（服务端）

如果你想在其他 Python 代码中启动这个服务，可以导入并使用 `setup` 模块：

```python
# 导入设置函数
from super_agents.deep_research.a2a_adapter.setup import setup_a2a_server

# 配置并获取服务器实例
server = setup_a2a_server(host="127.0.0.1", port=8000)

# 启动服务器 (这是一个阻塞调用)
server.start()
```

## 内部工作流程

DeepResearch Agent 执行以下研究步骤：

1. **研究规划 (Plan Research)**: 分析主题，生成初步的搜索查询和分析点
2. **多源搜索 (Multi-Source Search)**: 调用网页搜索 (Tavily)、学术搜索 (Exa) 等工具获取信息
3. **(可选) 分析执行 (Perform Analysis)**: 对搜索结果进行初步分析（如情感、SWOT 等）
4. **差距分析 (Gap Analysis)**: 评估已有信息，识别知识空白和局限性
5. **(可选) 补充搜索 (Gap Filling)**: 针对知识空白进行额外的、更具针对性的搜索
6. **最终综合 (Final Synthesis)**: 整合所有信息，提炼关键发现和不确定性
7. **报告生成 (Report Generation)**: 将综合结果和上下文信息，撰写成一份详细的、带引用的 Markdown 研究报告

## A2A 适配器架构

A2A 适配器主要由以下几部分协作完成：

1. **`deep_research_task_manager.py` (`DeepResearchTaskManager`)**:
   * 核心适配器，继承自通用的 `InMemoryTaskManager`
   * 实现了处理 A2A 请求的具体逻辑
   * 将 A2A 请求转换为 DeepResearch Agent 需要的输入格式
   * 调用 DeepResearch Agent 的流式接口来执行研究任务
   * 处理中间状态和最终结果，转换为 A2A 协议格式

2. **`setup.py`**:
   * `setup_a2a_server` 函数：配置和组装 A2A 服务器组件
   * 创建 `AgentCard`（描述 Agent 能力）
   * 创建 `DeepResearchTaskManager` 实例
   * 创建并返回配置好的 `A2AServer` 实例

3. **`run_server.py`**: 
   * 简单的入口脚本，调用 `setup.py` 中的函数来启动服务

## A2A 工作流程 (流式任务示例)

1. **客户端**: 构造请求，调用 `client.send_task_streaming(payload)`
2. **A2AClient**: 发送 `tasks/sendSubscribe` 的 JSON-RPC 请求到服务器
3. **A2AServer**: 接收请求，调用 `TaskManager.on_send_task_subscribe`
4. **DeepResearchTaskManager**: 
   * 验证请求，设置任务初始状态为 `WORKING`
   * 启动后台任务 `_process_research_task(payload)`
   * 设置 SSE 队列，返回 `dequeue_events_for_sse` 异步生成器
5. **A2AServer**: 向客户端发送 HTTP 200 OK 响应，`Content-Type` 为 `text/event-stream`
6. **客户端**: 建立 SSE 连接，开始等待事件
7. **服务器 (后台任务)**: 调用 `research_app.astream` 执行 LangGraph 图
8. **服务器 (后台任务)**: 每次产生状态更新，解析并创建 `TaskStatusUpdateEvent`
9. **服务器**: 将事件放入队列，然后发送给客户端
10. **客户端**: 接收事件，处理并显示进度更新
11. **服务器 (后台任务)**: 研究完成，创建最终 `Artifact` 和 `COMPLETED` 状态
12. **客户端**: 接收并处理最终报告和状态事件

## 与其他系统集成

由于实现了标准的 A2A 协议，DeepResearch Agent 可以方便地集成到：

* Google Assistant 等支持 A2A 的平台
* 其他实现了 A2A 客户端的 Agent 或应用程序
* 需要调用强大研究能力的自定义前端或后端系统

## 故障排除

如果遇到问题：

1. **检查 `.env` 文件:** 确保所有必需的 API 密钥都已正确配置且有效
2. **检查服务器日志:** 优先查看 `ERROR` 或 `WARNING` 级别的日志
3. **检查客户端日志:** 客户端脚本的输出可以帮助判断问题发生在请求发送阶段还是响应处理阶段
4. **端口冲突:** 确保端口 8000 没有被其他应用程序占用
5. **依赖安装:** 确认所有依赖都已在激活的虚拟环境中正确安装

## 贡献

欢迎对 DeepResearch Agent 或 A2A 适配器贡献代码、报告问题或提出改进建议。

================================================
FILE: super_agents/deep_research/__init__.py
================================================


================================================
FILE: super_agents/deep_research/a2a_adapter/README.md
================================================
# DeepResearch A2A 适配器

## 概述

本模块提供了一个将 **DeepResearch Agent**（一个基于 LangGraph 构建的、能够执行深度研究并调用外部工具的复杂 Agent）与 Google 的 **Agent-to-Agent (A2A) 协议** 进行集成的适配层。通过这个适配器，强大的 DeepResearch Agent 可以作为一个标准的 A2A 服务被发现和调用，响应 A2A 请求，并通过同步或流式方式返回结构化的研究结果。

## 特性

* **解耦设计:** 适配器层 (`AgentTaskManager`) 与 DeepResearch 核心 Agent 逻辑分离，方便维护和扩展。
* **A2A 协议兼容:** 实现了 A2A 协议的核心方法，如 `tasks/send`, `tasks/sendSubscribe`, `tasks/get` 等，并提供 `/.well-known/agent.json` 服务发现端点。
* **类型安全:** 基于 `core/a2a/types.py` 中的 Pydantic 模型进行严格的请求/响应校验。
* **工具集成:** 支持 DeepResearch Agent 在执行任务时调用外部工具 (如 Tavily, Exa API, LLM)。
* **流式响应:** 支持通过 Server-Sent Events (SSE) 实时返回研究进度和中间状态更新。*(当前版本的更新详细程度取决于 `_process_stream_updates` 的实现)*
* **推送通知框架:** 包含了处理和发送推送通知的逻辑框架。*(需要配置真实的推送发送器才能实际发送)*

## 目录结构 (相关部分)

```
.
├── core/                           # 核心 A2A 协议实现 (复用)
│   └── a2a/
│       ├── client/
│       │   └── client.py           # A2AClient 客户端库实现
│       ├── server/
│       │   ├── server.py           # A2AServer HTTP 服务器实现
│       │   └── task_manager.py     # TaskManager 基础接口
│       ├── agent_task_manager.py     # (之前的 LangGraph Agent 任务管理器示例)
│       └── types.py                # A2A 协议的 Pydantic 模型定义
├── super_agents/                   # 可能包含多个 Super Agent
│   └── deep_research/              # DeepResearch Agent 核心代码
│       ├── a2a_adapter/            # DeepResearch 的 A2A 适配层
│       │   ├── deep_research_task_manager.py # ★ 本适配器的核心逻辑
│       │   ├── setup.py              # ★ 配置和组装 A2A 服务器
│       │   ├── run_server.py         # ★ 启动服务器的脚本
│       │   └── client_example.py       # ★ 测试本适配器的客户端示例
│       ├── reason_graph/             # DeepResearch 的 LangGraph 图和状态定义 (假设)
│       │   ├── graph.py
│       │   ├── state.py
│       │   └── schemas.py
│       └── ...                     # DeepResearch 的其他模块
├── .env                            # 存储环境变量 - *需要自行创建*
├── requirements.txt                # Python 依赖项列表 (假设存在)
└── README.md                       # 项目主 README (可能)
```
*(★ 表示本文档主要涉及的文件)*

## 安装

确保已安装所有必要的依赖。推荐使用虚拟环境。

1.  **创建并激活虚拟环境 (使用 uv):**
    ```bash
    uv venv
    source .venv/bin/activate  # Linux/macOS
    # 或者 .venv\Scripts\activate # Windows
    ```
    *(如果未使用 uv, 可用 `python -m venv .venv`)*

2.  **安装依赖项 (使用 uv):**
    ```bash
    uv sync
    ```
    *(如果未使用 uv, 可用 `pip install -r requirements.txt`)*

## 配置

1.  在项目**根目录**下创建 `.env` 文件（如果不存在，可以复制 `.env.example` 并重命名）。
2.  确保设置了必要的环境变量。根据服务器日志和 DeepResearch 的可能需求，可能包括：
    ```dotenv
    # A2A 服务器配置
    A2A_HOST=127.0.0.1
    A2A_PORT=8000

    # LLM API 配置 (示例为 OpenAI/XAI, 根据实际使用的 LLM 修改)
    # OPENAI_API_KEY=sk-...
    XAI_API_KEY=your_xai_api_key # 如果使用 Grok
    # GROQ_API_KEY=... # 如果使用 Groq

    # DeepResearch 可能需要的其他工具 API Keys
    TAVILY_API_KEY=tvly-...
    EXA_API_KEY=your_exa_api_key
    # 其他 DeepResearch 可能需要的 Keys...
    ```

## 使用方法

### 启动 A2A 服务器

在项目根目录下，运行：

```bash
python -m super_agents.deep_research.a2a_adapter.run_server
```

服务器将根据 `.env` 文件中的 `A2A_HOST` 和 `A2A_PORT` 启动，默认监听 `http://127.0.0.1:8000`。

### 客户端示例

项目提供了一个专门测试 DeepResearch A2A 适配器的客户端示例。在服务器运行的情况下，打开**新的终端**并运行：

```bash
python -m super_agents.deep_research.a2a_adapter.client_example
```

它会连接服务器，获取 Agent 信息，然后提示你输入研究主题（或使用默认的特斯拉主题），并通过流式方式（如果 AgentCard 声明支持）显示研究进度和最终报告。

### 在代码中集成（服务端）

如果你想在其他 Python 代码中启动这个服务，可以导入并使用 `setup` 模块：

```python
# 导入设置函数
from super_agents.deep_research.a2a_adapter.setup import setup_a2a_server

# 配置并获取服务器实例 (host/port 可选，会使用 setup 中的默认值或环境变量)
server = setup_a2a_server(host="127.0.0.1", port=8000)

# 启动服务器 (这是一个阻塞调用)
server.start()
```

## 架构与核心组件

此 A2A 适配器主要由以下几部分协作完成：

1.  **`core/a2a/types.py`**: 定义 A2A 协议数据结构的 Pydantic 模型，确保类型安全和数据校验。
2.  **`core/a2a/server/server.py` (`A2AServer`)**: 通用的 A2A HTTP 服务器，负责接收请求、解析 JSON-RPC、验证方法、调用 TaskManager 处理，并根据 TaskManager 的返回类型（`JSONRPCResponse` 或 `AsyncIterable`）发送正确的 HTTP 响应（`application/json` 或 `text/event-stream`）。
3.  **`super_agents/deep_research/a2a_adapter/deep_research_task_manager.py` (`DeepResearchTaskManager`)**:
    * **核心适配器**，继承自通用的 `InMemoryTaskManager`（提供内存任务存储和基础方法）。
    * 实现了处理 A2A 请求（如 `on_send_task`, `on_send_task_subscribe`）的具体逻辑。
    * **关键职责:**
        * 将传入 A2A 请求中的用户查询 (`message.parts`) 转换为 DeepResearch Agent (`research_app`) 需要的输入格式（目前是提取文本放入 `initial_state["topic"]`）。
        * 调用 DeepResearch Agent 的流式接口 (`research_app.astream`) 来执行研究任务。
        * **处理中间状态:** 在 `_process_stream_updates` 方法中，解析 `research_app` 流式输出的状态更新 (`StreamUpdate` 对象)，提取信息，并将其转换为 A2A 的 `TaskStatusUpdateEvent`（包含 `TextPart` 和 `DataPart`），通过 SSE 推送给客户端。**此方法的实现质量直接决定了客户端收到的进度信息的丰富程度。**
        * **处理最终结果:** 在 `_finalize_task` 方法中，从 Agent 的最终状态提取 Markdown 报告，创建 A2A `Artifact`，更新任务状态为 `COMPLETED`，并通过 SSE 推送 `TaskArtifactUpdateEvent` 和最终的 `TaskStatusUpdateEvent`。
        * **SSE 队列管理:** 实现了 `setup_sse_consumer`, `enqueue_events_for_sse`, `dequeue_events_for_sse` 等方法来管理与客户端的 SSE 连接和事件推送。
        * **推送通知 (框架):** 实现了 `send_task_notification` 方法框架，但需要注入真实的 `notification_sender_auth` 对象才能实际发送。
4.  **`super_agents/deep_research/a2a_adapter/setup.py`**:
    * `setup_a2a_server` 函数：集中配置和组装上述组件。创建 `AgentCard`（描述 Agent 能力，包括是否支持流式和推送），创建 `DeepResearchTaskManager` 实例（并注入模拟的推送通知发送器），最后创建并返回配置好的 `A2AServer` 实例。
    * `run_server` 函数：调用 `setup_a2a_server` 并启动服务器。
5.  **`super_agents/deep_research/a2a_adapter/run_server.py`**: 简单的入口脚本，调用 `setup.py` 中的 `run_server` 函数来启动服务。

## 工作流程 (流式任务示例)

1.  **客户端**: 构造 `payload` (符合 `TaskSendParams`, 含 `id`, `message`), 调用 `client.send_task_streaming(payload)`.
2.  **A2AClient**: 发送 `method: tasks/sendSubscribe` 的 JSON-RPC POST 请求到服务器。
3.  **A2AServer**: 接收请求，验证，调用 `TaskManager.on_send_task_subscribe`.
4.  **DeepResearchTaskManager**: 验证请求，设置任务初始状态为 `WORKING`，**启动后台任务** `_process_research_task(payload)`，设置 SSE 队列，**立即返回 `dequeue_events_for_sse` 异步生成器**。
5.  **A2AServer**: 检测到返回的是 `AsyncIterable`，向客户端发送 HTTP 200 OK 响应，`Content-Type` 为 `text/event-stream`，保持连接。
6.  **客户端**: 收到 200 OK 和正确的 `Content-Type`，建立 SSE 连接，开始 `async for` 循环等待事件。
7.  **服务器 (后台任务 `_process_research_task`)**: 调用 `research_app.astream` 执行 LangGraph 图。
8.  **服务器 (后台任务 `_process_research_task`)**: 每次 `research_app` 产生状态更新，调用 `_process_stream_updates`。
9.  **服务器 (`_process_stream_updates`)**: 解析状态更新，创建 `TaskStatusUpdateEvent` (含 `TextPart`/`DataPart`)，调用 `enqueue_events_for_sse` 将事件放入队列。
10. **服务器 (`dequeue_events_for_sse`)**: 从队列中获取事件，包装成 `SendTaskStreamingResponse`，`yield` 给 `A2AServer`。
11. **A2AServer**: 将 `SendTaskStreamingResponse` 格式化为 SSE 事件 (`data: {...}\n\n`) 发送给客户端。
12. **客户端**: `async for` 循环接收到事件，解析 `SendTaskStreamingResponse`，处理 `result` 中的 `TaskStatusUpdateEvent` 并打印“进度更新”。
13. **服务器 (后台任务 `_process_research_task`)**: 研究完成，调用 `_finalize_task`。
14. **服务器 (`_finalize_task`)**: 创建最终 `Artifact` 和 `COMPLETED` 状态，调用 `enqueue_events_for_sse` 发送 `TaskArtifactUpdateEvent` 和 `TaskStatusUpdateEvent(final=True)`，最后发送 `SSE_CLOSE_SENTINEL`。
15. **客户端**: 接收并处理 `TaskArtifactUpdateEvent`（打印报告），接收到 `final=True` 的状态事件，接收到关闭信号后 `async for` 循环结束。

## 关键实现细节总结

* **Agent 接口:** `AgentTaskManager` 期望注入的 Agent 对象至少实现 `invoke(query, session_id)` 和 `stream(query, session_id)` 方法（后者需为异步生成器）。
* **流式更新内容:** 客户端看到的流式更新的详细程度，完全取决于 `DeepResearchTaskManager._process_stream_updates` 方法如何解析 Agent 内部状态并构造 `TextPart` 或 `DataPart`。
* **Pydantic 严格性:** A2A 交互的健壮性很大程度上依赖于 `types.py` 中模型的准确性和双方对这些模型的遵守。任何必需字段的缺失或类型错误都会导致 `ValidationError`。
* **SSE 实现:** 流式响应依赖于 `AgentTaskManager` 中 SSE 队列的正确实现（`setup_sse_consumer`, `enqueue_events_for_sse`, `dequeue_events_for_sse`）。

## 与其他系统集成

由于实现了标准的 A2A 协议，此 DeepResearch Agent 服务可以方便地集成到：

* Google Assistant 等支持 A2A 的平台。
* 其他实现了 A2A 客户端的 Agent 或应用程序。
* 需要调用强大研究能力的自定义前端或后端系统。

## 故障排除

如果遇到问题：

1.  **检查 `.env` 文件:** 确保所有必需的 API 密钥（OpenAI/XAI, Tavily, Exa 等）都已正确配置且有效。
2.  **检查服务器日志:** `run_server.py` 的输出包含详细的执行信息和错误栈。优先查看 `ERROR` 或 `WARNING` 级别的日志。
3.  **检查客户端日志:** 客户端脚本的输出可以帮助判断问题发生在请求发送阶段还是响应处理阶段。`httpx` 的日志可以确认网络请求是否成功。
4.  **端口冲突:** 确保端口 8000 没有被其他应用程序占用。
5.  **依赖安装:** 确认所有 `requirements.txt` 中的依赖都已在激活的虚拟环境中正确安装。

## 贡献

欢迎对此适配器或 DeepResearch Agent 本身贡献代码、报告问题或提出改进建议。请参考项目（如果公开）的贡献指南。

================================================
FILE: super_agents/deep_research/a2a_adapter/__init__.py
================================================
# super_agents/deep_research/a2a_adapter/__init__.py

# 确保导出关键组件
from super_agents.deep_research.a2a_adapter.deep_research_task_manager import DeepResearchTaskManager
from super_agents.deep_research.a2a_adapter.setup import setup_a2a_server

__all__ = ["DeepResearchTaskManager", "setup_a2a_server"]

================================================
FILE: super_agents/deep_research/a2a_adapter/client_example.py
================================================
# super_agents/deep_research/a2a_adapter/client_example.py

import os
import sys
import asyncio
import json
import logging
from pathlib import Path
from uuid import uuid4 # Import uuid

# 添加项目根目录到路径
current_script_path = Path(__file__).resolve()
project_root = current_script_path.parent.parent.parent.parent
if str(project_root) not in sys.path:
    sys.path.insert(0, str(project_root))

# 导入环境变量
from dotenv import load_dotenv
load_dotenv()

# 导入A2A客户端和所需类型
from core.a2a.client.client import A2AClient
from core.a2a.client.card_resolver import A2ACardResolver # Assuming this works as intended
# Import necessary types for requests and responses
from core.a2a.types import (
    Message, TextPart, AgentCard, Task, TaskState,DataPart,
    SendTaskResponse, GetTaskResponse, JSONRPCError,
    SendTaskStreamingResponse, TaskStatusUpdateEvent, TaskArtifactUpdateEvent # Import event types
)


# 配置日志
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

async def main():
    """
    DeepResearch A2A客户端示例 (已修正)
    """
    # 定义服务器配置
    HOST = os.getenv("A2A_HOST", "127.0.0.1")
    PORT = int(os.getenv("A2A_PORT", "8000"))

    print(f"\n=== DeepResearch A2A 客户端示例 ===\n")
    print(f"连接到服务器: http://{HOST}:{PORT}")
    print("-" * 40)

    # 创建A2A客户端
    client = A2AClient(url=f"http://{HOST}:{PORT}")

    # 获取Agent卡片信息
    agent_card: Optional[AgentCard] = None # Initialize agent_card
    try:
        # Assuming A2ACardResolver works and might need await if it does I/O
        # If get_agent_card is synchronous, wrap it if running in async context,
        # but for simplicity, let's assume it works or replace with direct GET if needed.
        card_resolver = A2ACardResolver(base_url=f"http://{HOST}:{PORT}")
        # If get_agent_card is async: agent_card = await card_resolver.get_agent_card()
        # If get_agent_card is sync:
        try:
            agent_card = card_resolver.get_agent_card() # Assuming sync for now
            print("\n=== Agent卡片信息 ===\n")
            print(json.dumps(agent_card.model_dump(exclude_none=True), indent=2, ensure_ascii=False))
            print("-" * 40)
        except Exception as card_err:
             logger.warning(f"同步获取Agent卡片失败: {card_err}. 可能需要异步获取或直接请求URL.")
             # Fallback or re-raise depending on requirements

    except Exception as e:
        logger.error(f"处理Agent卡片时出错: {e}")
        # Decide if execution should continue without the card info
        # return

    # --- 使用 Agent Card 判断是否支持流式 ---
    # Use a default if agent_card couldn't be fetched
    supports_streaming = False
    if agent_card and hasattr(agent_card, 'capabilities'):
        supports_streaming = agent_card.capabilities.streaming
    else:
        logger.warning("无法获取 Agent Card 或 Capabilities，将尝试非流式请求。")


    # 发送研究请求
    research_topic = input("\n请输入研究主题 (或按 Enter 使用默认): ")
    if not research_topic:
        research_topic = "特斯拉电动汽车的市场分析和未来发展趋势"
        print(f"使用默认研究主题: {research_topic}")

    print("\n=== 发送研究请求 ===\n")
    print(f"研究主题: {research_topic}")
    print("正在处理，请稍候...")

    # 创建消息
    message = Message(
        role="user",
        parts=[TextPart(text=research_topic)] # type="text" is default
    )

    # 发送任务并获取响应
    try:
        # 生成唯一任务ID
        task_id = "deep_research_" + uuid4().hex

        # 构建任务参数字典
        payload = {
            "id": task_id,
            "sessionId": "deep_research_session_" + uuid4().hex, # Unique session per run
            "message": message.model_dump(), # Serialize message to dict
            "acceptedOutputModes": ["text"],
            "metadata": {"skill_name": "deep_research"} # Match skill name/id from setup.py
        }

        if supports_streaming:
            # --- 修正流式API调用和处理 ---
            print("\n=== 流式响应 ===\n")
            print(f"任务ID: {task_id}")
            # 1. 调用 send_task_streaming (不使用 await) 获取异步生成器
            event_stream_generator = client.send_task_streaming(payload=payload)

            # 2. 使用 async for 迭代生成器
            async for event_response in event_stream_generator:
                logger.debug(f"Received stream event: {event_response}")

                # 3. 检查整个响应是否有错误
                if event_response.error:
                     error: JSONRPCError = event_response.error
                     print(f"流式传输中出错: Code={error.code}, Message={error.message}")
                     continue # 或者 break

                # 4. 获取事件具体内容 (TaskStatusUpdateEvent 或 TaskArtifactUpdateEvent)
                event = event_response.result
                if not event:
                     logger.warning("Received stream response with empty result.")
                     continue

                # 5. 根据事件类型处理 (使用 isinstance 或 hasattr)
                if isinstance(event, TaskStatusUpdateEvent):
                    if event.status and event.status.message and event.status.message.parts:
                        readable_summary = ""
                        structured_info = {}
                        for part in event.status.message.parts:
                            if isinstance(part, TextPart):
                                readable_summary = part.text # 获取人类可读的文本
                            elif isinstance(part, DataPart): # *** 处理 DataPart ***
                                structured_info = part.data # 获取结构化数据字典
                                logger.debug(f"收到结构化数据: {structured_info}") # 打印原始数据

                        # 你可以根据需要选择性地打印信息
                        if readable_summary:
                            print(f"进度更新 (文本): {readable_summary}")
                        # 或者/并且 打印结构化信息
                        if structured_info:
                            step = structured_info.get('step', '-')
                            status = structured_info.get('status', '-')
                            detail = structured_info.get('detail', '-')
                            query = structured_info.get('query')
                            source = structured_info.get('source')
                            count = structured_info.get('results_count')

                            print(f"进度更新 (结构化): [步骤: {step}, 状态: {status}]", end="")
                            if source: print(f" - 来源: {source}", end="")
                            if query: print(f" - 查询: '{query}'", end="")
                            if count is not None: print(f" - 结果数: {count}", end="")
                            print(f" - 详情: {detail}")

                elif isinstance(event, TaskArtifactUpdateEvent):
                    # ... 处理 artifact.parts (也可能包含 DataPart) ...
                    print("\n收到最终 Artifact:")
                    if event.artifact and event.artifact.parts:
                        full_report = ""
                        for part in event.artifact.parts:
                            if isinstance(part, TextPart):
                                print(f"  研究报告片段 (TextPart): {part.text}")
                                full_report += part.text + "\n"
                            elif isinstance(part, DataPart):
                                # 如果最终报告也可能在 DataPart 中
                                print(f"  研究报告片段 (DataPart): {part.data}")
                                # 假设报告主要在 TextPart
                        # 如果需要打印完整报告
                        print(f"\n=== 最终研究报告 (来自Artifact) ===\n{full_report.strip()}")

                else:
                    logger.warning(f"收到未知类型的流式事件: {type(event)}")

            print("流式任务处理完成。")

        else:
            # --- 修正非流式API调用和处理 ---
            print("\n=== 非流式响应 ===\n")
            # 1. 调用 send_task
            send_response: SendTaskResponse = await client.send_task(payload=payload)
            logger.debug(f"Send task response: {send_response}")

            if send_response.error:
                error: JSONRPCError = send_response.error
                print(f"发送任务时出错: Code={error.code}, Message={error.message}")
                return # Exit if sending failed
            if not send_response.result:
                print(f"发送任务成功，但未收到任务详情: {send_response}")
                # Use the task_id we sent for polling
            elif send_response.result.id != task_id:
                logger.warning(f"服务器返回的任务ID '{send_response.result.id}' 与客户端发送的ID '{task_id}' 不匹配。")
                task_id = send_response.result.id # Use server's ID

            print(f"任务已发送，ID: {task_id}")

            # 2. 轮询 get_task
            print("等待任务完成...")
            task_result: Optional[Task] = None
            for attempt in range(20): # Increase attempts for potentially long research tasks
                await asyncio.sleep(5) # Increase sleep time
                get_payload = {"id": task_id}
                logger.debug(f"Getting task with payload: {get_payload} (Attempt {attempt+1})")
                get_response: GetTaskResponse = await client.get_task(payload=get_payload)
                logger.debug(f"Get task response: {get_response}")

                if get_response.error:
                     error: JSONRPCError = get_response.error
                     print(f"获取任务时出错: Code={error.code}, Message={error.message}")
                     return
                if not get_response.result:
                     print(f"获取任务成功，但未收到任务详情: {get_response}")
                     continue

                task_result = get_response.result
                print(f"  当前任务状态: {task_result.status.state.value}")
                if task_result.status.state in [TaskState.COMPLETED, TaskState.FAILED, TaskState.CANCELED]:
                    break
            else:
                print("任务在限定时间内未完成。")
                return

            # 3. 处理最终结果
            if task_result.status.state == TaskState.COMPLETED and task_result.artifacts:
                print(f"\n=== 研究报告 ===")
                full_report = ""
                for artifact in task_result.artifacts:
                    if artifact.parts:
                        for part in artifact.parts:
                            if isinstance(part, TextPart):
                                full_report += part.text + "\n" # Concatenate parts
                print(full_report.strip())

            elif task_result.status.state == TaskState.FAILED:
                 error_msg = "未知错误"
                 if task_result.status.message and task_result.status.message.parts:
                     if isinstance(task_result.status.message.parts[0], TextPart):
                        error_msg = task_result.status.message.parts[0].text
                 print(f"任务失败: {error_msg}")
            else:
                 print(f"任务最终状态为: {task_result.status.state.value}")


    except Exception as e:
        logger.error(f"处理任务时发生异常: {e}", exc_info=True)
        print(f"处理任务时出错: {e}")

    print("\n=== 示例完成 ===\n")

if __name__ == "__main__":
    try:
        asyncio.run(main())
    except KeyboardInterrupt:
        print("\n客户端已手动停止。")
    except Exception as e:
        logger.error(f"运行客户端时发生未处理的异常: {e}", exc_info=True)

================================================
FILE: super_agents/deep_research/a2a_adapter/deep_research_task_manager.py
================================================
# super_agents/deep_research/a2a_adapter/deep_research_task_manager.py
import asyncio
import logging
import traceback
from typing import Dict, Any, Union, AsyncIterable, Optional, List
from collections import defaultdict # Import defaultdict

# Ensure all necessary types are imported
from core.a2a.types import (
    TaskState, TaskStatus, Task, Artifact, Message, TextPart, DataPart,
    SendTaskRequest, SendTaskResponse, GetTaskRequest, GetTaskResponse,
    CancelTaskRequest, CancelTaskResponse, SendTaskStreamingRequest, SendTaskStreamingResponse,
    SetTaskPushNotificationRequest, SetTaskPushNotificationResponse,
    GetTaskPushNotificationRequest, GetTaskPushNotificationResponse,
    TaskResubscriptionRequest, TaskSendParams, JSONRPCResponse, InvalidParamsError,
    TaskNotFoundError, TaskNotCancelableError, PushNotificationNotSupportedError,
    TaskArtifactUpdateEvent, TaskStatusUpdateEvent, InternalError, TaskIdParams,
    PushNotificationConfig
)
from core.a2a.server.task_manager import TaskManager, InMemoryTaskManager
from core.a2a.server import utils

# 导入DeepResearch相关组件
from super_agents.deep_research.reason_graph.graph import get_app
from super_agents.deep_research.reason_graph.state import ResearchState
# Assume StreamUpdate has a specific structure, likely including a 'data' field
from super_agents.deep_research.reason_graph.schemas import StreamUpdate

logger = logging.getLogger(__name__)

# Sentinel object to signal queue closure
SSE_CLOSE_SENTINEL = object()

class DeepResearchTaskManager(InMemoryTaskManager):
    """
    DeepResearchTaskManager (已修改 _process_stream_updates 以发送更详细的日志)
    """
    def __init__(self, notification_sender_auth=None):
        super().__init__()
        self.notification_sender_auth = notification_sender_auth
        self.research_app = get_app(for_web=True)
        self.sse_queues: Dict[str, List[asyncio.Queue]] = defaultdict(list)
        self.sse_queues_lock = asyncio.Lock()
        # --- ADDED: Track last processed stream update index per task ---
        self.last_stream_update_index: Dict[str, int] = defaultdict(int)
        # --- END ADDED ---

    # --- send_task_notification method (保持不变) ---
    async def send_task_notification(self, task: Task):
        # ... (代码同上一版本) ...
        if not task or not task.id: logger.error("send_task_notification called with invalid task object."); return
        try:
            has_info = await self.has_push_notification_info(task.id)
            if not has_info: logger.debug(f"No push notification info found for task {task.id}"); return
            push_info: Optional[PushNotificationConfig] = await self.get_push_notification_info(task.id)
            if not push_info or not push_info.url: logger.warning(f"Push notification info incomplete or URL missing for task {task.id}"); return
            if self.notification_sender_auth:
                logger.info(f"Sending push notification for task {task.id} to {push_info.url} (State: {task.status.state.value})")
                notification_data = task.model_dump(exclude_none=True)
                await self.notification_sender_auth.send_push_notification(push_info.url, data=notification_data)
            else: logger.warning(f"Push notification URL configured for task {task.id} but no 'notification_sender_auth' object was provided.")
        except AttributeError as e: logger.error(f"Push notification methods missing in base class? Error: {e}", exc_info=True)
        except Exception as e: logger.error(f"Failed to send push notification for task {task.id}: {e}", exc_info=True)

    # --- SSE Management Methods (保持不变) ---
    async def setup_sse_consumer(self, task_id: str) -> asyncio.Queue:
        # ... (代码同上一版本) ...
        queue = asyncio.Queue()
        async with self.sse_queues_lock: self.sse_queues[task_id].append(queue)
        logger.debug(f"SSE consumer queue created and registered for task {task_id}. Total consumers: {len(self.sse_queues[task_id])}")
        return queue

    async def enqueue_events_for_sse(self, task_id: str, event: Union[TaskStatusUpdateEvent, TaskArtifactUpdateEvent, object]):
         # ... (代码同上一版本) ...
        async with self.sse_queues_lock:
            if task_id in self.sse_queues:
                queues = self.sse_queues[task_id]
                logger.debug(f"Enqueuing event for task {task_id} to {len(queues)} consumers. Event: {type(event)}")
                put_tasks = [q.put(event) for q in queues]
                await asyncio.gather(*put_tasks, return_exceptions=True)
            else: logger.debug(f"No active SSE consumers found for task {task_id} when enqueuing event.")

    async def _cleanup_sse_queues(self, task_id: str, queue_to_remove: Optional[asyncio.Queue] = None):
         # ... (代码同上一版本) ...
        async with self.sse_queues_lock:
            if task_id in self.sse_queues:
                if queue_to_remove:
                    try: self.sse_queues[task_id].remove(queue_to_remove); logger.debug(f"Removed specific SSE queue for task {task_id}.")
                    except ValueError: logger.warning(f"Attempted to remove a non-existent SSE queue for task {task_id}.")
                else:
                    queues = self.sse_queues.pop(task_id, []); logger.debug(f"Cleaning up all {len(queues)} SSE queues for task {task_id}.")
                if not self.sse_queues.get(task_id): self.sse_queues.pop(task_id, None); logger.debug(f"Task ID {task_id} removed from SSE queue registry.")
            else: logger.debug(f"No SSE queues found for task {task_id} during cleanup.")
            # --- ADDED: Clean up last processed index ---
            self.last_stream_update_index.pop(task_id, None)
            logger.debug(f"Removed last stream update index tracker for task {task_id}.")
            # --- END ADDED ---

    async def dequeue_events_for_sse(self, request_id: str, task_id: str, queue: asyncio.Queue) -> AsyncIterable[SendTaskStreamingResponse]:
        # ... (代码同上一版本) ...
        logger.debug(f"Starting SSE event dequeuing for task {task_id}, request {request_id}.")
        try:
            while True:
                event = await queue.get()
                logger.debug(f"Dequeued event for task {task_id}, request {request_id}. Event type: {type(event)}")
                try:
                    if event is SSE_CLOSE_SENTINEL: logger.debug(f"SSE close sentinel received for task {task_id}, request {request_id}. Closing stream."); break
                    if isinstance(event, (TaskStatusUpdateEvent, TaskArtifactUpdateEvent)): yield SendTaskStreamingResponse(id=request_id, result=event)
                    else: logger.warning(f"Dequeued unexpected event type for SSE: {type(event)} for task {task_id}")
                finally:
                     if hasattr(queue, 'task_done'): queue.task_done()
                 # Check final flag AFTER processing the event
                if hasattr(event, 'final') and event.final: logger.debug(f"Received final event flag for task {task_id}, request {request_id}. Closing stream after yielding."); break
        except asyncio.CancelledError: logger.info(f"SSE stream cancelled for task {task_id}, request {request_id}.")
        except Exception as e: logger.error(f"Error during SSE event dequeuing for task {task_id}, request {request_id}: {e}", exc_info=True)
        finally: logger.debug(f"Cleaning up SSE queue for task {task_id}, request {request_id}."); await self._cleanup_sse_queues(task_id, queue)

    # --- _get_user_query (保持不变) ---
    def _get_user_query(self, task_send_params: TaskSendParams) -> str:
        # ... (代码同上一版本) ...
        if not task_send_params.message or not task_send_params.message.parts: logger.warning(f"[_get_user_query] Message or parts are empty for task {task_send_params.id}"); return ""
        part = task_send_params.message.parts[0]; text = ""
        if isinstance(part, TextPart): text = part.text
        elif isinstance(part, dict) and part.get("type") == "text": text = part.get("text", "")
        elif hasattr(part, 'text'): text = part.text
        else: logger.error(f"[_get_user_query] First part is not a recognized text part! Type: {type(part)}, Value: {part!r}"); raise ValueError(f"Expected first message part to contain text, but got {type(part)}")
        logger.debug(f"[_get_user_query] Extracted query: '{text}'"); return text.strip()

    # --- _validate_request (保持不变) ---
    def _validate_request(self, request: Union[SendTaskRequest, SendTaskStreamingRequest]) -> JSONRPCResponse | None:
         # ... (代码同上一版本) ...
        task_send_params: TaskSendParams = request.params; supported_content_types = ["text"]
        if not utils.are_modalities_compatible(task_send_params.acceptedOutputModes, supported_content_types): logger.warning(f"Unsupported output mode. Received %s, Support %s", task_send_params.acceptedOutputModes, supported_content_types); return utils.new_incompatible_types_error(request.id)
        if task_send_params.pushNotification and not task_send_params.pushNotification.url: logger.warning("Push notification URL is missing"); return JSONRPCResponse(id=request.id, error=InvalidParamsError(message="Push notification URL is missing"))
        return None

    # --- on_send_task (保持不变) ---
    async def on_send_task(self, request: SendTaskRequest) -> SendTaskResponse:
         # ... (代码同上一版本) ...
        validation_error = self._validate_request(request);
        if validation_error: return SendTaskResponse(id=request.id, error=validation_error.error)
        if request.params.pushNotification:
             try:
                if not await self.set_push_notification_info(request.params.id, request.params.pushNotification): return SendTaskResponse(id=request.id, error=InvalidParamsError(message="Failed to set push notification info"))
             except AttributeError: logger.error("set_push_notification_info method not found/implemented."); return SendTaskResponse(id=request.id, error=InternalError(message="Server config error (push notifications setup)."))
             except Exception as e: logger.error(f"Error during set_push_notification_info: {e}", exc_info=True); return SendTaskResponse(id=request.id, error=InternalError(message=f"Error setting push notification: {e}"))
        await self.upsert_task(request.params)
        task_working: Optional[Task] = await self.update_store(request.params.id, TaskStatus(state=TaskState.WORKING), None)
        if not task_working: logger.error(f"Failed to update task {request.params.id} to WORKING state."); return SendTaskResponse(id=request.id, error=InternalError(message="Failed to initialize task state."))
        await self.send_task_notification(task_working)
        asyncio.create_task(self._process_research_task(request.params))
        return SendTaskResponse(id=request.id, result=task_working)

    # --- _process_research_task (修正 finally 块) ---
    async def _process_research_task(self, task_send_params: TaskSendParams):
        query = self._get_user_query(task_send_params)
        task_id = task_send_params.id
        task_failed = None
        try:
            logger.info(f"Starting research process for task {task_id} with query: '{query}'")
            initial_state: ResearchState = { "topic": query, "depth": "advanced", "research_plan": None, "search_steps_planned": [], "analysis_steps_planned": [], "current_search_step_index": 0, "current_analysis_step_index": 0, "current_gap_search_index": 0, "search_results": [], "gap_analysis": None, "additional_queries_planned": [], "final_synthesis": None, "final_report_markdown": None, "stream_updates": [], "completed_steps_count": 0, "total_steps": 0, }
            config = {"recursion_limit": 100}

            async for current_state in self.research_app.astream(initial_state, config=config, stream_mode="values"):
                await self._process_stream_updates(task_id, current_state) # 将当前状态传递给处理函数
                if current_state.get("final_report_markdown"):
                    await self._finalize_task(task_id, current_state)
                    return # 正常结束

            logger.warning(f"Research task {task_id} stream finished without producing final report.")
            await self._finalize_task(task_id, {"final_report_markdown": "研究过程异常结束，未能生成报告。"})

        except Exception as e:
            # ... (异常处理逻辑不变, 包含 send_task_notification 和 enqueue SSE close) ...
            logger.error(f"Error during research task processing for task {task_id}: {e}", exc_info=True)
            error_message = f"研究过程中发生错误: {str(e) or type(e).__name__}"; parts = [TextPart(text=error_message)]
            task_status = TaskStatus(state=TaskState.FAILED, message=Message(role="agent", parts=parts))
            try:
                task_failed = await self.update_store(task_id, task_status, None)
                if task_failed:
                    await self.send_task_notification(task_failed)
                    status_event = TaskStatusUpdateEvent(id=task_id, status=task_status, final=True)
                    await self.enqueue_events_for_sse(task_id, status_event)
                    await self.enqueue_events_for_sse(task_id, SSE_CLOSE_SENTINEL)
                else: logger.error(f"Failed to update task {task_id} to FAILED state after error.")
            except Exception as final_err: logger.error(f"Further error during task failure handling for {task_id}: {final_err}", exc_info=True)
        finally:
            # --- 修正 finally 块 ---
            logger.debug(f"Entering finally block for task {task_id} processing.")
            # 直接访问基类提供的任务存储字典 self.tasks (假设存在)
            final_task_object: Optional[Task] = self.tasks.get(task_id) # 使用 .get() 安全地获取

            # 检查任务是否以最终状态结束
            if not final_task_object or final_task_object.status.state not in [TaskState.COMPLETED, TaskState.FAILED, TaskState.CANCELED]:
                logger.warning(f"Task {task_id} processing ended but task not in final state ({getattr(final_task_object, 'status', None)}). Enqueuing SSE close sentinel just in case.")
                # 确保向所有等待的客户端发送关闭信号
                await self.enqueue_events_for_sse(task_id, SSE_CLOSE_SENTINEL)
            else:
                logger.debug(f"Task {task_id} processing ended in final state: {final_task_object.status.state.value}. SSE cleanup should be handled by dequeue.")
            # 不再需要在这里主动清理所有队列
            # await self._cleanup_sse_queues(task_id)
            # --- 修改结束 ---


    async def _process_stream_updates(self, task_id: str, current_state: Dict[str, Any]):
        """
        处理来自 research_app 的流式状态更新，提取详细信息并发送 A2A 事件。
        (已增强以发送更丰富的更新)
        """
        last_index = self.last_stream_update_index[task_id]
        stream_updates: List[StreamUpdate] = current_state.get("stream_updates", [])
        new_updates = stream_updates[last_index:]

        if not new_updates:
            return

        logger.debug(f"Processing {len(new_updates)} new stream updates for task {task_id} (from index {last_index})")

        for update in new_updates:
            # 尝试从 update.data 中提取结构化信息和详细消息
            # (这里的字段名 'step', 'status', 'query', 'source', 'message' 是基于日志的推测,
            # 你需要根据 StreamUpdate 的实际定义调整)
            update_data = getattr(update, 'data', None)
            structured_data = {}
            detail_message = None

            if update_data:
                detail_message = getattr(update_data, 'message', None)
                structured_data['step'] = getattr(update_data, 'step', getattr(update_data, 'step_name', None)) # 尝试不同可能的字段名
                structured_data['status'] = getattr(update_data, 'status', None)
                structured_data['query'] = getattr(update_data, 'query', None)
                structured_data['source'] = getattr(update_data, 'source', None)
                structured_data['results_count'] = getattr(update_data, 'results_count', None)
                # 添加原始消息作为备用细节
                structured_data['detail'] = detail_message if detail_message else str(update_data)[:200] + "..."
            else:
                # 如果没有 data 字段，则使用 update 本身的字符串表示
                detail_message = str(update)[:200] + "..."
                structured_data['detail'] = detail_message

            # 清理 structured_data 中的 None 值
            structured_data = {k: v for k, v in structured_data.items() if v is not None}

            # 构造人类可读的文本 (基于提取到的信息)
            readable_text = detail_message if detail_message else structured_data.get('detail', 'Processing...')
            # 可以添加更多信息到 readable_text，例如:
            prefix = ""
            if step := structured_data.get('step'): prefix += f"[{step}] "
            if query := structured_data.get('query'): prefix += f"Query: '{query}' "
            if source := structured_data.get('source'): prefix += f"Source: {source} "
            if count := structured_data.get('results_count'): prefix += f"({count} results) "
            if prefix: readable_text = prefix.strip() + (f": {detail_message}" if detail_message and not detail_message.startswith(prefix) else "")


            # 如果提取到了有效更新
            if structured_data or readable_text:
                parts_to_send = []
                # 添加结构化数据部分 (推荐)
                if structured_data:
                     logger.debug(f"Sending DataPart for task {task_id}: {structured_data}")
                     parts_to_send.append(DataPart(data=structured_data))
                # 添加人类可读文本部分
                logger.debug(f"Sending TextPart for task {task_id}: {readable_text}")
                parts_to_send.append(TextPart(text=readable_text))

                if parts_to_send:
                    message = Message(role="agent", parts=parts_to_send)
                    # 状态始终是 WORKING，因为这是中间更新
                    task_status = TaskStatus(state=TaskState.WORKING, message=message)

                    # 更新内存中的任务状态（可选）
                    task_updated = await self.update_store(task_id, task_status, None)
                    if task_updated:
                        await self.send_task_notification(task_updated) # 发送推送（如果配置）
                    else:
                        logger.warning(f"Failed to update store during stream processing for task {task_id}")

                    # 将 TaskStatusUpdateEvent 放入 SSE 队列
                    task_update_event = TaskStatusUpdateEvent(
                        id=task_id, status=task_status, final=False # final=False 表示是中间更新
                    )
                    await self.enqueue_events_for_sse(task_id, task_update_event)

        # 更新此任务已处理的最新索引
        self.last_stream_update_index[task_id] = len(stream_updates)
        logger.debug(f"Updated last stream update index for task {task_id} to {len(stream_updates)}")
    # --- 核心修改结束 ---


    # --- _finalize_task (添加 index 清理) ---
    async def _finalize_task(self, task_id: str, final_state: Dict[str, Any]):
        logger.info(f"Finalizing task {task_id}")
        final_report = final_state.get("final_report_markdown", "未能生成研究报告")
        parts = [TextPart(text=final_report)]
        artifact = Artifact(parts=parts, index=0, append=False)
        task_status = TaskStatus(state=TaskState.COMPLETED)

        task_completed = await self.update_store(task_id, task_status, [artifact])
        if task_completed: await self.send_task_notification(task_completed)
        else: logger.error(f"Failed to update task {task_id} to COMPLETED state.")

        # 发送最终事件到 SSE 队列
        artifact_event = TaskArtifactUpdateEvent(id=task_id, artifact=artifact)
        await self.enqueue_events_for_sse(task_id, artifact_event)
        status_event = TaskStatusUpdateEvent(id=task_id, status=task_status, final=True) # 标记 final=True
        await self.enqueue_events_for_sse(task_id, status_event)
        await self.enqueue_events_for_sse(task_id, SSE_CLOSE_SENTINEL) # 发送关闭信号

        # 清理 stream update index 跟踪器
        async with self.sse_queues_lock: # 使用锁确保线程安全
            self.last_stream_update_index.pop(task_id, None)
            logger.debug(f"Removed last stream update index tracker for completed task {task_id}.")

    # --- on_send_task_subscribe (保持不变, 使用已修正的 SSE 方法) ---
    async def on_send_task_subscribe(self, request: SendTaskStreamingRequest) -> Union[AsyncIterable[SendTaskStreamingResponse], JSONRPCResponse]:
        # ... (代码同上一版本) ...
        logger.debug(f"Received on_send_task_subscribe request: {request.id} for task {request.params.id}"); validation_error = self._validate_request(request);
        if validation_error: logger.warning(f"Validation failed for task {request.params.id}: {validation_error.error}"); return JSONRPCResponse(id=request.id, error=validation_error.error)
        if request.params.pushNotification:
             try:
                if not await self.set_push_notification_info(request.params.id, request.params.pushNotification): logger.warning(f"Failed to set push notification info for task {request.params.id}"); return JSONRPCResponse(id=request.id, error=InvalidParamsError(message="Failed to set push notification info"))
             except AttributeError: logger.error("set_push_notification_info method not found/implemented."); return JSONRPCResponse(id=request.id, error=InternalError(message="Server config error (push notifications setup)."))
             except Exception as e: logger.error(f"Error during set_push_notification_info for task {request.params.id}: {e}", exc_info=True); return JSONRPCResponse(id=request.id, error=InternalError(message=f"Error setting push notification: {e}"))
        await self.upsert_task(request.params)
        task_working: Optional[Task] = await self.update_store(request.params.id, TaskStatus(state=TaskState.WORKING), None)
        if not task_working: logger.error(f"Failed to update task {request.params.id} to WORKING state."); return JSONRPCResponse(id=request.id, error=InternalError(message="Failed to initialize task state."))
        await self.send_task_notification(task_working)
        logger.info(f"Creating background task for research processing: {request.params.id}")
        asyncio.create_task(self._process_research_task(request.params))
        logger.debug(f"Attempting to setup SSE for task {request.params.id}, request {request.id}")
        try:
            sse_consumer_queue = await self.setup_sse_consumer(request.params.id); logger.debug(f"SSE consumer queue setup successfully for task {request.params.id}, request {request.id}")
            result_iterable = self.dequeue_events_for_sse(request.id, request.params.id, sse_consumer_queue); logger.debug(f"[TaskManager DEBUG] Returning from on_send_task_subscribe (Success - SSE Iterable): type={type(result_iterable)}, value={result_iterable!r}")
            return result_iterable
        except Exception as e:
            logger.error(f"Fatal error setting up SSE consumer or dequeuing for task {request.params.id}, request {request.id}: {e}", exc_info=True)
            error_response = JSONRPCResponse(id=request.id, error=InternalError(message="Failed to setup streaming response channel")); logger.debug(f"[TaskManager DEBUG] Returning from on_send_task_subscribe (SSE Setup Exception): type={type(error_response)}, value={error_response!r}")
            return error_response

    # --- Other methods like on_get_task, on_cancel_task should be inherited ---
    # Implement set_push_notification_info if not provided by base class and verification is needed
    # async def set_push_notification_info(self, task_id: str, push_notification_config: PushNotificationConfig):
    #     if self.notification_sender_auth:
    #         is_verified = await self.notification_sender_auth.verify_push_notification_url(push_notification_config.url)
    #         if not is_verified:
    #             return False
    #     # Assuming base class handles storage
    #     await super().set_push_notification_info(task_id, push_notification_config)
    #     return True

================================================
FILE: super_agents/deep_research/a2a_adapter/dr_terminal_output.md
================================================
python3 super_agents/deep_research/a2a_adapter/client_example.py

=== DeepResearch A2A 客户端示例 ===

连接到服务器: http://127.0.0.1:8000
----------------------------------------
INFO:httpx:HTTP Request: GET http://127.0.0.1:8000/.well-known/agent.json "HTTP/1.1 200 OK"

=== Agent卡片信息 ===

{
  "name": "DeepResearch Agent",
  "description": "一个强大的研究助手，能够执行深度研究并生成详细报告",
  "url": "http://127.0.0.1:8000/agent",
  "version": "0.1.0",
  "capabilities": {
    "streaming": true,
    "pushNotifications": true,
    "stateTransitionHistory": false
  },
  "defaultInputModes": [
    "text"
  ],
  "defaultOutputModes": [
    "text"
  ],
  "skills": [
    {
      "id": "deep_research_skill",
      "name": "deep_research",
      "description": "执行深度研究并生成详细报告，包括搜索、分析和综合",
      "inputModes": [
        "text"
      ],
      "outputModes": [
        "text"
      ]
    }
  ]
}
----------------------------------------

请输入研究主题 (或按 Enter 使用默认): 
使用默认研究主题: 特斯拉电动汽车的市场分析和未来发展趋势

=== 发送研究请求 ===

研究主题: 特斯拉电动汽车的市场分析和未来发展趋势
正在处理，请稍候...

=== 流式响应 ===

任务ID: deep_research_055a54fdeb8e4a0099ae4c9939ee1968
INFO:httpx:HTTP Request: POST http://127.0.0.1:8000 "HTTP/1.1 200 OK"
进度更新 (文本): Creating research plan...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Creating research plan...
进度更新 (文本): Research plan created
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Research plan created
进度更新 (文本): Query: '特斯拉电动汽车市场份额': Searching all sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车市场份额' - 详情: Searching all sources...
进度更新 (文本): Query: '特斯拉电动汽车市场份额': Found 4 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车市场份额' - 详情: Found 4 results
进度更新 (文本): Query: '特斯拉电动汽车市场份额': Searching all sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车市场份额' - 详情: Searching all sources...
进度更新 (文本): Query: '特斯拉电动汽车市场份额': Found 4 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车市场份额' - 详情: Found 4 results
进度更新 (文本): Query: '特斯拉电动汽车市场份额': Searching all sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车市场份额' - 详情: Searching all sources...
进度更新 (文本): Query: '特斯拉电动汽车市场份额': Found 4 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车市场份额' - 详情: Found 4 results
进度更新 (文本): Query: '特斯拉电动汽车销售数据': Searching web sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车销售数据' - 详情: Searching web sources...
进度更新 (文本): Query: '特斯拉电动汽车销售数据': Found 4 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车销售数据' - 详情: Found 4 results
进度更新 (文本): Query: '特斯拉电动汽车消费者反馈': Searching x sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车消费者反馈' - 详情: Searching x sources...
进度更新 (文本): Query: '特斯拉电动汽车消费者反馈': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车消费者反馈' - 详情: Found 6 results
进度更新 (文本): Query: '特斯拉电动汽车技术创新': Searching academic sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车技术创新' - 详情: Searching academic sources...
进度更新 (文本): Query: '特斯拉电动汽车技术创新': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车技术创新' - 详情: Found 3 results
进度更新 (文本): Query: '特斯拉电动汽车未来发展策略': Searching all sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车未来发展策略' - 详情: Searching all sources...
进度更新 (文本): Query: '特斯拉电动汽车未来发展策略': Found 2 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车未来发展策略' - 详情: Found 2 results
进度更新 (文本): Query: '特斯拉电动汽车未来发展策略': Searching all sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车未来发展策略' - 详情: Searching all sources...
进度更新 (文本): Query: '特斯拉电动汽车未来发展策略': Found 2 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车未来发展策略' - 详情: Found 2 results
进度更新 (文本): Query: '特斯拉电动汽车未来发展策略': Searching all sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车未来发展策略' - 详情: Searching all sources...
进度更新 (文本): Query: '特斯拉电动汽车未来发展策略': Found 8 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车未来发展策略' - 详情: Found 8 results
进度更新 (文本): Query: '特斯拉电动汽车竞争对手分析': Searching web sources...
进度更新 (结构化): [步骤: -, 状态: running] - 查询: '特斯拉电动汽车竞争对手分析' - 详情: Searching web sources...
进度更新 (文本): Query: '特斯拉电动汽车竞争对手分析': Found 2 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: '特斯拉电动汽车竞争对手分析' - 详情: Found 2 results
进度更新 (文本): Analyzing SWOT...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Analyzing SWOT...
进度更新 (文本): Analysis complete
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Analysis complete
进度更新 (文本): Analyzing Comparative...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Analyzing Comparative...
进度更新 (文本): Analysis complete
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Analysis complete
进度更新 (文本): Analyzing Sentiment...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Analyzing Sentiment...
进度更新 (文本): Analysis complete
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Analysis complete
进度更新 (文本): Analyzing Trend...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Analyzing Trend...
进度更新 (文本): Analysis complete
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Analysis complete
进度更新 (文本): Analyzing research gaps and limitations...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Analyzing research gaps and limitations...
进度更新 (文本): Identified 3 limitations and 3 knowledge gaps
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Identified 3 limitations and 3 knowledge gaps
进度更新 (文本): Query: 'Tesla market share in India 2024': Searching web to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla market share in India 2024' - 详情: Searching web to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (文本): Query: 'Tesla market share in India 2024': Searching academic to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla market share in India 2024' - 详情: Searching academic to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (文本): Query: 'Tesla market share in India 2024': Searching x to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla market share in India 2024' - 详情: Searching x to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (文本): Query: 'Tesla market share in India 2024': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla market share in India 2024' - 详情: Found 3 results
进度更新 (文本): Query: 'Tesla market share in India 2024': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla market share in India 2024' - 详情: Found 3 results
进度更新 (文本): Query: 'Tesla market share in India 2024': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla market share in India 2024' - 详情: Found 6 results
进度更新 (文本): Query: 'Tesla sales growth in Southeast Asia': Searching academic to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla sales growth in Southeast Asia' - 详情: Searching academic to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (文本): Query: 'Tesla sales growth in Southeast Asia': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla sales growth in Southeast Asia' - 详情: Found 3 results
进度更新 (文本): Query: 'Tesla's market entry strategy in Africa': Searching x to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla's market entry strategy in Africa' - 详情: Searching x to fill gap: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis, yet the current research lacks detailed data on these regions.
进度更新 (文本): Query: 'Tesla's market entry strategy in Africa': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla's market entry strategy in Africa' - 详情: Found 6 results
进度更新 (文本): Query: 'Tesla consumer sentiment among millennials': Searching web to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla consumer sentiment among millennials' - 详情: Searching web to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (文本): Query: 'Tesla consumer sentiment among millennials': Searching academic to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla consumer sentiment among millennials' - 详情: Searching academic to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (文本): Query: 'Tesla consumer sentiment among millennials': Searching x to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla consumer sentiment among millennials' - 详情: Searching x to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (文本): Query: 'Tesla consumer sentiment among millennials': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla consumer sentiment among millennials' - 详情: Found 3 results
进度更新 (文本): Query: 'Tesla consumer sentiment among millennials': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla consumer sentiment among millennials' - 详情: Found 3 results
进度更新 (文本): Query: 'Tesla consumer sentiment among millennials': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla consumer sentiment among millennials' - 详情: Found 6 results
进度更新 (文本): Query: 'Tesla brand perception among baby boomers': Searching academic to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla brand perception among baby boomers' - 详情: Searching academic to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (文本): Query: 'Tesla brand perception among baby boomers': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla brand perception among baby boomers' - 详情: Found 3 results
进度更新 (文本): Query: 'Tesla customer feedback from urban vs rural areas': Searching x to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Tesla customer feedback from urban vs rural areas' - 详情: Searching x to fill gap: The sentiment analysis conducted is broad and does not account for variations across different demographic groups, which could influence Tesla's marketing and product development strategies.
进度更新 (文本): Query: 'Tesla customer feedback from urban vs rural areas': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Tesla customer feedback from urban vs rural areas' - 详情: Found 6 results
进度更新 (文本): Query: 'Effect of EV subsidies on Tesla sales in Europe': Searching web to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Effect of EV subsidies on Tesla sales in Europe' - 详情: Searching web to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (文本): Query: 'Effect of EV subsidies on Tesla sales in Europe': Searching academic to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Effect of EV subsidies on Tesla sales in Europe' - 详情: Searching academic to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (文本): Query: 'Effect of EV subsidies on Tesla sales in Europe': Searching x to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Effect of EV subsidies on Tesla sales in Europe' - 详情: Searching x to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (文本): Query: 'Effect of EV subsidies on Tesla sales in Europe': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Effect of EV subsidies on Tesla sales in Europe' - 详情: Found 3 results
进度更新 (文本): Query: 'Effect of EV subsidies on Tesla sales in Europe': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Effect of EV subsidies on Tesla sales in Europe' - 详情: Found 3 results
进度更新 (文本): Query: 'Effect of EV subsidies on Tesla sales in Europe': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Effect of EV subsidies on Tesla sales in Europe' - 详情: Found 6 results
进度更新 (文本): Query: 'Impact of US tariffs on Tesla's competitiveness in China': Searching academic to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Impact of US tariffs on Tesla's competitiveness in China' - 详情: Searching academic to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (文本): Query: 'Impact of US tariffs on Tesla's competitiveness in China': Found 3 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Impact of US tariffs on Tesla's competitiveness in China' - 详情: Found 3 results
进度更新 (文本): Query: 'Government incentives for Tesla in South America': Searching x to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (结构化): [步骤: -, 状态: running] - 查询: 'Government incentives for Tesla in South America' - 详情: Searching x to fill gap: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position, but the research does not delve into this aspect in detail.
进度更新 (文本): Query: 'Government incentives for Tesla in South America': Found 6 results
进度更新 (结构化): [步骤: -, 状态: completed] - 查询: 'Government incentives for Tesla in South America' - 详情: Found 6 results
进度更新 (文本): Synthesizing all research findings...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Synthesizing all research findings...
进度更新 (文本): Synthesized 6 key findings
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Synthesized 6 key findings
进度更新 (文本): Research complete
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Research complete
进度更新 (文本): Compiling research findings into the final report...
进度更新 (结构化): [步骤: -, 状态: running] - 详情: Compiling research findings into the final report...
进度更新 (文本): Successfully generated Markdown report (22103 characters).
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Successfully generated Markdown report (22103 characters).
进度更新 (文本): Research complete
进度更新 (结构化): [步骤: -, 状态: completed] - 详情: Research complete

收到最终 Artifact:
  研究报告片段 (TextPart): ## Introduction

Tesla, Inc., has emerged as a pivotal player in the global electric vehicle (EV) market, spearheading the transition to sustainable transportation. The company's journey, however, has been marked by dynamic shifts in market dynamics, technological advancements, and varying consumer sentiments across different regions. This comprehensive research report delves into Tesla's market performance and future prospects, analyzing key findings from recent data on market share fluctuations, technological innovations, and consumer preferences. The focus is on understanding the intricate factors influencing Tesla's position in the EV industry, including regional market trends, the impact of government policies, and the evolving competitive landscape.

The report aims to provide a detailed examination of Tesla's market share trends in major regions such as the United States, China, and Europe, where the company has faced varying degrees of success and challenges. Furthermore, it explores Tesla's technological edge, particularly in battery efficiency and autonomous driving capabilities, which continue to shape its competitive advantage. Consumer sentiment, especially among different demographic groups like millennials, is also scrutinized to understand the broader appeal of Tesla's products. Additionally, the report assesses the significant role of government policies, including subsidies and tariffs, in influencing Tesla's market dynamics globally.

By synthesizing these key findings, this report seeks to offer a nuanced analysis of Tesla's current market position and future development trends, providing insights into the company's strategic responses to the challenges and opportunities it faces in the rapidly evolving EV market.

## Tesla's Market Share Fluctuations

### Finding 1: Tesla's Market Share in the US Electric Vehicle (EV) Market Has Experienced Fluctuations, with a Notable Decline in 2024

Tesla's market share in the US electric vehicle market has been subject to significant fluctuations over recent years, culminating in a notable decline in 2024. According to Cox Automotive, Tesla's US market share dropped to 4.2% in 2023, indicating a shift in the competitive landscape [特斯拉在美国电动汽车市场份额首次跌破50% - NE时代](https://m.ne-time.cn/newindexDetail/33817). This decline continued into 2024, with Tesla's sales in the US falling by 5.6%, marking the company's first annual decline since 2011 [Auto: For Tesla, India is a challenge as well as opportunity - Rediff.com](https://www.rediff.com/business/report/auto-for-tesa-india-is-a-challenge-as-well-as-opportunity/20250319.htm). This downturn is particularly significant as it contrasts with the overall growth in the US EV market, suggesting that Tesla's dominance is being challenged by emerging competitors.

The decline in Tesla's market share in the US can be attributed to several factors. Firstly, the increase in competition from other automakers, such as General Motors and Ford, has eroded Tesla's once-unassailable lead. These competitors have introduced new models and increased production capacity, which has diluted Tesla's market share. Secondly, the aging model lineup, particularly the Model S and Model X, may have contributed to waning consumer interest, as newer models from competitors offer fresh designs and features. Lastly, Tesla's pricing strategies and production challenges have also played a role, as potential buyers may have been deterred by price volatility and delivery delays.

Despite the decline, Tesla remains a significant player in the US EV market, with its vehicles still commanding a substantial portion of total EV sales. The company's focus on technological innovation and brand loyalty continues to be a key factor in maintaining its position, even as it navigates these market fluctuations. However, Tesla must address these challenges head-on, potentially through the introduction of new models and improvements in production efficiency, to regain its footing and reverse the downward trend in its US market share.

### Finding 2: In China, Tesla's Market Share Has Been Decreasing, Despite Record Sales in 2024

In China, Tesla has experienced a paradoxical situation where its market share has declined despite achieving record sales in 2024. According to data from bjx.com.cn, Tesla's market share in China dropped from 7.8% in 2023 to 6% in 2024, even as the company sold over 657,000 cars in the country during the same period [特斯拉汽车2024年在中国市场创销量纪录，但市场份额下降](https://m.bjx.com.cn/mnews/20250110/1422044.shtml). This decline in market share underscores the intensifying competition within the Chinese EV market, where local manufacturers are rapidly gaining ground.

The decrease in Tesla's market share in China can be attributed to several key factors. Firstly, the rise of domestic competitors, such as BYD and NIO, has put pressure on Tesla's position. These companies have not only increased their production capacities but also introduced new models that cater specifically to Chinese consumer preferences, offering competitive alternatives to Tesla's vehicles. Secondly, Tesla's pricing strategies have faced scrutiny, as the company has engaged in price wars to maintain sales volumes, which may have impacted its brand perception and profitability. Lastly, the lack of new model introductions and updates to existing models has been a point of contention, as consumers seek the latest technology and features.

Despite these challenges, Tesla's record sales in China in 2024 indicate strong underlying demand for its vehicles. The company's focus on expanding its manufacturing capabilities in Shanghai and enhancing its charging infrastructure has been crucial in sustaining sales growth. However, to reverse the decline in market share, Tesla must continue to innovate and adapt to the unique dynamics of the Chinese market. This could involve introducing new models tailored to local preferences, enhancing its service network, and possibly adjusting pricing strategies to balance volume and profitability.

### Finding 3: Tesla's Sales in Europe Have Declined Significantly, Influenced by the End of EV Subsidies and Increasing Competition

Tesla's sales in Europe have experienced a significant decline in 2024, influenced by the end of EV subsidies and increasing competition from other manufacturers. According to data from bnn bloomberg.ca, Tesla's European sales fell by 13% in 2024 [Tesla Sales Plunge 63% in EU's Second-Biggest EV Market](https://www.bnnbloomberg.ca/business/2025/02/03/tesla-sales-plunge-63-in-france-the-eus-second-biggest-ev-market/). This decline was particularly pronounced in Germany, where the cessation of EV subsidies in December 2023 had a profound impact on Tesla's sales, with a reported 41% drop [Tesla Sales Tumbled In Europe In 2024. But That's Just Part Of The ...](https://insideevs.com/news/747977/tesla-sales-down-europe-2024/).

The end of government incentives for electric vehicles in several European countries has been a major factor in the decline of Tesla's sales. These subsidies had previously encouraged consumers to opt for electric vehicles, and their removal has led to a decrease in overall EV demand, with Tesla being disproportionately affected due to its significant reliance on these markets. Additionally, increasing competition from European automakers, such as Volkswagen and Stellantis, has further challenged Tesla's position. These companies have introduced new EV models and expanded their production capacities, offering consumers more choices and potentially more appealing options.

Despite these challenges, Tesla continues to hold a significant presence in the European market, with its vehicles still accounting for a notable portion of total EV sales. To mitigate the impact of the subsidy cuts and rising competition, Tesla has implemented strategies such as price adjustments and the introduction of new features through over-the-air updates. However, the company must continue to innovate and adapt to the changing market dynamics in Europe, potentially through the introduction of new models and enhanced marketing efforts to maintain and grow its market share.

## Tesla's Technological Innovations

### Finding 4: Tesla's Technological Innovations, Particularly in Battery Efficiency and Autonomous Driving, Continue to Be a Competitive Advantage

Tesla's technological innovations, particularly in battery efficiency and autonomous driving, have been pivotal in maintaining its competitive edge in the EV market. The company's advancements in battery technology have significantly improved the range and efficiency of its vehicles, addressing one of the primary concerns for EV consumers. According to naipo.com, Tesla's focus on battery technology has enabled the company to develop high-efficiency lithium-ion battery packs, which have enhanced the driving range and charging speed of its vehicles [北美智权报第151期：特斯拉2024：技术创新与市场挑战的展望](https://www.naipo.com/Portals/11/web_cn/Knowledge_Center/Industry_Insight/IPND_240124_1501.htm).

In addition to battery technology, Tesla's advancements in autonomous driving have positioned it as a leader in the industry. The company's Autopilot and Full Self-Driving (FSD) systems have attracted significant attention and interest from consumers and investors alike. These systems leverage over-the-air (OTA) software updates to continuously improve vehicle performance and add new features without the need for physical modifications. According to tradesmax.com, Tesla's focus on OTA updates and its autonomous driving capabilities have been key differentiators in the market [为什么特斯拉电动车会成功？ - 美股投资网](https://www.tradesmax.com/component/k2/item/20180-why-tesla-is-successful).

Tesla's commitment to technological innovation extends beyond just battery and autonomous driving technologies. The company has also made significant strides in other areas, such as electric motor efficiency and vehicle manufacturing processes. For instance, Tesla's use of carbon silicon power devices in its inverters has led to improved energy conversion efficiency, resulting in a 5-10% increase in vehicle range [“平平无奇”特斯拉，身上全是“遥遥领先” - 新浪汽车](https://auto.sina.cn/zz/hy/2023-09-28/detail-imzpfekr3231284.d.html). Additionally, the company's adoption of one-piece casting technology has streamlined its manufacturing process, reducing complexity and costs.

Despite these technological achievements, Tesla faces ongoing challenges in maintaining its lead. The rapid pace of innovation in the EV industry means that competitors are continually catching up, with companies like BYD and NIO making significant investments in battery and autonomous driving technologies. To sustain its competitive advantage, Tesla must continue to invest in research and development, focusing on breakthroughs that can further enhance the performance and appeal of its vehicles.

## Consumer Sentiment Towards Tesla

### Finding 5: Consumer Sentiment Towards Tesla Varies Significantly Across Demographics, with Millennials Showing Strong Interest in Tesla's Products

Consumer sentiment towards Tesla varies significantly across different demographic groups, with millennials demonstrating particularly strong interest in the company's products. According to foxbusiness.com, the Tesla Model 3 was rated as the 'most satisfying' car for millennials, indicating a high level of satisfaction and loyalty among this demographic [Both millennials and baby boomers name Tesla Model 3 the 'most satisfying' car](https://www.foxbusiness.com/lifestyle/millenials-baby-boomers-tesla-model-3-most-satisfying-car). This sentiment is driven by Tesla's alignment with millennials' values, such as environmental consciousness and technological innovation.

Millennials' preference for Tesla can be attributed to several factors. Firstly, the company's eco-friendly image resonates with this demographic, as they are more likely to prioritize sustainability and environmental impact in their purchasing decisions. Secondly, Tesla's focus on cutting-edge technology, including features like Autopilot and OTA updates, appeals to tech-savvy millennials who value innovation and connectivity in their vehicles. According to businessinsider.com, Tesla's Model 3 appeals to millennials due to its affordability and alignment with their values [Why Tesla's Model 3 appeals to millennials](https://www.businessinsider.com/why-tesla-model-3-appeals-to-millennials-2018-2).

In contrast, other demographic groups, such as baby boomers, have shown mixed sentiments towards Tesla. While some baby boomers also rated the Model 3 as the 'most satisfying' car, there is a broader range of opinions among this group, with some expressing concerns about the reliability and practicality of electric vehicles. According to fool.com, baby boomers' perceptions of Tesla are influenced by factors such as brand familiarity and traditional automotive preferences [Why Do Baby Boomers Hate Tesla?](https://www.fool.com/investing/2020/11/24/why-do-baby-boomers-hate-tesla/).

Understanding these demographic variations in consumer sentiment is crucial for Tesla's marketing and product development strategies. The company must continue to tailor its messaging and offerings to different age groups, emphasizing the aspects of its brand and products that resonate most with each demographic. For millennials, this could involve highlighting Tesla's commitment to sustainability and technological advancement, while for baby boomers, focusing on reliability and performance may be more effective.

## Impact of Government Policies on Tesla's Market Position

### Finding 6: Government Policies, Such as Subsidies and Tariffs, Have a Significant Impact on Tesla's Market Position Globally

Government policies, including subsidies and tariffs, have a significant impact on Tesla's market position globally, influencing the company's sales and competitiveness in different regions. In Europe, the end of EV subsidies in countries like Germany has led to a notable decline in Tesla's sales. According to insideevs.com, the cessation of Germany's EV subsidy program in December 2023 resulted in a 41% drop in Tesla's sales in the country [Tesla Sales Tumbled In Europe In 2024. But That's Just Part Of The ...](https://insideevs.com/news/747977/tesla-sales-down-europe-2024/). This highlights the importance of government incentives in driving EV adoption and Tesla's reliance on these markets.

In contrast, changes in government policies can also create opportunities for Tesla. In India, the government's decision to reduce import duties on EVs to 15% under certain conditions has opened up potential new markets for the company. According to restofworld.org, this policy change could facilitate Tesla's entry into the Indian market, which is expected to grow significantly in the coming years [Tesla looks to India at a moment of crisis - Rest of World](https://restofworld.org/2025/tesla-india-sales-stock-decline/). However, the exact impact of Tesla's market share in emerging markets like India remains uncertain due to limited data.

Tariffs also play a crucial role in shaping Tesla's market dynamics, particularly in China. The imposition of US tariffs on Chinese imports has affected Tesla's competitiveness in the country, as the company relies heavily on its Shanghai factory for production. According to cnn.com, Tesla stopped taking new orders in China for two imported, US-made models due to these tariffs, which could impact its overall sales in the region [Tesla stops taking new orders in China for two imported, US-made ...](https://www.cnn.com/2025/04/12/business/tesla-china-tariffs-musk/index.html).

To navigate these challenges and capitalize on opportunities, Tesla must adopt a flexible and strategic approach to government policies. This could involve lobbying for favorable policies in key markets, adjusting pricing strategies to mitigate the impact of subsidy cuts, and exploring new markets where government incentives are more favorable. By doing so, Tesla can maintain and enhance its global market position in the face of varying policy landscapes.

## Scope and Limitations

### Scope and Limitations

This research report on Tesla's market analysis and future development trends is comprehensive, yet it is important to acknowledge its scope and limitations, which stem from the identified gaps in the data and methodology used.

**Source Bias**: The majority of the sources utilized in this research are derived from web articles and social media platforms, which may introduce bias due to the potential for sensationalism or incomplete data. Academic sources, while included, are limited and often focus on specific aspects rather than providing a comprehensive market analysis. This reliance on non-academic sources could skew the findings and affect the reliability of the conclusions drawn [特斯拉电动汽车市场份额](WEB). To address this limitation, future research should incorporate more academic and industry reports to balance the data and cross-reference findings with official company statements and financial reports.

**Data Scarcity**: There is a notable lack of detailed, up-to-date data on Tesla's market share in various regions, particularly in emerging markets like India and Southeast Asia. The available data often focuses on established markets such as the US and China, leaving gaps in understanding global market dynamics [特斯拉电动汽车市场份额](ACADEMIC). This scarcity hinders a complete analysis of Tesla's performance and potential in these regions. To overcome this, primary research or surveys in underrepresented regions could be conducted, and international market research databases could be utilized for more comprehensive data.

**Temporal Bias**: The research results are heavily weighted towards recent data, which may overlook long-term trends and historical context that could provide deeper insights into Tesla's market position and future strategies. This temporal bias could lead to an incomplete understanding of the company's trajectory and its response to market changes over time [特斯拉电动汽车市场份额](X). To mitigate this, future studies should include historical data analysis to understand long-term trends and use time-series analysis to predict future market movements based on past performance.

### Identified Knowledge Gaps

**Tesla's Market Share in Emerging Markets**: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis. However, the current research lacks detailed data on these regions, limiting the ability to assess Tesla's global market strategy effectively [特斯拉电动汽车市场份额](WEB). Future research should prioritize collecting more data from these markets to fill this gap.

**Consumer Sentiment in Different Demographics**: The sentiment analysis conducted in this report is broad and does not account for variations across different demographic groups beyond millennials and baby boomers. This limitation could influence Tesla's marketing and product development strategies, as understanding these variations is essential for targeted approaches [特斯拉电动汽车消费者反馈](X). Future studies should delve deeper into consumer sentiment across various demographics to provide a more nuanced understanding.

**Impact of Government Policies on Tesla's Market Position**: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position. However, the research does not delve into this aspect in detail, particularly in how these policies influence Tesla's long-term strategies and competitiveness [Effect of EV subsidies on Tesla sales in Europe](WEB). A more thorough analysis of the impact of government policies across different regions would enhance the understanding of Tesla's global market dynamics.

By acknowledging these limitations and addressing the identified knowledge gaps, future research can provide a more comprehensive and accurate analysis of Tesla's market position and future development trends.

## Conclusion

This research report has provided a detailed analysis of Tesla's market performance and future development trends, highlighting key findings across different regions and aspects of the company's operations. Tesla's market share in the US and China has experienced fluctuations, with notable declines in 2024, driven by increased competition and the end of EV subsidies in key markets like Europe. Despite these challenges, Tesla's technological innovations in battery efficiency and autonomous driving continue to be a significant competitive advantage, attracting strong interest from consumers, particularly among millennials.

Government policies, including subsidies and tariffs, play a crucial role in shaping Tesla's market position globally. The end of EV subsidies in Europe has led to a decline in sales, while potential opportunities in emerging markets like India are influenced by favorable policy changes. However, the exact impact of Tesla's market share in these regions remains uncertain due to limited data.

The report also acknowledges several limitations and knowledge gaps, including source bias, data scarcity in emerging markets, and temporal bias in the analysis. Future research should aim to address these gaps by incorporating more academic sources, conducting primary research in underrepresented regions, and including historical data to provide a more comprehensive understanding of Tesla's market dynamics.

In conclusion, Tesla faces a complex and evolving market landscape, with challenges and opportunities that require strategic responses. By continuing to innovate and adapt to regional market conditions and government policies, Tesla can navigate these dynamics and maintain its position as a leader in the global EV market. However, the remaining uncertainties, such as the long-term effects of government policies and variations in consumer sentiment across different demographics, highlight the need for ongoing research and analysis to fully understand Tesla's future prospects.

=== 最终研究报告 (来自Artifact) ===
## Introduction

Tesla, Inc., has emerged as a pivotal player in the global electric vehicle (EV) market, spearheading the transition to sustainable transportation. The company's journey, however, has been marked by dynamic shifts in market dynamics, technological advancements, and varying consumer sentiments across different regions. This comprehensive research report delves into Tesla's market performance and future prospects, analyzing key findings from recent data on market share fluctuations, technological innovations, and consumer preferences. The focus is on understanding the intricate factors influencing Tesla's position in the EV industry, including regional market trends, the impact of government policies, and the evolving competitive landscape.

The report aims to provide a detailed examination of Tesla's market share trends in major regions such as the United States, China, and Europe, where the company has faced varying degrees of success and challenges. Furthermore, it explores Tesla's technological edge, particularly in battery efficiency and autonomous driving capabilities, which continue to shape its competitive advantage. Consumer sentiment, especially among different demographic groups like millennials, is also scrutinized to understand the broader appeal of Tesla's products. Additionally, the report assesses the significant role of government policies, including subsidies and tariffs, in influencing Tesla's market dynamics globally.

By synthesizing these key findings, this report seeks to offer a nuanced analysis of Tesla's current market position and future development trends, providing insights into the company's strategic responses to the challenges and opportunities it faces in the rapidly evolving EV market.

## Tesla's Market Share Fluctuations

### Finding 1: Tesla's Market Share in the US Electric Vehicle (EV) Market Has Experienced Fluctuations, with a Notable Decline in 2024

Tesla's market share in the US electric vehicle market has been subject to significant fluctuations over recent years, culminating in a notable decline in 2024. According to Cox Automotive, Tesla's US market share dropped to 4.2% in 2023, indicating a shift in the competitive landscape [特斯拉在美国电动汽车市场份额首次跌破50% - NE时代](https://m.ne-time.cn/newindexDetail/33817). This decline continued into 2024, with Tesla's sales in the US falling by 5.6%, marking the company's first annual decline since 2011 [Auto: For Tesla, India is a challenge as well as opportunity - Rediff.com](https://www.rediff.com/business/report/auto-for-tesa-india-is-a-challenge-as-well-as-opportunity/20250319.htm). This downturn is particularly significant as it contrasts with the overall growth in the US EV market, suggesting that Tesla's dominance is being challenged by emerging competitors.

The decline in Tesla's market share in the US can be attributed to several factors. Firstly, the increase in competition from other automakers, such as General Motors and Ford, has eroded Tesla's once-unassailable lead. These competitors have introduced new models and increased production capacity, which has diluted Tesla's market share. Secondly, the aging model lineup, particularly the Model S and Model X, may have contributed to waning consumer interest, as newer models from competitors offer fresh designs and features. Lastly, Tesla's pricing strategies and production challenges have also played a role, as potential buyers may have been deterred by price volatility and delivery delays.

Despite the decline, Tesla remains a significant player in the US EV market, with its vehicles still commanding a substantial portion of total EV sales. The company's focus on technological innovation and brand loyalty continues to be a key factor in maintaining its position, even as it navigates these market fluctuations. However, Tesla must address these challenges head-on, potentially through the introduction of new models and improvements in production efficiency, to regain its footing and reverse the downward trend in its US market share.

### Finding 2: In China, Tesla's Market Share Has Been Decreasing, Despite Record Sales in 2024

In China, Tesla has experienced a paradoxical situation where its market share has declined despite achieving record sales in 2024. According to data from bjx.com.cn, Tesla's market share in China dropped from 7.8% in 2023 to 6% in 2024, even as the company sold over 657,000 cars in the country during the same period [特斯拉汽车2024年在中国市场创销量纪录，但市场份额下降](https://m.bjx.com.cn/mnews/20250110/1422044.shtml). This decline in market share underscores the intensifying competition within the Chinese EV market, where local manufacturers are rapidly gaining ground.

The decrease in Tesla's market share in China can be attributed to several key factors. Firstly, the rise of domestic competitors, such as BYD and NIO, has put pressure on Tesla's position. These companies have not only increased their production capacities but also introduced new models that cater specifically to Chinese consumer preferences, offering competitive alternatives to Tesla's vehicles. Secondly, Tesla's pricing strategies have faced scrutiny, as the company has engaged in price wars to maintain sales volumes, which may have impacted its brand perception and profitability. Lastly, the lack of new model introductions and updates to existing models has been a point of contention, as consumers seek the latest technology and features.

Despite these challenges, Tesla's record sales in China in 2024 indicate strong underlying demand for its vehicles. The company's focus on expanding its manufacturing capabilities in Shanghai and enhancing its charging infrastructure has been crucial in sustaining sales growth. However, to reverse the decline in market share, Tesla must continue to innovate and adapt to the unique dynamics of the Chinese market. This could involve introducing new models tailored to local preferences, enhancing its service network, and possibly adjusting pricing strategies to balance volume and profitability.

### Finding 3: Tesla's Sales in Europe Have Declined Significantly, Influenced by the End of EV Subsidies and Increasing Competition

Tesla's sales in Europe have experienced a significant decline in 2024, influenced by the end of EV subsidies and increasing competition from other manufacturers. According to data from bnn bloomberg.ca, Tesla's European sales fell by 13% in 2024 [Tesla Sales Plunge 63% in EU's Second-Biggest EV Market](https://www.bnnbloomberg.ca/business/2025/02/03/tesla-sales-plunge-63-in-france-the-eus-second-biggest-ev-market/). This decline was particularly pronounced in Germany, where the cessation of EV subsidies in December 2023 had a profound impact on Tesla's sales, with a reported 41% drop [Tesla Sales Tumbled In Europe In 2024. But That's Just Part Of The ...](https://insideevs.com/news/747977/tesla-sales-down-europe-2024/).

The end of government incentives for electric vehicles in several European countries has been a major factor in the decline of Tesla's sales. These subsidies had previously encouraged consumers to opt for electric vehicles, and their removal has led to a decrease in overall EV demand, with Tesla being disproportionately affected due to its significant reliance on these markets. Additionally, increasing competition from European automakers, such as Volkswagen and Stellantis, has further challenged Tesla's position. These companies have introduced new EV models and expanded their production capacities, offering consumers more choices and potentially more appealing options.

Despite these challenges, Tesla continues to hold a significant presence in the European market, with its vehicles still accounting for a notable portion of total EV sales. To mitigate the impact of the subsidy cuts and rising competition, Tesla has implemented strategies such as price adjustments and the introduction of new features through over-the-air updates. However, the company must continue to innovate and adapt to the changing market dynamics in Europe, potentially through the introduction of new models and enhanced marketing efforts to maintain and grow its market share.

## Tesla's Technological Innovations

### Finding 4: Tesla's Technological Innovations, Particularly in Battery Efficiency and Autonomous Driving, Continue to Be a Competitive Advantage

Tesla's technological innovations, particularly in battery efficiency and autonomous driving, have been pivotal in maintaining its competitive edge in the EV market. The company's advancements in battery technology have significantly improved the range and efficiency of its vehicles, addressing one of the primary concerns for EV consumers. According to naipo.com, Tesla's focus on battery technology has enabled the company to develop high-efficiency lithium-ion battery packs, which have enhanced the driving range and charging speed of its vehicles [北美智权报第151期：特斯拉2024：技术创新与市场挑战的展望](https://www.naipo.com/Portals/11/web_cn/Knowledge_Center/Industry_Insight/IPND_240124_1501.htm).

In addition to battery technology, Tesla's advancements in autonomous driving have positioned it as a leader in the industry. The company's Autopilot and Full Self-Driving (FSD) systems have attracted significant attention and interest from consumers and investors alike. These systems leverage over-the-air (OTA) software updates to continuously improve vehicle performance and add new features without the need for physical modifications. According to tradesmax.com, Tesla's focus on OTA updates and its autonomous driving capabilities have been key differentiators in the market [为什么特斯拉电动车会成功？ - 美股投资网](https://www.tradesmax.com/component/k2/item/20180-why-tesla-is-successful).

Tesla's commitment to technological innovation extends beyond just battery and autonomous driving technologies. The company has also made significant strides in other areas, such as electric motor efficiency and vehicle manufacturing processes. For instance, Tesla's use of carbon silicon power devices in its inverters has led to improved energy conversion efficiency, resulting in a 5-10% increase in vehicle range [“平平无奇”特斯拉，身上全是“遥遥领先” - 新浪汽车](https://auto.sina.cn/zz/hy/2023-09-28/detail-imzpfekr3231284.d.html). Additionally, the company's adoption of one-piece casting technology has streamlined its manufacturing process, reducing complexity and costs.

Despite these technological achievements, Tesla faces ongoing challenges in maintaining its lead. The rapid pace of innovation in the EV industry means that competitors are continually catching up, with companies like BYD and NIO making significant investments in battery and autonomous driving technologies. To sustain its competitive advantage, Tesla must continue to invest in research and development, focusing on breakthroughs that can further enhance the performance and appeal of its vehicles.

## Consumer Sentiment Towards Tesla

### Finding 5: Consumer Sentiment Towards Tesla Varies Significantly Across Demographics, with Millennials Showing Strong Interest in Tesla's Products

Consumer sentiment towards Tesla varies significantly across different demographic groups, with millennials demonstrating particularly strong interest in the company's products. According to foxbusiness.com, the Tesla Model 3 was rated as the 'most satisfying' car for millennials, indicating a high level of satisfaction and loyalty among this demographic [Both millennials and baby boomers name Tesla Model 3 the 'most satisfying' car](https://www.foxbusiness.com/lifestyle/millenials-baby-boomers-tesla-model-3-most-satisfying-car). This sentiment is driven by Tesla's alignment with millennials' values, such as environmental consciousness and technological innovation.

Millennials' preference for Tesla can be attributed to several factors. Firstly, the company's eco-friendly image resonates with this demographic, as they are more likely to prioritize sustainability and environmental impact in their purchasing decisions. Secondly, Tesla's focus on cutting-edge technology, including features like Autopilot and OTA updates, appeals to tech-savvy millennials who value innovation and connectivity in their vehicles. According to businessinsider.com, Tesla's Model 3 appeals to millennials due to its affordability and alignment with their values [Why Tesla's Model 3 appeals to millennials](https://www.businessinsider.com/why-tesla-model-3-appeals-to-millennials-2018-2).

In contrast, other demographic groups, such as baby boomers, have shown mixed sentiments towards Tesla. While some baby boomers also rated the Model 3 as the 'most satisfying' car, there is a broader range of opinions among this group, with some expressing concerns about the reliability and practicality of electric vehicles. According to fool.com, baby boomers' perceptions of Tesla are influenced by factors such as brand familiarity and traditional automotive preferences [Why Do Baby Boomers Hate Tesla?](https://www.fool.com/investing/2020/11/24/why-do-baby-boomers-hate-tesla/).

Understanding these demographic variations in consumer sentiment is crucial for Tesla's marketing and product development strategies. The company must continue to tailor its messaging and offerings to different age groups, emphasizing the aspects of its brand and products that resonate most with each demographic. For millennials, this could involve highlighting Tesla's commitment to sustainability and technological advancement, while for baby boomers, focusing on reliability and performance may be more effective.

## Impact of Government Policies on Tesla's Market Position

### Finding 6: Government Policies, Such as Subsidies and Tariffs, Have a Significant Impact on Tesla's Market Position Globally

Government policies, including subsidies and tariffs, have a significant impact on Tesla's market position globally, influencing the company's sales and competitiveness in different regions. In Europe, the end of EV subsidies in countries like Germany has led to a notable decline in Tesla's sales. According to insideevs.com, the cessation of Germany's EV subsidy program in December 2023 resulted in a 41% drop in Tesla's sales in the country [Tesla Sales Tumbled In Europe In 2024. But That's Just Part Of The ...](https://insideevs.com/news/747977/tesla-sales-down-europe-2024/). This highlights the importance of government incentives in driving EV adoption and Tesla's reliance on these markets.

In contrast, changes in government policies can also create opportunities for Tesla. In India, the government's decision to reduce import duties on EVs to 15% under certain conditions has opened up potential new markets for the company. According to restofworld.org, this policy change could facilitate Tesla's entry into the Indian market, which is expected to grow significantly in the coming years [Tesla looks to India at a moment of crisis - Rest of World](https://restofworld.org/2025/tesla-india-sales-stock-decline/). However, the exact impact of Tesla's market share in emerging markets like India remains uncertain due to limited data.

Tariffs also play a crucial role in shaping Tesla's market dynamics, particularly in China. The imposition of US tariffs on Chinese imports has affected Tesla's competitiveness in the country, as the company relies heavily on its Shanghai factory for production. According to cnn.com, Tesla stopped taking new orders in China for two imported, US-made models due to these tariffs, which could impact its overall sales in the region [Tesla stops taking new orders in China for two imported, US-made ...](https://www.cnn.com/2025/04/12/business/tesla-china-tariffs-musk/index.html).

To navigate these challenges and capitalize on opportunities, Tesla must adopt a flexible and strategic approach to government policies. This could involve lobbying for favorable policies in key markets, adjusting pricing strategies to mitigate the impact of subsidy cuts, and exploring new markets where government incentives are more favorable. By doing so, Tesla can maintain and enhance its global market position in the face of varying policy landscapes.

## Scope and Limitations

### Scope and Limitations

This research report on Tesla's market analysis and future development trends is comprehensive, yet it is important to acknowledge its scope and limitations, which stem from the identified gaps in the data and methodology used.

**Source Bias**: The majority of the sources utilized in this research are derived from web articles and social media platforms, which may introduce bias due to the potential for sensationalism or incomplete data. Academic sources, while included, are limited and often focus on specific aspects rather than providing a comprehensive market analysis. This reliance on non-academic sources could skew the findings and affect the reliability of the conclusions drawn [特斯拉电动汽车市场份额](WEB). To address this limitation, future research should incorporate more academic and industry reports to balance the data and cross-reference findings with official company statements and financial reports.

**Data Scarcity**: There is a notable lack of detailed, up-to-date data on Tesla's market share in various regions, particularly in emerging markets like India and Southeast Asia. The available data often focuses on established markets such as the US and China, leaving gaps in understanding global market dynamics [特斯拉电动汽车市场份额](ACADEMIC). This scarcity hinders a complete analysis of Tesla's performance and potential in these regions. To overcome this, primary research or surveys in underrepresented regions could be conducted, and international market research databases could be utilized for more comprehensive data.

**Temporal Bias**: The research results are heavily weighted towards recent data, which may overlook long-term trends and historical context that could provide deeper insights into Tesla's market position and future strategies. This temporal bias could lead to an incomplete understanding of the company's trajectory and its response to market changes over time [特斯拉电动汽车市场份额](X). To mitigate this, future studies should include historical data analysis to understand long-term trends and use time-series analysis to predict future market movements based on past performance.

### Identified Knowledge Gaps

**Tesla's Market Share in Emerging Markets**: Understanding Tesla's penetration and growth potential in emerging markets is crucial for a comprehensive market analysis. However, the current research lacks detailed data on these regions, limiting the ability to assess Tesla's global market strategy effectively [特斯拉电动汽车市场份额](WEB). Future research should prioritize collecting more data from these markets to fill this gap.

**Consumer Sentiment in Different Demographics**: The sentiment analysis conducted in this report is broad and does not account for variations across different demographic groups beyond millennials and baby boomers. This limitation could influence Tesla's marketing and product development strategies, as understanding these variations is essential for targeted approaches [特斯拉电动汽车消费者反馈](X). Future studies should delve deeper into consumer sentiment across various demographics to provide a more nuanced understanding.

**Impact of Government Policies on Tesla's Market Position**: Government policies, such as subsidies and tariffs, significantly affect Tesla's market position. However, the research does not delve into this aspect in detail, particularly in how these policies influence Tesla's long-term strategies and competitiveness [Effect of EV subsidies on Tesla sales in Europe](WEB). A more thorough analysis of the impact of government policies across different regions would enhance the understanding of Tesla's global market dynamics.

By acknowledging these limitations and addressing the identified knowledge gaps, future research can provide a more comprehensive and accurate analysis of Tesla's market position and future development trends.

## Conclusion

This research report has provided a detailed analysis of Tesla's market performance and future development trends, highlighting key findings across different regions and aspects of the company's operations. Tesla's market share in the US and China has experienced fluctuations, with notable declines in 2024, driven by increased competition and the end of EV subsidies in key markets like Europe. Despite these challenges, Tesla's technological innovations in battery efficiency and autonomous driving continue to be a significant competitive advantage, attracting strong interest from consumers, particularly among millennials.

Government policies, including subsidies and tariffs, play a crucial role in shaping Tesla's market position globally. The end of EV subsidies in Europe has led to a decline in sales, while potential opportunities in emerging markets like India are influenced by favorable policy changes. However, the exact impact of Tesla's market share in these regions remains uncertain due to limited data.

The report also acknowledges several limitations and knowledge gaps, including source bias, data scarcity in emerging markets, and temporal bias in the analysis. Future research should aim to address these gaps by incorporating more academic sources, conducting primary research in underrepresented regions, and including historical data to provide a more comprehensive understanding of Tesla's market dynamics.

In conclusion, Tesla faces a complex and evolving market landscape, with challenges and opportunities that require strategic responses. By continuing to innovate and adapt to regional market conditions and government policies, Tesla can navigate these dynamics and maintain its position as a leader in the global EV market. However, the remaining uncertainties, such as the long-term effects of government policies and variations in consumer sentiment across different demographics, highlight the need for ongoing research and analysis to fully understand Tesla's future prospects.
流式任务处理完成。

=== 示例完成 ===


================================================
FILE: super_agents/deep_research/a2a_adapter/run_server.py
================================================
# super_agents/deep_research/a2a_adapter/run_server.py

import os
import sys
import logging
from pathlib import Path

# 添加项目根目录到路径
current_script_path = Path(__file__).resolve()
project_root = current_script_path.parent.parent.parent.parent
if str(project_root) not in sys.path:
    sys.path.insert(0, str(project_root))

# 导入环境变量
from dotenv import load_dotenv
load_dotenv()

# 导入A2A适配器
from super_agents.deep_research.a2a_adapter.setup import run_server

# 配置日志
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

def main():
    """
    启动DeepResearch A2A服务器的主函数
    """
    # 定义服务器配置
    HOST = os.getenv("A2A_HOST", "127.0.0.1")
    PORT = int(os.getenv("A2A_PORT", "8000"))
    
    print(f"\n=== 启动 DeepResearch A2A 服务器 ===\n")
    print(f"主机: {HOST}")
    print(f"端口: {PORT}")
    print("-" * 40)
    
    # 运行服务器
    run_server(HOST, PORT)

if __name__ == "__main__":
    try:
        main()
    except KeyboardInterrupt:
        print("\n服务器已手动停止。")
    except Exception as e:
        logger.error(f"启动服务器时发生未处理的异常: {e}", exc_info=True)

================================================
FILE: super_agents/deep_research/a2a_adapter/setup.py
================================================
# super_agents/deep_research/a2a_adapter/setup.py

import logging
import asyncio
from typing import Dict, Any, Optional

# 导入A2A相关组件
from core.a2a.types import (
    AgentCard, AgentCapabilities, AgentSkill, Task # Import Task for type hinting
)
from core.a2a.server.server import A2AServer
from starlette.middleware.cors import CORSMiddleware

# 导入DeepResearch适配器
from super_agents.deep_research.a2a_adapter.deep_research_task_manager import DeepResearchTaskManager

# --- Placeholder/Dummy Push Notification Sender ---
# TODO: Replace this with your actual push notification sender implementation
# Your real implementation should likely handle HTTP requests, errors, retries,
# and potentially authentication challenges.
# It needs to be importable, e.g., from core.a2a.server.push_notification_auth import PushNotificationSenderAuth
class DummyPushNotificationSender:
    """这是一个推送通知发送器的占位符/模拟实现，仅记录日志。"""
    async def send_push_notification(self, url: str, data: dict):
        """
        模拟发送推送通知。

        Args:
            url: 目标推送 URL.
            data: 要发送的任务数据 (通常是 Task.model_dump()).
        """
        task_id = data.get("id", "N/A")
        task_state = data.get("status", {}).get("state", "N/A")
        logger.info(
            f"[DummyPushNotificationSender] SIMULATING push notification for task {task_id} "
            f"(State: {task_state}) to URL: {url}"
        )
        # 在这里添加实际的 HTTP POST 请求逻辑
        # 例如:
        # async with httpx.AsyncClient() as client:
        #     try:
        #         response = await client.post(url, json=data, timeout=10.0)
        #         response.raise_for_status()
        #         logger.info(f"Push notification sent successfully for task {task_id}")
        #     except Exception as e:
        #         logger.error(f"Failed to send push notification for task {task_id} to {url}: {e}")
        await asyncio.sleep(0.01) # Simulate tiny async delay

    async def verify_push_notification_url(self, url: str) -> bool:
         """
         模拟验证推送通知URL（例如通过挑战请求）。
         TODO: 实现真实的验证逻辑。
         """
         logger.info(f"[DummyPushNotificationSender] SIMULATING verification for URL: {url} - Returning True")
         return True # 假设总是验证成功
# --- End of Placeholder ---


logger = logging.getLogger(__name__)

def setup_a2a_server(host: str = "127.0.0.1", port: int = 8000) -> A2AServer:
    """
    设置并返回DeepResearch的A2A服务器实例 (启用推送通知支持)

    Args:
        host: 服务器主机地址
        port: 服务器端口

    Returns:
        A2AServer: 配置好的A2A服务器实例
    """
    print("\n=== 配置 DeepResearch A2A 服务器 ===\n")

    # 创建Agent卡片 (确保 pushNotifications=True)
    agent_card = AgentCard(
        name="DeepResearch Agent",
        description="一个强大的研究助手，能够执行深度研究并生成详细报告",
        url=f"http://{host}:{port}/agent", # 使用传入的 host/port 构建 URL
        version="0.1.0",
        capabilities=AgentCapabilities(
            streaming=True,           # Agent 支持流式
            pushNotifications=True    # Agent *声明*支持推送通知
        ),
        skills=[
            AgentSkill(
                id="deep_research_skill",
                name="deep_research",
                description="执行深度研究并生成详细报告，包括搜索、分析和综合",
                inputModes=["text"],
                outputModes=["text"]
            )
        ]
        # 你可以在这里添加 provider 等可选字段
        # provider=AgentProvider(organization="YourOrg", url="http://yourorg.com")
    )

    # --- 实例化 Push Notification Sender ---
    # 使用上面定义的占位符实现。
    # TODO: 当你有真实的实现时，替换下面这行
    notification_sender = DummyPushNotificationSender()
    logger.info("Initialized with DummyPushNotificationSender.")
    # --- 实例化结束 ---

    # --- 创建任务管理器，并传入 notification_sender_auth ---
    task_manager = DeepResearchTaskManager(
        notification_sender_auth=notification_sender
    )
    # --- 创建结束 ---

    # 创建A2A服务器实例 (传入 host 和 port)
    server = A2AServer(
        host=host,
        port=port,
        agent_card=agent_card,
        task_manager=task_manager
    )
    
    # 添加CORS中间件支持
    server.app.add_middleware(
        CORSMiddleware,
        allow_origins=["*"],  # 允许所有前端域名访问，生产环境中应该限制为特定域名
        allow_credentials=True,
        allow_methods=["*"],  # 允许所有HTTP方法
        allow_headers=["*"],  # 允许所有HTTP头
    )
    print("已添加CORS支持，允许来自所有域的请求")

    print(f"DeepResearch A2A服务器实例已创建，监听地址 http://{host}:{port}")
    return server

# 示例使用方法 (保持不变)
def run_server(host: str = "127.0.0.1", port: int = 8000):
    """
    运行DeepResearch A2A服务器

    Args:
        host: 服务器主机地址
        port: 服务器端口
    """
    try:
        # 设置服务器
        server = setup_a2a_server(host, port)

        # 启动服务器
        print(f"启动DeepResearch A2A服务器...") # 移除重复地址信息
        server.start()

    except KeyboardInterrupt:
        print("\n服务器已手动停止。")
    except Exception as e:
        logger.error(f"启动服务器时发生未处理的异常: {e}", exc_info=True)

if __name__ == "__main__":
    # 直接运行此文件时启动服务器
    # 你可以从命令行参数或环境变量获取 host 和 port
    run_host = os.getenv("A2A_HOST", "127.0.0.1")
    run_port = int(os.getenv("A2A_PORT", "8000"))
    run_server(host=run_host, port=run_port)

================================================
FILE: super_agents/deep_research/main.py
================================================
# main.py
import sys
from pathlib import Path
import asyncio
import json
import os # <--- 导入 os 模块
import re
import time # <--- 确保导入 time (虽然 finalize_basic_research 中没用到，但 add_stream_update 可能需要)
from datetime import datetime
from typing import Literal, List, Dict, Any, Set # <--- 确保导入 List

# --- OpenAI 错误处理 ---
try:
    from openai import RateLimitError
except ImportError:
    # 如果用户没有安装 openai 包，定义一个基础异常类以便 except 块能工作
    class RateLimitError(Exception):
        pass

# 1. 获取当前脚本文件的绝对路径对象
#    Path(__file__) 获取当前脚本路径
#    .resolve() 将其转换为绝对路径，并解析任何符号链接
current_script_path = Path(__file__).resolve()
project_root = current_script_path.parent
while not (project_root / '.git').exists() and project_root.parent != project_root:
    project_root = project_root.parent
if not (project_root / '.git').exists():
       # 如果找不到 .git，可能需要用其他标记或给出错误
    raise FileNotFoundError("Could not determine project root based on .git directory.")
#    构建需要添加的路径 (例如 'src' 目录)
#    根据你的实际情况，可能是项目根目录，或者根目录下的 'src', 'lib' 等
path_to_add = project_root
# 3. 将计算出的路径添加到 sys.path (如果它还不在里面的话)
#    使用 str() 将 Path 对象转换为字符串，因为 sys.path 需要字符串
if str(path_to_add) not in sys.path:
    # insert(0, ...) 表示优先搜索这个路径
    sys.path.insert(0, str(path_to_add))

# (可选) 打印出来确认一下
print(f"Dynamically added to sys.path: {path_to_add}")
# print(sys.path)

# --- LangGraph 和内部模块导入 ---
try:
    from super_agents.deep_research.reason_graph.graph import app
    from super_agents.deep_research.reason_graph.state import ResearchState
    # 导入需要用到的 Pydantic 模型
    from super_agents.deep_research.reason_graph.schemas import StreamUpdate, FinalSynthesisResult, KeyFinding
except ImportError as e:
    print(f"Error importing graph components: {e}")
    print("Please ensure 'reason_graph' package and its modules (graph, state, schemas) exist.")
    exit(1)

# --- 助手函数 ---

def slugify(text: str) -> str:
    """将文本转换为安全的文件名部分 (简化版)."""
    if not text:
        return "no_topic"
    text = text.lower()
    text = re.sub(r'\s+', '_', text) # 空格替换为下划线
    text = re.sub(r'[^\w\-]+', '', text) # 移除所有非字母、数字、下划线、连字符
    text = text.strip('_')
    # 限制文件名长度，避免过长
    return text[:100] if text else "sanitized_topic"

# --- 主研究函数 ---

async def run_research(topic: str, depth: Literal['basic', 'advanced'] = 'basic'):
    """执行研究图并处理输出和错误。"""
    initial_state: ResearchState = {
        "topic": topic,
        "depth": depth,
        "research_plan": None,
        "search_steps_planned": [],
        "analysis_steps_planned": [],
        "current_search_step_index": 0,
        "current_analysis_step_index": 0,
        "current_gap_search_index": 0,
        "search_results": [],
        "gap_analysis": None,
        "additional_queries_planned": [],
        "final_synthesis": None,
        "final_report_markdown": None, # 确保初始状态包含
        "stream_updates": [],
        "completed_steps_count": 0,
        "total_steps": 0,
    }

    print("--- Starting Research Graph ---")
    print(f"Topic: '{topic}'")
    print(f"Depth: '{depth}'")
    print("-" * 30)

    processed_updates_count = 0
    config = {"recursion_limit": 100} # 保持递归限制

    final_state = initial_state.copy() # 初始化 final_state
    error_occurred: Exception | None = None # 用于标记是否有错误发生

    # --- Streaming Execution with Error Handling ---
    try:
        async for current_state in app.astream(
            initial_state,
            config=config,
            stream_mode="values" # 使用 values 模式获取完整状态
        ):
            final_state = current_state # 持续更新 final_state 为最新状态

            # 检查并打印新的 stream_updates
            all_current_updates: List[StreamUpdate] = current_state.get("stream_updates", [])
            new_updates_count = len(all_current_updates) - processed_updates_count

            if new_updates_count > 0:
                newly_added_updates = all_current_updates[processed_updates_count:]
                for update in newly_added_updates:
                    try:
                        # 尝试打印详细信息
                        print(f"--- STREAM UPDATE (ID: {update.data.id} | Status: {update.data.status}) ---")
                        # 使用 model_dump() (Pydantic V2) 而不是 dict()
                        print(json.dumps(update.model_dump(), indent=2, default=str))
                        print("-" * 30)
                    except AttributeError as e:
                        # 处理可能的意外情况，比如列表中混入了非 StreamUpdate 对象
                        print(f"--- Error processing stream update (AttributeError): {e} ---")
                        print(f"Problematic update data: {update}")
                        print("-" * 30)
                    except Exception as e: # 捕获其他可能的打印错误
                        print(f"--- Error printing stream update: {e} ---")
                        print(f"Problematic update data: {update}")
                        print("-" * 30)


                # 更新已处理计数
                processed_updates_count = len(all_current_updates)

            # --- Optional Current State Summary ---
            # 可以取消注释以查看每步状态摘要
            # print(f"--- Current State Summary ---")
            # print(f"  Search steps completed: {current_state.get('current_search_step_index', 0)}")
            # print(f"  Analysis steps completed: {current_state.get('current_analysis_step_index', 0)}")
            # print(f"  Total results so far: {len(current_state.get('search_results', []))}")
            # print("-" * 30)


    except RateLimitError as e: # 捕获特定的 OpenAI Quota 错误
        error_occurred = e # 标记错误
        print("\n" + "="*40)
        print("!!! OpenAI API Error: Insufficient Quota !!!")
        print("="*40)
        print("The research process was stopped because your OpenAI account has exceeded its quota.")
        print("Please check your OpenAI plan and billing details.")
        print(f"Original error message: {e}")
        print("Attempting to show partial results obtained before the error...")
    except Exception as e: # 捕获其他可能的意外错误
         error_occurred = e
         print("\n" + "="*40)
         print("!!! An Unexpected Error Occurred During Graph Execution !!!")
         print("="*40)
         print(f"Error type: {type(e).__name__}")
         print(f"Error details: {e}")
         # 打印详细的 traceback 以便调试
         import traceback
         traceback.print_exc()
         print("Attempting to show partial results obtained before the error...")


    # --- Process Final State ---
    if error_occurred:
         print("\n--- Graph Execution INTERRUPTED ---")
    else:
         print("\n--- Graph Execution Finished ---")

    # 检查 final_state 是否有效
    if not final_state or not isinstance(final_state, dict):
         print("Error: Invalid or unavailable final state after execution.")
         return None

    # --- Print Final State Summary (始终尝试打印) ---
    print("\n--- FINAL (Possibly Partial) RESEARCH STATE (Summary) ---") # 调整标题
    print(f"Topic: {final_state.get('topic', 'N/A')}")
    print(f"Depth: {final_state.get('depth', 'N/A')}")
    research_plan = final_state.get('research_plan')
    if research_plan and hasattr(research_plan, 'search_queries') and hasattr(research_plan, 'required_analyses'):
        print("\nResearch Plan:")
        print(f"- {len(research_plan.search_queries)} Search Queries Planned")
        print(f"- {len(research_plan.required_analyses)} Analyses Planned")
    search_results = final_state.get('search_results', [])
    print(f"\nTotal Search Results Collected: {len(search_results)}")
    gap_analysis = final_state.get('gap_analysis')
    if gap_analysis and hasattr(gap_analysis, 'limitations') and hasattr(gap_analysis, 'knowledge_gaps'):
        print("\nGap Analysis:")
        print(f"- {len(gap_analysis.limitations)} Limitations Identified")
        print(f"- {len(gap_analysis.knowledge_gaps)} Knowledge Gaps Identified")


    # --- Save Final Synthesis Report (只有在没有错误且报告存在时才保存) ---
    final_markdown = final_state.get('final_report_markdown')

    if not error_occurred and final_markdown and isinstance(final_markdown, str) and "Report Generation Failed" not in final_markdown:
        # 打印 Synthesis 摘要 (如果存在)
        final_synthesis_data = final_state.get('final_synthesis')
        if final_synthesis_data and hasattr(final_synthesis_data, 'key_findings') and hasattr(final_synthesis_data, 'remaining_uncertainties'):
             print("\nFinal Synthesis Summary:")
             print(f"- {len(final_synthesis_data.key_findings)} Key Findings")
             print(f"- {len(final_synthesis_data.remaining_uncertainties)} Remaining Uncertainties")

        print("\n--- Saving Final Report to Markdown ---")
        try:
            markdown_content = final_markdown
            # 使用 .get 提供默认值以防 topic 丢失
            topic_slug = slugify(final_state.get('topic', 'unknown_topic'))
            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
            filename = f"research_report_{topic_slug}_{timestamp}.md"

            # --- 保存路径逻辑 ---
            script_dir = os.path.dirname(os.path.abspath(__file__))
            output_dir = os.path.join(script_dir, "Output")
            os.makedirs(output_dir, exist_ok=True)
            filepath = os.path.join(output_dir, filename)
            # --- 路径逻辑结束 ---

            with open(filepath, "w", encoding="utf-8") as f:
                f.write(markdown_content)
            print(f"Successfully saved report to: {filepath}")

        except Exception as e:
            print(f"Error saving report to Markdown: {e}")

    elif final_markdown and isinstance(final_markdown, str) and "Report Generation Failed" in final_markdown:
         # 如果报告生成节点本身出错并返回了错误信息
         print("\n--- Final Report Generation Failed ---")
         # 只打印错误部分，避免打印整个 Markdown 错误模板
         print(final_markdown.split('\n\n', 1)[-1]) # 尝试只打印 Error: ...
         print("Report not saved.")
    elif error_occurred:
         # 如果是因为 RateLimitError 等原因中断
         print("\nFinal Report: Not generated due to execution error.")
    else:
         # 正常结束但没有报告（例如 basic depth 或 synthesis 缺失）
         print("\nFinal Report: Not generated (Flow did not reach, complete report generation step, or synthesis was missing).")


    print("\n--- END OF RESEARCH ---")
    return final_state

# --- Main Execution Block ---
async def main():
     # --- 用户输入 topic ---
     topic = input("Please enter the research topic: ")
     if not topic:
         print("No topic entered. Exiting.")
         return
     # --- (可选) 用户输入 depth ---
     depth_input = input("Enter search depth (basic/advanced) [Default: advanced]: ").strip().lower()
     depth: Literal['basic', 'advanced'] = 'basic' if depth_input == 'basic' else 'advanced'
     # ---

     await run_research(topic, depth=depth)

if __name__ == "__main__":
    # 运行 asyncio 事件循环
    try:
        asyncio.run(main())
    except KeyboardInterrupt:
        print("\nResearch interrupted by user.")

================================================
FILE: super_agents/deep_research/output/research_report_analyze_smartvalue_co_ltds_9417t_core_business_key_productsservices_eg_government_cloud_solutions_mo_20250418_125137.md
================================================
## Introduction

Smartvalue Co Ltd (9417.T) stands as a significant player in Japan's IT landscape, focusing on cloud solutions and mobility services. The company's primary target markets include the public sector and mobility industries, where it provides innovative cloud-based platforms and mobility services tailored to meet the specific needs of these sectors. Smartvalue's business model is centered around leveraging cloud technology to address social issues, with a particular emphasis on regional information cloud business, cloud platform business, and mobility service business. The company's strategic approach involves a blend of steady income growth and aggressive pursuit of new business opportunities, aiming for significant increases in operating profit. This report delves into Smartvalue's core business operations, market strategy, financial performance, and technological capabilities, providing a comprehensive analysis based on the available data.

The analysis begins with an exploration of Smartvalue's key products and services, followed by an examination of its revenue mix, unique value proposition, and market strategy. We then discuss Smartvalue's target markets in Japan, its financial performance over the last five years, and its core technology base. Additionally, we assess the company's intellectual property, R&D capabilities, and key management personnel. The report also covers Smartvalue's major shareholders, corporate governance structure, and financial condition, including key KPIs and cash flow trends. Finally, we evaluate Smartvalue's customer segments, sales and marketing strategies, and potential risks such as customer concentration and legal proceedings. This comprehensive analysis aims to provide a detailed understanding of Smartvalue's position in the market and its potential for growth and synergy if acquired by a larger IT services firm.

## Smartvalue Co Ltd's Core Business Focus

### Finding 1: Smartvalue Co Ltd's core business focuses on cloud solutions and mobility services, targeting primarily the public sector and mobility markets in Japan.

Smartvalue Co Ltd is deeply engaged in the provision of resolutions to social issues through its cloud service offerings. The company operates across multiple segments, including the regional information cloud business, cloud platform business, and mobility service business, all of which are geared towards leveraging cloud technology to enhance public sector operations and mobility services in Japan [Smartvalue Co Ltd, 9417:TYO profile - FT.com - Markets data](https://markets.ft.com/data/equities/tearsheet/profile?s=9417:TYO). This strategic focus aligns with the growing demand for digital transformation in these sectors, where efficiency and innovation are paramount.

In the public sector, Smartvalue provides cloud solutions such as SMART L-Gov, a platform designed to solve various regional issues, and GaaS (Government as a Service), an online government platform for administrative services. These solutions are part of Smartvalue's broader effort to streamline government operations and improve service delivery to citizens. The company also offers the Open-gov platform, which is tailored for smart cities and areas, further demonstrating its commitment to using technology to enhance public administration [Smartvalue Co., Ltd. (9417.T) Stock Price, News, Quote & History - Yahoo Finance](https://finance.yahoo.com/quote/9417.T/).

In the mobility sector, Smartvalue's offerings include the Kuruma Tsunagu Platform, an IoT platform specialized in mobility, and Kuruma Base, a telematic service for corporations that provides white labelled in-vehicle devices, management consoles, and smartphone apps for mobility sharing services such as car sharing and call centers. These services are aimed at companies engaged in Mobility-as-a-Service (MaaS) business, indicating Smartvalue's focus on leveraging technology to transform mobility solutions [Smartvalue - CB Insights](https://www.cbinsights.com/investor/smartvalue). The integration of these technologies into the mobility sector showcases Smartvalue's innovative approach to addressing transportation challenges in Japan.

The company's emphasis on cloud solutions and mobility services positions it well to capitalize on the digital transformation trends in Japan. By targeting the public sector and mobility markets, Smartvalue not only addresses current market needs but also positions itself for future growth as these sectors continue to evolve and demand more sophisticated technological solutions. This strategic focus on niche markets allows Smartvalue to differentiate itself from competitors and build a strong brand reputation in these areas.

## Revenue Mix of Smartvalue Co Ltd

### Finding 2: Smartvalue's revenue mix includes both recurring and non-recurring revenue, though specific details on the proportions are not available.

Smartvalue Co Ltd's revenue model encompasses both recurring and non-recurring revenue streams, a common strategy among companies in the technology sector. Recurring revenue typically comes from subscription-based services or long-term contracts, providing a stable income source, while non-recurring revenue is generated from one-time sales or project-based services [Recurring revenue vs. non-recurring revenue - Calqulate](https://www.calqulate.io/blog/recurring-revenue-vs-non-recurring-revenue). Although specific data on the proportions of these revenue streams for Smartvalue is not publicly available, understanding the general dynamics of these revenue types is crucial for assessing the company's financial stability and growth potential.

Recurring revenue is often considered a key indicator of a company's health, as it provides a predictable and stable income stream that can be used to forecast future earnings. For Smartvalue, recurring revenue likely stems from its cloud service subscriptions, such as those provided through SMART L-Gov and GaaS, which are essential for maintaining and expanding its customer base in the public sector. On the other hand, non-recurring revenue may be derived from one-time sales of mobility solutions or project-specific implementations, which can be significant but less predictable [SaaS Recurring Revenue: A Complete Guide - HubiFi](https://www.hubifi.com/blog/saas-recurring-revenue-guide).

The absence of detailed data on the revenue mix poses a challenge in fully evaluating Smartvalue's financial strategy. However, the company's financial statements indicate overall revenue figures, suggesting a robust business model that balances these two revenue types. For instance, the company's net sales for fiscal years 2023 and 2024 were reported at 3.87 billion and 3.81 billion yen, respectively, indicating a stable revenue stream despite the lack of breakdown into recurring and non-recurring components [Smartvalue Co., Ltd. 10-Year Income Statement, Financial Data 9417 - MarketScreener](https://www.marketscreener.com/quote/stock/SMARTVALUE-CO-LTD-22468068/finances-income-statement/).

Understanding the balance between recurring and non-recurring revenue is essential for investors and potential acquirers, as it impacts the company's valuation and growth strategy. A higher proportion of recurring revenue would suggest a more stable business model with predictable cash flows, which is attractive for long-term investments. Conversely, a reliance on non-recurring revenue might indicate higher growth potential but also increased volatility. As such, further detailed financial disclosures from Smartvalue would be beneficial for a more comprehensive analysis.

## Market Strategy of Smartvalue Co Ltd

### Finding 3: Smartvalue's market strategy involves growth through steady income and aggressive pursuit of new business, aiming for increased operating profit.

Smartvalue Co Ltd's market strategy is characterized by a dual approach of maintaining steady income growth while aggressively pursuing new business opportunities. This strategy is outlined in the company's revised second medium-term business plan, where it expresses a goal of achieving a significant increase in operating profit by leveraging both steady income and new business ventures [The Revised Second Medium-term Business Plan - Smartvalue_OM_MTBP2020.pdf](https://www.tokaitokyo.co.jp/japan-gateway/uploads/2020/12/Smartvalue_OM_MTBP2020.pdf). This approach reflects a balanced strategy that aims to ensure stability while capitalizing on growth opportunities.

The steady income component of Smartvalue's strategy likely stems from its recurring revenue streams, such as subscriptions to its cloud services. These stable revenue sources provide a foundation for the company's financial health, allowing it to invest in new initiatives without compromising its operational stability. The aggressive pursuit of new business, on the other hand, involves expanding into new markets, developing innovative solutions, and potentially acquiring or partnering with other companies to enhance its service offerings. This dual strategy is critical in a dynamic market where both stability and innovation are necessary for sustained growth.

Smartvalue's focus on increasing operating profit through this strategy suggests a keen awareness of the need to optimize its cost structure and revenue streams. By combining steady income growth with the pursuit of new business, the company aims to achieve a more efficient and profitable operation. This approach is particularly relevant in the context of Japan's public sector and mobility markets, where digital transformation initiatives are driving demand for innovative cloud and mobility solutions.

The effectiveness of Smartvalue's market strategy can be assessed by examining its financial performance over time. For instance, the company's net sales figures for fiscal years 2023 and 2024 show a stable revenue base, while the stated goal of increasing operating profit indicates a focus on improving profitability. However, the lack of detailed financial performance data, including specific breakdowns of operating profit and the impact of new business ventures, limits the ability to fully evaluate the success of this strategy.

In summary, Smartvalue's market strategy of balancing steady income with the aggressive pursuit of new business aligns with its goal of increasing operating profit. This approach positions the company to capitalize on growth opportunities while maintaining financial stability, a critical factor for success in the competitive IT services market in Japan.

## Target Markets of Smartvalue Co Ltd in Japan

### Finding 4: Smartvalue's target markets in Japan include the public sector for cloud solutions and mobility services, with a focus on local governments and mobility-related businesses.

Smartvalue Co Ltd has strategically targeted the public sector and mobility markets in Japan, focusing on local governments and businesses engaged in Mobility-as-a-Service (MaaS). The company's regional information cloud business is specifically tailored to provide software as a service (SaaS) solutions to local governments, public institutions, and other specific industries, leveraging an urban data center to enhance service delivery and efficiency [Smartvalue Co Ltd, 9417:TYO profile - FT.com - Markets data](https://markets.ft.com/data/equities/tearsheet/profile?s=9417:TYO). This focus on the public sector aligns with the increasing demand for digital transformation in government operations, where cloud solutions can significantly improve administrative processes and public service delivery.

In the mobility sector, Smartvalue's offerings such as the Kuruma Tsunagu Platform and Kuruma Base are designed to support companies involved in MaaS. These solutions provide IoT and telematic services that facilitate mobility sharing services, including car sharing and call centers. By targeting this niche market, Smartvalue positions itself as a key player in the evolving mobility landscape in Japan, where the demand for efficient and innovative transportation solutions is growing [Smartvalue - CB Insights](https://www.cbinsights.com/investor/smartvalue).

The public sector in Japan represents a significant market for Smartvalue, as local governments and public institutions seek to modernize their operations and improve service delivery. The size of this market is substantial, given the number of local governments and public entities across Japan, and its growth is driven by the ongoing digital transformation initiatives. Smartvalue's cloud solutions such as SMART L-Gov, GaaS, and the Open-gov platform are well-suited to meet these needs, offering scalable and efficient platforms that can be customized to various regional requirements [Smartvalue Co., Ltd. (9417.T) Stock Price, News, Quote & History - Yahoo Finance](https://finance.yahoo.com/quote/9417.T/).

Similarly, the mobility market in Japan is experiencing rapid growth, fueled by the rise of MaaS and the demand for sustainable transportation solutions. Smartvalue's mobility services, particularly the Kuruma Tsunagu Platform and Kuruma Base, cater to this market by providing advanced IoT and telematic services that enhance the efficiency and user experience of mobility sharing services. The company's focus on this sector positions it to capitalize on the growing demand for innovative mobility solutions in Japan.

By targeting these specific markets, Smartvalue not only addresses current market needs but also positions itself for future growth as these sectors continue to evolve. The company's strategic focus on the public sector and mobility markets allows it to differentiate itself from competitors and build a strong brand reputation in these areas. However, the success of this strategy depends on Smartvalue's ability to continuously innovate and adapt its offerings to meet the changing needs of these markets.

## Financial Performance of Smartvalue Co Ltd Over the Last 5 Years

### Finding 5: Smartvalue's financial performance over the last 5 years shows a decline in net income and mixed trends in other financial metrics.

Smartvalue Co Ltd's financial performance over the last five years has exhibited a notable decline in net income alongside mixed trends in other key financial metrics. According to data from the Wall Street Journal, the company experienced a significant net income growth rate of -619.04% over this period, indicating a substantial decrease in profitability. Despite this, Smartvalue's sales or revenue remained relatively stable at 3.81 billion yen, suggesting that while the company has maintained its revenue base, it has struggled to convert this into net income [9417.JP | Smartvalue Co. Ltd. Financial Statements - WSJ](https://www.wsj.com/market-data/quotes/JP/XTKS/9417/financials).

The company's financial statements provide further insights into its performance. Over the five-year period, various financial ratios and trends have shown mixed results. For instance, the inventory turnover ratio increased from 10.51 to 25.44, indicating improved efficiency in managing inventory. However, the current ratio, a measure of short-term liquidity, declined from 2.84 to 1.85, suggesting a potential vulnerability in meeting short-term obligations. Similarly, the quick ratio, which excludes inventory from current assets, decreased from 2.4 to 1.61, further highlighting liquidity concerns [Financial Ratios Smartvalue Co., Ltd. - MarketScreener](https://www.marketscreener.com/quote/stock/SMARTVALUE-CO-LTD-22468068/finances-ratios/).

Despite these challenges, Smartvalue's net sales figures for fiscal years 2023 and 2024 were reported at 3.87 billion and 3.81 billion yen, respectively, indicating a stable revenue stream. However, the company's net income for these years showed significant declines, with figures of -48 million and -348 million yen, respectively. This suggests that while Smartvalue has been able to maintain its revenue, it has faced difficulties in managing costs and achieving profitability [Smartvalue Co., Ltd. 10-Year Income Statement, Financial Data 9417 - MarketScreener](https://www.marketscreener.com/quote/stock/SMARTVALUE-CO-LTD-22468068/finances-income-statement/).

The decline in net income over the last five years raises concerns about Smartvalue's ability to maintain profitability and manage its cost structure effectively. The mixed trends in other financial metrics, such as the inventory turnover ratio and current ratio, indicate areas where the company has shown improvement and areas where it needs to focus on enhancing its financial health. These trends underscore the importance of a detailed financial analysis to understand the underlying factors driving these results.

In conclusion, Smartvalue's financial performance over the last five years has been characterized by a significant decline in net income and mixed trends in other financial metrics. While the company has maintained a stable revenue base, it has struggled to achieve profitability, highlighting the need for strategic initiatives to improve cost management and operational efficiency. A deeper analysis of the company's financial statements and key performance indicators would provide further insights into its financial health and potential areas for improvement.

## Scope and Limitations

### Scope and Limitations of the Research

The analysis of Smartvalue Co Ltd's core business, market strategy, and financial performance has been conducted using a variety of publicly available data sources. However, several limitations and gaps in the research must be acknowledged to provide a comprehensive understanding of the scope of this report.

**Source Bias:** The majority of the data used in this analysis is derived from web sources, such as financial reports, company profiles, and market data from platforms like FT.com, Yahoo Finance, and MarketScreener. While these sources provide valuable insights into Smartvalue's operations and financial performance, they may not offer the depth and credibility required for a thorough analysis. The limited availability of academic sources directly addressing Smartvalue's core business aspects further compounds this issue [Smartvalue Co Ltd, 9417:TYO profile - FT.com - Markets data](https://markets.ft.com/data/equities/tearsheet/profile?s=9417:TYO). To mitigate this limitation, future research could incorporate more academic and industry-specific reports to gain deeper insights into Smartvalue's technology and market position.

**Data Scarcity:** A significant challenge in this analysis has been the lack of detailed information on Smartvalue's core technology base, intellectual property, and R&D/innovation capabilities. The available data does not provide specific details on these critical areas, which are essential for assessing the company's competitive edge and future growth potential [Smartvalue - CB Insights](https://www.cbinsights.com/investor/smartvalue). To address this gap, targeted searches in patent databases and technology-focused publications could be conducted. Additionally, reaching out to industry experts or analysts might provide further insights into Smartvalue's technological capabilities.

**Relevance:** Many of the search results retrieved during the research process were not directly relevant to Smartvalue Co Ltd (9417.T). Instead, they pertained to other companies with similar names or unrelated topics, diluting the quality of the information gathered [Smartvalue Co., Ltd. (9417.T) Stock Price, News, Quote & History - Yahoo Finance](https://finance.yahoo.com/quote/9417.T/). Refining search queries to include more specific identifiers, such as the stock ticker or company registration number, and using advanced search filters to exclude irrelevant results could improve the relevance of future research.

**Identified Knowledge Gaps:** The research has identified several key knowledge gaps that limit the comprehensiveness of the analysis:

- **Core Technology Base:** Detailed information on Smartvalue's cloud platform capabilities, software quality, and scalability is lacking, which is crucial for understanding its competitive edge.
- **Intellectual Property:** There is a significant lack of data on Smartvalue's key intellectual property, which is essential for assessing its innovation and market protection.
- **R&D and Innovation:** The research does not cover Smartvalue's R&D efforts and innovation capabilities, which are vital for future growth and competitive positioning.
- **Financial Performance Details:** While some financial data is available, there is a gap in understanding the detailed financial performance, especially regarding key KPIs and cash flow trends.

To address these limitations and gaps, future research should aim to incorporate a broader range of sources, including academic publications, industry reports, and direct communication with company representatives or industry experts. This approach would provide a more comprehensive and accurate analysis of Smartvalue Co Ltd's operations and market position.

## Conclusion

Smartvalue Co Ltd's focus on cloud solutions and mobility services in Japan's public sector and mobility markets positions it as a key player in the IT services industry. The company's strategic approach of balancing steady income with the aggressive pursuit of new business opportunities aims to increase operating profit and drive growth. However, the analysis reveals a mixed financial performance over the last five years, with a significant decline in net income despite stable revenue figures. This highlights the need for Smartvalue to enhance its cost management and operational efficiency to improve profitability.

Several uncertainties remain, including the lack of detailed information on Smartvalue's core technology base, intellectual property, and R&D capabilities. These gaps limit the ability to fully assess the company's competitive edge and potential for future growth. Additionally, the reliance on web-based sources and the scarcity of relevant data pose challenges to the depth and credibility of the analysis. Addressing these limitations through more comprehensive research and data collection would provide a clearer picture of Smartvalue's market position and strategic direction.

In conclusion, while Smartvalue Co Ltd demonstrates a strong market focus and strategic vision, its financial performance and the identified knowledge gaps suggest areas for improvement and further investigation. Future research should aim to fill these gaps and provide a more detailed understanding of Smartvalue's technological capabilities and financial health, ultimately contributing to a more robust assessment of its potential for growth and synergy within the IT services sector.

================================================
FILE: super_agents/deep_research/output/research_report_id_like_a_thorough_analysis_of_li_auto_stock_including_summary_company_overview_key_metrics_performa_20250327_121800.md
================================================
## Introduction

LI Auto Inc., a prominent player in the Chinese electric vehicle (EV) market, has garnered significant attention due to its focus on extended-range electric vehicles (EREVs). Founded in November 2015 by Li Xiang, the company has quickly established itself as a leader in the new energy vehicle (NEV) sector, particularly with its flagship model, the Li ONE. As the global automotive industry shifts towards sustainable transportation, understanding LI Auto's position and potential within this dynamic market is crucial for investors and industry analysts alike. This report aims to provide a comprehensive analysis of LI Auto's stock, encompassing a detailed company overview, financial performance, market sentiment, technical analysis, competitive positioning, and investment thesis.

The analysis will delve into LI Auto's financial metrics, including revenue trends and profit margins, to assess its financial health and growth trajectory. Additionally, we will explore market sentiment through analyst ratings and recent news impacts, as well as technical indicators to understand short-term trading dynamics. A comparative analysis against key competitors will highlight LI Auto's market share and financial standing, while a value investor's perspective will focus on intrinsic value, growth potential, and risk factors. Finally, a SWOT analysis will provide a structured framework for evaluating LI Auto's strategic position, culminating in tailored investment recommendations for different investor types.

## Company Overview and Key Metrics

### LI Auto Inc.: A Chinese Electric Vehicle Manufacturer

LI Auto Inc. is a Chinese electric vehicle manufacturer that specializes in producing extended-range electric vehicles (EREVs). Founded in November 2015 by Li Xiang, the company is headquartered in Beijing, China. LI Auto's mission is to provide premium smart electric vehicles that cater to the growing demand for sustainable transportation in China. The company's focus on EREVs sets it apart in the competitive landscape of the electric vehicle market, as these vehicles combine the benefits of electric propulsion with the convenience of a gasoline engine for extended range [Li Auto Inc. (LI): history, ownership, mission, how it works & makes ...](https://dcfmodeling.com/blogs/history/li-history-mission-ownership).

LI Auto's product lineup includes the Li ONE, a six-seater, large, premium plug-in electric SUV equipped with a range extension system and advanced smart vehicle solutions. The company began volume production of the Li ONE in November 2019 and has since expanded its product offerings to include other models such as the Li L series and Li MEGA. LI Auto's vehicles are designed to appeal to consumers seeking luxury and performance in the NEV market, positioning the company as a premium brand in the industry [Li Auto Inc (LI): A Deep Dive into Its Performance Metrics](https://finance.yahoo.com/news/li-auto-inc-li-deep-161354442.html).

The company's ownership structure reflects a balanced mix of founder ownership, institutional investors, and public float. As of the latest data, founder ownership accounts for 34.5% of the company, while institutional investors hold 41.3%, and the public float represents 24.2%. This ownership distribution suggests a strong alignment of interests between the company's leadership and its investors, which can be a positive indicator for long-term stability and growth [Li Auto Inc. (LI): history, ownership, mission, how it works & makes ...](https://dcfmodeling.com/blogs/history/li-history-mission-ownership).

## Financial Performance

### Revenue and Profitability in 2023

In 2023, LI Auto reported total revenue of $12.4 billion, all of which was derived from the Chinese market. This figure underscores the company's strong domestic presence and its ability to capture a significant share of the NEV market in China. The exclusive focus on the Chinese market highlights LI Auto's strategic decision to prioritize its home market before expanding internationally, a move that has allowed the company to establish a solid foundation for growth [Li Auto Inc. (LI) SWOT Analysis](https://dcfmodeling.com/products/li-swot-analysis).

Despite the impressive revenue figures, detailed revenue trends and profit margins over time are not available, which limits the ability to assess LI Auto's financial performance comprehensively. However, the company's financial performance in 2023 indicates a robust growth trajectory, with a significant increase in revenue compared to previous years. This growth can be attributed to the increasing demand for NEVs in China and LI Auto's successful market penetration strategies [Li Auto Inc. (LI) SWOT Analysis](https://dcfmodeling.com/products/li-swot-analysis).

The absence of specific data on profit margins and other financial metrics over time is a notable gap in the analysis. Understanding these trends is essential for evaluating the company's profitability and financial health. Future research should focus on obtaining more detailed financial data to provide a more comprehensive assessment of LI Auto's financial performance [Li Auto Inc. (LI) SWOT Analysis](https://dcfmodeling.com/products/li-swot-analysis).

## Product Lineup and Market Position

### The Li ONE: Flagship Model and Range Capabilities

LI Auto's flagship model, the Li ONE, is a testament to the company's commitment to innovation and performance in the electric vehicle sector. The Li ONE boasts a range of approximately 800 kilometers (about 497 miles) on a single charge when utilizing the range extender. This extended range positions LI Auto strongly against competitors in the electric vehicle market, which typically offer shorter ranges [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

The Li ONE's range capability is a significant competitive advantage, as it addresses one of the primary concerns of consumers considering electric vehicles: range anxiety. By offering a vehicle that can travel nearly 500 miles on a single charge, LI Auto appeals to a broader segment of the market, including those who may be hesitant to switch to electric vehicles due to concerns about range limitations [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

The success of the Li ONE has been instrumental in establishing LI Auto's reputation as a leader in the EREV segment. The model's sales performance and positive consumer feedback have contributed to the company's strong market position and its ability to command a premium price in the NEV market [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

## Market Focus and Competitive Positioning

### Focus on Hybrid Electric Vehicles

LI Auto's strong focus on hybrid electric vehicles (HEVs) is a strategic decision that positions the company well against competitors in the electric vehicle sector. By offering vehicles that combine electric propulsion with a gasoline engine for extended range, LI Auto addresses the needs of consumers who value both sustainability and convenience. This focus on HEVs allows the company to differentiate itself in a crowded market and appeal to a broader customer base [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

The company's emphasis on HEVs is reflected in its product lineup, which includes models like the Li ONE and the Li L series. These vehicles are designed to offer the benefits of electric propulsion, such as reduced emissions and lower operating costs, while also providing the flexibility of a gasoline engine for longer trips. This dual approach to vehicle design has resonated with consumers in the Chinese market, contributing to LI Auto's strong sales performance and market share [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

LI Auto's competitive positioning in the HEV segment is further enhanced by its commitment to technological innovation and product development. The company's R&D efforts focus on improving the efficiency and performance of its vehicles, ensuring that they remain competitive in a rapidly evolving market. This dedication to innovation is a key strength that sets LI Auto apart from its competitors and positions the company for long-term success [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

## Market Share and International Expansion

### Market Share in the Chinese NEV Market

LI Auto's market share in the Chinese new energy vehicle (NEV) market is approximately 0.2% globally, with minimal international expansion. This figure reflects the company's strong focus on the domestic market, where it has achieved significant success. As of Q4 2023, LI Auto's operations were primarily concentrated in China, with international sales representing only 0.3% of total company revenue [Li Auto Inc. (LI) SWOT Analysis](https://dcfmodeling.com/products/li-swot-analysis).

The company's limited international presence is a notable weakness, as it restricts LI Auto's potential for growth and diversification. Expanding into international markets could provide new revenue streams and reduce the company's reliance on the Chinese market. However, the challenges associated with international expansion, such as regulatory compliance and market entry barriers, must be carefully considered [Li Auto Inc. (LI) SWOT Analysis](https://dcfmodeling.com/products/li-swot-analysis).

Despite its limited global market share, LI Auto has demonstrated strong performance in the Chinese NEV market. The company's focus on the domestic market has allowed it to capture a significant share of the premium segment, particularly in the RMB200,000 and above NEV market. In September 2024, LI Auto accounted for over 17% of market share in this segment, ranking first among Chinese automotive brands [Li Auto Inc. September 2024 Delivery Update](https://ir.lixiang.com/news-releases/news-release-details/li-auto-inc-september-2024-delivery-update).

## Analyst Forecasts and Stock Performance

### Analyst Forecasts and Upside Potential

Analysts have forecasted a 13.43% upside potential for LI Auto's stock based on average price targets. This forecast reflects the positive sentiment among analysts regarding the company's future performance and growth prospects. The average target price of $230.57 suggests that analysts believe LI Auto's stock is undervalued and has room for appreciation [Li Auto (LI) Stock Forecast, Price Targets and Analysts Predictions](https://www.tipranks.com/stocks/li/forecast).

The positive analyst sentiment is supported by LI Auto's strong financial performance and market position. The company's revenue growth and profitability have exceeded market expectations, contributing to the bullish outlook among analysts. Additionally, LI Auto's focus on innovation and product development has been well-received by the investment community, further bolstering confidence in the company's future prospects [Li Auto (LI) Stock Forecast, Price Targets and Analysts Predictions](https://www.tipranks.com/stocks/li/forecast).

However, it is important to note that analyst forecasts are subject to change based on new information and market conditions. Investors should consider a range of factors, including macroeconomic trends and industry developments, when evaluating the potential upside of LI Auto's stock [Li Auto (LI) Stock Forecast, Price Targets and Analysts Predictions](https://www.tipranks.com/stocks/li/forecast).

## Stock Volatility and Market Sentiment

### Stock Volatility and Recent News Impact

LI Auto's stock has shown significant volatility, with recent news impacting its performance. The company's stock price has experienced fluctuations due to various factors, including quarterly earnings reports, product announcements, and market sentiment. For example, LI Auto's stock price was affected by the company's decision to lower its sales outlook for the first quarter of 2024, which was attributed to lower-than-expected sales of the Li Mega minivan [Li Auto Options Trading: A Deep Dive into Market Sentiment](https://www.benzinga.com/insights/options/25/03/44500474/li-auto-options-trading-a-deep-dive-into-market-sentiment).

The impact of recent news on LI Auto's stock highlights the importance of monitoring market sentiment and staying informed about developments that may affect the company's performance. Investors should consider the potential for volatility when making investment decisions and be prepared to adjust their strategies based on new information [Li Auto Options Trading: A Deep Dive into Market Sentiment](https://www.benzinga.com/insights/options/25/03/44500474/li-auto-options-trading-a-deep-dive-into-market-sentiment).

In addition to news events, market sentiment can be influenced by broader economic trends and industry developments. For example, the ongoing trade war between the U.S. and China has had a significant impact on the Chinese automotive industry, contributing to volatility in LI Auto's stock price. Investors should consider these macroeconomic factors when evaluating the company's stock and its potential for growth [Li Auto Options Trading: A Deep Dive into Market Sentiment](https://www.benzinga.com/insights/options/25/03/44500474/li-auto-options-trading-a-deep-dive-into-market-sentiment).

## Strengths and Weaknesses

### Technological Innovation and Product Appeal

LI Auto's strengths include its technological innovation and product appeal, which have been key drivers of the company's success in the Chinese NEV market. The company's focus on developing advanced smart vehicle solutions and extended-range electric vehicles has resonated with consumers, contributing to strong sales performance and market share [Research on the Investment Value of LI Auto based on Multiple ...](https://drpress.org/ojs/index.php/HBEM/article/view/23726).

The Li ONE, with its impressive range capabilities and premium features, exemplifies LI Auto's commitment to innovation and product excellence. The vehicle's success has helped establish the company as a leader in the EREV segment and has attracted a loyal customer base. Additionally, LI Auto's ongoing R&D efforts ensure that the company remains at the forefront of technological advancements in the electric vehicle industry [Research on the Investment Value of LI Auto based on Multiple ...](https://drpress.org/ojs/index.php/HBEM/article/view/23726).

However, LI Auto also faces challenges related to its limited international presence and production scale. The company's focus on the Chinese market has limited its potential for growth and diversification, as international expansion could provide new revenue streams and reduce reliance on the domestic market. Additionally, scaling production to meet growing demand is a critical challenge that LI Auto must address to maintain its competitive position [Research on the Investment Value of LI Auto based on Multiple ...](https://drpress.org/ojs/index.php/HBEM/article/view/23726).

## Opportunities and Threats

### International Expansion and Market Competition

Opportunities for LI Auto include expanding into international markets, which could provide new growth avenues and reduce the company's reliance on the Chinese market. The global demand for electric vehicles is increasing, and LI Auto's focus on EREVs positions it well to capitalize on this trend. By entering new markets, the company could diversify its revenue streams and enhance its long-term growth potential [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

However, LI Auto also faces threats from intense competition in the Chinese EV market. The industry is characterized by rapid technological advancements and aggressive competition among established players and new entrants. Companies like NIO, XPeng, and Tesla are vying for market share, and LI Auto must continue to innovate and differentiate its products to maintain its competitive position [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

Additionally, macroeconomic factors such as the ongoing trade war between the U.S. and China and economic slowdowns can impact the company's performance. These external factors can affect consumer demand and market sentiment, contributing to volatility in LI Auto's stock price. The company must navigate these challenges while continuing to focus on its core strengths and growth opportunities [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

## Scope and Limitations

### Incomplete Financial Data

The research results lack comprehensive data on LI Auto's revenue trends, profit margins, balance sheet, and cash flow analysis. This absence severely limits the ability to assess the company's financial health and growth trajectory. Without detailed financial data, it is challenging to evaluate LI Auto's profitability, liquidity, and overall financial stability [Gap Analysis Summary].

To address this limitation, future research should focus on obtaining LI Auto's financial statements and reports from official sources such as the company's investor relations page or financial databases. Utilizing financial analysis tools to extract and analyze the required data would provide a more comprehensive understanding of the company's financial performance [Gap Analysis Summary].

### Missing Market Sentiment Data

There is a significant gap in data regarding analyst ratings, sentiment indicators, and the impact of recent news on LI Auto's stock. This limits the understanding of market perceptions and potential influences on stock price. Comprehensive market sentiment data is essential for investors to make informed decisions and assess the company's stock performance [Gap Analysis Summary].

To address this gap, future research should search for recent analyst reports and sentiment analyses from reputable financial news outlets and platforms like Bloomberg, Reuters, or Morningstar. Monitoring social media and financial forums for real-time sentiment indicators would also provide valuable insights into market perceptions [Gap Analysis Summary].

### Lack of Technical Analysis

The absence of data on price trends, technical indicators, and support/resistance levels for LI Auto's stock hinders the ability to perform a thorough technical analysis, which is crucial for short-term trading strategies. Technical analysis provides insights into market trends and potential price movements, helping traders make informed decisions [Gap Analysis Summary].

To address this limitation, future research should use financial charting tools and platforms like TradingView or Yahoo Finance to gather historical price data and apply technical indicators. Consulting technical analysis reports from financial analysts specializing in stock market trends would also enhance the understanding of LI Auto's stock performance [Gap Analysis Summary].

### Inadequate Competitive Analysis

The research lacks a comparison of LI Auto's market share and financial metrics against its key competitors, which is essential for understanding its relative market position. A comprehensive competitive analysis would provide insights into LI Auto's strengths and weaknesses relative to other players in the electric vehicle market [Gap Analysis Summary].

To address this gap, future research should gather market share data from industry reports and market research firms like Statista or IBISWorld. Comparing financial metrics of LI Auto with those of competitors like NIO, XPeng, and Tesla using financial databases would provide a more complete picture of the company's competitive position [Gap Analysis Summary].

### Insufficient Value Investor Analysis

There is no data on LI Auto's intrinsic value, growth potential, and risk factors, which are critical for value investors to make informed decisions. Understanding these factors is essential for assessing the company's long-term investment potential and identifying potential risks [Gap Analysis Summary].

To address this limitation, future research should use valuation models like DCF (Discounted Cash Flow) or comparable company analysis to estimate LI Auto's intrinsic value. Analyzing industry reports and economic forecasts to assess growth potential and identify risk factors would provide valuable insights for value investors [Gap Analysis Summary].

### Limited Investment Thesis

The investment thesis is incomplete without a comprehensive SWOT analysis and tailored recommendations for different investor types, limiting the depth of investment insights. A detailed SWOT analysis and investment recommendations would provide a structured framework for evaluating LI Auto's strategic position and potential for growth [Gap Analysis Summary].

To address this gap, future research should conduct a detailed SWOT analysis using company reports, industry analyses, and expert opinions. Developing investment recommendations by considering different investor profiles and risk appetites would enhance the investment thesis and provide actionable insights for investors [Gap Analysis Summary].

## Conclusion

LI Auto Inc. has established itself as a significant player in the Chinese electric vehicle market, with a strong focus on extended-range electric vehicles (EREVs). The company's flagship model, the Li ONE, offers an impressive range of approximately 800 kilometers on a single charge, positioning LI Auto well against competitors in the electric vehicle sector. In 2023, LI Auto reported total revenue of $12.4 billion, exclusively from the Chinese market, highlighting its strong domestic presence [Li Auto Inc. (LI) SWOT Analysis](https://dcfmodeling.com/products/li-swot-analysis).

Analysts have forecasted a 13.43% upside potential for LI Auto's stock, reflecting positive sentiment regarding the company's future performance. However, the stock has shown significant volatility, with recent news impacting its performance. LI Auto's strengths include technological innovation and product appeal, while weaknesses include limited international presence and production scale. Opportunities for growth include expanding into international markets, while threats include intense competition in the Chinese EV market [Li Auto SWOT Analysis – CanvasBusinessModel.com](https://canvasbusinessmodel.com/products/li-auto-swot-analysis?srsltid=AfmBOooD9nQETJeWHiano9p_PjceSDp39GjTXfWNmrWKCGuqXSSzNiSd).

Despite these insights, several uncertainties remain. Detailed revenue trends and profit margins over time are not available, limiting the ability to assess financial performance comprehensively. Specific data on LI Auto's balance sheet and cash flow statements are missing, which are crucial for evaluating financial health and liquidity. Comprehensive analyst ratings and sentiment indicators are not provided, which are essential for understanding market perceptions. Technical analysis data such as price trends, technical indicators, and support/resistance levels are absent, hindering short-term trading insights. Comparative analysis of LI Auto's market share and financial metrics against key competitors is not available, impacting the understanding of its competitive position. Data on LI Auto's intrinsic value, growth potential, and specific risk factors are missing, which are critical for value investors. A detailed SWOT analysis and tailored investment recommendations for different investor types are not fully developed, limiting the depth of the investment thesis [Remaining Uncertainties].

In conclusion, while LI Auto has demonstrated strong performance in the Chinese NEV market, addressing these uncertainties and gaps in data will be crucial for a more comprehensive analysis and informed investment decisions.

================================================
FILE: super_agents/deep_research/output/research_report_id_like_a_thorough_analysis_of_xpev_stock_including_summary_company_overview_key_metrics_performance_20250327_105350.md
================================================
## Query
I'd like a thorough analysis of XPEV stock, including: Summary: Company overview, key metrics, performance data and investment recommendations Financial Data: Revenue trends, profit margins, balance sheet and cash flow analysis Market Sentiment: Analyst ratings, sentiment indicators and news impact Technical Analysis: Price trends, technical indicators and support/resistance levels Compare Assets: Market share and financial metrics vs. key competitors Value Investor: Intrinsic value, growth potential and risk factors Investment Thesis: SWOT analysis and recommendations for different investor types.

## Introduction

XPeng Inc. (XPEV) is a prominent player in China's electric vehicle (EV) market, focusing on mid- to high-end segments within the passenger vehicle sector. Established in 2014, XPeng has rapidly expanded its presence both domestically and internationally, driven by a commitment to integrating cutting-edge technology and smart features into its vehicles. This report provides a comprehensive analysis of XPeng's stock, covering various aspects such as company overview, financial performance, market sentiment, technical analysis, competitive positioning, intrinsic value, and investment thesis. The analysis leverages a wide array of data points and insights, ensuring a thorough understanding of XPeng's current market position and future potential.

As the global EV market continues to grow, XPeng's strategic initiatives and performance metrics have become critical for investors and analysts alike. The company's significant growth in vehicle deliveries and revenue, as well as its financial challenges, provide a complex picture that requires careful examination. This report aims to dissect these elements to offer a detailed view of XPeng's operational and financial health, market sentiment, and investment prospects. Through this analysis, stakeholders can gain insights into the company's strengths, weaknesses, opportunities, and threats, as well as its potential for future growth and the associated risks.

## Company Overview and Key Metrics

### XPeng Inc.'s Business Focus and Market Position

XPeng Inc. is strategically positioned within China's burgeoning EV market, targeting the mid- to high-end segment of passenger vehicles. The company's focus on smart electric vehicles (EVs) is underscored by its development of advanced driver-assistance systems (ADAS) and in-car intelligent operating systems. XPeng's product lineup includes the G3 SUV and the P7 sports sedan, which are designed to appeal to tech-savvy consumers seeking environmentally friendly and technologically advanced transportation solutions [XPeng Inc. (XPEV) Stock Price, News, Quote & History](https://finance.yahoo.com/quote/XPEV/). 

The company's market position is further reinforced by its vertical integration strategy, allowing XPeng to control the development and production of core vehicle systems, including powertrain and electrical/electronic architecture. This approach not only enhances the user experience but also differentiates XPeng's offerings from competitors. Moreover, XPeng's expansion into European markets and the successful launch of its XNGP driving technology have contributed to its growing global presence [XPeng Inc. (XPEV) Stock Price, News, Quote & History](https://finance.yahoo.com/quote/XPEV/).

### Key Performance Metrics

XPeng's performance metrics provide a quantitative measure of its growth and operational efficiency. As of the latest data, the company boasts a market capitalization of approximately $19.88 billion, reflecting its significant scale within the EV industry [XPeng Inc. (XPEV) Valuation Measures & Financial Statistics](https://finance.yahoo.com/quote/XPEV/key-statistics/). The enterprise value stands at $17.45 billion, indicating the company's total value including debt and equity.

Revenue per share for the trailing twelve months (TTM) is reported at $43.21, with a quarterly revenue growth of 18.40% year-over-year. These figures highlight XPeng's robust growth trajectory, particularly in the context of the competitive EV market [XPeng Inc. (XPEV) Valuation Measures & Financial Statistics](https://finance.yahoo.com/quote/XPEV/key-statistics/). 

However, despite the revenue growth, XPeng's gross profit for the TTM is $5.85 billion, which translates to a gross margin of only 1.5%. This low margin is indicative of the challenges the company faces in achieving profitability, largely due to high production costs and the competitive pricing pressures within the EV market [Xpeng Inc Annual Gross Margin Trends, Business Profitability](https://csimarket.com/stocks/singleProfitabilityRatiosy.php?code=XPEV&gro).

### Investment Recommendations and Analyst Insights

Investment recommendations for XPeng stock are mixed, reflecting the nuanced view of analysts on the company's future performance. The Zacks Investment Research report provides a detailed analysis of XPeng's vital statistics, including earnings and sales charts, which are crucial for understanding the company's financial health and growth prospects [XPEV : XPeng Key Company Metrics & Non-finance Metrics - Zacks](https://www.zacks.com/stock/research/XPEV/key-company-metrics).

Reuters' analysis of XPeng's key metrics further emphasizes the company's financial strength and management effectiveness, providing a comprehensive overview of its financial position [XPEV.N - | Stock Price & Latest News - Reuters](https://www.reuters.com/markets/companies/XPEV.N/key-metrics/management-effectiveness). These insights are essential for investors looking to evaluate XPeng's potential as an investment opportunity.

In summary, XPeng Inc.'s focus on smart EVs, coupled with its vertical integration strategy, positions it as a formidable player in the EV market. However, the company's financial performance, characterized by high revenue growth but low profit margins, presents challenges that investors must consider. The mixed analyst recommendations further underscore the need for a nuanced approach to investing in XPeng stock.

## Financial Performance

### Revenue Trends

XPeng Inc. has demonstrated significant growth in its revenue over the past few years, aligning with its ambitious expansion plans and increasing demand for electric vehicles. In 2023, XPeng reported a total revenue of RMB30.68 billion, equivalent to approximately $4.32 billion [XPeng, Inc. ADR (XPEV) Financial Statements - Cash Flow - TipRanks](https://www.tipranks.com/stocks/xpev/financials). This figure represents a substantial increase from previous years, driven by a surge in vehicle deliveries and strategic market expansions.

The company's revenue growth is particularly notable in the first quarter of 2025, where XPeng reported a 300% year-over-year increase in vehicle deliveries, projecting up to 93,000 units for the quarter. This impressive delivery growth aligns with the company's robust revenue growth guidance, further boosting investor confidence [XPeng Inc. (XPEV) Latest Stock News & Headlines - Yahoo Finance](https://finance.yahoo.com/quote/XPEV/news/). 

Despite these achievements, XPeng's revenue growth has been accompanied by a significant increase in operating expenses, which have outpaced revenue growth, leading to challenges in achieving profitability. The company's quarterly revenue growth rate of 18.40% year-over-year for the most recent period further underscores its strong performance in the market [XPeng Inc. (XPEV) Valuation Measures & Financial Statistics](https://finance.yahoo.com/quote/XPEV/key-statistics/).

### Profit Margins

XPeng's profit margins remain a critical area of concern for investors and analysts. The company's gross margin for 2023 stood at a meager 1.5%, reflecting the high costs associated with producing electric vehicles and the competitive pricing pressures in the market [Xpeng Inc Annual Gross Margin Trends, Business Profitability](https://csimarket.com/stocks/singleProfitabilityRatiosy.php?code=XPEV&gro). This low margin is indicative of the challenges XPeng faces in achieving profitability, as the costs of materials, labor, and overhead continue to rise.

Historical data on XPeng's net profit margin reveals a consistent trend of negative margins, with the latest figures showing a net margin of -15.54% as of September 30, 2024 [XPeng Net Profit Margin 2020-2024 | XPEV - Macrotrends](https://macrotrends.net/stocks/charts/XPEV/xpeng/net-profit-margin). This negative net margin is a reflection of the company's inability to translate its revenue growth into profits, primarily due to high operating costs and the competitive nature of the EV market.

### Balance Sheet Analysis

XPeng's balance sheet provides insights into its financial health and stability. As of the fourth quarter of 2024, the company's total assets stood at $11.33 billion, marking a 4.01% increase from the previous quarter. Conversely, total liabilities increased by 11.32% to $7.05 billion during the same period [XPeng Inc. Balance Sheet – NYSE:XPEV - TradingView](https://www.tradingview.com/symbols/NYSE-XPEV/financials-balance-sheet/). 

The rise in liabilities, particularly in the context of a high cash burn rate, raises concerns about XPeng's long-term financial sustainability. The company's debt-to-equity ratio, which has fluctuated over time, stood at 2.01 in 2020 but decreased to 0.73 by 2023, indicating a more balanced approach to financing in recent years [Study of Xpeng Automotive's Development Under China's Carbon](https://www.atlantis-press.com/article/125985530.pdf). However, the increasing liabilities suggest that XPeng may need to manage its debt levels carefully to maintain financial stability.

### Cash Flow Analysis

XPeng's cash flow statement further illuminates its financial performance, highlighting the company's cash burn rate and its ability to fund operations. In 2023, XPeng reported an operating income of -¥10.89 billion, a significant decrease from the previous year's -¥8.71 billion [XPeng, Inc. ADR (XPEV) Financial Statements - Cash Flow - TipRanks](https://www.tipranks.com/stocks/xpev/financials). This negative operating income reflects the company's high operational costs and the challenges it faces in achieving positive cash flow.

The company's cash flow from operating activities has been consistently negative, with a reported cash outflow of -$0.83 billion for the trailing twelve months as of September 30, 2024 [XPeng Net Profit Margin 2020-2024 | XPEV - Macrotrends](https://macrotrends.net/stocks/charts/XPEV/xpeng/net-profit-margin). This negative cash flow from operations is a significant concern, as it indicates that XPeng is not generating enough cash to cover its operational expenses, relying instead on external financing to sustain its growth.

In summary, XPeng's financial performance is characterized by strong revenue growth but persistent challenges with profitability and cash flow management. The company's low profit margins and negative cash flow from operations highlight the need for strategic cost management and operational efficiency improvements to ensure long-term financial sustainability.

## Market Sentiment

### Analyst Ratings

The market sentiment surrounding XPeng Inc.'s stock is characterized by a mix of optimism and caution, as reflected in the analyst ratings and price targets. According to TipRanks, XPeng has received a range of ratings in the current month, with 10 Buy ratings, 6 Hold ratings, and 2 Sell ratings. The average analyst price target over the past three months is $23.74 [XPeng, Inc. ADR (XPEV) Stock Forecast & Price Target - TipRanks](https://www.tipranks.com/stocks/xpev/forecast). This diversity in ratings suggests a lack of consensus among analysts, reflecting the complex nature of XPeng's market position and future prospects.

MarketBeat reports a similar consensus, assigning XPeng a 'Hold' rating with an average rating score of 2.46, based on 5 buy ratings, 6 hold ratings, and 1 sell rating [XPeng (XPEV) Stock Price, News & Analysis - MarketBeat](https://www.marketbeat.com/stocks/NYSE/XPEV/). The 'Hold' consensus indicates that while some analysts see potential for growth, others are more cautious, possibly due to concerns over the company's profitability and cash flow challenges.

### Sentiment Indicators

Sentiment indicators provide additional insights into the market's perception of XPeng's stock. The stock has experienced significant volatility, with a 91% appreciation over the last quarter [XPeng (XPEV) Stock Price, News & Analysis - MarketBeat](https://www.marketbeat.com/stocks/NYSE/XPEV/). This volatility is indicative of the dynamic nature of the EV market and the impact of various factors, including corporate performance and macroeconomic trends, on investor sentiment.

Recent news has played a crucial role in shaping market sentiment. For instance, XPeng's announcement of expected Q1 2025 vehicle deliveries up to 93,000 units, representing an over 300% year-over-year increase, has bolstered investor confidence [XPeng Inc. (XPEV) Latest Stock News & Headlines - Yahoo Finance](https://finance.yahoo.com/quote/XPEV/news/). Additionally, the company's expansion into European markets and the successful launch of the XNGP driving technology have been viewed positively by investors, contributing to the stock's recent appreciation.

However, the absence of recent news impact data from X/Twitter limits the ability to fully capture the immediate sentiment shifts influenced by real-time news and social media discussions. This gap in data suggests that while positive corporate developments have driven stock price increases, the full extent of news-driven sentiment fluctuations remains uncertain.

### News Impact

The impact of news on XPeng's stock performance is evident in the company's quarterly performance reports and strategic announcements. XPeng's strong Q4 and FY2024 financial results, with significant growth in deliveries and revenues, have been key drivers of positive sentiment [XPEV - Xpeng Inc Latest Stock News & Market Updates](https://www.stocktitan.net/news/XPEV/). These results demonstrate the company's ability to execute its growth strategy effectively, reinforcing investor confidence.

Conversely, the broader economic environment and regulatory changes can also influence market sentiment. For instance, the EV market in China experienced a meaningful decrease in sales during the first quarter of 2024, which may have contributed to some of the caution reflected in analyst ratings [XPeng - XPEV - Stock Price & News | The Motley Fool](https://www.fool.com/quote/nyse/xpev/). Such market dynamics highlight the importance of considering both company-specific news and broader industry trends when assessing sentiment.

In conclusion, the market sentiment for XPeng Inc. is characterized by a mix of optimism and caution, driven by the company's strong growth in vehicle deliveries and revenue, alongside concerns over profitability and cash flow. The lack of real-time news impact data from X/Twitter represents a significant gap in understanding the full extent of sentiment fluctuations, underscoring the need for comprehensive data sources to capture the dynamic nature of market sentiment.

## Technical Analysis

### Price Trends

XPeng Inc.'s stock has exhibited a moderately bearish trend in recent analyses, despite experiencing buying pressure, which is generally a positive indicator [XPEV Stock Price Chart Technical Analysis - Financhill](https://financhill.com/stock-price-chart/xpev-technical-analysis). The stock's price appreciation of 91% over the last quarter underscores the significant volatility it has experienced, reflecting both the dynamic nature of the EV market and the impact of various corporate developments on investor sentiment [XPeng (XPEV) Stock Price, News & Analysis - MarketBeat](https://www.marketbeat.com/stocks/NYSE/XPEV/).

The current stock price of XPeng is $20.72, with a support level identified at $21.79 and a resistance level at $23.73 [XPENG INC - ADR (XPEV) Stock Price, Quote, News and Overview](https://www.chartmill.com/stock/quote/XPEV/profile). These support and resistance levels are critical for traders to monitor, as they can influence short-term price movements and trading decisions.

### Technical Indicators

Technical analysis of XPeng's stock is limited by incomplete data on key indicators, which affects the depth and reliability of the analysis. The Moving Average Convergence Divergence (MACD) stands at 1.92, and the Relative Strength Index (RSI) is at 59.50, according to the latest available data [XPeng, Inc. ADR (XPEV) Technical Analysis - TipRanks.com](https://www.tipranks.com/stocks/xpev/technical-analysis). These indicators provide insights into the stock's momentum and potential overbought or oversold conditions, but the lack of complete data on other key indicators, such as Stochastic %K, Commodity Channel Index (CCI), and Average Directional Index (ADI), limits the ability to draw comprehensive conclusions [Technical Analysis of XPeng Inc. (NYSE:XPEV) - TradingView](https://www.tradingview.com/symbols/NYSE-XPEV/technicals/).

The absence of complete data on these technical indicators represents a significant gap in the analysis, as they are crucial for making informed trading decisions. For instance, the Stochastic RSI, Williams Percent Range, and Bull Bear Power indicators are not available, which could affect the accuracy of trend predictions and the identification of potential entry and exit points for traders [Technical Analysis of XPeng Inc. (NYSE:XPEV) - TradingView](https://www.tradingview.com/symbols/NYSE-XPEV/technicals/).

### Support and Resistance Levels

The identified support and resistance levels for XPeng's stock are essential for understanding potential price movements. The stock has a short-term support level at $22.34 and a resistance level at $22.61, which are valid for intraday trading [Xpeng Inc ADR XPEV Support Resistance charts](https://munafasutra.com/nyse/ma/XPEV). Additionally, a more significant support level below the current price is at $18.04, with a resistance level above at $24.91 [XPEV $XPEV Stock Charts, Analysis, Trend, XPeng Inc ADR](https://www.stockconsultant.com/consultnow/basicplus.cgi?symbol=XPEV).

These levels are critical for traders to monitor, as they can influence trading strategies and decision-making. The support levels represent potential buying opportunities, while the resistance levels indicate points where selling pressure may increase, potentially leading to a price reversal.

In summary, XPeng's stock exhibits a moderately bearish trend with buying pressure, but the technical analysis is limited by incomplete data on key indicators. The identified support and resistance levels provide critical insights for traders, but the lack of comprehensive technical data underscores the need for more detailed analysis to make informed trading decisions.

## Comparative Analysis

### Market Share

XPeng Inc. holds a modest 0.21% market share in the global electric vehicle (EV) market as of Q4 2023, significantly lower than its competitors such as Toyota, which commands a 14.20% market share, and General Motors with an 8.63% market share [Xpeng Inc Market share relative to its competitors, as of Q4 2023](https://csimarket.com/stocks/competitionSEG2.php?code=XPEV). This disparity highlights XPeng's relatively small footprint in the global market, despite its significant growth in vehicle deliveries and revenue within China.

The company's market share has shown a slight increase from 0.19% in Q3 2023 to 0.21% in Q4 2023, indicating progress in capturing a larger portion of the market. However, XPeng's market share remains dwarfed by established players, underscoring the challenges it faces in expanding its global presence [Xpeng Inc Market share relative to its competitors, as of Q4 2023](https://csimarket.com/stocks/competitionSEG2.php?code=XPEV).

### Financial Metrics vs. Competitors

When comparing XPeng's financial metrics to those of its key competitors, several notable differences emerge. XPeng's revenue for 2023 stood at RMB30.68 billion ($4.32 billion), which is significantly lower than the revenues of larger competitors like Toyota and General Motors [XPeng, Inc. ADR (XPEV) Financial Statements - Cash Flow - TipRanks](https://www.tipranks.com/stocks/xpev/financials). For instance, Toyota reported a revenue of $275.3 billion in the same year, highlighting the vast scale difference between XPeng and established automotive giants [Xpeng Inc Market share relative to its competitors, as of Q4 2023](https://csimarket.com/stocks/competitionSEG2.php?code=XPEV).

XPeng's gross margin for 2023 was reported at 1.5%, which is considerably lower than that of its competitors. For example, Toyota's gross margin for the same period was around 18%, reflecting a more efficient cost structure and higher profitability [Xpeng Inc Annual Gross Margin Trends, Business Profitability](https://csimarket.com/stocks/singleProfitabilityRatiosy.php?code=XPEV&gro). This comparison underscores XPeng's challenges in achieving profitability, particularly in the context of high production costs and competitive pricing pressures within the EV market.

### Competitive Positioning

XPeng's competitive positioning within the EV market is characterized by its focus on mid- to high-end segments and its emphasis on integrating cutting-edge technology into its vehicles. The company's vertical integration strategy allows it to develop core vehicle systems in-house, enhancing its ability to differentiate its offerings and optimize the user experience [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

Despite its technological strengths, XPeng faces significant competition from both domestic and international players. In China, competitors like NIO and Li Auto are also vying for market share within the premium EV segment, while global giants like Tesla continue to expand their presence in the region. XPeng's limited product portfolio and dependence on the Chinese market are notable weaknesses that could hinder its ability to compete effectively on a global scale [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

In summary, XPeng Inc. holds a small market share in the global EV market and faces significant challenges in achieving profitability compared to its larger competitors. The company's focus on technology and vertical integration provides a competitive edge, but its limited product portfolio and market dependence remain areas of concern. Understanding these comparative dynamics is crucial for investors evaluating XPeng's long-term growth potential and competitive positioning.

## Value Investor Analysis

### Intrinsic Value

The intrinsic value of XPeng Inc. (XPEV) is a critical metric for value investors, providing insight into the company's true worth based on its future cash flows and growth potential. According to Investor's Craft, the intrinsic value of XPeng is estimated at $41.93, suggesting a significant upside potential of 92% from its previous close of $21.80 [Intrinsic Value of XPeng Inc. (XPEV) is $41.93 - Investor's Craft](https://investorscraft.com/intrinsic-value/xpev). This valuation is based on fiscal year data as of 2023 and quarterly data as of December 31, 2023, using a discounted cash flow (DCF) model.

Another source, ValueInvesting.io, provides a higher intrinsic value estimate of $206.70 for XPeng, based on the Discounted Cash Flows (Growth Exit 5Y) model [XPEV Intrinsic Value | Is Xpeng Inc (XPEV) undervalued?](https://valueinvesting.io/XPEV/valuation/intrinsic-value). This wide range in intrinsic value estimates reflects the variability and uncertainty inherent in projecting future cash flows, particularly for a company operating in the dynamic EV market.

The intrinsic value calculations are further supported by a DCF analysis conducted by Yahoo Finance, which projects XPeng's future cash flows up to 2034. The analysis suggests a terminal value of CN¥410 billion, discounted back to a present value of CN¥111 billion [Estimating The Intrinsic Value Of XPeng Inc. (NYSE:XPEV)](https://finance.yahoo.com/news/estimating-intrinsic-value-xpeng-inc-174757329.html). This comprehensive approach to valuation highlights the potential for significant growth, but also underscores the reliance on projections that may not be fully validated.

### Growth Potential

XPeng's growth potential is closely tied to its ability to expand its market share and increase its profitability. The company's projected revenue growth rate is expected to be robust, with forecasts indicating a compound annual growth rate (CAGR) that could drive significant increases in future cash flows [Intrinsic Value of XPeng Inc. (XPEV) is $41.93 - Investor's Craft](https://investorscraft.com/intrinsic-value/xpev). 

The company's expansion into European markets and the successful launch of the XNGP driving technology are key drivers of its growth potential. These strategic initiatives are expected to contribute to XPeng's ability to capture a larger share of the global EV market, which is projected to grow significantly in the coming years [XPeng Inc. (XPEV) Latest Stock News & Headlines - Yahoo Finance](https://finance.yahoo.com/quote/XPEV/news/).

However, XPeng's growth potential is tempered by the challenges it faces in achieving profitability and managing its cash flow. The company's negative profit margins and high cash burn rate suggest that while revenue growth is strong, the path to sustainable profitability remains uncertain [Xpeng Inc Annual Gross Margin Trends, Business Profitability](https://csimarket.com/stocks/singleProfitabilityRatiosy.php?code=XPEV&gro).

### Risk Factors

Investing in XPeng Inc. comes with several risk factors that value investors must consider. The company's high cash burn rate is a significant concern, as it indicates a reliance on external financing to sustain operations. As of the latest data, XPeng's cash flow from operating activities has been consistently negative, with a reported cash outflow of -$0.83 billion for the trailing twelve months [XPeng Net Profit Margin 2020-2024 | XPEV - Macrotrends](https://macrotrends.net/stocks/charts/XPEV/xpeng/net-profit-margin).

Revenue volatility is another risk factor, as XPeng's growth has been accompanied by fluctuations in revenue that could impact its ability to achieve stable cash flows. The company's dependence on the Chinese market further exposes it to geopolitical risks, particularly related to international trade tensions and regulatory changes [Breaking Down XPeng Inc. (XPEV): Key Insights for Investors – DCF Modeling](https://dcfmodeling.com/blogs/health/xpev-financial-health).

Additionally, XPeng's debt exposure is a concern, with total liabilities increasing by 11.32% in Q4 2024 to $7.05 billion [XPeng Inc. Balance Sheet – NYSE:XPEV - TradingView](https://www.tradingview.com/symbols/NYSE-XPEV/financials-balance-sheet/). This rise in liabilities, coupled with a high debt-to-equity ratio, suggests that XPeng may need to manage its debt levels carefully to maintain financial stability.

In summary, the intrinsic value calculations for XPeng Inc. suggest significant growth potential, with estimates ranging from $41.93 to $206.70. However, these calculations are based on projections that may not be fully validated, introducing uncertainty into value assessments. The company's growth potential is promising, driven by strategic expansions and technological innovations, but is tempered by challenges related to profitability and cash flow management. The identified risk factors, including high cash burn rate, revenue volatility, debt exposure, and geopolitical risks, highlight the need for careful consideration by value investors evaluating XPeng's investment potential.

## Investment Thesis

### SWOT Analysis

#### Strengths

XPeng Inc. boasts several strengths that position it as a competitive player in the electric vehicle (EV) market. One of its primary strengths lies in its cutting-edge technology, which includes advanced driver-assistance systems (ADAS), intelligent operating systems, and over-the-air updates. These features appeal to tech-savvy consumers seeking innovative and connected transportation solutions [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/). 

Another significant strength is XPeng's vertical integration strategy, which allows the company to develop core vehicle systems, including powertrain and the electrical/electronic architecture, in-house. This approach enables XPeng to optimize the user experience and differentiate its offerings from competitors, enhancing its market position [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

#### Weaknesses

Despite its strengths, XPeng faces several weaknesses that could impact its growth and profitability. The company's limited product portfolio is a notable weakness, as it currently focuses on a narrow range of mid- to high-end vehicles. This limitation could hinder XPeng's ability to capture a broader market segment and compete effectively with companies offering more diverse product lines [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

Additionally, XPeng's dependence on the Chinese market is a significant weakness. While the company has begun expanding into European markets, its reliance on domestic sales exposes it to regulatory and economic risks within China, which could impact its overall performance [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

#### Opportunities

XPeng has several opportunities to leverage for future growth. The global EV market is projected to experience significant expansion in the coming years, driven by increasing consumer demand for environmentally friendly vehicles and supportive government policies. XPeng's strategic expansion into European markets and its focus on technological innovation position it well to capitalize on this growth [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

Moreover, the company's development of advanced driving technologies, such as the XNGP driving system, presents an opportunity to differentiate itself further in the market. By continuing to invest in research and development, XPeng can enhance its competitive edge and attract a larger customer base [XPeng Inc. (XPEV) Latest Stock News & Headlines - Yahoo Finance](https://finance.yahoo.com/quote/XPEV/news/).

#### Threats

XPeng faces several threats that could impact its long-term success. The intense competition within the EV market, both domestically and internationally, poses a significant threat. Competitors like NIO, Li Auto, and Tesla are also vying for market share, particularly in the premium segment, which could limit XPeng's growth potential [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/).

Regulatory risks are another major threat, as changes in government policies and subsidies related to EVs could impact XPeng's operations and profitability. Additionally, geopolitical tensions, particularly related to international trade, could disrupt XPeng's supply chain and market access, further complicating its expansion efforts [Breaking Down XPeng Inc. (XPEV): Key Insights for Investors – DCF Modeling](https://dcfmodeling.com/blogs/health/xpev-financial-health).

### Recommendations for Different Investor Types

#### Growth Investors

For growth investors, XPeng Inc. presents an attractive opportunity due to its significant growth in vehicle deliveries and revenue. The company's projected 300% year-over-year increase in Q1 2025 vehicle deliveries and its expansion into European markets indicate strong growth potential [XPeng Inc. (XPEV) Latest Stock News & Headlines - Yahoo Finance](https://finance.yahoo.com/quote/XPEV/news/). Growth investors should, however, be mindful of the company's challenges with profitability and cash flow, which could impact its long-term sustainability.

#### Value Investors

Value investors may find XPeng's intrinsic value calculations appealing, with estimates ranging from $41.93 to $206.70, suggesting significant upside potential [Intrinsic Value of XPeng Inc. (XPEV) is $41.93 - Investor's Craft](https://investorscraft.com/intrinsic-value/xpev). However, these calculations are based on projections that may not be fully validated, introducing uncertainty. Value investors should carefully consider the company's high cash burn rate and negative profit margins, as these factors could affect the realization of its intrinsic value.

#### Risk-Averse Investors

Risk-averse investors may find XPeng's stock less appealing due to its high cash burn rate, revenue volatility, and exposure to geopolitical risks. The company's negative cash flow from operating activities and increasing liabilities highlight the need for careful risk management [XPeng Net Profit Margin 2020-2024 | XPEV - Macrotrends](https://macrotrends.net/stocks/charts/XPEV/xpeng/net-profit-margin). Risk-averse investors should monitor XPeng's progress in achieving profitability and reducing its reliance on external financing before considering an investment.

#### Long-Term Investors

Long-term investors may find XPeng's focus on technological innovation and its strategic expansion into new markets appealing. The company's development of advanced driving technologies and its potential to capture a larger share of the growing global EV market align with a long-term investment strategy [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights](https://www.strategypunk.com/xpeng-swot-analysis-free-ppt-template-and-in-depth-insights-free-file/). Long-term investors should, however, remain vigilant about the company's financial health and the competitive landscape, as these factors could influence XPeng's long-term performance.

In summary, XPeng Inc.'s investment thesis is characterized by its strengths in technology and vertical integration, coupled with opportunities in the growing global EV market. However, the company's weaknesses, including a limited product portfolio and dependence on the Chinese market, along with threats from intense competition and regulatory risks, must be carefully considered. Different investor types can find XPeng appealing based on their investment strategies, but all should remain cognizant of the company's financial challenges and market dynamics.

## Scope and Limitations

### Identified Limitations

The research on XPeng Inc. (XPEV) stock has been conducted using primarily web sources such as Yahoo Finance, Zacks, Reuters, and TipRanks. While these sources are reputable financial data providers, the lack of academic sources and the absence of results from X/Twitter queries represent significant limitations in the depth and diversity of the information gathered. The reliance on web sources may limit the academic rigor and peer-reviewed validation of the data, potentially impacting the robustness of the analysis [Gap Analysis Summary].

To address this limitation, future research could incorporate academic papers to provide more in-depth analysis and validation of financial metrics and market sentiment. Additionally, utilizing X/Twitter could capture real-time market sentiment and the immediate impact of news on XPeng's stock performance, enhancing the comprehensiveness of the analysis [Gap Analysis Summary].

### Missing Perspectives or Data

The research lacks data on the recent news impact on XPeng's stock, which is crucial for understanding short-term market movements. This gap in data is due to the absence of results from X/Twitter queries, which are essential for capturing real-time sentiment shifts influenced by news and social media discussions [Gap Analysis Summary]. 

Moreover, the technical analysis section has incomplete data on key indicators, such as Stochastic %K, Commodity Channel Index (CCI), and Average Directional Index (ADI). This incomplete data limits the depth and reliability of the technical analysis, potentially affecting the accuracy of trading decisions [Technical Analysis of XPeng Inc. (NYSE:XPEV) - TradingView].

To overcome these limitations, a targeted search for recent news articles and their impact on XPeng's stock should be conducted. Additionally, ensuring complete data sets for technical indicators would enhance the reliability of the technical analysis, providing a more comprehensive view of XPeng's stock trends [Gap Analysis Summary].

### Areas Needing Deeper Investigation

The intrinsic value calculations and growth potential assessments for XPeng are based on projections and assumptions that may not be fully substantiated. The wide range of intrinsic value estimates, from $41.93 to $206.70, reflects the variability and uncertainty inherent in these projections [Intrinsic Value of XPeng Inc. (XPEV) is $41.93 - Investor's Craft], [XPEV Intrinsic Value | Is Xpeng Inc (XPEV) undervalued?]. 

Similarly, the SWOT analysis, while comprehensive, could benefit from more specific data points to support each element. The qualitative assessments of XPeng's strengths, weaknesses, opportunities, and threats would be more robust with quantitative data to validate the claims [Xpeng SWOT Analysis: Free PPT Template and In-Depth Insights].

To address these areas, future research should validate intrinsic value calculations with multiple models and historical data, ensuring a more reliable assessment of XPeng's true worth. Enhancing the SWOT analysis with quantitative data points would also provide a more robust framework for understanding XPeng's strategic positioning [Gap Analysis Summary].

### Potential Biases or Conflicts

The analyst ratings and sentiment indicators for XPeng may be influenced by the biases of the analysts or the firms they represent. These biases could skew the consensus ratings and price targets, potentially impacting investor decisions [XPeng, Inc. ADR (XPEV) Stock Forecast & Price Target - TipRanks]. Additionally, the financial data sources used in the research may have conflicts of interest if they are affiliated with investment firms that have stakes in XPeng, which could affect the objectivity of the data provided [Gap Analysis Summary].

To mitigate these potential biases and conflicts, cross-referencing analyst ratings with multiple sources could help identify any discrepancies and potential biases. Furthermore, disclosing any affiliations or conflicts of interest of the data providers would enhance the transparency and credibility of the research [Gap Analysis Summary].

In summary, the scope and limitations of this research on XPeng Inc. highlight the need for a more diverse set of data sources, including academic papers and real-time social media data, to enhance the depth and reliability of the analysis. Addressing the gaps in recent news impact and technical indicators, validating intrinsic value calculations, and mitigating potential biases are crucial steps to ensure a comprehensive and robust assessment of XPeng's stock.

## Conclusion

This comprehensive analysis of XPeng Inc. (XPEV) stock has provided a detailed examination of the company's performance across various dimensions, including company overview, financial performance, market sentiment, technical analysis, competitive positioning, intrinsic value, and investment thesis. XPeng's focus on mid- to high-end smart electric vehicles in China's passenger vehicle market, coupled with its significant growth in vehicle deliveries and revenue, positions it as a notable player in the EV industry. However, the company's financial challenges, characterized by negative profit margins and a high cash burn rate, underscore the complexities and risks associated with investing in XPeng.

The market sentiment for XPeng's stock is mixed, with a consensus 'Hold' rating from analysts and significant volatility reflecting both optimism and caution. The technical analysis suggests a moderately bearish trend with buying pressure, though incomplete data on key indicators limits the depth of this analysis. Comparatively, XPeng holds a small market share in the global EV market and faces challenges in achieving profitability compared to larger competitors like Toyota and General Motors. 

Intrinsic value calculations indicate significant growth potential, with estimates ranging from $41.93 to $206.70. However, these projections introduce uncertainty due to their reliance on assumptions that may not be fully validated. The SWOT analysis highlights XPeng's strengths in technology and vertical integration, but also its weaknesses, such as a limited product portfolio and dependence on the Chinese market. Opportunities in the global EV market growth are promising, but threats from intense competition and regulatory risks remain significant.

The remaining uncertainties identified in this research include the impact of recent news on XPeng's stock performance, which is not fully captured due to the lack of X/Twitter data. Additionally, the incomplete technical analysis due to missing data on key indicators could affect trading decisions. The intrinsic value calculations and SWOT analysis also rely on projections and qualitative assessments that could benefit from further validation and quantitative support.

In conclusion, XPeng Inc. presents a complex investment opportunity with significant growth potential, but also notable risks and uncertainties. Investors should carefully consider the company's financial health, market sentiment, and competitive positioning when evaluating XPeng as an investment. Future research should aim to address the identified limitations by incorporating academic sources, real-time social media data, and more comprehensive technical indicators to enhance the robustness of the analysis.

================================================
FILE: super_agents/deep_research/reason_graph/__init__.py
================================================


================================================
FILE: super_agents/deep_research/reason_graph/graph.py
================================================
from typing import Literal, Optional, Dict, Any
from langgraph.graph import StateGraph, END
from super_agents.deep_research.reason_graph.state import ResearchState
from super_agents.deep_research.reason_graph.nodes import (
    plan_research,
    prepare_steps,
    execute_search,
    perform_analysis,
    analyze_gaps,
    execute_gap_search,
    synthesize_final_report,
    finalize_basic_research,
    generate_final_markdown_report 
    # These are the functions that will be used as nodes in the graph
)
# --- Conditional Edge Functions ---

def should_continue_search(state: ResearchState) -> Literal["execute_search", "perform_analysis"]:
    """Decides whether to continue searching or move to analysis."""
    if state['current_search_step_index'] < len(state['search_steps_planned']):
        return "execute_search"
    else:
        # Check if analysis steps exist before proceeding
        if state['analysis_steps_planned']:
             return "perform_analysis"
        else:
             # If no analysis steps, go directly to gap analysis
             return "analyze_gaps"


def should_continue_analysis(state: ResearchState) -> Literal["perform_analysis", "analyze_gaps"]:
    """Decides whether to continue analysis or move to gap analysis."""
    if state['current_analysis_step_index'] < len(state['analysis_steps_planned']):
        return "perform_analysis"
    else:
        return "analyze_gaps"

def decide_gap_followup(state: ResearchState) -> Literal["execute_gap_search", "synthesize_final_report", "finalize_basic"]:
    """Decides whether to perform gap searches, synthesize, or end."""
    depth = state['depth']
    gap_analysis = state.get('gap_analysis')
    additional_queries = state.get('additional_queries_planned', [])
    current_gap_index = state.get('current_gap_search_index', 0)

    if depth == 'advanced' and gap_analysis and additional_queries:
        if current_gap_index < len(additional_queries):
             return "execute_gap_search" 
        else:
             # Finished gap searches, proceed to final synthesis
             return "synthesize_final_report" 
    else:
        # Basic depth, or advanced with no gaps/failed gap analysis/no queries from gaps
        return "finalize_basic_research" # Use correct function name

# --- Build Graph Function ---

def build_research_graph(for_web: bool = False) -> StateGraph:
    """Builds and returns a research workflow graph.
    
    Args:
        for_web: If True, configures the graph for web streaming with additional settings.
        
    Returns:
        A configured StateGraph instance ready to be compiled.
    """
    workflow = StateGraph(ResearchState)
    
    # Add Nodes - same for both CLI and web versions
    workflow.add_node("plan_research", plan_research)
    workflow.add_node("prepare_steps", prepare_steps)
    workflow.add_node("execute_search", execute_search)
    workflow.add_node("perform_analysis", perform_analysis)
    workflow.add_node("analyze_gaps", analyze_gaps)
    workflow.add_node("execute_gap_search", execute_gap_search)
    workflow.add_node("synthesize_final_report", synthesize_final_report)
    workflow.add_node("finalize_basic_research", finalize_basic_research)
    workflow.add_node("generate_final_markdown_report", generate_final_markdown_report)
    
    # Define Edges - same for both CLI and web versions
    workflow.set_entry_point("plan_research")
    workflow.add_edge("plan_research", "prepare_steps")
    workflow.add_edge("prepare_steps", "execute_search") # Start search loop
    
    # Search Loop
    workflow.add_conditional_edges(
        "execute_search",
        should_continue_search,
        { "execute_search": "execute_search", "perform_analysis": "perform_analysis", "analyze_gaps": "analyze_gaps" }
    )
    
    # Analysis Loop
    workflow.add_conditional_edges(
        "perform_analysis",
        should_continue_analysis,
        { "perform_analysis": "perform_analysis", "analyze_gaps": "analyze_gaps" }
    )
    
    # Gap Analysis Follow-up Logic
    workflow.add_conditional_edges(
        "analyze_gaps",
        decide_gap_followup,
        { "execute_gap_search": "execute_gap_search", "synthesize_final_report": "synthesize_final_report", "finalize_basic_research": "finalize_basic_research" }
    )
    
    # Gap Search Loop & Synthesis
    workflow.add_conditional_edges(
        "execute_gap_search",
        decide_gap_followup, 
        { "execute_gap_search": "execute_gap_search", "synthesize_final_report": "synthesize_final_report", "finalize_basic_research": "finalize_basic_research" }
    )
    
    # --- Adjust Final Edges ---
    # If synthesis succeeds, go to report generation
    workflow.add_edge("synthesize_final_report", "generate_final_markdown_report") 
    # If report generation succeeds, END
    workflow.add_edge("generate_final_markdown_report", END) 
    # If flow goes to basic finalizer, END
    workflow.add_edge("finalize_basic_research", END)
    
    # Web-specific configuration
    if for_web:
        # For web, we might want to configure additional settings
        # such as checkpoint frequency, stream mode, etc.
        pass
        
    return workflow

# --- Build the original workflow for main.py ---
workflow = build_research_graph(for_web=False)

# --- Build the web workflow for web interface ---
web_workflow = build_research_graph(for_web=True)

# Compile both graphs
app = workflow.compile()
web_app = web_workflow.compile()

# Function to get the appropriate app based on context
def get_app(for_web: bool = False) -> Any:
    """Returns the appropriate compiled graph based on the context.
    
    Args:
        for_web: If True, returns the web-optimized graph.
        
    Returns:
        The compiled graph application.
    """
    return web_app if for_web else app

================================================
FILE: super_agents/deep_research/reason_graph/nodes.py
================================================
import asyncio
import json
import time
from datetime import datetime
from typing import Dict, Any, List, Literal
from langchain_core.messages import AIMessage, HumanMessage, ToolMessage
# --- Internal Imports ---
from super_agents.deep_research.reason_graph.state import ResearchState # Relative import
from super_agents.deep_research.reason_graph.schemas import ( # Relative import
    SearchQuery, 
    RequiredAnalysis, 
    AnalysisResult, 
    GapAnalysisResult, 
    FinalSynthesisResult, 
    SearchStepResult, 
    SearchResultItem,
    StreamUpdate,
    StepInfo,
    ResearchPlan
)
from super_agents.deep_research.reason_graph.tools import ( # Relative import
    llm, 
    llm_creative, 
    generate_structured_output, 
    perform_web_search, 
    perform_academic_search, 
    perform_x_search, 
    add_stream_update
)
from super_agents.deep_research.reason_graph.prompt import FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE 
# --- Node Functions ---

async def plan_research(state: ResearchState) -> Dict[str, Any]:
    """Generates the initial research plan using an LLM."""
    topic = state['topic']
    updates = add_stream_update(state, {
        'id': 'research-plan-initial',
        'type': 'plan',
        'status': 'running',
        'title': 'Research Plan',
        'message': 'Creating research plan...',
        'overwrite': True
    })

    prompt = f"""Create a focused research plan for the topic: "{topic}". 

Today's date and day of the week: {datetime.now().strftime('%A, %B %d, %Y')}

Keep the plan concise but comprehensive, with:
- 4-12 targeted search queries (each can use web, academic, x (Twitter), or all sources)
- 2-8 key analyses to perform
- Prioritize the most important aspects to investigate (priority 2-4 for searches, 1-5 for analyses)

Available sources:
- "web": General web search (Use Tavily)
- "academic": Academic papers and research (Use Exa)
- "x": X/Twitter posts and discussions (Use Exa with domain filter)
- "all": Use all source types (web, academic, and X/Twitter)

Priority rules for search_queries:
- Use only whole numbers between 2 and 4. Lower number means higher priority (e.g., 2 is highest).

Importance rules for required_analyses:
- Use only whole numbers between 1 and 5. Higher number means higher importance.

Consider different angles and potential controversies, but maintain focus on the core aspects.
Ensure the total number of steps (searches + analyses) does not exceed 20."""

    research_plan = await asyncio.get_event_loop().run_in_executor(
        None, generate_structured_output, llm, ResearchPlan, prompt
    )
    # research_plan = generate_structured_output(llm, ResearchPlan, prompt) # If generate_structured_output is async

    return {"research_plan": research_plan, "stream_updates": updates}


def prepare_steps(state: ResearchState) -> Dict[str, Any]:
    """Processes the plan to create lists of search and analysis steps with IDs."""
    plan = state['research_plan']
    if not plan:
        raise ValueError("Research plan is missing.")

    search_steps_planned = []
    analysis_steps_planned = []
    search_counter = 0
    analysis_counter = 0

    # Generate search steps, expanding 'all'
    for i, query in enumerate(plan.search_queries):
        if query.source == 'all':
            search_steps_planned.append(StepInfo(id=f"search-web-{i}", type='web', details=query.dict()))
            search_steps_planned.append(StepInfo(id=f"search-academic-{i}", type='academic', details=query.dict()))
            search_steps_planned.append(StepInfo(id=f"search-x-{i}", type='x', details=query.dict()))
            search_counter += 3
        elif query.source == 'x':
            search_steps_planned.append(StepInfo(id=f"search-x-{i}", type='x', details=query.dict()))
            search_counter += 1
        elif query.source == 'academic':
            search_steps_planned.append(StepInfo(id=f"search-academic-{i}", type='academic', details=query.dict()))
            search_counter += 1
        else: # 'web'
            search_steps_planned.append(StepInfo(id=f"search-web-{i}", type='web', details=query.dict()))
            search_counter += 1

    # Generate analysis steps
    for i, analysis in enumerate(plan.required_analyses):
        analysis_steps_planned.append(StepInfo(id=f"analysis-{i}", type='analysis', details=analysis.dict()))
        analysis_counter += 1
        
    total_steps = search_counter + analysis_counter
    
    # Send plan completed update
    updates = add_stream_update(state, {
        'id': 'research-plan',
        'type': 'plan',
        'status': 'completed',
        'title': 'Research Plan',
        'plan': plan, # Send the plan object itself
        'totalSteps': total_steps,
        'message': 'Research plan created',
        'overwrite': True
    })

    return {
        "search_steps_planned": search_steps_planned,
        "analysis_steps_planned": analysis_steps_planned,
        "current_search_step_index": 0,
        "current_analysis_step_index": 0,
        "total_steps": total_steps,
        "completed_steps_count": 0, # Initialize completed steps
        "stream_updates": updates
    }


async def execute_search(state: ResearchState) -> Dict[str, Any]:
    """Executes a single search step based on the current index."""
    idx = state['current_search_step_index']
    step = state['search_steps_planned'][idx]
    query_obj = SearchQuery(**step.details)
    depth = state['depth']
    
    step_type = step.type
    step_id = step.id
    query_str = query_obj.query
    
    # 计算当前完成的步骤数和总步骤数，用于进度显示
    completed_steps = state.get('completed_steps_count', 0)
    total_steps = state.get('total_steps', 0)
    
    # Send running update with progress information
    running_updates = add_stream_update(state, {
        'id': step_id,
        'type': step_type,
        'status': 'running',
        'title': f"Searching {step_type} for '{query_str}'",
        'query': query_str,
        'message': f"Searching {query_obj.source} sources...",
        'completedSteps': completed_steps,
        'totalSteps': total_steps,
    })

    results = []
    search_step_result = None

    try:
        if step_type == 'web':
            results = await perform_web_search(query_str, depth, query_obj.priority)
        elif step_type == 'academic':
            results = await perform_academic_search(query_str, query_obj.priority)
        elif step_type == 'x':
            # Pass the full query object to x_search if it needs more context (like priority)
            results = await perform_x_search(query_obj)
            
        search_step_result = SearchStepResult(type=step_type, query=query_obj, results=results)
        
        # Send completed update
        completed_updates = add_stream_update(state, {
            'id': step_id,
            'type': step_type,
            'status': 'completed',
            'title': f"Search complete for '{query_str}'",
            'query': query_str,
            'results': results, # Send results in the update
            'message': f"Found {len(results)} results",
            'overwrite': True
        })
        
        all_updates = running_updates + completed_updates
        
        return {
            "search_results": [search_step_result] if search_step_result else [], # Use operator.add
            "current_search_step_index": idx + 1,
            "completed_steps_count": state.get('completed_steps_count', 0) + 1,
            "stream_updates": all_updates
        }
    except Exception as e:
        print(f"Error executing search step {step_id}: {e}")
         # Send error update
        error_updates = add_stream_update(state, {
            'id': step_id,
            'type': step_type,
            'status': 'completed', # Mark as completed even on error to proceed
            'title': f"Search failed for '{query_str}'",
            'query': query_str,
            'message': f"Error during search: {str(e)}",
            'overwrite': True
        })
        all_updates = running_updates + error_updates
        return {
            "search_results": [], 
            "current_search_step_index": idx + 1, # Move to next step even on error
            "completed_steps_count": state.get('completed_steps_count', 0) + 1, # Count error step as 'completed' for progress
            "stream_updates": all_updates
        }

async def perform_analysis(state: ResearchState) -> Dict[str, Any]:
    """Performs a single analysis step based on the current index."""
    idx = state['current_analysis_step_index']
    step = state['analysis_steps_planned'][idx]
    analysis_obj = RequiredAnalysis(**step.details)
    all_search_results = state['search_results']

    step_id = step.id
    analysis_type = analysis_obj.type
    analysis_desc = analysis_obj.description

    # 计算当前完成的步骤数和总步骤数，用于进度显示
    completed_steps = state.get('completed_steps_count', 0)
    total_steps = state.get('total_steps', 0)
    
    # Send running update with progress information
    running_updates = add_stream_update(state, {
        'id': step_id,
        'type': 'analysis',
        'status': 'running',
        'title': f"Analyzing {analysis_type}",
        'analysisType': analysis_type,
        'message': f"Analyzing {analysis_type}...",
        'completedSteps': completed_steps,
        'totalSteps': total_steps,
    })

    prompt = f"""Perform a "{analysis_type}" analysis. Analysis description: "{analysis_desc}"
Consider all sources and their reliability based on the provided search results.

Search results JSON: 
{json.dumps([r.dict() for r in all_search_results], indent=2)}

Generate findings (insight, evidence, confidence), implications, and limitations based *only* on the provided search results."""
    
    try:
        # Use the 'creative' LLM instance if needed
        analysis_result = await asyncio.get_event_loop().run_in_executor(
             None, generate_structured_output, llm_creative, AnalysisResult, prompt
        )
        # analysis_result = generate_structured_output(llm_creative, AnalysisResult, prompt) # If generate_structured_output is async

        # 更新完成步骤数
        completed_steps = state.get('completed_steps_count', 0) + 1
        
        # Send completed update with progress information
        completed_updates = add_stream_update(state, {
            'id': step_id,
            'type': 'analysis',
            'status': 'completed',
            'title': f"Analysis of {analysis_type} complete",
            'analysisType': analysis_type,
            # Simplify findings for streaming if needed, or send full object
            'findings': [f.dict() for f in analysis_result.findings], 
            'message': f"Analysis complete",
            'overwrite': True,
            'completedSteps': completed_steps,
            'totalSteps': total_steps
        })
        
        all_updates = running_updates + completed_updates

        # NOTE: The original code streams the result but doesn't seem to store
        # the *output* of individual analyses for later LLM steps, only the *plan*.
        # We will follow that here. If aggregation is needed, modify the state.
        return {
            "current_analysis_step_index": idx + 1,
            "completed_steps_count": state.get('completed_steps_count', 0) + 1,
            "stream_updates": all_updates
        }
    except Exception as e:
        print(f"Error performing analysis step {step_id}: {e}")
         # Send error update
        error_updates = add_stream_update(state, {
            'id': step_id,
            'type': 'analysis',
            'status': 'completed',
            'title': f"Analysis failed for {analysis_type}",
            'analysisType': analysis_type,
            'message': f"Error during analysis: {str(e)}",
            'overwrite': True
        })
        all_updates = running_updates + error_updates
        return {
            "current_analysis_step_index": idx + 1, # Move to next step
            "completed_steps_count": state.get('completed_steps_count', 0) + 1,
            "stream_updates": all_updates
        }


async def analyze_gaps(state: ResearchState) -> Dict[str, Any]:
    """Analyzes limitations and knowledge gaps based on all search results."""
    all_search_results = state['search_results']
    analysis_steps_info = state['analysis_steps_planned'] # Get info about what analyses were done

    # 计算当前完成的步骤数和总步骤数，用于进度显示
    completed_steps = state.get('completed_steps_count', 0)
    total_steps = state.get('total_steps', 0)
    
    # Send running update with progress information
    running_updates = add_stream_update(state, {
        'id': 'gap-analysis',
        'type': 'analysis',
        'status': 'running',
        'title': 'Research Gaps and Limitations',
        'analysisType': 'gaps',
        'message': 'Analyzing research gaps and limitations...',
        'completedSteps': completed_steps,
        'totalSteps': total_steps,
    })

    # Prepare info about analyses performed for the prompt
    analyses_performed_summary = [
        {"type": step.details.get('type'), "description": step.details.get('description')} 
        for step in analysis_steps_info
    ]

    prompt = f"""Analyze the research results and identify limitations, knowledge gaps, and recommended follow-up actions.
Consider:
- Quality and reliability of sources evident in the results.
- Missing perspectives or data based on the topic: "{state['topic']}".
- Areas needing deeper investigation.
- Potential biases or conflicts observed in the content.
- Severity for limitations should be between 2 and 10.
- Priority for follow-up actions should be between 2 and 10.

When suggesting additional_queries for knowledge gaps, keep in mind they might be used to search:
- Web sources (Tavily)
- Academic papers (Exa)
- X/Twitter (Exa)
Design queries likely to yield useful results across these diverse source types.

Research results JSON:
{json.dumps([r.dict() for r in all_search_results], indent=2)}

Analyses performed during research (types and descriptions):
{json.dumps(analyses_performed_summary, indent=2)}
"""
    try:
        gap_analysis_result = await asyncio.get_event_loop().run_in_executor(
             None, generate_structured_output, llm, GapAnalysisResult, prompt
        )
        # gap_analysis_result = generate_structured_output(llm, GapAnalysisResult, prompt) # If async
        
        # Calculate total steps including potential advanced steps for the update
        base_total_steps = state['total_steps']
        final_total_steps = base_total_steps + (2 if state['depth'] == 'advanced' else 1) # +1 for gap analysis, +1 for synthesis if advanced
        
        # Send completed update
        completed_updates = add_stream_update(state, {
            'id': 'gap-analysis',
            'type': 'analysis',
            'status': 'completed',
            'title': 'Research Gaps and Limitations',
            'analysisType': 'gaps',
            # Simplify findings for streaming
            'findings': [
                {"insight": l.description, "evidence": l.potential_solutions, "confidence": (10 - l.severity) / 8.0} 
                for l in gap_analysis_result.limitations
            ], 
            'gaps': gap_analysis_result.knowledge_gaps,
            'recommendations': gap_analysis_result.recommended_followup,
            'message': f"Identified {len(gap_analysis_result.limitations)} limitations and {len(gap_analysis_result.knowledge_gaps)} knowledge gaps",
            'overwrite': True,
            'completedSteps': state.get('completed_steps_count', 0) + 1,
            'totalSteps': final_total_steps
        })
        
        all_updates = running_updates + completed_updates
        
        # Prepare additional queries if needed
        additional_queries_planned = []
        if state['depth'] == 'advanced' and gap_analysis_result.knowledge_gaps:
             for gap_idx, gap in enumerate(gap_analysis_result.knowledge_gaps):
                 for query_idx, query_str in enumerate(gap.additional_queries):
                     # Strategy: 'all' for first query per gap, rotate others
                     source: Literal['web', 'academic', 'x', 'all']
                     if query_idx == 0:
                         source = 'all'
                     else:
                         source_types: List[Literal['web', 'academic', 'x']] = ['web', 'academic', 'x']
                         source = source_types[query_idx % len(source_types)]
                         
                     additional_queries_planned.append(SearchQuery(
                         query=query_str,
                         rationale=gap.reason,
                         source=source,
                         priority=3 # Default priority for gap fills
                     ))

        return {
            "gap_analysis": gap_analysis_result,
            "completed_steps_count": state.get('completed_steps_count', 0) + 1,
            "stream_updates": all_updates,
            "additional_queries_planned": additional_queries_planned,
            "current_gap_search_index": 0, # Initialize gap search index
            "total_steps": final_total_steps # Update total steps in state
        }
    except Exception as e:
        print(f"Error during gap analysis: {e}")
        # Send error update
        error_updates = add_stream_update(state, {
            'id': 'gap-analysis',
            'type': 'analysis',
            'status': 'completed',
            'title': 'Gap Analysis Failed',
            'analysisType': 'gaps',
            'message': f"Error during gap analysis: {str(e)}",
            'overwrite': True,
            'completedSteps': state.get('completed_steps_count', 0) + 1,
             # Use base total steps + 1 for gap analysis step itself
            'totalSteps': state['total_steps'] + 1 
        })
        all_updates = running_updates + error_updates
        return {
            "gap_analysis": None, # Indicate failure
            "completed_steps_count": state.get('completed_steps_count', 0) + 1,
            "stream_updates": all_updates,
            "additional_queries_planned": [], # No additional searches on error
            "current_gap_search_index": 0,
             # Ensure total_steps reflects only the completed gap analysis attempt
            "total_steps": state['total_steps'] + 1 
        }


async def execute_gap_search(state: ResearchState) -> Dict[str, Any]:
    """Executes searches based on identified gaps (for advanced depth)."""
    idx = state['current_gap_search_index']
    if not state.get('additional_queries_planned') or idx >= len(state['additional_queries_planned']):
        return {} # Should not happen if logic is correct, but safe return

    query_obj = state['additional_queries_planned'][idx]
    depth = state['depth'] # Should be 'advanced' here
    
    # 计算当前完成的步骤数和总步骤数，用于进度显示
    completed_steps = state.get('completed_steps_count', 0)
    total_steps = state.get('total_steps', 0)
    
    all_new_results: List[SearchStepResult] = []
    all_updates: List[StreamUpdate] = []
    
    search_tasks = []
    step_ids = []

    # If source is 'all', create tasks for web, academic, and x
    # Otherwise, create a task for the specific source
    
    base_id = f"gap-search-{state['current_search_step_index'] + idx}" # Create a unique enough ID base

    sources_to_search: List[Literal['web', 'academic', 'x']] = []
    if query_obj.source == 'all':
        sources_to_search = ['web', 'academic', 'x']
    else:
        sources_to_search = [query_obj.source]

    search_counter = 0 # To create unique IDs if 'all'
    for source_type in sources_to_search:
        step_id = f"{base_id}-{source_type}" if query_obj.source == 'all' else base_id
        step_ids.append(step_id)
        
        # Send running update with progress information
        running_update = add_stream_update(state, {
            'id': step_id,
            'type': source_type,
            'status': 'running',
            'title': f"Additional {source_type} search for '{query_obj.query}'",
            'query': query_obj.query,
            'message': f"Searching {source_type} to fill gap: {query_obj.rationale}",
            'completedSteps': completed_steps,
            'totalSteps': total_steps,
        })
        all_updates.extend(running_update)
        
        # Create async task
        if source_type == 'web':
            search_tasks.append(perform_web_search(query_obj.query, depth, query_obj.priority))
        elif source_type == 'academic':
            search_tasks.append(perform_academic_search(query_obj.query, query_obj.priority))
        elif source_type == 'x':
            search_tasks.append(perform_x_search(query_obj)) # Pass full object
            
        search_counter +=1

    # Execute searches concurrently
    try:
        search_outputs: List[List[SearchResultItem]] = await asyncio.gather(*search_tasks)
        
        # Process results and send completed updates
        for i, results in enumerate(search_outputs):
            source_type = sources_to_search[i]
            step_id = step_ids[i]
            
            # Create a query object specific to this source type for the result log
            specific_query = SearchQuery(
                query=query_obj.query, 
                rationale=query_obj.rationale, 
                source=source_type, 
                priority=query_obj.priority
            )
            step_result = SearchStepResult(type=source_type, query=specific_query, results=results)
            all_new_results.append(step_result)
            
            completed_update = add_stream_update(state, {
                'id': step_id,
                'type': source_type,
                'status': 'completed',
                'title': f"Additional {source_type} search complete for '{query_obj.query}'",
                'query': query_obj.query,
                'results': results,
                'message': f"Found {len(results)} results",
                'overwrite': True # Overwrite the running status
            })
            all_updates.extend(completed_update)

    except Exception as e:
         print(f"Error during gap search for query '{query_obj.query}': {e}")
         # Send error updates for all attempted steps in this batch
         for i, source_type in enumerate(sources_to_search):
             step_id = step_ids[i]
             error_update = add_stream_update(state, {
                 'id': step_id,
                 'type': source_type,
                 'status': 'completed',
                 'title': f"Additional {source_type} search failed for '{query_obj.query}'",
                 'query': query_obj.query,
                 'message': f"Error during gap search: {str(e)}",
                 'completedSteps': completed_steps,
                 'totalSteps': total_steps,
                 'overwrite': True
             })
             all_updates.extend(error_update)
         # Do not add partial results if gather failed significantly
         all_new_results = []


    return {
        "search_results": all_new_results, # Append results
        "current_gap_search_index": idx + 1,
        "stream_updates": all_updates
        # Note: completed_steps_count is handled in the final synthesis update
    }


async def synthesize_final_report(state: ResearchState) -> Dict[str, Any]:
    """Synthesizes all findings if advanced search was performed."""
    all_search_results = state['search_results']
    gap_analysis = state.get('gap_analysis')
    
    # This node is only reached if depth=='advanced' and gaps were found/searched
    
    # 计算当前完成的步骤数和总步骤数，用于进度显示
    completed_steps = state.get('completed_steps_count', 0)
    total_steps = state.get('total_steps', 0)
    
    # Send running update with progress information
    running_updates = add_stream_update(state, {
        'id': 'final-synthesis',
        'type': 'analysis',
        'status': 'running',
        'title': 'Final Research Synthesis',
        'analysisType': 'synthesis',
        'message': 'Synthesizing all research findings...',
        'completedSteps': completed_steps,
        'totalSteps': total_steps,
    })

    # Prepare gap analysis summary for prompt (avoid sending full objects if too large)
    gap_summary = "No gap analysis performed or available."
    if gap_analysis:
         gap_summary = {
             "limitations_summary": [l.description for l in gap_analysis.limitations],
             "knowledge_gaps_summary": [f"{g.topic}: {g.reason}" for g in gap_analysis.knowledge_gaps],
             "followup_summary": [f.action for f in gap_analysis.recommended_followup]
         }
         gap_summary = json.dumps(gap_summary, indent=2)


    prompt = f"""Synthesize all research findings, including the initial searches, the gap analysis, and any follow-up research conducted to fill those gaps.
Highlight key conclusions, assign a confidence score (0-1), list supporting evidence (e.g., citing source URLs or titles briefly), and identify remaining uncertainties.

Stick strictly to the requested output schema.

Topic: "{state['topic']}"

Combined Search Results (Initial + Gap Filling) JSON:
{json.dumps([r.dict() for r in all_search_results], indent=2, default=str)} 

Gap Analysis Summary:
{gap_summary}

Generate the final synthesis."""

    try:
        final_synthesis_result = await asyncio.get_event_loop().run_in_executor(
            None, generate_structured_output, llm, FinalSynthesisResult, prompt
        )
        # final_synthesis_result = generate_structured_output(llm, FinalSynthesisResult, prompt) # If async
        
        final_total_steps = state['total_steps'] # Should already include the +2 for advanced
        final_completed_steps = final_total_steps # Synthesis is the last step

        # Send completed update
        completed_updates = add_stream_update(state, {
            'id': 'final-synthesis',
            'type': 'analysis',
            'status': 'completed',
            'title': 'Final Research Synthesis',
            'analysisType': 'synthesis',
            'findings': [
                 {"insight": f.finding, "evidence": f.supporting_evidence, "confidence": f.confidence} 
                 for f in final_synthesis_result.key_findings
             ], # Simplified for stream
            'uncertainties': final_synthesis_result.remaining_uncertainties,
            'message': f"Synthesized {len(final_synthesis_result.key_findings)} key findings",
            'overwrite': True,
            'completedSteps': final_completed_steps -1, # Show as nearly complete before final progress update
            'totalSteps': final_total_steps
        })

        all_updates = running_updates + completed_updates
        
        # Add final progress update
        final_progress_update = add_stream_update(state, {
            'id': 'research-progress',
            'type': 'progress',
            'status': 'completed',
            'title': 'Research Progress', 
            'message': 'Research complete',
            'completedSteps': final_completed_steps,
            'totalSteps': final_total_steps,
            'isComplete': True,
            'overwrite': True, # Overwrite any previous progress
            'timestamp': time.time()
        })
        all_updates.extend(final_progress_update)

        return {
            "final_synthesis": final_synthesis_result,
            "stream_updates": all_updates,
            "completed_steps_count": final_completed_steps # Mark final count
        }
    except Exception as e:
        print(f"Error during final synthesis: {e}")
        final_total_steps = state['total_steps']
        # Send error update for synthesis
        running_updates = add_stream_update(state, { # 重新获取或确保 running_updates 可用
            'id': 'final-synthesis', 
            'type': 'analysis', 
            'status': 'running', 
            'title': 'Final Research Synthesis', 
            'analysisType': 'synthesis', 
            'message': 'Synthesizing all research findings...', 'timestamp': time.time() # Add timestamp if needed
        }) # 确保 running_updates 可用, 或者移除它如果你不打算在这里加它
        error_updates = add_stream_update(state, {
            'id': 'final-synthesis',
            'type': 'analysis',
            'status': 'completed', # Mark step as ended
            'title': 'Final Synthesis Failed',
            'analysisType': 'synthesis',
            'message': f"Error during synthesis: {str(e)}",
            'overwrite': True,
            'completedSteps': final_total_steps -1, 
            'totalSteps': final_total_steps
        })
         # Still send a final progress update, but indicate potential incompletion
        final_progress_update = add_stream_update(state, {
            'id': 'research-progress',
            'type': 'progress',
            'status': 'completed', # Research process finished, even if synthesis failed
            'title': 'Research Progress', 
            'message': 'Research finished, but final synthesis failed.',
            'completedSteps': final_total_steps - 1, # One step failed
            'totalSteps': final_total_steps,
            'isComplete': True, # The graph run is complete
            'overwrite': True 
        })
        all_updates = running_updates + error_updates + final_progress_update
        return {
            "final_synthesis": None, # Indicate failure
            "stream_updates": all_updates,
             "completed_steps_count": final_total_steps - 1
        }


def finalize_basic_research(state: ResearchState) -> Dict[str, Any]:
    """Adds the final progress update for basic depth or advanced without gaps."""
    final_total_steps = state['total_steps']
    final_completed_steps = state['completed_steps_count'] # Should be total_steps if no errors
    
    message = "Research complete"
    # Check if gap analysis failed, adjust message
    if state.get('gap_analysis') is None and state['current_analysis_step_index'] == len(state['analysis_steps_planned']):
         message = "Research finished, but gap analysis failed."
         final_completed_steps = state['completed_steps_count'] # Keep completed count as is

    final_progress_update = add_stream_update(state, {
        'id': 'research-progress',
        'type': 'progress',
        'status': 'completed',
        'title': 'Research Progress',
        'message': message,
        'completedSteps': final_completed_steps,
        'totalSteps': final_total_steps,
        'isComplete': True,
        'overwrite': True,
        'timestamp': time.time()
    })
    return {"stream_updates": final_progress_update}

# --- generate_final_markdown_report 函数 ---

async def generate_final_markdown_report(state: ResearchState) -> Dict[str, Any]:
    """Generates the final, long-form Markdown report using all gathered data."""

    print("--- Entering Node: generate_final_markdown_report ---")

    # --- 获取状态数据 ---
    topic = state['topic']
    final_synthesis = state.get('final_synthesis')
    search_results = state.get('search_results', [])
    gap_analysis = state.get('gap_analysis')
    
    # 计算当前完成的步骤数和总步骤数，用于进度显示
    completed_steps = state.get('completed_steps_count', 0)
    total_steps = state.get('total_steps', 0)

    # --- 检查是否有 Synthesis 数据 ---
    if not final_synthesis:
        print("Skipping final report generation: Final synthesis data is missing.")
        skipped_update = add_stream_update(state, {
            'id': 'final-report-generation', 'type': 'report', 'status': 'completed',
            'title': 'Final Report Generation Skipped',
            'message': 'Skipped report generation because final synthesis data was missing.',
            'completedSteps': completed_steps,
            'totalSteps': total_steps,
            'overwrite': True, 'timestamp': time.time()
        })
        base_total_steps = state.get('total_steps', 0)
        final_total_steps = base_total_steps # 没有增加步骤
        final_completed_steps = state.get('completed_steps_count', 0)
        final_progress_update = add_stream_update(state, {
             'id': 'research-progress', 'type': 'progress', 'status': 'completed',
             'title': 'Research Progress', 'message': 'Research finished, synthesis missing, report skipped.',
             'completedSteps': final_completed_steps, 'totalSteps': final_total_steps,
             'isComplete': True, 'overwrite': True, 'timestamp': time.time()
        })
        return {"final_report_markdown": None, "stream_updates": skipped_update + final_progress_update}

    # --- 发送运行中 Update ---
    running_updates = add_stream_update(state, {
        'id': 'final-report-generation',
        'type': 'report',
        'status': 'running',
        'title': 'Generating Final Report',
        'message': 'Compiling research findings into the final report...',
        'completedSteps': completed_steps,
        'totalSteps': total_steps,
        'timestamp': time.time() # 添加时间戳
    })
    all_updates = list(running_updates) # 初始化 updates 列表

    # --- 构建详细上下文 (只构建一次) ---
    print("--- Building Context for Final Report ---")
    context_parts = []
    context_parts.append(f"## Research Topic:\n{topic}\n")

    # 1. 添加 Final Synthesis 结果
    context_parts.append("## I. Synthesized Key Findings & Uncertainties (Core Content)\n")
    context_parts.append("### Key Findings (Elaborate on these using evidence below):\n")
    if final_synthesis.key_findings:
        for i, finding in enumerate(final_synthesis.key_findings):
            context_parts.append(f"**Finding {i+1}: {finding.finding}**")
            context_parts.append(f"   - Confidence: {finding.confidence:.2f}")
            context_parts.append(f"   - Evidence Hints: {', '.join(finding.supporting_evidence)}")
            context_parts.append("")
    else:
        context_parts.append("- No key findings were synthesized.\n")

    context_parts.append("### Remaining Uncertainties (Address in conclusion or limitations):\n")
    if final_synthesis.remaining_uncertainties:
        for uncertainty in final_synthesis.remaining_uncertainties:
            context_parts.append(f"- {uncertainty}")
    else:
        context_parts.append("- No specific remaining uncertainties identified.\n")
    context_parts.append("\n")

    # 2. 添加 Gap Analysis 结果
    if gap_analysis:
         context_parts.append("## II. Gap Analysis Summary (For 'Scope and Limitations' section):\n")
         if gap_analysis.limitations:
              context_parts.append("### Identified Limitations:\n")
              for limit in gap_analysis.limitations:
                   context_parts.append(f"- **{limit.type}**: {limit.description} (Severity: {limit.severity})")
                   if limit.potential_solutions:
                        context_parts.append(f"  - Potential Solutions: {'; '.join(limit.potential_solutions)}")
         else:
             context_parts.append("- No specific limitations identified.\n")

         if gap_analysis.knowledge_gaps:
              context_parts.append("### Identified Knowledge Gaps:\n")
              for gap in gap_analysis.knowledge_gaps:
                   context_parts.append(f"- **{gap.topic}**: {gap.reason}")
         else:
             context_parts.append("- No specific knowledge gaps identified.\n")
         context_parts.append("\n")
    else:
        context_parts.append("## II. Gap Analysis Summary:\n- Gap analysis was not performed or yielded no results.\n")

    # 3. 添加详细的 Search Results Context
    context_parts.append("## III. Search Results Context (Evidence for Citations [Title](URL) and Details):\n")
    search_results_list = state.get('search_results', [])
    total_results_count = sum(len(group.results) for group in search_results_list)
    context_parts.append(f"(Reference Appendix: Contains snippets from {total_results_count} collected results)\n")

    processed_urls: Set[str] = set()
    max_results_per_query_in_context = 5
    max_content_length = 600

    if search_results_list:
        for result_group in search_results_list:
             query_text = result_group.query.query
             source_type = result_group.type
             context_parts.append(f"### Context for Query: \"{query_text}\" ({source_type.upper()})\n")

             results_shown_count = 0
             if result_group.results:
                  for item in result_group.results:
                        if results_shown_count >= max_results_per_query_in_context:
                             break
                        if not item.url or item.url in processed_urls:
                             continue

                        title = item.title.replace('"',"'").strip() if item.title else "Source"
                        url = item.url

                        content_full = item.content if item.content else ""
                        content_snippet = content_full[:max_content_length]
                        if len(content_full) > max_content_length:
                             last_period = content_snippet.rfind('.')
                             if last_period > max_content_length * 0.7:
                                  content_snippet = content_snippet[:last_period+1]
                             else:
                                  content_snippet += "..."
                        content_snippet = content_snippet.replace('\n', ' ').strip()

                        context_parts.append(f"- **[{title}]({url})**")
                        if content_snippet:
                            context_parts.append(f"  - Snippet: {content_snippet}")

                        processed_urls.add(url)
                        results_shown_count += 1
             else:
                  context_parts.append("- (No relevant results found or processed for this query)")
             context_parts.append("")
    else:
        context_parts.append("- No search results were collected.\n")

    user_prompt_context = "\n".join(context_parts)
    # --- 上下文构建结束 ---

    # --- 定义 Prompts ---
    try:
        current_date_str = datetime.now().strftime("%a, %b %d, %Y")
        # 从 prompt.py 导入模板并格式化
        system_prompt = FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE.format(current_date=current_date_str)
    except Exception as e:
        print(f"Error formatting system prompt: {e}")
        system_prompt = "Error: Could not format system prompt." # Fallback

    # User Prompt 结尾指令
    user_prompt = f"""Based *only* on the provided context below (Sections I, II, III), please generate the comprehensive research report following ALL the guidelines and requirements detailed in the system prompt. Ensure deep analysis, structure with Introduction, thematic H2 sections with H3 subsections for each finding (3-5 paragraphs each), Scope/Limitations, and Conclusion. Every factual claim MUST have an inline citation [Title](URL) from Section III. Aim for a substantial word count by fully utilizing the context.

{user_prompt_context}

Generate the final Markdown research report now:"""

    # --- Call LLM and handle response ---
    markdown_content = ""
    try:
        print("--- Calling LLM for Final Report Generation ---")
        response = await llm_creative.ainvoke([
            AIMessage(content=system_prompt),
            HumanMessage(content=user_prompt)
        ])
        markdown_content = response.content
        print(f"--- LLM Call Successful. Report Length: {len(markdown_content)} chars ---")

        # 发送 'final-report-generation' 完成 Update
        completed_updates = add_stream_update(state, {
            'id': 'final-report-generation', 'type': 'report', 'status': 'completed',
            'title': 'Final Report Generated',
            'message': f'Successfully generated Markdown report ({len(markdown_content)} characters).',
            'completedSteps': completed_steps,
            'totalSteps': total_steps,
            'overwrite': True, 'timestamp': time.time() # 添加时间戳
        })
        all_updates.extend(completed_updates) # 添加到列表中

        # 发送最终 'research-progress' 完成 Update
        base_total_steps = state.get('total_steps', 0)
        # 如果 base_total_steps 有效则加1，否则基于 completed_steps 加1
        final_total_steps = base_total_steps + 1 if base_total_steps > 0 else state.get('completed_steps_count', 0) + 1
        final_completed_steps = final_total_steps

        final_progress_update = add_stream_update(state, {
             'id': 'research-progress', 'type': 'progress', 'status': 'completed',
             'title': 'Research Progress', # <-- 确保有 title
             'message': 'Research complete',
             'completedSteps': final_completed_steps,
             'totalSteps': final_total_steps,
             'isComplete': True, 'overwrite': True, 'timestamp': time.time()
        })
        all_updates.extend(final_progress_update)

        print("--- Exiting Node: generate_final_markdown_report (Success) ---")
        return {
            "final_report_markdown": markdown_content,
            "stream_updates": all_updates,
            "completed_steps_count": final_completed_steps
        }

    except Exception as e:
        print(f"Error during final report generation: {e}")
        # 发送 'final-report-generation' 失败 Update
        error_updates = add_stream_update(state, {
            'id': 'final-report-generation', 'type': 'report', 'status': 'completed',
            'title': 'Final Report Generation Failed',
            'message': f"Error generating report: {str(e)}",
            'overwrite': True, 'timestamp': time.time()
        })
        all_updates.extend(error_updates)

        # 发送最终 'research-progress' 完成 (但报告失败) Update
        base_total_steps = state.get('total_steps', 0)
        final_total_steps = base_total_steps + 1 if base_total_steps > 0 else state.get('completed_steps_count', 0) + 1
        final_completed_steps = final_total_steps - 1 # 本节点失败

        final_progress_update = add_stream_update(state, {
             'id': 'research-progress', 'type': 'progress', 'status': 'completed',
             'title': 'Research Progress', # <-- 确保有 title
             'message': 'Research finished, but final report generation failed.',
             'completedSteps': final_completed_steps,
             'totalSteps': final_total_steps,
             'isComplete': True, 'overwrite': True, 'timestamp': time.time()
        })
        all_updates.extend(final_progress_update)

        print("--- Exiting Node: generate_final_markdown_report (Error) ---")
        return {
            "final_report_markdown": f"# Report Generation Failed\n\nError: {str(e)}",
            "stream_updates": all_updates,
            "completed_steps_count": state.get('completed_steps_count', 0) # 失败时不增加
        }

================================================
FILE: super_agents/deep_research/reason_graph/prompt.py
================================================
# reason_graph/prompt.py
FINAL_REPORT_SYSTEM_PROMPT_TEMPLATE = """You are an advanced research assistant tasked with writing a final, comprehensive research report based *only* on the provided context (synthesized findings, gap analysis, search results). Your focus is deep analysis, logical structure, and accurate citation based *only* on the provided evidence.
The current date is {current_date}.

**Report Requirements:**

1.  **Length & Depth:** Generate a highly detailed and comprehensive report. Aim for a substantial length (e.g., target **3000-5000 words** or more if the context supports it) by elaborating deeply on the findings using the provided search result details. Do NOT just summarize. Analyze, compare, contrast, and discuss implications.
2.  **Structure:**
    * Start with an "Introduction" section (~2-3 paragraphs) setting the stage for the research topic.
    * Create thematic sections using H2 headings (##) based on the "Synthesized Key Findings" provided in the context.
    * For *each* Key Finding, create a dedicated subsection using H3 headings (###).
    * Within each H3 subsection, write **3-5 detailed paragraphs** elaborating on the finding. Use specific details, data points, or quotes found in the "Search Results Context" section to support your points. Critically analyze the evidence where possible.
    * Include a dedicated "Scope and Limitations" section (H2) using insights from the "Gap Analysis Summary" context.
    * End with a "Conclusion" section (H2, ~2-3 paragraphs) summarizing the main takeaways and discussing the "Remaining Uncertainties" provided in the context.
3.  **Citations:**
    * You MUST cite every factual claim using evidence *only* from the "Search Results Context".
    * Place citations *inline* immediately after the relevant sentence or statement.
    * Use the format `[Title](URL)` where Title and URL are taken directly from the Search Results Context section.
    * Do *not* list citations separately at the end. Do *not* hallucinate sources.
4.  **Formatting:**
    * Use Markdown format exclusively.
    * Use H2 (##) and H3 (###) headings only. Do NOT use H1 (#).
    * Write in well-structured paragraphs. Bullet points are acceptable within paragraphs or for specific lists but the main body should be paragraphs.
    * Use LaTeX for math ($inline$$ or $$block$$) and "USD" for currency if relevant.
5.  **Tone & Style:** Maintain a formal, objective, analytical tone appropriate for a research report. Be creative in synthesis but strictly evidence-based.

**Context Sections Provided:**
- Section I: Synthesized Key Findings & Uncertainties (Core content to elaborate)
- Section II: Gap Analysis Summary (For limitations section)
- Section III: Search Results Context (Evidence for details and citations)

Adhere strictly to these requirements and use *only* the provided context.
"""


================================================
FILE: super_agents/deep_research/reason_graph/schemas.py
================================================
# reason_graph/schemas.py

from typing import List, Optional, Literal, Dict, Any
from pydantic import BaseModel, Field

# --- Pydantic Schemas Mirroring Zod Schemas from original JS ---

class SearchQuery(BaseModel):
    """Represents a single search query within the research plan."""
    query: str = Field(description="The specific search query string.")
    rationale: str = Field(description="The reasoning behind why this query is important.")
    source: Literal['web', 'academic', 'x', 'all'] = Field(description="The source type(s) to search.")
    priority: int = Field(description="Priority of the query (e.g., 2-4, lower means higher priority).")

class RequiredAnalysis(BaseModel):
    """Represents a required analysis step in the research plan."""
    type: str = Field(description="The type of analysis to perform (e.g., 'SWOT', 'Comparative', 'Sentiment').")
    description: str = Field(description="A brief description of what the analysis should cover.")
    importance: int = Field(description="Importance score (e.g., 1-5, higher means more important).")

class ResearchPlan(BaseModel):
    """The overall research plan generated by the LLM."""
    search_queries: List[SearchQuery] = Field(
        description="List of targeted search queries.",
    )
    required_analyses: List[RequiredAnalysis] = Field(
        description="List of key analyses to perform on the search results.",
    )

class SearchResultItem(BaseModel):
    """Represents a single item returned from a search API."""
    source: Literal['web', 'academic', 'x'] = Field(description="The type of source the result came from.")
    title: str = Field(description="The title of the search result.")
    url: str = Field(description="The URL of the search result.")
    content: str = Field(description="The content snippet or summary of the result.")
    tweetId: Optional[str] = Field(default=None, description="The ID of the tweet, if the source is 'x'.")

class SearchStepResult(BaseModel):
    """Holds the results obtained from executing a single search step."""
    type: Literal['web', 'academic', 'x'] = Field(description="The type of search performed for this step.")
    query: SearchQuery = Field(description="The original SearchQuery object that prompted this search.")
    results: List[SearchResultItem] = Field(description="The list of results found for this search step.")

class AnalysisFinding(BaseModel):
    """Represents a single finding from an analysis step."""
    insight: str = Field(description="The core insight or finding discovered.")
    evidence: List[str] = Field(description="List of supporting evidence (e.g., brief quotes, source references).")
    confidence: float = Field(description="Confidence score in the finding (0.0 to 1.0).")

class AnalysisResult(BaseModel):
    """The structured output of a single analysis performed by the LLM."""
    findings: List[AnalysisFinding] = Field(description="List of key findings from the analysis.")
    implications: List[str] = Field(description="Potential implications of the findings.")
    limitations: List[str] = Field(description="Limitations noted during this specific analysis.")

class Limitation(BaseModel):
    """Describes a limitation identified during the gap analysis phase."""
    type: str = Field(description="The type of limitation (e.g., 'Source Bias', 'Data Scarcity').")
    description: str = Field(description="Detailed description of the limitation.")
    severity: int = Field(description="Severity score (e.g., 2-10, higher means more severe).")
    potential_solutions: List[str] = Field(description="Suggested ways to mitigate or address the limitation.")

class KnowledgeGap(BaseModel):
    """Describes a knowledge gap identified during the gap analysis phase."""
    topic: str = Field(description="The specific topic or area where knowledge is lacking.")
    reason: str = Field(description="The reason why this gap exists or is significant.")
    additional_queries: List[str] = Field(description="Specific queries suggested to help fill this gap.")

class RecommendedFollowup(BaseModel):
    """Describes a recommended follow-up action from the gap analysis."""
    action: str = Field(description="The suggested follow-up action.")
    rationale: str = Field(description="The reasoning behind recommending this action.")
    priority: int = Field(description="Priority score for the follow-up action (e.g., 2-10).")

class GapAnalysisResult(BaseModel):
    """The structured output of the gap analysis phase."""
    limitations: List[Limitation] = Field(description="List of identified limitations in the research.")
    knowledge_gaps: List[KnowledgeGap] = Field(description="List of identified knowledge gaps.")
    recommended_followup: List[RecommendedFollowup] = Field(description="List of recommended follow-up actions.")

class KeyFinding(BaseModel):
    """Represents a key finding in the final synthesis report."""
    finding: str = Field(description="The synthesized key finding or conclusion.")
    confidence: float = Field(description="Overall confidence in this finding (0.0 to 1.0).")
    supporting_evidence: List[str] = Field(description="List of key pieces of evidence supporting the finding (e.g., references to specific search results or analyses).")

class FinalSynthesisResult(BaseModel):
    """The structured output of the final synthesis phase (only in 'advanced' depth)."""
    key_findings: List[KeyFinding] = Field(description="List of synthesized key findings from all research.")
    remaining_uncertainties: List[str] = Field(description="List of questions or uncertainties that remain after the research.")


# --- Helper Schemas for Graph State and Streaming ---

class StepInfo(BaseModel):
    """Helper schema to store planned step information in the state."""
    id: str = Field(description="Unique ID for the step.")
    type: str = Field(description="Type of step ('web', 'academic', 'x', 'analysis').")
    details: Dict[str, Any] = Field(description="Holds the original query or analysis object details.")


class StreamUpdateData(BaseModel):
    """Data payload for a single streaming update message."""
    id: str = Field(description="Unique ID for the step or phase this update refers to.")
    type: str = Field(description="Type of the step or phase ('plan', 'web', 'academic', 'x', 'analysis', 'progress', 'error').")
    status: Literal['running', 'completed'] = Field(description="Current status of the step/phase.")
    title: str = Field(description="Display title for the update.")
    message: str = Field(description="Descriptive message about the current status or result.")
    timestamp: float = Field(description="Timestamp when the update was generated (epoch time).")
    overwrite: Optional[bool] = Field(default=False, description="Whether this update should replace a previous one with the same ID in the UI.")
    # Optional fields depending on the update type and status
    plan: Optional[ResearchPlan] = Field(default=None, description="The research plan (used in 'plan completed' update).")
    totalSteps: Optional[int] = Field(default=None, description="Total number of steps planned for the research.")
    query: Optional[str] = Field(default=None, description="The query string for search steps.")
    results: Optional[List[SearchResultItem]] = Field(default=None, description="Search results (used in 'search completed' updates).")
    analysisType: Optional[str] = Field(default=None, description="The type of analysis being performed or completed.")
    # Use Dict for findings in stream update for simplicity, full Pydantic models are in state
    findings: Optional[List[Dict]] = Field(default=None, description="Analysis findings (simplified for streaming).")
    gaps: Optional[List[KnowledgeGap]] = Field(default=None, description="Identified knowledge gaps.")
    recommendations: Optional[List[RecommendedFollowup]] = Field(default=None, description="Follow-up recommendations.")
    uncertainties: Optional[List[str]] = Field(default=None, description="Remaining uncertainties from final synthesis.")
    completedSteps: Optional[int] = Field(default=None, description="Number of steps completed so far.")
    isComplete: Optional[bool] = Field(default=None, description="Flag indicating if the entire research process is complete.")

class StreamUpdate(BaseModel):
    """Wrapper for the streaming update message, matching the original JS structure."""
    type: Literal['research_update'] = Field(default='research_update')
    data: StreamUpdateData = Field(description="The actual data payload for the update.")

================================================
FILE: super_agents/deep_research/reason_graph/state.py
================================================
import operator
from typing import TypedDict, List, Optional, Annotated, Dict, Any, Literal

# Use relative import to access schemas defined within the same package
from super_agents.deep_research.reason_graph.schemas import (
    ResearchPlan,
    SearchStepResult,
    GapAnalysisResult,
    FinalSynthesisResult,
    StreamUpdate,
    StepInfo,
    SearchQuery,
)

class ResearchState(TypedDict):
    """
    Represents the state of the research graph execution.
    It holds inputs, intermediate results, and final outputs.
    """
    # --- Inputs ---
    topic: str
    depth: Literal['basic', 'advanced']

    # --- Planning Phase ---
    research_plan: Optional[ResearchPlan]
    search_steps_planned: List[StepInfo] # Flat list of all searches to execute
    analysis_steps_planned: List[StepInfo] # List of analyses to execute

    # --- Execution Tracking ---
    current_search_step_index: int # Index for iterating through search_steps_planned
    current_analysis_step_index: int # Index for iterating through analysis_steps_planned
    current_gap_search_index: int # Index for iterating through additional_queries_planned

    # --- Accumulated Results ---
    # Use Annotated and operator.add to append results instead of replacing the list
    search_results: Annotated[List[SearchStepResult], operator.add]

    # --- Analysis & Synthesis Results ---
    gap_analysis: Optional[GapAnalysisResult]
    # List of queries generated by gap analysis for advanced depth
    additional_queries_planned: List[SearchQuery]
    final_synthesis: Optional[FinalSynthesisResult] # Result of final synthesis if advanced depth

    # --- Streaming & Progress ---
    # Use Annotated and operator.add to append updates
    stream_updates: Annotated[List[StreamUpdate], operator.add]
    completed_steps_count: int # Counter for completed steps (searches, analyses, gap, synthesis)
    total_steps: int # Total number of steps calculated after planning (may update after gap analysis)

    # --- Final Output ---
    final_report_markdown: Optional[str] # Add this field

================================================
FILE: super_agents/deep_research/reason_graph/tools.py
================================================
# reason_graph/tools.py

import os
import json
import time
import re
import asyncio
from datetime import datetime
from typing import Optional, List, Literal, Dict, Any, Tuple, Set # <--- 添加 Tuple, Set

# --- Environment Variable Loading ---
from dotenv import load_dotenv
load_dotenv()

# --- Pydantic & LangChain Core ---
from pydantic import BaseModel # Use Pydantic V2
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.runnables.base import RunnableSerializable # Type hint for LLM
from langchain_openai import ChatOpenAI # Default

# --- External Service Clients ---
try:
    from tavily import AsyncTavilyClient # Use Async Client
    TAVILY_AVAILABLE = True
except ImportError:
    TAVILY_AVAILABLE = False
    # print("Warning: tavily-python not installed. Web searches via Tavily will fail.")

try:
    from exa_py import Exa
    EXA_AVAILABLE = True
except ImportError:
    EXA_AVAILABLE = False
    # print("Warning: exa-py not installed. Academic/X searches via Exa will fail.")


# --- Internal Imports ---
# Assuming these exist in sibling files
try:
    from super_agents.deep_research.reason_graph.schemas import SearchResultItem, SearchQuery, StreamUpdate, StreamUpdateData
    from super_agents.deep_research.reason_graph.state import ResearchState
except ImportError as e:
    print(f"Error importing local schemas/state: {e}")
    # Define dummy classes if needed for script to load partially
    class SearchResultItem(BaseModel): pass
    class SearchQuery(BaseModel): pass
    class StreamUpdate(BaseModel): pass
    class StreamUpdateData(BaseModel): pass
    class ResearchState(dict): pass


# --- API Key Loading ---
# Prefer specific LLM_API_KEY, fallback to provider-specific or general OPENAI key
LLM_API_KEY_FROM_ENV = os.getenv("LLM_API_KEY")
OPENAI_API_KEY_FROM_ENV = os.getenv("OPENAI_API_KEY")
GROQ_API_KEY_FROM_ENV = os.getenv("GROQ_API_KEY") # For Groq Cloud

TAVILY_API_KEY = os.getenv("TAVILY_API_KEY")
EXA_API_KEY = os.getenv("EXA_API_KEY")

# --- Configurable LLM Initialization ---
def initialize_llms() -> Tuple[Optional[RunnableSerializable], Optional[RunnableSerializable]]:
    """
    Initializes and returns the main and creative LLM instances based on environment variables.
    Supports providers: "openai", "groq", "xai"/"grok" (via compatible endpoint), "openai_compatible".
    Returns: (llm, llm_creative) or (None, None) on failure.
    """
    provider = os.getenv("LLM_PROVIDER", "openai").lower()
    model_name = os.getenv("LLM_MODEL_NAME", "gpt-4.1-mini") # Sensible default
    api_key = LLM_API_KEY_FROM_ENV # Use generic key first
    base_url = os.getenv("LLM_BASE_URL") # For compatible APIs

    try:
        temperature = float(os.getenv("LLM_TEMPERATURE", "0.0"))
        creative_temperature = float(os.getenv("LLM_CREATIVE_TEMPERATURE", "0.5"))
    except ValueError:
        print("Warning: Invalid LLM temperature value in .env. Using defaults (0.0 / 0.5).")
        temperature = 0.0
        creative_temperature = 0.5

    print(f"\n--- Initializing LLM ---")
    print(f"Provider: '{provider}'")
    print(f"Model Name: '{model_name}'")
    print(f"Base URL: {base_url if base_url else 'Default'}")
    print(f"Temperatures: Main={temperature}, Creative={creative_temperature}")
    print(f"------------------------")

    llm_instance = None
    llm_creative_instance = None

    try:
        if provider == "openai":
            key_to_use = api_key or OPENAI_API_KEY_FROM_ENV
            if not key_to_use:
                raise ValueError("OpenAI API key not found (checked LLM_API_KEY, OPENAI_API_KEY).")
            llm_instance = ChatOpenAI(model=model_name, temperature=temperature, api_key=key_to_use)
            llm_creative_instance = ChatOpenAI(model=model_name, temperature=creative_temperature, api_key=key_to_use)

        elif provider == "xai" or provider == "grok":
            print("Info: Configuring provider 'xai'/'grok'. Assuming OpenAI-compatible API endpoint.")
            if not api_key:
                raise ValueError(f"LLM_API_KEY is required for provider '{provider}' (Your xAI API Key).")
            if not base_url:
                raise ValueError(f"LLM_BASE_URL is required for provider '{provider}' (The xAI Grok API endpoint URL).")
            if not model_name:
                raise ValueError(f"LLM_MODEL_NAME is required for provider '{provider}' (e.g., 'grok-1').")

            llm_instance = ChatOpenAI(
                model=model_name, temperature=temperature,
                openai_api_key=api_key, openai_api_base=base_url,
            )
            llm_creative_instance = ChatOpenAI(
                model=model_name, temperature=creative_temperature,
                openai_api_key=api_key, openai_api_base=base_url,
            )
            print(f"Note: Ensure '{model_name}' is valid for the xAI API at {base_url}.")

        elif provider == "openai_compatible":
            if not api_key:
                raise ValueError(f"LLM_API_KEY is required for provider '{provider}'.")
            if not base_url:
                raise ValueError(f"LLM_BASE_URL is required for provider '{provider}'.")
            if not model_name:
                 raise ValueError(f"LLM_MODEL_NAME is required for provider '{provider}'.")

            llm_instance = ChatOpenAI(
                model=model_name, temperature=temperature,
                openai_api_key=api_key, openai_api_base=base_url,
            )
            llm_creative_instance = ChatOpenAI(
                model=model_name, temperature=creative_temperature,
                openai_api_key=api_key, openai_api_base=base_url,
            )
        else:
            raise ValueError(f"Unsupported LLM_PROVIDER: '{provider}'. Check .env file. Supported: 'openai', 'groq', 'xai'/'grok', 'openai_compatible'.")

        print("--- LLM Initialization Successful ---")
        return llm_instance, llm_creative_instance

    except Exception as e:
        print(f"!!! ERROR during LLM Initialization: {e}")
        return None, None

# --- Initialize LLM instances at module level ---
llm, llm_creative = initialize_llms()

# --- Initialize External Service Clients ---
if not TAVILY_API_KEY:
    print("Warning: TAVILY_API_KEY not found in environment variables. Web search will fail.")
tavily_client = AsyncTavilyClient(api_key=TAVILY_API_KEY) if TAVILY_API_KEY and TAVILY_AVAILABLE else None

if not EXA_API_KEY:
    print("Warning: EXA_API_KEY not found in environment variables. Academic/X search will fail.")
exa_client = Exa(api_key=EXA_API_KEY) if EXA_API_KEY and EXA_AVAILABLE else None


# --- Tool Helper Functions ---

def generate_structured_output(model: Optional[RunnableSerializable], schema: BaseModel, prompt: str, system_message: str = "") -> Optional[BaseModel]:
    """
    Uses langchain `.with_structured_output` for reliable JSON generation.
    Returns the parsed Pydantic object or None on failure.
    """
    if model is None:
        print("Error: LLM instance not available for structured output generation.")
        return None # Return None if LLM failed to initialize

    try:
        # Let LangChain handle method selection, but be aware of compatibility warnings.
        # If issues persist with specific models/providers, try method="function_calling".
        structured_llm = model.with_structured_output(schema)
        # structured_llm = model.with_structured_output(schema, method="function_calling") # Fallback

        messages = []
        if system_message:
            messages.append(SystemMessage(content=system_message))
        messages.append(HumanMessage(content=prompt))
        
        # .invoke is typically synchronous for ChatModels
        response = structured_llm.invoke(messages)
        return response
    except Exception as e:
        print(f"Error during structured output generation: {e}")
        # Consider logging the full traceback here if needed for debugging
        # import traceback
        # traceback.print_exc()
        return None # Indicate failure

def extract_tweet_id(url: str) -> Optional[str]:
    """Extracts tweet ID from twitter.com or x.com URLs."""
    if not url:
        return None
    match = re.search(r"(?:twitter\.com|x\.com)\/\w+\/status\/(\d+)", url)
    return match.group(1) if match else None

def add_stream_update(state: ResearchState, data_dict: Dict[str, Any]) -> List[StreamUpdate]:
    """Creates and returns a list containing a single StreamUpdate, handling potential errors."""
    # Ensure required fields are present for validation, add timestamp
    data_dict.setdefault('timestamp', time.time())
    # Set other defaults expected by StreamUpdateData if necessary,
    # although Pydantic handles Optional fields.

    try:
        # Validate data against the Pydantic model
        update_data = StreamUpdateData(**data_dict)
        stream_update = StreamUpdate(type='research_update', data=update_data)
        return [stream_update]
    except Exception as e: # Catch Pydantic ValidationError or others
        print(f"Error creating stream update for ID {data_dict.get('id', 'N/A')}: {e}")
        print(f"Data causing error: {json.dumps(data_dict, indent=2, default=str)}") # Print problematic data

        # Create a standardized error update object
        try:
            error_update_data = StreamUpdateData(
                id=data_dict.get('id', 'error-id') + '-validation-error', # Make ID unique
                type='error',
                status='completed', # Treat validation error as 'completed' step for flow
                title='Stream Update Creation Error', # Specific Title
                message=f"Pydantic validation failed: {str(e)}", # Include Pydantic error
                timestamp=time.time()
                # Ensure all *required* fields of StreamUpdateData are present here
            )
            stream_update = StreamUpdate(type='research_update', data=error_update_data)
            return [stream_update]
        except Exception as inner_e:
            # If creating even the error update fails, print and return empty
            print(f"CRITICAL: Failed to create error stream update: {inner_e}")
            return []


# --- Tool Wrappers ---

async def perform_web_search(query: str, depth: Literal['basic', 'advanced'], priority: int) -> List[SearchResultItem]:
    """Performs web search using Tavily."""
    if not tavily_client:
        print(f"Tavily client not available. Skipping web search for: '{query}'")
        return []

    max_results = min(max(1, 6 - priority), 10)
    search_depth = depth if depth in ['basic', 'advanced'] else 'basic'

    try:
        print(f"--- Calling Tavily API for: '{query}' ---")
        response = await tavily_client.search(
            query=query,
            search_depth=search_depth,
            include_answer=False, # Set based on whether you need Tavily's answer
            max_results=max_results
        )
        print(f"--- Tavily API call successful for: '{query}' ---")

        results_list = response.get('results', []) if isinstance(response, dict) else []

        formatted_results = [
            SearchResultItem(
                source='web',
                title=r.get('title', 'N/A'),
                url=r.get('url', '#'),
                content=r.get('content', '')
            ) for r in results_list if isinstance(r, dict) and r.get('url')
        ]
        return formatted_results
    except Exception as e:
        print(f"Error during Tavily search for '{query}': {e}")
        # import traceback # Optional: Uncomment for detailed trace
        # traceback.print_exc()
        return []


async def perform_academic_search(query: str, priority: int) -> List[SearchResultItem]:
    """Performs academic search using Exa."""
    if not exa_client:
        print(f"Exa client not available. Skipping academic search for: '{query}'")
        return []

    num_results = min(max(1, 6 - priority), 5)

    try:
        print(f"--- Calling Exa API (Academic) for: '{query}' ---")
        # Wrap synchronous Exa call in run_in_executor for async context
        loop = asyncio.get_running_loop()
        response = await loop.run_in_executor(
            None, # Use default executor (ThreadPoolExecutor)
            lambda: exa_client.search_and_contents(
                query,
                type='auto',
                num_results=num_results,
                highlights=True, # Request highlights/summary
                use_autoprompt=True # Let Exa optimize query
            )
        )
        print(f"--- Exa API call (Academic) successful for: '{query}' ---")

        formatted_results = [
            SearchResultItem(
                source='academic',
                title=r.title or 'N/A',
                url=r.url or '#',
                # Use highlights as content proxy; fallback to text
                content=(r.highlights[0] if r.highlights else r.text or ''),
                tweetId=None # Explicitly None for academic
            ) for r in response.results if r.url # Ensure URL exists
        ]
        return formatted_results
    except Exception as e:
        print(f"Error during Exa academic search for '{query}': {e}")
        # import traceback
        # traceback.print_exc()
        return []

async def perform_x_search(query_obj: SearchQuery) -> List[SearchResultItem]:
    """Performs X/Twitter search using Exa."""
    if not exa_client:
        print(f"Exa client not available. Skipping X search for: '{query_obj.query}'")
        return []

    # Priority might influence number of results differently for social
    num_results = max(2, min(query_obj.priority * 2, 10)) # Example: Scale priority, cap at 10

    try:
        print(f"--- Calling Exa API (X/Twitter) for: '{query_obj.query}' ---")
        loop = asyncio.get_running_loop()
        response = await loop.run_in_executor(
            None,
            lambda: exa_client.search_and_contents(
                query_obj.query,
                type='neural', # Often better for social media queries
                num_results=num_results,
                include_domains=['twitter.com', 'x.com'],
                text=True,
                use_autoprompt=True
            )
        )
        print(f"--- Exa API call (X/Twitter) successful for: '{query_obj.query}' ---")

        processed_tweets = []
        for r in response.results:
            tweet_id = extract_tweet_id(r.url)
            if tweet_id and r.url: # Ensure valid ID and URL
                processed_tweets.append(
                    SearchResultItem(
                        source='x',
                        title=r.title or r.author or 'Tweet',
                        url=r.url,
                        content=r.text or '',
                        tweetId=tweet_id
                    )
                )
        return processed_tweets
    except Exception as e:
        print(f"Error during Exa X search for '{query_obj.query}': {e}")
        # import traceback
        # traceback.print_exc()
        return []

================================================
FILE: super_agents/deep_research/tests/__init__.py
================================================


================================================
FILE: super_agents/deep_research/tests/test_graph.py
================================================


================================================
FILE: web/.gitignore
================================================
# See https://help.github.com/articles/ignoring-files/ for more about ignoring files.

# dependencies
/node_modules
/.pnp
.pnp.*
.yarn/*
!.yarn/patches
!.yarn/plugins
!.yarn/releases
!.yarn/versions

# testing
/coverage

# next.js
/.next/
/out/

# production
/build

# misc
.DS_Store
*.pem

# debug
npm-debug.log*
yarn-debug.log*
yarn-error.log*
.pnpm-debug.log*

# env files (can opt-in for committing if needed)
.env.*

# vercel
.vercel

# typescript
*.tsbuildinfo
next-env.d.ts


================================================
FILE: web/README.md
================================================
# Mentis 的 LangGraph + NextJS 集成演示

Mentis 演示项目展示了如何使用LangGraph创建AI代理并将其集成到NextJS应用程序中。它具体演示了 **ReAct Agent** (用于通用任务) 和 **Deep Research Agent** (用于深度主题探索) 的实现。LangGraph是一个强大的框架，用于构建代理和多代理工作流。它提供了构建复杂逻辑的灵活性，并具有出色的调试工具(LangGraph Studio)和监控功能(LangSmith)。NextJS是一个流行的Web应用程序框架。

## 技术选择

### 为什么选择LangGraph

LangGraph是一个用于构建基于LLM的状态化应用程序的库。它可以用于创建AI代理和多代理系统，或在LLM调用周围建立预定义的代码路径。该框架提供了对流程执行的低级控制，使用灵活。在LangGraph中，您定义图形，其中节点本质上是包含自定义代码的函数。然后，您在这些节点之间建立边缘连接。图形有一个状态，它只是一个键值对字典，在每个节点执行后更新。

### 为什么选择Next.js

Next.js是一个优秀的全栈框架，提供了构建现代Web应用程序所需的一切功能：

-   **服务器端渲染(SSR)**：通过在将页面发送到客户端之前在服务器上渲染页面，提高SEO和性能。
-   **静态站点生成(SSG)**：允许在构建时预渲染页面，从而缩短加载时间。
-   **API路由**：通过允许在同一应用程序中创建API端点，简化后端集成。
-   **自动代码分割**：只加载正在访问的页面所需的JavaScript，提高性能。
-   **基于文件的路由**：通过使用文件系统简化路由，使创建和管理路由变得容易。
-   **内置CSS和Sass支持**：无需额外配置即可支持全局和模块化CSS以及Sass。
-   **图像优化**：自动优化图像以提高性能和用户体验。
-   **丰富的生态系统**：与React良好集成，拥有庞大的社区和插件工具生态系统。

## Agent集成机制

### 图执行与检查点

首先，让我们探讨图（AI代理）执行的含义。LangGraph在应用执行前、每个图节点执行前以及应用执行后创建检查点（checkpoints）。检查点本质上是图状态的快照，指示下一步将执行哪个节点或哪些节点。

检查点机制是LangGraph的核心特性之一，它允许：
-   保存执行历史，便于回溯和调试
-   在任意点暂停和恢复执行
-   从特定状态创建分支执行
-   实现人机交互循环

在客户端应用中，我们需要复制这种架构以获得完全控制并访问图执行数据。这种逻辑封装在`useLangGraphAgent`钩子中，它调用AI服务API并在客户端同步代理状态。

### useLangGraphAgent钩子

`useLangGraphAgent`钩子是前端与LangGraph后端集成的核心。它提供了以下功能：

**属性：**
-   `status`：指示代理的执行状态（idle、running、stopping、error）
-   `appCheckpoints`：图检查点和节点及其状态的列表

**方法：**
-   `run`：使用提供的状态执行代理
-   `resume`：人机交互后继续代理执行
-   `restore`：检索特定代理线程的检查点历史
-   `replay`：从检查点重新执行代理
-   `fork`：使用自定义状态创建检查点的分支并运行代理
-   `stop`：停止正在执行的代理

### 客户端状态同步

钩子通过以下机制与后端同步：

1.  **SSE流处理**：使用Server-Sent Events接收来自LangGraph的实时更新
2.  **事件类型处理**：
    -   `checkpoint`：处理新的检查点和状态更新
    -   `message_chunk`：处理LLM生成的消息片段
    -   `interrupt`：处理需要人机交互的中断
    -   `custom`：处理自定义状态更新
    -   `error`：处理执行错误

3.  **状态差异计算**：计算状态变化以优化UI更新

## 功能特性

-   **多 Agent 示例:** 演示了不同的 Agent 架构，当前包括：
    -   **ReAct Agent:** 一个通用的助手，使用 ReAct 框架进行规划和工具使用。
    -   **Deep Research Agent:** 一个专门用于执行深度研究任务的助手。
-   **流式响应**：代理将LLM生成的内容实时流式传输到客户端应用程序。
-   **生成式UI**：基于代理状态渲染组件，例如天气小部件。
-   **人机交互**：代理可以向用户请求澄清以继续任务，例如确认创建提醒。
-   **状态持久化**：LangGraph具有内置的持久层。它可用于在会话之间持久保存代理状态。在演示应用中，状态保存在内存中。参见[LangGraph持久化](https://langchain-ai.github.io/langgraph/docs/how-tos/persistence/)了解如何使用PostgreSQL或MongoDB。
-   **回复和分支**：可以从任何检查点回复或分支代理。
-   **代理状态复制**：基于图检查点，代理状态在客户端完全复制。
-   **错误处理**：应用程序显示全局代理错误（例如代理不可访问时）以及图节点级别发生的错误。
-   **停止代理**：可以停止代理执行并稍后恢复。
-   **无依赖**：集成不依赖第三方库。您可以根据需要进行调整。
-   **简洁UI**：应用程序基于shadcn组件，支持深色和浅色主题。

## 项目架构

项目分为两个主要部分：

### 1. API服务器 (FastAPI + LangGraph)

位于`/api`目录，包含：
-   `server.py`：FastAPI服务器，提供与LangGraph交互的端点。负责加载和路由到正确的 Agent 图。
-   `agent/` 目录：包含 LangGraph Agent 图的定义。这可能包括为 **ReAct Agent** 和 **Deep Research Agent** 配置或定义的独立模块（例如 `react_graph.py`, `research_graph.py` 或一个可配置的 `graph_factory.py`）。
-   `utils.py`：用于格式化事件和状态的工具函数。

### 2. Web客户端 (NextJS)

位于`/web`目录（或项目根目录，取决于您的结构），包含：
-   `app/`：NextJS应用程序页面和路由。包括用于不同 Agent 类型（如 `app/default/[id]/page.tsx` 和 `app/deep_research/[id]/page.tsx`）的动态路由。
-   `hooks/useLangGraphAgent/`：与LangGraph代理交互的React钩子。
-   `components/`：UI组件，包括 Sidebar 和 Agent 交互界面。
-   `stores/`：使用Zustand的状态管理 (`chat-store.ts`)，用于存储聊天会话列表及其关联的 Agent 类型。

## 技术实现细节

### LangGraph与Next.js的集成

LangGraph是Python框架，而Next.js是JavaScript框架，这使得直接集成变得复杂。我们的解决方案包括：

1.  **FastAPI中间层**：创建一个FastAPI服务器作为中间层，暴露LangGraph功能为REST API。
2.  **SSE（Server-Sent Events）**：使用SSE实现从服务器到客户端的实时数据流。
3.  **状态同步机制**：在客户端复制和维护LangGraph的状态。

### 关键API端点

-   `/agent`：运行代理，支持多种操作模式（run、resume、fork、replay）。服务器端会根据请求路由到正确的 Agent 图。
-   `/history`：获取完整的状态历史，用于恢复图执行。
-   `/state`：获取当前图状态。
-   `/agent/stop`：停止正在运行的代理。

### 数据流程

1.  **客户端请求**：通过 `useLangGraphAgent` 钩子或直接 API 调用发起请求，指定要交互的 Agent。
2.  **服务器处理**：FastAPI 服务器接收请求，加载相应的 LangGraph Agent 图并开始执行。
3.  **流式响应**：服务器通过 SSE 流式传输执行结果（检查点、消息、中断等）。
4.  **客户端处理**：客户端解析事件流并更新本地状态 (`useLangGraphAgent` 钩子内部)。
5.  **UI渲染**：基于更新的状态渲染 UI 组件（聊天消息、状态指示器等）。

### 状态管理

LangGraph的状态是一个键值对字典，在每个节点执行后更新。在客户端，我们使用以下机制管理状态：

1.  **`useChatStore` (Zustand)**：存储聊天会话列表，每个会话包含 `id`, `name`, `agentId`, `agentName` 等信息。
2.  **`useLangGraphAgent` Hook State**：钩子内部维护当前活动 Agent 的检查点 (`appCheckpoints`) 和执行状态 (`status`)。
3.  **事件处理**：钩子处理来自 SSE 的不同类型的事件（checkpoint、message_chunk、interrupt、custom、error）以更新其内部状态。

## 限制

目前有一些尚未实现的功能：

-   并行节点中的图中断（人机交互）
-   从同一并行节点发送自定义事件。例如，同时检查多个城市的天气时，无法在客户端区分它们。
-   Deep Research Agent 的前端渲染机制可能需要根据具体输出进行优化。

## 安装和运行

### 安装依赖

#### API服务器

```bash
# Navigate to your API directory if needed
# cd api/
uv sync # 或者 pip install -r requirements.txt
```

#### Web客户端

```bash
# Navigate to your web client directory if needed (e.g., cd web/)
npm install # 或者 pnpm install 或 yarn install
```

### 环境变量

1.  在项目根目录或 API 服务器目录创建 `.env` 文件（参考 `.env.example`）。
2.  添加必要的API密钥，例如：
    ```
    OPENAI_API_KEY=your_openai_api_key
    # LANGCHAIN_TRACING_V2=true (可选, 用于 LangSmith)
    # LANGCHAIN_API_KEY=your_langsmith_api_key (可选, 用于 LangSmith)
    ```

### 运行项目

#### 启动API服务器

```bash
# Navigate to your API directory if needed
# cd api/
uv run python -m api.server # 或者 python -m api.server
```

API 服务器通常运行在 `http://localhost:8001` (或您配置的端口)。

#### 启动Web客户端

```bash
# Navigate to your web client directory if needed (e.g., cd web/)
pnpm run dev # 或者 npm run dev 或 yarn dev
```

Web 应用程序将在 `http://localhost:3000` 启动。

## 开发指南

### 调整AI代理逻辑

1.  修改 `api/agent/` 目录下相关的 Agent 图定义文件（例如，调整现有 **ReAct Agent** 或 **Deep Research Agent** 的逻辑）。
2.  或者创建一个全新的 Agent 图文件。
3.  确保 `api/server.py` 中的加载和路由逻辑能够识别并调用你的新 Agent 或修改后的 Agent。

### 调整代理状态类型

1.  如果 Agent 的状态结构发生变化，相应地在 `web/app/[agentId]/[id]/page.tsx` (或相关的类型定义文件，如 `agent-types.ts`) 中修改 TypeScript 类型定义。

### 在客户端应用中调用代理

在相关的页面组件 (例如 `app/default/[id]/page.tsx` 或 `app/deep_research/[id]/page.tsx`) 中使用 `useLangGraphAgent` 钩子：

```tsx
import { useLangGraphAgent } from '@/hooks/useLangGraphAgent/useLangGraphAgent';
// Import specific state types for the agent being used
import { AgentState, InterruptValue, ResumeValue } from './agent-types'; // Adjust path as needed

export default function AgentPage({ params }: { params: { id: string } }) {
  const thread_id = params.id; // Get thread_id from route

  const { status, appCheckpoints, run, resume, replay, restore } =
    useLangGraphAgent<AgentState, InterruptValue, ResumeValue>(thread_id); // Pass thread_id

  // 使用钩子方法与代理交互
  // 例如，在组件加载时恢复历史记录:
  // React.useEffect(() => {
  //   restore();
  // }, [restore]);

  // ... rest of your component logic ...
}
```

## 路线图

### 短期目标

1.  **改进错误处理**
    -   实现更详细的错误消息
    -   添加重试机制
2.  **增强UI组件**
    -   为 Deep Research Agent 的输出提供更丰富的渲染组件
    -   改进移动端响应式设计
3.  **添加认证 (可选)**
    -   实现基本的用户认证
    -   添加会话管理

### 中期目标

1.  **持久化存储**
    -   为 LangGraph 检查点集成 PostgreSQL 或 MongoDB
    -   为用户聊天列表添加持久化
2.  **并行节点改进**
    -   实现并行节点中的人机交互
    -   支持从并行节点发送自定义事件
3.  **工具集成**
    -   为 ReAct Agent 添加更多实用的工具
    -   为 Deep Research Agent 集成更多数据源

### 长期目标

1.  **多代理支持**
    -   实现多个协作代理的示例
    -   添加代理间通信的可视化
2.  **高级UI功能**
    -   探索可视化图构建/调试工具集成
3.  **企业功能**
    -   添加团队协作功能
    -   实现角色和权限管理
    -   添加审计和日志记录

## 贡献

欢迎贡献！请随时提交问题或拉取请求。

## 许可

[MIT](LICENSE)

================================================
FILE: web/app/api/agent/route.ts
================================================
import { NextRequest, NextResponse } from 'next/server';

// This API route serves as a proxy to the agent endpoint of the ai service. 
// It is necessary to send requests from the Next.js backend rather than the client. 
// This approach prevents exposing the AI service as a public endpoint and eliminates the need to implement authentication logic.
// The mode elegant way is to use server actions, but it is not possible with streaming response.

const AGENT_URL = process.env.NEXT_PUBLIC_AGENT_URL;

export async function POST(request: NextRequest) {
  const body = await request.json();

  try {
    const response = await fetch(`${AGENT_URL}/agent`, {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
        'Accept': 'text/event-stream',
      },
      body: JSON.stringify(body),
    });

    if (!response.ok) {
      const error = await response.json();
      throw new Error(error.detail || 'Failed to call agent');
    }

    const stream = new TransformStream();
    const writer = stream.writable.getWriter();

    (async () => {
      try {
        const reader = response.body?.getReader();
        if (!reader) throw new Error('No reader available');

        while (true) {
          const { done, value } = await reader.read();
          if (done) {
            await writer.close();
            break;
          }

          // Just forward the raw chunks
          await writer.write(value);
        }
      } catch (error) {
        console.error('Stream processing error:', error);

        // Write an error message to the stream before closing
        const errorData = JSON.stringify({ error: "Error in agent" });
        await writer.write(new TextEncoder().encode(`event: error\ndata: ${errorData}\n\n`));
        await writer.close();
      }
    })();

    return new Response(stream.readable, {
      headers: {
        'Content-Type': 'text/event-stream',
        'Cache-Control': 'no-cache',
        'Connection': 'keep-alive',
      },
    });

  } catch (error) {
    console.error('Error in agent route', error);
    return NextResponse.json(
      { error: 'Failed to process /agent request' },
      { status: 500 }
    );
  }
} 

================================================
FILE: web/app/chat/[id]/agent-types.ts
================================================
import { WithMessages } from "@/hooks/useLangGraphAgent/types";

// The agent state which mirrors the LangGraph state. If your sate have messages, extend WithMessages interface.
export interface AgentState extends WithMessages {
  weather_forecast: WeatherForecast[];
  research_status: ResearchStatus[];
  search_results: SearchResult[];
  report_content?: string;
  node_type?: string;
}

export interface WeatherForecast {
  location: string;
  search_status: string;
  result: "Sunny" | "Cloudy" | "Rainy" | "Snowy";
}

export interface ResearchStatus {
  topic: string;
  status: string;
  progress?: number;
}

export interface SearchResult {
  title: string;
  url: string;
  snippet: string;
}

// All possible interrupt types from the graph. We are using string for Reminder node
export type InterruptValue = string | number | { "question": string };

// All possible resume types to send to the graph. We are using string for Reminder node
export type ResumeValue = string | number;


================================================
FILE: web/app/chat/[id]/components/chatbot-node.tsx
================================================
import { AgentState } from '../agent-types';
import { Bot, User } from 'lucide-react';
import { cn } from '@/lib/utils';
import ReactMarkdown from 'react-markdown';
import remarkGfm from 'remark-gfm';
import { Badge } from '@/components/ui/badge';
import { Message } from '@/hooks/useLangGraphAgent/types';
import { useEffect, useRef } from 'react';

interface ChatbotNodeProps {
  nodeState: Partial<AgentState>;
  fallbackMessages?: Message[]; // Add fallback messages from hook
}

export function ChatbotNode({ nodeState, fallbackMessages }: ChatbotNodeProps) {
  // 使用ref保存最后一次有效的消息列表，防止消息丢失
  const lastValidMessagesRef = useRef<Message[]>([]);
  
  // 如果nodeState.messages存在且不为空，使用它；否则使用fallbackMessages；如果都没有，使用上次有效的消息
  const currentMessages = nodeState?.messages?.length ? nodeState.messages : 
                         (fallbackMessages?.length ? fallbackMessages : lastValidMessagesRef.current);
  
  // 更新最后一次有效的消息引用
  useEffect(() => {
    if (currentMessages?.length > 0) {
      lastValidMessagesRef.current = [...currentMessages];
      console.log("[ChatbotNode] 更新最后有效消息缓存:", currentMessages.length);
    }
  }, [currentMessages]);

  // Debug log for message rendering
  console.log("[ChatbotNode] Rendering with:", { 
    nodeStateMessages: nodeState?.messages?.length || 0, 
    fallbackMessages: fallbackMessages?.length || 0,
    lastValidMessages: lastValidMessagesRef.current.length,
    displaying: currentMessages.length
  });

  // 添加更详细的消息内容调试
  if (currentMessages.length > 0) {
    console.log("[ChatbotNode] Messages content:", 
      currentMessages.map(msg => ({
        id: msg.id,
        type: msg.type,
        contentLength: msg.content?.length || 0,
        contentPreview: msg.content?.substring(0, 50) + (msg.content?.length > 50 ? '...' : ''),
        hasToolCalls: msg.tool_calls?.length > 0
      }))
    );
  }

  const getMessageIcon = (type: string) => {
    const baseClasses = "bg-gray-100 dark:bg-gray-800 text-gray-600 dark:text-gray-300 border-gray-200 dark:border-gray-700";

    switch (type) {
      case 'ai':
        return {
          icon: <Bot className="h-5 w-5" />,
          className: baseClasses
        };
      case 'user':
      case 'human':
        return {
          icon: <User className="h-5 w-5" />,
          className: baseClasses
        };
      default:
        return {
          icon: <Bot className="h-5 w-5" />,
          className: baseClasses
        };
    }
  };

  if (!currentMessages?.length) {
    console.log("[ChatbotNode] No messages to display, returning null");
    return null; // Don't render anything if no messages
  }

  return (
    <div className="space-y-4 font-mono">
      {currentMessages.map((msg, index) => (
        // When restoring data from checkpoint history, user input messages do not have an id.
        // Use index as key to avoid React warnings.
        <div key={msg.id ?? index} className="flex items-start gap-3" style={{border: '1px solid #f0f0f0', padding: '8px', margin: '8px 0'}}>
          <div className={cn(
            "flex-shrink-0 flex items-center justify-center w-10 h-10 rounded-full border",
            getMessageIcon(msg.type).className
          )}>
            {getMessageIcon(msg.type).icon}
          </div>
          <div className="flex-1 p-2 min-w-0">
            <div className="text-foreground text-sm break-words">
              {msg.content ? (
                <ReactMarkdown
                  remarkPlugins={[remarkGfm]}
                  className="prose prose-sm max-w-none overflow-hidden"
                  components={{
                    p: ({ children }) => <p className="mb-2 break-words">{children}</p>,
                    code: ({ children, className }) => {
                      const isInline = !className?.includes('language-');
                      return (
                        <code className={cn(
                          "bg-gray-100 px-1 py-0.5 rounded break-all",
                          !isInline && "block p-2 my-2 overflow-x-auto"
                        )}>
                          {children}
                        </code>
                      );
                    },
                    pre: ({ children }) => <pre className="bg-gray-100 p-2 rounded my-2 overflow-x-auto max-w-full">{children}</pre>,
                    ul: ({ children }) => <ul className="list-disc pl-6 mb-2">{children}</ul>,
                    ol: ({ children }) => <ol className="list-decimal pl-6 mb-2">{children}</ol>,
                  }}
                >
                  {msg.content}
                </ReactMarkdown>
              ) : (
                <span className="text-gray-400 italic">(空消息)</span>
              )}
            </div>
            {msg.tool_calls && msg.tool_calls.length > 0 && (
              <div className="flex items-center gap-2">
                <span className="text-sm font-mono">Tool calls:</span>
                {msg.tool_calls?.map((toolCall) => (
                  <div key={toolCall.id}>
                    <Badge variant="outline">{toolCall.name}</Badge>
                  </div>
                ))}
              </div>
            )}
          </div>
        </div>
      ))}
    </div>
  )
}

================================================
FILE: web/app/chat/[id]/components/checkpoint-card.tsx
================================================
import { Button } from '@/components/ui/button';
import { AppCheckpoint, ReplayAgentInput } from '@/hooks/useLangGraphAgent/types';
import { AgentState, InterruptValue } from '../agent-types';
import { Check, Redo, AlertCircle } from 'lucide-react';
import {
  Popover,
  PopoverContent,
  PopoverTrigger,
} from "@/components/ui/popover"
import { JsonView, defaultStyles } from 'react-json-view-lite';
import { cn } from '@/lib/utils';

interface CheckpointCardProps {
  thread_id: string;
  appCheckpoint: AppCheckpoint<AgentState, InterruptValue>;
  replayHandler: (agentInput: ReplayAgentInput) => void;
}

export function CheckpointCard({ thread_id, appCheckpoint: node, replayHandler }: CheckpointCardProps) {
  return (
    <div className={cn(
      "flex items-center gap-2 p-2 rounded-md font-mono text-sm",
      node.error ? "bg-red-100/50" : "bg-muted"
    )}>
      {node.error ? (
        <AlertCircle className="h-4 w-4 text-red-500" />
      ) : (
        <Check className="h-4 w-4 text-muted-foreground" />
      )}
      <div className="flex-1 flex flex-col gap-1">
        <span className="text-muted-foreground text-xs">checkpoint id: {node.checkpointConfig.configurable.checkpoint_id}</span>
        <div className="flex items-center justify-between">
          <span className="text-xs">next nodes: {node.nodes.map(n => n.name).join(', ')}</span>
          <div className="flex items-center gap-2">
            <Popover>
              <PopoverTrigger asChild>
                <Button variant="link" size="sm" className="text-xs">
                  View state
                </Button>
              </PopoverTrigger>
              <PopoverContent className="w-[500px]">
                <div className="max-h-[400px] overflow-auto p-2 rounded bg-muted/50">
                  <JsonView
                    data={node.state}
                    style={{
                      ...defaultStyles,
                      container: "font-mono text-xs",
                    }}
                  />
                </div>
              </PopoverContent>
            </Popover>
            <Popover>
              <PopoverTrigger asChild>
                <Button variant="link" size="sm" className="text-xs">
                  View state diff
                </Button>
              </PopoverTrigger>
              <PopoverContent className="w-[500px]">
                <div className="max-h-[400px] overflow-auto p-2 rounded bg-muted/50">
                  <JsonView
                    data={node.stateDiff}
                    style={{
                      ...defaultStyles,
                      container: "font-mono text-xs",
                    }}
                  />
                </div>
              </PopoverContent>
            </Popover>
            <Button
              variant="link"
              size="sm"
              className="text-xs"
              onClick={() => replayHandler({ thread_id, config: node.checkpointConfig })}
            >
              <Redo className="h-3 w-3 mr-1" />
              Replay
            </Button>
          </div>
        </div>
      </div>
    </div>
  )
}

================================================
FILE: web/app/chat/[id]/components/node-card.tsx
================================================
import { GraphNode } from "@/hooks/useLangGraphAgent/types";
import { AgentState } from "../agent-types";
import { Button } from '@/components/ui/button';
import {
  Popover,
  PopoverContent,
  PopoverTrigger,
} from "@/components/ui/popover"
import { JsonView, defaultStyles } from 'react-json-view-lite';

export function NodeCard({ node }: { node: GraphNode<AgentState> }) {
  return (
    <div className="flex items-center gap-2 p-2 rounded-md font-mono text-sm bg-muted/50">
      <span className="text-xs">node: {node.name}</span>
      <div className="flex items-center gap-2 ml-auto">
        <Popover>
          <PopoverTrigger asChild>
            <Button variant="link" size="sm" className="text-xs">
              View state
            </Button>
          </PopoverTrigger>
          <PopoverContent className="w-[500px]">
            <div className="max-h-[400px] overflow-auto p-2 rounded bg-muted/50">
              <JsonView
                data={node.state}
                style={{
                  ...defaultStyles,
                  container: "font-mono text-xs",
                }}
              />
            </div>
          </PopoverContent>
        </Popover>
      </div>
    </div>
  );
}

================================================
FILE: web/app/chat/[id]/components/reminder.tsx
================================================
import { Card, CardHeader, CardFooter, CardTitle } from "@/components/ui/card";
import { Button } from "@/components/ui/button";
import { useState } from "react";
import { Loader2 } from "lucide-react";

interface ReminderProps {
  interruptValue: string;
  onResume: (resumeValue: string) => void;
}

export default function Reminder({ interruptValue, onResume }: ReminderProps) {
  const [isLoading, setIsLoading] = useState(false);

  // Do not show the confirmation after user action
  if (!interruptValue) {
    return null;
  }

  const handleAction = (action: "approve" | "cancel") => {
    setIsLoading(true);
    onResume(action);
  };

  return (
    <div className="flex justify-end">
      <Card className="w-full max-w-sm">
        <CardHeader className="space-y-1 p-4">
          <CardTitle className="text-xl">{interruptValue}</CardTitle>
          <p className="text-sm text-muted-foreground">Are u sure you want to create a reminder?</p>
        </CardHeader>
        <CardFooter className="flex items-center gap-2 p-4 pt-0">
          {isLoading && <Loader2 className="h-4 w-4 animate-spin" />}
          <div className="flex gap-2 ml-auto">
            <Button
              variant="outline"
              onClick={() => handleAction("cancel")}
              disabled={isLoading}
            >
              Cancel
            </Button>
            <Button
              onClick={() => handleAction("approve")}
              disabled={isLoading}
            >
              Approve
            </Button>
          </div>
        </CardFooter>
      </Card>
    </div>
  );
}

================================================
FILE: web/app/chat/[id]/components/research/report-preview.tsx
================================================
import { AgentState } from "../../agent-types";
import { Card, CardContent, CardHeader, CardTitle } from "@/components/ui/card";
import { FileText } from "lucide-react";

interface ReportPreviewProps {
  nodeState: Partial<AgentState>;
}

export default function ReportPreview({ nodeState }: ReportPreviewProps) {
  if (!nodeState?.report_content) {
    return null;
  }

  return (
    <Card className="overflow-hidden">
      <CardHeader className="p-3 pb-0">
        <CardTitle className="text-sm flex items-center gap-2">
          <FileText className="h-4 w-4" />
          Research Report
        </CardTitle>
      </CardHeader>
      <CardContent className="p-3 pt-1">
        <div className="prose prose-sm max-w-none">
          <div dangerouslySetInnerHTML={{ __html: nodeState.report_content }} />
        </div>
      </CardContent>
    </Card>
  );
}

================================================
FILE: web/app/chat/[id]/components/research/research-node.tsx
================================================
import { AgentState } from "../../agent-types";
import ResearchStatus from "./research-status";
import SearchResults from "./search-results";
import ReportPreview from "./report-preview";

interface ResearchNodeProps {
  nodeState: Partial<AgentState>;
}

export default function ResearchNode({ nodeState }: ResearchNodeProps) {
  // 根据节点名称渲染不同的组件
  if (nodeState?.node_type === "research_status") {
    return <ResearchStatus nodeState={nodeState} />;
  }
  
  if (nodeState?.node_type === "search_results") {
    return <SearchResults nodeState={nodeState} />;
  }
  
  if (nodeState?.node_type === "report_preview") {
    return <ReportPreview nodeState={nodeState} />;
  }
  
  return null;
}

================================================
FILE: web/app/chat/[id]/components/research/research-status.tsx
================================================
import { AgentState } from "../../agent-types";
import { Loader2 } from "lucide-react";
import { Card, CardContent } from "@/components/ui/card";
import { Progress } from "@/components/ui/progress";

interface ResearchStatusProps {
  nodeState: Partial<AgentState>;
}

export default function ResearchStatus({ nodeState }: ResearchStatusProps) {
  if (!nodeState?.research_status?.[0]) {
    return null;
  }

  const { topic, status, progress } = nodeState.research_status[0];

  return (
    <div className="flex justify-end">
      <Card className="inline-block">
        <CardContent className="p-2">
          <div className="space-y-2">
            <div className="flex items-center gap-2">
              <Loader2 className="w-4 h-4 animate-spin" />
              <div className="text-sm font-medium">{topic}</div>
            </div>
            <div className="text-xs text-muted-foreground">{status}</div>
            {progress !== undefined && (
              <Progress value={progress} className="h-1" />
            )}
          </div>
        </CardContent>
      </Card>
    </div>
  );
}

================================================
FILE: web/app/chat/[id]/components/research/search-results.tsx
================================================
import { AgentState } from "../../agent-types";
import { Card, CardContent, CardHeader, CardTitle } from "@/components/ui/card";
import { ExternalLink } from "lucide-react";

interface SearchResultsProps {
  nodeState: Partial<AgentState>;
}

export default function SearchResults({ nodeState }: SearchResultsProps) {
  if (!nodeState?.search_results?.length) {
    return null;
  }

  return (
    <div className="space-y-3">
      {nodeState.search_results.map((result, index) => (
        <Card key={index} className="overflow-hidden">
          <CardHeader className="p-3 pb-0">
            <CardTitle className="text-sm flex items-center gap-2">
              <a 
                href={result.url} 
                target="_blank" 
                rel="noopener noreferrer"
                className="text-blue-600 hover:underline flex items-center gap-1"
              >
                {result.title}
                <ExternalLink className="h-3 w-3" />
              </a>
            </CardTitle>
          </CardHeader>
          <CardContent className="p-3 pt-1">
            <p className="text-xs text-muted-foreground">{result.snippet}</p>
          </CardContent>
        </Card>
      ))}
    </div>
  );
}

================================================
FILE: web/app/chat/[id]/components/weather/cloudy.tsx
================================================
"use client"

import { Cloud, Droplets, Wind } from "lucide-react"
import { Card } from "@/components/ui/card"

export default function Cloudy() {
  return (
    <Card className="relative overflow-hidden group w-72 h-40 cursor-pointer transition-all hover:shadow-lg">
      {/* Gradient Background */}
      <div className="absolute inset-0 bg-gradient-to-br from-gray-50 via-gray-100 to-gray-200 dark:from-gray-900/40 dark:via-gray-800/30 dark:to-gray-700/20 opacity-50" />

      {/* Content Container */}
      <div className="relative h-full p-6 flex flex-col justify-between">
        {/* Top Section */}
        <div className="flex items-center space-x-4">
          <div className="p-2 bg-gray-200 dark:bg-gray-800/60 rounded-full group-hover:bg-gray-300 dark:group-hover:bg-gray-700/80 transition-colors">
            <Cloud className="w-6 h-6 text-gray-600 dark:text-gray-200" />
          </div>
          <div>
            <h3 className="text-xl font-semibold text-gray-800 dark:text-gray-100">Cloudy</h3>
            <p className="text-sm text-gray-600 dark:text-gray-300">Today&apos;s Forecast</p>
          </div>
        </div>

        {/* Bottom Section */}
        <div className="flex justify-between items-center mt-4">
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-300">
            <Droplets className="w-4 h-4" />
            <span className="text-sm">60%</span>
          </div>
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-300">
            <Wind className="w-4 h-4" />
            <span className="text-sm">15 km/h</span>
          </div>
          <div className="text-2xl font-bold text-gray-800 dark:text-gray-100">22°C</div>
        </div>
      </div>
    </Card>
  )
}


================================================
FILE: web/app/chat/[id]/components/weather/rainy.tsx
================================================
"use client"

import { Cloud, Droplets, Wind } from "lucide-react"
import { Card } from "@/components/ui/card"
import { motion } from "framer-motion"

export default function Rainy() {
  return (
    <Card className="relative overflow-hidden group w-72 h-40 cursor-pointer transition-all hover:shadow-lg">
      {/* Gradient Background */}
      <div className="absolute inset-0 bg-gradient-to-br from-blue-50 via-blue-100 to-blue-200 dark:from-blue-950/40 dark:via-blue-900/30 dark:to-blue-800/20 opacity-50" />

      {/* Content Container */}
      <div className="relative h-full p-6 flex flex-col justify-between">
        {/* Top Section */}
        <div className="flex items-center space-x-4">
          <div className="p-2 bg-blue-100 dark:bg-blue-900/30 rounded-full group-hover:bg-blue-200 dark:group-hover:bg-blue-800/40 transition-colors">
            <Cloud className="w-6 h-6 text-blue-600 dark:text-blue-300" />
          </div>
          <div>
            <h3 className="text-xl font-semibold text-gray-800 dark:text-gray-100">Rainy</h3>
            <p className="text-sm text-gray-600 dark:text-gray-300">Today&apos;s Forecast</p>
          </div>
        </div>

        {/* Bottom Section */}
        <div className="flex justify-between items-center mt-4">
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-300">
            <Droplets className="w-4 h-4" />
            <span className="text-sm">75%</span>
          </div>
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-300">
            <Wind className="w-4 h-4" />
            <span className="text-sm">12 km/h</span>
          </div>
          <div className="text-2xl font-bold text-gray-800 dark:text-gray-100">18°C</div>
        </div>

        {/* Animated Rain Effect */}
        <div className="absolute inset-0 overflow-hidden pointer-events-none">
          {[...Array(10)].map((_, i) => (
            <motion.div
              key={i}
              style={{
                left: `${i * 10}%`
              }}
              className="absolute w-[2px] h-[10px] bg-blue-400/50 dark:bg-blue-200/60 rounded-full"
              animate={{
                y: ["-10%", "110%"],
              }}
              transition={{
                duration: 1,
                repeat: Number.POSITIVE_INFINITY,
                delay: i * 0.1,
                ease: "linear",
              }}
            />
          ))}
          {[...Array(10)].map((_, i) => (
            <motion.div
              key={`second-${i}`}
              style={{
                left: `${5 + (i * 10)}%`
              }}
              className="absolute w-[2px] h-[10px] bg-blue-400/50 dark:bg-blue-200/60 rounded-full"
              animate={{
                y: ["-10%", "110%"],
              }}
              transition={{
                duration: 1,
                repeat: Number.POSITIVE_INFINITY,
                delay: 0.5 + (i * 0.1),
                ease: "linear",
              }}
            />
          ))}
        </div>
      </div>
    </Card>
  )
}


================================================
FILE: web/app/chat/[id]/components/weather/snowy.tsx
================================================
"use client"

import { Snowflake, Thermometer, Wind } from "lucide-react"
import { Card } from "@/components/ui/card"
import { motion } from "framer-motion"

export default function Snowy() {
  return (
    <Card className="relative overflow-hidden group w-72 h-40 cursor-pointer transition-all hover:shadow-lg">
      {/* Gradient Background */}
      <div className="absolute inset-0 bg-gradient-to-br from-blue-50 via-indigo-50 to-purple-50 dark:from-blue-950/40 dark:via-indigo-900/30 dark:to-purple-900/20 opacity-50" />

      {/* Content Container */}
      <div className="relative h-full p-6 flex flex-col justify-between">
        {/* Top Section */}
        <div className="flex items-center space-x-4">
          <div className="p-2 bg-blue-100 dark:bg-blue-900/30 rounded-full group-hover:bg-blue-200 dark:group-hover:bg-blue-800/40 transition-colors">
            <Snowflake className="w-6 h-6 text-blue-500 dark:text-blue-300" />
          </div>
          <div>
            <h3 className="text-xl font-semibold text-gray-800 dark:text-gray-100">Snowy</h3>
            <p className="text-sm text-gray-600 dark:text-gray-300">Today&apos;s Forecast</p>
          </div>
        </div>

        {/* Bottom Section */}
        <div className="flex justify-between items-center mt-4">
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-300">
            <Thermometer className="w-4 h-4" />
            <span className="text-sm">-2°C</span>
          </div>
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-300">
            <Wind className="w-4 h-4" />
            <span className="text-sm">10 km/h</span>
          </div>
          <div className="text-2xl font-bold text-gray-800 dark:text-gray-100">5 cm</div>
        </div>

        {/* Animated Snowfall Effect */}
        <div className="absolute inset-0 overflow-hidden pointer-events-none">
          {[...Array(15)].map((_, i) => (
            <motion.div
              key={i}
              style={{
                left: `${i * 7}%`
              }}
              className="absolute w-3 h-3 text-blue-300 dark:text-blue-200/90 opacity-90"
              animate={{
                y: ["-10%", "110%"],
                x: [`${Math.sin(i) * 10}px`, `${Math.sin(i + 1) * -10}px`],
                rotate: [0, 180]
              }}
              transition={{
                duration: 3,
                repeat: Number.POSITIVE_INFINITY,
                delay: i * 0.2,
                ease: "linear",
                rotate: {
                  duration: 3,
                  ease: "linear",
                  repeat: Number.POSITIVE_INFINITY
                }
              }}
            >
              <svg viewBox="0 0 24 24" fill="currentColor">
                <path d="M12,0 L12,24 M6,6 L18,18 M18,6 L6,18 M0,12 L24,12" strokeWidth="2" stroke="currentColor" strokeLinecap="round" />
                <circle cx="12" cy="12" r="2" fill="currentColor" />
              </svg>
            </motion.div>
          ))}
          {[...Array(15)].map((_, i) => (
            <motion.div
              key={`second-${i}`}
              style={{
                left: `${3.5 + (i * 7)}%`
              }}
              className="absolute w-3 h-3 text-blue-300 dark:text-blue-200/90 opacity-90"
              animate={{
                y: ["-10%", "110%"],
                x: [`${Math.sin(i) * 10}px`, `${Math.sin(i + 1) * -10}px`],
                rotate: [0, 180]
              }}
              transition={{
                duration: 3,
                repeat: Number.POSITIVE_INFINITY,
                delay: 1.5 + (i * 0.2),
                ease: "linear",
                rotate: {
                  duration: 3,
                  ease: "linear",
                  repeat: Number.POSITIVE_INFINITY
                }
              }}
            >
              <svg viewBox="0 0 24 24" fill="currentColor">
                <path d="M12,0 L12,24 M6,6 L18,18 M18,6 L6,18 M0,12 L24,12" strokeWidth="2" stroke="currentColor" strokeLinecap="round" />
                <circle cx="12" cy="12" r="2" fill="currentColor" />
              </svg>
            </motion.div>
          ))}
        </div>
      </div>
    </Card>
  )
}


================================================
FILE: web/app/chat/[id]/components/weather/sunny.tsx
================================================
"use client"

import { Sun, Thermometer, Wind } from "lucide-react"
import { Card } from "@/components/ui/card"
import { motion } from "framer-motion"

export default function Sunny() {
  return (
    <Card className="relative overflow-hidden group w-72 h-40 cursor-pointer transition-all hover:shadow-lg">
      {/* Gradient Background */}
      <div className="absolute inset-0 bg-gradient-to-br from-orange-50 via-yellow-50 to-orange-100 dark:from-amber-900/20 dark:via-yellow-900/20 dark:to-orange-800/30 opacity-50" />

      {/* Content Container */}
      <div className="relative h-full p-6 flex flex-col justify-between">
        {/* Top Section */}
        <div className="flex items-center space-x-4">
          <div className="relative p-2 bg-amber-100 dark:bg-amber-900/40 rounded-full group-hover:bg-amber-200 dark:group-hover:bg-amber-800/60 transition-colors">
            {/* Animated Sun Rays Effect */}
            {[...Array(6)].map((_, i) => (
              <motion.div
                key={i}
                className="absolute w-16 h-0.5 bg-amber-200 dark:bg-yellow-500/30"
                style={{
                  left: "50%",
                  top: "50%",
                  rotate: i * 60,
                  transformOrigin: "0 50%",
                  transform: "translateY(-50%)",
                }}
                animate={{
                  opacity: [0.2, 0.5, 0.2],
                  scale: [1, 1.2, 1],
                }}
                transition={{
                  duration: 2,
                  repeat: Number.POSITIVE_INFINITY,
                  delay: i * 0.2,
                  ease: "easeInOut",
                }}
              />
            ))}
            <Sun className="w-6 h-6 text-amber-500 dark:text-yellow-400 relative z-10" />
          </div>
          <div>
            <h3 className="text-xl font-semibold text-gray-800 dark:text-gray-100">Sunny</h3>
            <p className="text-sm text-gray-600 dark:text-gray-400">Today&apos;s Forecast</p>
          </div>
        </div>

        {/* Bottom Section */}
        <div className="flex justify-between items-center mt-4">
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-400">
            <Thermometer className="w-4 h-4" />
            <span className="text-sm">UV 8</span>
          </div>
          <div className="flex items-center space-x-2 text-gray-600 dark:text-gray-400">
            <Wind className="w-4 h-4" />
            <span className="text-sm">8 km/h</span>
          </div>
          <div className="text-2xl font-bold text-gray-800 dark:text-gray-100">28°C</div>
        </div>
      </div>
    </Card>
  )
}


================================================
FILE: web/app/chat/[id]/components/weather/weather-node.tsx
================================================
import { AgentState } from "../../agent-types";
import { Loader2 } from "lucide-react";
import { Card, CardContent } from "@/components/ui/card";
import Rainy from "./rainy";
import Sunny from "./sunny";
import Cloudy from "./cloudy";
import Snowy from "./snowy";

interface WeatherNodeProps {
  nodeState: Partial<AgentState>;
}

export default function WeatherNode({ nodeState }: WeatherNodeProps) {
  if (nodeState?.weather_forecast?.[0]?.search_status) {
    return (
      <div className="flex justify-end">
        <Card className="inline-block">
          <CardContent className="p-2">
            <div className="flex items-center gap-2">
              <Loader2 className="w-6 h-6 animate-spin" />
              <div className="text-sm">{nodeState?.weather_forecast?.[0]?.search_status}</div>
            </div>
          </CardContent>
        </Card>
      </div>
    );
  }

  if (!nodeState?.weather_forecast?.[0]?.result) {
    return null;
  }

  const WeatherComponents = {
    Sunny,
    Cloudy,
    Rainy,
    Snowy,
  } as const;

  const WeatherComponent = WeatherComponents[nodeState?.weather_forecast?.[0].result];

  return (
    <div className="flex justify-end">
      <WeatherComponent />
    </div>
  );
}

================================================
FILE: web/app/chat/[id]/page.tsx
================================================
'use client';

import { useState, useEffect, useRef } from 'react';
import { useParams } from 'next/navigation';
import { Button } from '@/components/ui/button';
import { Textarea } from "@/components/ui/textarea";
import { ArrowUp, Square, ArrowDown, Ellipsis, AlertTriangle } from "lucide-react";
import { useLangGraphAgent } from '@/hooks/useLangGraphAgent/useLangGraphAgent';
import { AppCheckpoint, GraphNode } from '@/hooks/useLangGraphAgent/types';
import { AgentState, InterruptValue, ResumeValue } from './agent-types';
import { CheckpointCard } from './components/checkpoint-card';
import { ChatbotNode } from './components/chatbot-node';
import { Checkbox } from "@/components/ui/checkbox";
import WeatherNode from './components/weather/weather-node';
import Reminder from './components/reminder';
import { NodeCard } from './components/node-card';
import ResearchNode from './components/research/research-node';

export default function ChatPage() {
  const params = useParams<{ id: string }>();
  const messagesContainerRef = useRef<HTMLDivElement>(null);
  const inputRef = useRef<HTMLTextAreaElement>(null);

  const [threadId] = useState(params.id);
  const [inputValue, setInputValue] = useState('');
  const [showScrollButton, setShowScrollButton] = useState(false);
  const [shouldAutoScroll, setShouldAutoScroll] = useState(true);
  const [showNodesinfo, setShowNodesinfo] = useState(false);
  const [restoreError, setRestoreError] = useState(false);

  const exampleMessages = [
    "What's the weather in SF today?",
    "Set a reminder for to call John",
    "Tell me a joke",
    "What can you do?"
  ];

  const onCheckpointStart = (checkpoint: AppCheckpoint<AgentState, InterruptValue>) => {
    console.log('Checkpoint started:', checkpoint.nodes);
  }

  const onCheckpointEnd = (checkpoint: AppCheckpoint<AgentState, InterruptValue>) => {
    console.log('Checkpoint ended:', checkpoint.nodes);

    // Example how to do some application logic based on the agent flow. E.g. reminders list.
    if (checkpoint.nodes.some(n => n.name === 'reminder')) {
      console.log('Reminder created');
    }
  }

  const onCheckpointStateUpdate = (checkpoint: AppCheckpoint<AgentState, InterruptValue>) => {
    console.log('Checkpoint intermediate state updated:', checkpoint.nodes, checkpoint.state);
  }

  const { status, appCheckpoints, run, resume, replay, restore, stop, restoring } = useLangGraphAgent<AgentState, InterruptValue, ResumeValue>({ onCheckpointStart, onCheckpointEnd, onCheckpointStateUpdate });

  // Restore chat on page open
  useEffect(() => {
    if (threadId) {
      restore(threadId).catch(() => {
        setRestoreError(true);
      });
    }
  }, [threadId]);

  // Focus input on page load and after message is sent
  useEffect(() => {
    const isInputEnabled = status !== 'running' && !restoring;
    if (inputRef.current && isInputEnabled) {
      inputRef.current.focus();
    }
  }, [status, restoring]);

  // Add scroll event listener
  useEffect(() => {
    const messagesContainer = messagesContainerRef.current;
    if (messagesContainer) {
      messagesContainer.addEventListener('scroll', handleScrollUpdate);
      return () => messagesContainer.removeEventListener('scroll', handleScrollUpdate);
    }
  }, []);

  // Auto-scroll when new nodes appear
  useEffect(() => {
    if (shouldAutoScroll) {
      scrollToBottom();
    }
  }, [appCheckpoints, shouldAutoScroll]);

  const handleScrollUpdate = () => {
    if (messagesContainerRef.current) {
      const { scrollTop, scrollHeight, clientHeight } = messagesContainerRef.current;
      const isAtBottom = scrollHeight - scrollTop - clientHeight < 100; // 100px threshold
      setShowScrollButton(!isAtBottom);

      if (isAtBottom) {
        setShouldAutoScroll(true);
      } else {
        setShouldAutoScroll(false);
      }
    }
  };

  const scrollToBottom = () => {
    if (messagesContainerRef.current) {
      messagesContainerRef.current.scrollTo({
        top: messagesContainerRef.current.scrollHeight,
        behavior: 'smooth'
      });
    }
  };

  const handleExampleClick = (message: string) => {
    if (status !== 'running' && !restoring) {
      setRestoreError(false);
      run({ thread_id: threadId, state: { "messages": [{ type: 'user', content: message }] } });
    }
  };

  const handleResume = (resumeValue: ResumeValue) => {
    resume({ thread_id: threadId, resume: resumeValue });
  }

  const renderCheckpointError = (checkpoint: AppCheckpoint<AgentState, InterruptValue>): React.ReactNode => {
    return (
      <div className="text-sm text-red-500 font-medium p-2 bg-red-50 rounded-md flex items-center gap-2">
        <AlertTriangle className="h-4 w-4" />
        Error in {checkpoint.checkpointConfig.configurable.checkpoint_id}
      </div>
    );
  }

  const renderNode = (checkpoint: AppCheckpoint<AgentState, InterruptValue>, node: GraphNode<AgentState>): React.ReactNode => {
    switch (node.name) {
      case '__start__':
      case 'agent':
        return <ChatbotNode nodeState={node.state} />;
      case 'weather':
        return <WeatherNode nodeState={node.state} />;
      case 'reminder':
        return <Reminder interruptValue={checkpoint.interruptValue as string} onResume={handleResume} />;
      case 'research':
      case 'search':
      case 'report':
        return <ResearchNode nodeState={node.state} />;
      default:
        return null;
    }
  }

  return (
    <div className="flex flex-col h-screen">
      <div className="flex justify-end flex-shrink-0 p-2">
        <div className="flex items-center space-x-2">
          <Checkbox
            id="show-nodesinfo"
            checked={showNodesinfo}
            onCheckedChange={(checked) => setShowNodesinfo(checked === true)}
          />
          <label
            htmlFor="show-nodesinfo"
            className="text-sm font-medium leading-none peer-disabled:cursor-not-allowed peer-disabled:opacity-70"
          >
            Show graph info
          </label>
        </div>
      </div>

      <div
        ref={messagesContainerRef}
        className="flex-1 overflow-y-auto px-4 relative"
      >
        <div className="space-y-2 max-w-2xl mx-auto w-full">
          {appCheckpoints.map((checkpoint) => (
            <div key={checkpoint.checkpointConfig.configurable.checkpoint_id} className="space-y-2">
              {showNodesinfo && (
                <CheckpointCard
                  thread_id={threadId}
                  appCheckpoint={checkpoint}
                  replayHandler={replay}
                />
              )}
              {checkpoint.error ? renderCheckpointError(checkpoint) : checkpoint.nodes.map((node, nodeIndex) => (
                <div key={nodeIndex} className="space-y-2">
                  {showNodesinfo && <NodeCard node={node} />}
                  {renderNode(checkpoint, node)}
                </div>
              ))}
            </div>
          ))}
          {(status === 'running' || restoring) && (
            <div className="flex items-center justify-center p-4">
              <Ellipsis className="w-6 h-6 text-muted-foreground animate-pulse" />
            </div>
          )}
          {(status === 'error') && (
            <div className="text-sm text-red-500 font-medium font-mono p-2 bg-red-50 rounded-md flex items-center gap-2">
              <AlertTriangle className="h-4 w-4" />
              Error running agent.
            </div>
          )}
          {restoreError && (
            <div className="text-sm text-red-500 font-medium font-mono p-2 bg-red-50 rounded-md flex items-center gap-2">
              <AlertTriangle className="h-4 w-4" />
              Error restoring agent. Check if agent server is running.
            </div>
          )}
        </div>

        {showScrollButton && (
          <Button
            className="fixed bottom-28 right-8 rounded-full shadow-md"
            size="icon"
            variant="outline"
            onClick={scrollToBottom}
          >
            <ArrowDown />
          </Button>
        )}
      </div>

      <div className="flex-shrink-0 p-2 pb-4">
        <div className="max-w-2xl mx-auto">
          <div className="mb-2 grid grid-cols-2 gap-2">
            {exampleMessages.map((message, index) => (
              <Button
                key={index}
                variant="outline"
                size="sm"
                onClick={() => handleExampleClick(message)}
                disabled={status === 'running' || restoring}
                className="text-xs font-mono w-full"
              >
                {message}
              </Button>
            ))}
          </div>
          <div className="relative">
            <Textarea
              ref={inputRef}
              className="pr-24 resize-none font-mono"
              placeholder="Enter your message..."
              value={inputValue}
              disabled={status === 'running' || restoring}
              onChange={(e) => setInputValue(e.target.value)}
              onKeyDown={(e) => {
                if (e.key === 'Enter' && !e.shiftKey) {
                  e.preventDefault();
                  if (inputValue.trim() && status !== 'running' && !restoring) {
                    setRestoreError(false);
                    run({ thread_id: threadId, state: { "messages": [{ type: 'user', content: inputValue }] } });
                    setInputValue('');
                  }
                }
              }}
            />
            {status === 'running' ? (
              <Button
                className="absolute right-3 top-[50%] translate-y-[-50%]"
                size="icon"
                variant="destructive"
                onClick={() => stop(threadId)}
              >
                <Square className="h-4 w-4" />
              </Button>
            ) : (
              <Button
                className="absolute right-3 top-[50%] translate-y-[-50%]"
                size="icon"
                variant="outline"
                disabled={!inputValue.trim() || restoring}
                onClick={() => {
                  if (inputValue.trim() && !restoring) {
                    run({ thread_id: threadId, state: { "messages": [{ type: 'user', content: inputValue }] } });
                    setInputValue('');
                  }
                }}
              >
                <ArrowUp className="h-4 w-4" />
              </Button>
            )}
          </div>
        </div>
      </div>
    </div>
  );
}

================================================
FILE: web/app/chat/page.tsx
================================================
export default function ChatsPage() {
  return (
    <div>
    </div>
  )
}


================================================
FILE: web/app/deep-research/[id]/page.tsx
================================================
'use client'; 

import { useState, useEffect, useRef, useCallback, useMemo } from 'react';
import { useParams } from 'next/navigation';
import { v4 as uuidv4 } from 'uuid';
import { Button } from '@/components/ui/button'; 
import { Textarea } from "@/components/ui/textarea"; 
import { ArrowUp, Square, Loader, AlertTriangle, Check } from "lucide-react"; 
import { Card, CardContent, CardHeader, CardTitle } from "@/components/ui/card"; 
import { Progress } from "@/components/ui/progress"; 

// Import hook and types
import { useLangGraphAgent } from '@/hooks/useLangGraphAgent/useLangGraphAgent';
import { 
  StreamUpdateData, 
  Message, 
  ToolCall, 
  WithMessages, 
  AppCheckpoint 
} from '@/hooks/useLangGraphAgent/types';

// Markdown renderer
import ReactMarkdown from 'react-markdown';
import remarkGfm from 'remark-gfm';

// Deep Research State interface
interface DeepResearchState extends WithMessages { 
  topic?: string; 
  depth?: string;
  final_report_markdown?: string | null; 
}

// Progress display component
function DeepResearchProgressDisplay({ updates }: { updates: Record<string, StreamUpdateData> }) {
  if (Object.keys(updates).length === 0) return null;

  return (
    <div className="space-y-3">
      {Object.entries(updates).map(([id, data]) => {
        // Calculate progress percentage - use completedSteps and totalSteps (if available) or default progress value
        const progressValue = data.completedSteps && data.totalSteps
          ? (data.completedSteps / data.totalSteps) * 100
          : data.progress ? data.progress * 100 : 0;
        
        return (
          <div key={id} className="border rounded-md p-3 bg-muted/20">
            <div className="flex items-center justify-between mb-1">
              <div className="flex items-center space-x-2">
                {data.status === 'completed' ? (
                  <Check className="h-4 w-4 text-green-500" />
                ) : (
                  <Loader className="h-4 w-4 animate-spin text-blue-500" />
                )}
                <span className="text-sm font-medium">{data.title || 'Progress'}</span>
              </div>
              <span className="text-xs text-muted-foreground">
                {data.completedSteps && data.totalSteps 
                  ? `${data.completedSteps}/${data.totalSteps}` 
                  : `${Math.round(progressValue)}%`}
              </span>
            </div>
            <Progress value={progressValue} className="h-1" />
            {data.message && (
              <p className="text-xs text-muted-foreground mt-1">{data.message}</p>
            )}
            {/* Display query result count (if available) */}
            {data.results && data.results.length > 0 && (
              <div className="mt-2 text-xs">
                <span className="font-medium">Results: </span>
                <span className="text-muted-foreground">{data.results.length} items</span>
              </div>
            )}
          </div>
        );
      })}
    </div>
  );
}

// Message history display component
function MessageHistoryDisplay({ messages }: { messages: Message[] }) {
  if (messages.length === 0) return null;
  
  return (
    <div className="space-y-4">
      {messages.map((message) => (
        <div 
          key={message.id} 
          className={`p-3 rounded-lg ${
            message.type === 'user' 
              ? 'bg-primary/10 border border-primary/20' 
              : 'bg-card'
          }`}
        >
          <div className="flex items-center gap-2 mb-1">
            <span className={`text-xs px-2 py-0.5 rounded-full ${
              message.type === 'user' 
                ? 'bg-primary/20 text-primary' 
                : 'bg-secondary/20 text-secondary'
            }`}>
              {message.name || message.type}
            </span>
          </div>
          
          <div className="prose prose-sm dark:prose-invert max-w-none">
            {message.content && (
              <ReactMarkdown remarkPlugins={[remarkGfm]}>
                {message.content}
              </ReactMarkdown>
            )}
            
            {message.tool_calls?.map((tool) => (
              <div key={tool.id} className="bg-muted/30 p-2 rounded-md mt-2 text-xs font-mono">
                <div className="font-semibold">{tool.name}</div>
                <pre className="overflow-x-auto p-1 mt-1">
                  {typeof tool.args === 'string' 
                    ? tool.args 
                    : JSON.stringify(tool.args, null, 2)}
                </pre>
              </div>
            ))}
          </div>
        </div>
      ))}
    </div>
  );
}

// Final report display component
function FinalReportDisplay({ report }: { report: string | null }) {
  if (!report) {
    return (
      <div className="flex items-center justify-center h-full text-muted-foreground">
        <p>No report generated yet</p>
      </div>
    );
  }

  return (
    <div className="prose prose-sm dark:prose-invert max-w-none">
      <ReactMarkdown remarkPlugins={[remarkGfm]}>
        {report}
      </ReactMarkdown>
    </div>
  );
}

export default function DeepResearchPage() {
  const params = useParams<{ id: string }>();
  const threadId = params.id;

  // State to prevent triggering run multiple times
  const [initialRunAttempted, setInitialRunAttempted] = useState(false);
  // Optional: State to indicate specific startup error
  const [startupError, setStartupError] = useState<string | null>(null);


  const {
      status,
      run, // We need the run function from the hook
      restore,
      stop,
      restoring,
      restoreError,
      messages,
      progressUpdates,
      appCheckpoints
      // Add interrupt state/handlers if needed: isInterrupted, interruptData, resume
  } = useLangGraphAgent<DeepResearchState, any, any>({ // Pass generics if needed
       // Add callbacks if used, e.g., onCheckpointEnd
  });

  // ... (useMemo for finalReport, useMemo for researchTopic, useRef for messagesEndRef) ...
   const researchTopic = useMemo(() => {
       // Logic to get topic from messages remains useful for display
       return messages?.[0]?.type === 'user' && typeof messages[0].content === 'string'
           ? messages[0].content
           : null;
   }, [messages]);
   const messagesEndRef = useRef<HTMLDivElement>(null);


  // Restore history AND trigger initial run if necessary
  useEffect(() => {
    // Guard: Only proceed if we have a threadId and haven't tried the initial run/restore check yet.
    if (!threadId || initialRunAttempted) {
        return;
    }

    setStartupError(null); // Clear previous startup error on new attempt
    console.log("Effect: Starting restore/initial run check for thread:", threadId);
    
    // 添加日志: 检查 sessionStorage 中是否有主题
    const initialTopicCheck = sessionStorage.getItem(`topic_for_${threadId}`);
    console.log(`Initial sessionStorage check for topic_for_${threadId}:`, initialTopicCheck);

    restore(threadId)
        .then((restoredCheckpoints) => {
            console.log("Effect: Restore promise resolved.");
            console.log("Restored checkpoints:", restoredCheckpoints);
            const hasMeaningfulHistory = restoredCheckpoints && restoredCheckpoints.length > 1;
            console.log("Has meaningful history:", hasMeaningfulHistory);

            // --- Logic to potentially trigger run ---
            if (!hasMeaningfulHistory && !restoreError) {
                console.log("Effect: Thread appears new based on checkpoints. Checking for topic...");
                // 重要修复: 再次检查 sessionStorage，因为可能在 restore 过程中被其他代码修改
                const initialTopic = sessionStorage.getItem(`topic_for_${threadId}`);
                console.log(`Second check for topic_for_${threadId}:`, initialTopic);
                
                // 只有在确认要运行时才删除 sessionStorage
                if (initialTopic) {
                    console.log(`Effect: Found initial topic: "${initialTopic}". Triggering run...`);
                    const initialMessages: Message[] = [{ type: 'user', content: initialTopic, id: `user-${crypto.randomUUID()}` }];
                    const initialState: DeepResearchState = { messages: initialMessages };

                    run({ thread_id: threadId, state: initialState, agent: "deep_research" })
                        .then(() => {
                            console.log("Initial run command sent successfully.");
                            setInitialRunAttempted(true); // Set attempt complete on success
                            // 成功运行后再删除 sessionStorage
                            sessionStorage.removeItem(`topic_for_${threadId}`);
                        })
                        .catch(runError => {
                            console.error("Error detail from initial run call:", runError);
                            let detail = runError instanceof Error ? runError.message : 'Unknown error';
                            setStartupError(`Failed to start research: ${detail}`);
                            setInitialRunAttempted(true); // Also set attempt complete on failure
                        });
                } else {
                    console.warn("Effect: Thread appears new, but no initial topic found.");
                    // 尝试从 URL 参数获取主题 (备用方案)
                    const urlParams = new URLSearchParams(window.location.search);
                    const topicFromUrl = urlParams.get('topic');
                    
                    if (topicFromUrl) {
                        console.log(`Found topic from URL: "${topicFromUrl}"`);
                        const initialMessages: Message[] = [{ type: 'user', content: topicFromUrl, id: `user-${crypto.randomUUID()}` }];
                        const initialState: DeepResearchState = { messages: initialMessages };
                        
                        run({ thread_id: threadId, state: initialState, agent: "deep_research" })
                            .then(() => {
                                console.log("Initial run from URL param sent successfully.");
                                setInitialRunAttempted(true);
                            })
                            .catch(runError => {
                                console.error("Error starting from URL param:", runError);
                                setStartupError(`Failed to start research: ${runError instanceof Error ? runError.message : 'Unknown error'}`);
                                setInitialRunAttempted(true);
                            });
                    } else {
                        setStartupError("Cannot start research: Initial topic is missing.");
                        setInitialRunAttempted(true); // Set attempt complete as we can't proceed
                    }
                }
            } else {
                 // Existing thread or restore error occurred
                 console.log("Effect: Existing thread or restore error.");
                 setInitialRunAttempted(true); // Mark attempt complete
                 sessionStorage.removeItem(`topic_for_${threadId}`); // Clean up just in case
            }
            // --- End run trigger logic ---
        })
        .catch((err) => {
            console.error("Effect: Unhandled error during restore promise chain:", err);
             setInitialRunAttempted(true); // Mark attempt complete on unexpected error
             if (!restoreError) {
                setStartupError("An unexpected error occurred during loading.")
             }
        });

// ***** ENSURE THIS DEPENDENCY ARRAY IS USED *****
}, [threadId, restore, run, initialRunAttempted, restoreError]);
// ***** DEPENDENCY ARRAY HAS 5 ITEMS AND IS STABLE *****


  // Auto-scroll effect (remains the same)
  useEffect(() => {
       messagesEndRef.current?.scrollIntoView({ behavior: "smooth" });
  }, [messages, progressUpdates]);


  // Stop research handler (remains the same)
  const handleStopResearch = useCallback(() => {
       if (threadId && status === 'running') {
         stop(threadId);
       }
  }, [threadId, status, stop]);

// --- THIS DEFINITION MUST EXIST BEFORE THE RETURN STATEMENT ---
const finalReport = useMemo(() => {
  // Defensive checks first
  if (!appCheckpoints || !Array.isArray(appCheckpoints) || appCheckpoints.length === 0) {
       return null;
  }
  const lastCheckpoint = appCheckpoints[appCheckpoints.length - 1];
  if (!lastCheckpoint || !lastCheckpoint.state) { // Check if lastCheckpoint and its state exist
      return null;
  }

  // Try to get the specific field from state
  let report = (lastCheckpoint.state as DeepResearchState)?.final_report_markdown;

  // Fallback to last AI message if report not found and it's the end of the graph
  if (!report && lastCheckpoint.next?.length === 0 && messages && messages.length > 0) {
    const lastMsg = messages[messages.length - 1];
    if (lastMsg?.type === 'ai' && typeof lastMsg.content === 'string') {
      console.log("Using last AI message as final report (fallback).");
      report = lastMsg.content;
    }
  }

  return report ?? null; // Return the found report or null
}, [appCheckpoints, messages]); // Dependencies are correct

  // --- Render Logic ---
  // (Includes checks for restoring, restoreError, startupError,
  //  and then displays messages, progress, report, interrupt UI etc.)
  return (
      <div className="flex flex-col h-screen p-2 md:p-4 bg-background text-foreground">
          <h1 className="text-xl md:text-2xl font-semibold mb-2 md:mb-4 text-center flex-shrink-0">
              Deep Research Assistant
              {researchTopic && !restoring && (
                  <span className="block text-sm text-muted-foreground font-normal mt-1">
                    Topic: {researchTopic}
                  </span>
              )}
          </h1>

          <div className="flex-1 overflow-hidden flex flex-col">
              <div className="flex flex-col gap-4 flex-1 min-h-0">
                  <div className="h-full flex flex-col border rounded-lg shadow-sm bg-card">
                      {/* Header with Status Indicator */}
                      <div className="p-2 border-b flex justify-between items-center flex-shrink-0">
                         {/* ... (Status display logic - same as before) ... */}
                           <h2 className="text-base md:text-lg font-semibold">
                               {researchTopic ? `Research: ${researchTopic.substring(0,30)}...` : "Research Progress"}
                          </h2>
                          <div className="text-xs text-muted-foreground flex items-center gap-1">
                             {/* ... (Status/Error/Stop Button display logic - same as before) ... */}
                          </div>
                      </div>

                      {/* Content Area */}
                      <div className="flex-1 overflow-y-auto p-2 space-y-4" id="messages-container">
                          {restoring ? (
                              <div className="flex justify-center items-center h-full text-muted-foreground">
                                  <Loader className="mr-2 h-4 w-4 animate-spin" /> Loading History...
                              </div>
                          ) : restoreError ? (
                              <div className="flex flex-col justify-center items-center h-full text-red-500 text-center p-4">
                                 <AlertTriangle className="mr-2 h-5 w-5 mb-2" />
                                 <p className="font-semibold">Failed to Load Research History</p>
                                 <p className="text-sm">{restoreError.message || 'An unknown error occurred.'}</p>
                             </div>
                          // Display specific startup error if restore was ok but topic was missing
                          ) : startupError ? (
                               <div className="flex flex-col justify-center items-center h-full text-orange-500 text-center p-4">
                                 <AlertTriangle className="mr-2 h-5 w-5 mb-2" />
                                 <p className="font-semibold">Cannot Start Research</p>
                                 <p className="text-sm">{startupError}</p>
                               </div>
                          ) : (
                              <>
                                  {/* Display content only when no critical errors */}
                                  <DeepResearchProgressDisplay updates={progressUpdates} />
                                  <MessageHistoryDisplay messages={messages} />
                                  {finalReport && (
                                      <div className="mt-6 border-t pt-4">
                                          <h2 className="text-base md:text-lg font-semibold mb-2">Final Report</h2>
                                          <FinalReportDisplay report={finalReport} />
                                      </div>
                                  )}
                                  {/* Message if idle/complete but nothing substantial found */}
                                   {status === 'idle' && messages.length === 0 && !finalReport && (!appCheckpoints || appCheckpoints.length === 0) && (
                                       <div className="text-center text-muted-foreground py-6">
                                         Waiting for research to start or no history found.
                                       </div>
                                   )}
                              </>
                          )}
                          {/* --- End Conditional Content --- */}
                          <div ref={messagesEndRef} />
                      </div>
                       {/* --- Human-in-the-Loop UI (Render based on hook state) --- */}
                      {/* {isInterrupted && interruptData && ( ... UI to call resume ... )} */}
                  </div>
              </div>
          </div>
      </div>
  );
}

================================================
FILE: web/app/deep-research/page.tsx
================================================
// @filename: app/deepresearch/page.tsx
'use client';

import { useState } from 'react';
import { useRouter } from 'next/navigation';
import { Button } from '@/components/ui/button';
import { Textarea } from '@/components/ui/textarea';
import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
import { useChatStore } from '@/stores/chat-store';
import { Loader } from 'lucide-react'; // Keep loader for button state

export default function DeepResearchInitiationPage() {
    const [topic, setTopic] = useState('');
    const [isNavigating, setIsNavigating] = useState(false); // Simple loading state for navigation
    const [error, setError] = useState<string | null>(null);
    const router = useRouter();
    const { addChat } = useChatStore();

    const handleInitiateResearch = () => {
        if (!topic.trim()) {
            setError("Please enter a topic.");
            return;
        }
        setIsNavigating(true); // Indicate process started
        setError(null);

        try {
            // 1. Create the chat entry in the store to get an ID
            //    Use agentId, agentName, and pass topic as the optional initialName
            const newChat = addChat('deep-research', 'Deep Research', topic);

            // 2. Store the actual topic temporarily for the next page
            //    Use a unique key based on the new chat ID
            sessionStorage.setItem(`topic_for_${newChat.id}`, topic);

            // 3. Navigate to the specific research page
            //    The actual 'run' will be triggered on that page load
            router.push(`/deep-research/${newChat.id}`);

            // Note: No backend API call here. No 'run' triggered here.

        } catch (err: any) {
            console.error("Failed to initiate research process:", err);
            setError(err.message || "Failed to start. Please try again.");
            setIsNavigating(false); // Stop loading on error
        }
        // If navigation starts, the component will unmount, no need to set isNavigating back to false
    };

    return (
        <div className="flex flex-col items-center justify-center min-h-screen p-4">
            <Card className="w-full max-w-2xl shadow-lg">
                <CardHeader>
                    <CardTitle>Start New Deep Research</CardTitle>
                </CardHeader>
                <CardContent>
                    <p className="text-muted-foreground mb-4">
                        Enter the topic you want the agent to research in depth.
                    </p>
                    <Textarea
                        value={topic}
                        onChange={(e) => setTopic(e.target.value)}
                        placeholder="Example: Impact of AI on renewable energy"
                        className="min-h-[100px] mb-4 text-sm"
                        disabled={isNavigating}
                    />
                    {error && (
                         <p className="text-red-500 text-sm mb-4">{error}</p>
                    )}
                    <Button
                        onClick={handleInitiateResearch} // Use the correct handler name
                        disabled={isNavigating || !topic.trim()}
                        className="w-full"
                    >
                        {isNavigating ? (
                            <>
                                <Loader className="mr-2 h-4 w-4 animate-spin" />
                                Proceeding...
                            </>
                        ) : (
                            // Changed button text to be more accurate
                            <>Prepare Research</>
                        )}
                    </Button>
                </CardContent>
            </Card>
        </div>
    );
}

================================================
FILE: web/app/globals.css
================================================
@import 'react-json-view-lite/dist/index.css';

@tailwind base;
@tailwind components;
@tailwind utilities;

body {
  font-family: Arial, Helvetica, sans-serif;
}

@layer base {
  :root {
    --background: 0 0% 100%;
    --foreground: 240 10% 3.9%;
    --card: 0 0% 100%;
    --card-foreground: 240 10% 3.9%;
    --popover: 0 0% 100%;
    --popover-foreground: 240 10% 3.9%;
    --primary: 240 5.9% 10%;
    --primary-foreground: 0 0% 98%;
    --secondary: 240 4.8% 95.9%;
    --secondary-foreground: 240 5.9% 10%;
    --muted: 240 4.8% 95.9%;
    --muted-foreground: 240 3.8% 46.1%;
    --accent: 240 4.8% 95.9%;
    --accent-foreground: 240 5.9% 10%;
    --destructive: 0 84.2% 60.2%;
    --destructive-foreground: 0 0% 98%;
    --border: 240 5.9% 90%;
    --input: 240 5.9% 90%;
    --ring: 240 10% 3.9%;
    --chart-1: 12 76% 61%;
    --chart-2: 173 58% 39%;
    --chart-3: 197 37% 24%;
    --chart-4: 43 74% 66%;
    --chart-5: 27 87% 67%;
    --radius: 0.5rem;
    --sidebar-background: 0 0% 98%;
    --sidebar-foreground: 240 5.3% 26.1%;
    --sidebar-primary: 240 5.9% 10%;
    --sidebar-primary-foreground: 0 0% 98%;
    --sidebar-accent: 240 4.8% 95.9%;
    --sidebar-accent-foreground: 240 5.9% 10%;
    --sidebar-border: 220 13% 91%;
    --sidebar-ring: 217.2 91.2% 59.8%;
  }

  .dark {
    --background: 240 10% 3.9%;
    --foreground: 0 0% 98%;
    --card: 240 10% 3.9%;
    --card-foreground: 0 0% 98%;
    --popover: 240 10% 3.9%;
    --popover-foreground: 0 0% 98%;
    --primary: 0 0% 98%;
    --primary-foreground: 240 5.9% 10%;
    --secondary: 240 3.7% 15.9%;
    --secondary-foreground: 0 0% 98%;
    --muted: 240 3.7% 15.9%;
    --muted-foreground: 240 5% 64.9%;
    --accent: 240 3.7% 15.9%;
    --accent-foreground: 0 0% 98%;
    --destructive: 0 62.8% 30.6%;
    --destructive-foreground: 0 0% 98%;
    --border: 240 3.7% 15.9%;
    --input: 240 3.7% 15.9%;
    --ring: 240 4.9% 83.9%;
    --chart-1: 220 70% 50%;
    --chart-2: 160 60% 45%;
    --chart-3: 30 80% 55%;
    --chart-4: 280 65% 60%;
    --chart-5: 340 75% 55%;
    --sidebar-background: 240 5.9% 10%;
    --sidebar-foreground: 240 4.8% 95.9%;
    --sidebar-primary: 224.3 76.3% 48%;
    --sidebar-primary-foreground: 0 0% 100%;
    --sidebar-accent: 240 3.7% 15.9%;
    --sidebar-accent-foreground: 240 4.8% 95.9%;
    --sidebar-border: 240 3.7% 15.9%;
    --sidebar-ring: 217.2 91.2% 59.8%;
  }
}

@layer base {
  * {
    @apply border-border;
  }

  body {
    @apply bg-background text-foreground;
  }
}

================================================
FILE: web/app/layout.tsx
================================================
import type { Metadata } from "next";
import { Geist, Geist_Mono } from "next/font/google";
import "./globals.css";
import { ThemeProvider } from "@/components/theme-provider"
import { SidebarProvider, SidebarTrigger } from "@/components/ui/sidebar"
import { AppSidebar } from "@/components/app-sidebar"

const geistSans = Geist({
  variable: "--font-geist-sans",
  subsets: ["latin"],
});

const geistMono = Geist_Mono({
  variable: "--font-geist-mono",
  subsets: ["latin"],
});

export const metadata: Metadata = {
  title: "Create Next App",
  description: "Generated by create next app",
};

export default function RootLayout({
  children,
}: Readonly<{
  children: React.ReactNode;
}>) {
  return (
    <html lang="en">
      <body
        className={`${geistSans.variable} ${geistMono.variable} antialiased`}
      >
        <ThemeProvider
          attribute="class"
          defaultTheme="system"
          enableSystem
          disableTransitionOnChange
        >
          <SidebarProvider>
            <AppSidebar />
            <div className="relative min-h-screen w-full">
              <SidebarTrigger className="absolute left-1 top-1 z-50" />
              <main className="h-full">
                {children}
              </main>
            </div>
          </SidebarProvider>
        </ThemeProvider>
      </body>
    </html>
  );
}


================================================
FILE: web/app/page.tsx
================================================
// @filename: pages/index.tsx (或者您的主页文件路径)
'use client';

import React, { useState } from 'react'; // 导入 React 和 useState
import { useRouter } from "next/navigation";
import { Button } from "@/components/ui/button";
// --- MODIFIED: Import Dialog components ---
import {
  Dialog,
  DialogContent,
  DialogDescription,
  DialogHeader,
  DialogTitle,
  DialogTrigger,
  DialogFooter, // Optional: if you need a footer
  DialogClose,  // Optional: for explicit close buttons
} from "@/components/ui/dialog";
// --- MODIFIED: Import useChatStore again ---
import { useChatStore } from "@/stores/chat-store";
// --- Example Icons ---
import { BrainCircuit, Users, Wrench, BotMessageSquare, GitBranch, MessageSquare } from "lucide-react";

// --- Agent Configuration (Hardcoded for now) ---
// 'id' should match the agent name expected by your backend API loader.
const availableAgents = [
  { id: 'chat', name: 'ReAct Agent', description: 'A general purpose assistant for various tasks.', icon: MessageSquare },
  { id: 'deep_research', name: 'Deep Research', description: 'Performs in-depth research on a topic.', icon: BrainCircuit },
  // Add other agents here
  // { id: 'another_agent', name: 'Another Agent', description: 'Description here', icon: Users },
];
// --- End Agent Configuration ---


// --- Feature Block Component (Unchanged from previous version) ---
function FeatureBlock({ title, description, icon: Icon }: { title: string; description: string; icon?: React.ElementType; }) {
  return (
    <div className="group p-4 md:p-6 rounded-lg bg-card dark:bg-gray-800/50 border border-border dark:border-gray-700/50 hover:shadow-md transition-shadow duration-300">
      <div className="flex items-center gap-3 mb-3">
         {Icon && <Icon className="w-6 h-6 text-primary flex-shrink-0" />}
         <h3 className="text-lg md:text-xl font-semibold text-foreground">{title}</h3>
      </div>
      <p className="text-sm md:text-base text-muted-foreground">{description}</p>
    </div>
  );
}

// --- Main Welcome Page Component ---
export default function WelcomePage() {
  const router = useRouter();
  // --- MODIFIED: Get addChat from the store ---
  const { addChat } = useChatStore();
  // State to control Dialog open/closed status, useful for closing programmatically
  const [isAgentSelectorOpen, setIsAgentSelectorOpen] = useState(false);

  
  // --- CORRECTED: Handler to create chat AND navigate dynamically ---
  const handleCreateChat = (agentId: string, agentName: string) => {
    console.log(`Creating new chat for agent: ${agentName} (ID: ${agentId})`);

    // 1. Call addChat - This matches the store definition.
    //    Pass agentId first, then agentName. The store generates the chat name.
    const newChat = addChat(agentId, agentName);

    if (agentId === 'deep_research') {
      const targetPath = '/deep-research/';
      setIsAgentSelectorOpen(false);
      router.push(targetPath); // Use the CORRECT dynamic path
    } else {
    // 2. Construct the dynamic navigation path using agentId
      const targetPath = `/${agentId}/${newChat.id}`;
      setIsAgentSelectorOpen(false);
      router.push(targetPath); // Use the CORRECT dynamic path
    }

  };

  return (
    <div className="min-h-screen bg-gradient-to-b from-background via-background/80 to-blue-50 dark:to-blue-900/20 flex items-center justify-center">
      <div className="container px-4 py-12 md:py-16 mx-auto space-y-12 md:space-y-16">

        {/* Hero Section (Unchanged) */}
        <div className="text-center space-y-4 max-w-4xl mx-auto">
          <h1 className="text-4xl md:text-6xl font-bold tracking-tight text-gray-900 dark:text-gray-100">
            Welcome to Mentis
          </h1>
          <p className="text-lg md:text-xl text-muted-foreground max-w-2xl mx-auto">
            An interactive learning framework for exploring Superagents and Multi-Agent Systems built with LangGraph.
          </p>
        </div>

        {/* About/Purpose Section (Unchanged) */}
        <div className="max-w-3xl mx-auto text-center space-y-4">
          <h2 className="text-2xl md:text-3xl font-semibold tracking-tight">Learn by Doing</h2>
          <p className="text-base md:text-lg text-muted-foreground leading-relaxed">
            Mentis provides hands-on examples and tools to help you understand the core concepts, architectures, and capabilities of modern AI agents. Dive into pre-built agents or explore the underlying graph structures.
          </p>
        </div>

        {/* Capabilities / Concepts Section (Unchanged) */}
        <div className="space-y-8">
          <h3 className="text-2xl md:text-3xl font-semibold text-center">Explore Key Agent Concepts</h3>
          <div className="grid md:grid-cols-2 lg:grid-cols-3 gap-4 md:gap-6 max-w-5xl mx-auto">
            <FeatureBlock title="Autonomous Agents (Superagents)" description="Interact with agents for complex, multi-step tasks like research, utilizing planning and tool use." icon={BrainCircuit} />
            <FeatureBlock title="Multi-Agent Collaboration" description="Observe how multiple specialized agents can work together, delegate tasks, and achieve a common goal." icon={Users}/>
            <FeatureBlock title="Tool Usage & Function Calling" description="See how agents leverage external tools (web search, APIs) to enhance their abilities." icon={Wrench}/>
            <FeatureBlock title="Streaming & Real-time Feedback" description="Experience how intermediate steps and results are streamed back for transparency." icon={BotMessageSquare}/>
            <FeatureBlock title="State Management & Persistence" description="Understand how LangGraph manages conversation state for resuming and tracing execution."/>
            <FeatureBlock title="Human-in-the-Loop" description="Explore scenarios where agents pause to ask for human input or approval."/>
          </div>
        </div>

        {/* CTA Section --- MODIFIED --- */}
        <div className="text-center pt-4">
          <Dialog open={isAgentSelectorOpen} onOpenChange={setIsAgentSelectorOpen}>
            <DialogTrigger asChild>
              <Button size="lg" className="px-8 py-3 text-lg">
                Explore Agents
              </Button>
            </DialogTrigger>
            <DialogContent className="sm:max-w-[425px] md:max-w-lg">
              <DialogHeader>
                <DialogTitle>Select an Agent</DialogTitle>
                <DialogDescription>
                  Choose an agent type to start interacting with.
                </DialogDescription>
              </DialogHeader>
              {/* List of available agents */}
              <div className="grid gap-4 py-4">
                {availableAgents.map((agent) => {
                   const Icon = agent.icon || Bot; // Default icon
                   return (
                     <button
                       key={agent.id}
                       // Ensure onClick passes BOTH agent.id and agent.name to the handler
                       onClick={() => handleCreateChat(agent.id, agent.name)}
                       className="flex items-center p-4 rounded-lg border bg-card hover:bg-muted/50 dark:border-gray-700 dark:hover:bg-gray-800/60 transition-colors text-left w-full"
                     >
                       <Icon className="w-6 h-6 mr-4 text-primary flex-shrink-0" />
                       <div>
                         <p className="font-semibold text-foreground">{agent.name}</p>
                         <p className="text-sm text-muted-foreground">{agent.description}</p>
                       </div>
                     </button>
                   )
                 })}
              </div>
            </DialogContent>
          </Dialog>
        </div>
        {/* --- End CTA Section --- */}

      </div>
    </div>
  );
}

================================================
FILE: web/components/app-sidebar.tsx
================================================
// @filename: components/layout/app-sidebar.tsx (或者您的实际路径)
'use client';

import Link from "next/link";
import { usePathname, useRouter } from "next/navigation";
import React from "react"; // 导入 React
import {
  Sidebar,
  SidebarContent,
  SidebarHeader,
  SidebarFooter,
  SidebarGroup,
  SidebarMenu,
  SidebarMenuItem,
  SidebarMenuButton,
  SidebarGroupLabel,
  // SidebarGroupAction // 不再需要，我们用普通按钮替代
} from "@/components/ui/sidebar"; // 确认这是您自定义的 Sidebar 结构组件
import { Bot, Plus, MessageSquare } from "lucide-react";
import { Button } from "@/components/ui/button"; // 导入 Button
import { useChatStore } from "@/stores/chat-store"; // 确认路径
import ThemeSwitcher from "./theme-switcher"; // 确认路径

// --- Agent 配置 (硬编码，未来可改为 API 获取) ---
// 'id' 应与后端 load_agent 期望的名称匹配
const availableAgents = [
  { id: 'chat', name: 'General Chatbot', description: '通用助理', icon: MessageSquare }, // 添加图标
  { id: 'deep_research', name: 'Deep Research', description: '深度研究助理', icon: Bot }, // 添加图标
  // 在这里添加更多 Agent
];
// --- Agent 配置结束 ---

export function AppSidebar() {
  const pathname = usePathname();
  const router = useRouter();
  // 假设 useChatStore 包含更新后的 addChat 和带 agentName 的 ChatItem
  const { chats, addChat } = useChatStore();

  // 处理创建新聊天的函数 (保持不变)
  const handleAddNewChat = (agentId: string, agentName: string) => {
    if (agentId === 'deep_research') {
      // For Deep Research, navigate to the dedicated initiation page
      const targetPath = '/deep-research/';
      console.log(`Navigating from Sidebar to Deep Research initiation: ${targetPath}`);
      router.push(targetPath);
      // NOTE: We DO NOT call addChat here for deep_research
    } else {
      // For all other agents, create chat item and navigate to its specific ID page
      console.log(`Creating new chat entry for agent: ${agentName}`);
      const newChat = addChat(agentId, agentName); // Create entry in store
      const targetPath = `/${agentId}/${newChat.id}`; // e.g., /default/abc987
      console.log(`Navigating from Sidebar to: ${targetPath}`);
      router.push(targetPath);
    }
  };

  return (
    <Sidebar>
      <SidebarHeader>
        {/* 保持您的 Header */}
        <SidebarMenu>
          <SidebarMenuItem>
            <SidebarMenuButton size="lg" asChild>
              <Link href="/" className="flex items-center gap-2">
                <div className="flex aspect-square size-8 items-center justify-center rounded-lg bg-sidebar-primary text-sidebar-primary-foreground">
                  <Bot className="size-4" />
                </div>
                <span className="font-semibold">Mentis Web UI</span>
              </Link>
            </SidebarMenuButton>
          </SidebarMenuItem>
        </SidebarMenu>
      </SidebarHeader>

      <SidebarContent className="flex flex-col"> {/* 允许内容增长 */}
        {/* --- MODIFIED: 添加 Agent 创建按钮区域 --- */}
        <SidebarGroup className="flex-shrink-0"> {/* 防止此区域过度增长 */}
          <SidebarGroupLabel>New Chat</SidebarGroupLabel>
          <SidebarMenu className="mt-1 space-y-1"> {/* 为按钮添加间距 */}
            {availableAgents.map((agent) => {
              const Icon = agent.icon || Plus; // 使用配置的图标或默认 Plus
              return (
                <SidebarMenuItem key={agent.id}>
                  <Button
                    variant="ghost" // 使用 ghost 样式使其看起来像菜单项
                    size="sm"
                    className="w-full justify-start px-2" // 调整 padding 和对齐
                    onClick={() => handleAddNewChat(agent.id, agent.name)}
                    title={agent.description} // 添加工具提示
                  >
                    <Icon className="mr-2 size-4" /> {/* 显示图标 */}
                    {agent.name}
                  </Button>
                </SidebarMenuItem>
              );
            })}
          </SidebarMenu>
        </SidebarGroup>
        {/* --- End Agent 创建按钮区域 --- */}

        <div className="my-4 border-t dark:border-gray-700 flex-shrink-0"></div> {/* 分隔线 */}

        {/* --- 聊天历史记录区域 --- */}
        <SidebarGroup className="flex-grow overflow-y-auto"> {/* 让历史记录区域可滚动 */}
          <SidebarGroupLabel>Recent Chats</SidebarGroupLabel>
           {/* 确保这里的 map 不会出错 */}
          <SidebarMenu className="mt-2">
            {/* 如果 chats 为空，可以显示提示 */}
            {chats && chats.length === 0 && (
              <p className="px-2 text-xs text-muted-foreground">No recent chats.</p>
            )}
            {/* --- MODIFIED: Link href in chat history --- */}
            {Array.isArray(chats) && chats.map((chat) => {
              // >>> Important Assumption: Your 'chat' object in the store needs to know its agentId <<<
              // >>> If not, you cannot correctly link back here. Let's assume chat has `agentId` <<<
              // >>> If `chat.agentId` doesn't exist, you'll need to update your store logic <<<
              const chatAgentId = chat.agentId || 'chat'; // Fallback to 'chat' if missing, adjust as needed

              // Construct the correct link based on the chat's agent type
              const chatHref = `/${chatAgentId}/${chat.id}`;
              const isActive = pathname === chatHref;

              // Find the agent icon (optional, improves UI)
               const agentConfig = availableAgents.find(a => a.id === chatAgentId);
               const Icon = agentConfig?.icon || MessageSquare; // Use agent icon or default

              return (
                <SidebarMenuItem key={chat.id}>
                  <SidebarMenuButton
                      asChild
                      isActive={isActive} // Check against the full dynamic path
                      className="truncate"
                      title={chat.name} // Use chat name for title
                  >
                    <Link href={chatHref}>
                      <Icon className="size-4 flex-shrink-0 mr-2" /> {/* Use dynamic icon */}
                      <span className="truncate">{chat.name}</span>
                    </Link>
                  </SidebarMenuButton>
                </SidebarMenuItem>
              );
            })}
          </SidebarMenu>
        </SidebarGroup>
      </SidebarContent>

      <SidebarFooter>
        {/* 保持您的 Footer */}
        <div className="flex flex-col items-center text-sm gap-4">
          <ThemeSwitcher />
          <span>Made by{" "}
            <a
              href="https://github.com/foreveryh/mentis"
              target="_blank"
              rel="noopener noreferrer"
              className="text-primary hover:text-primary/80 transition-colors inline-flex items-center gap-1 font-semibold underline underline-offset-4"
            >
              Mentis
            </a>
          </span>
        </div>
      </SidebarFooter>
    </Sidebar>
  );
}

================================================
FILE: web/components/theme-provider.tsx
================================================
"use client"

import * as React from "react"
import { useEffect, useState } from 'react'
import { ThemeProvider as NextThemesProvider } from "next-themes"

export const useMounted = () => {
  const [mounted, setMounted] = useState(false)
  useEffect(() => { setMounted(true) }, [])
  return mounted
}

export function ThemeProvider({
  children,
  ...props
}: React.ComponentProps<typeof NextThemesProvider>) {
  const mounted = useMounted()
  return mounted && <NextThemesProvider {...props}>{children}</NextThemesProvider>
}


================================================
FILE: web/components/theme-switcher.tsx
================================================
"use client"

import { useState } from "react"
import { useTheme } from "next-themes"
import { Moon, SunMedium, Monitor } from "lucide-react"
import { motion } from "framer-motion"
import { cn } from "@/lib/utils"

const themes = [
  { name: "system", icon: Monitor },
  { name: "light", icon: SunMedium },
  { name: "dark", icon: Moon },
]

export default function ThemeSwitcher() {
  const { theme, setTheme } = useTheme()
  const [selectedTheme, setSelectedTheme] = useState(theme)

  console.log('current theme', theme)

  const handleThemeChange = (themeToSwitch: string) => {
    setSelectedTheme(themeToSwitch)
    setTheme(themeToSwitch)
  }

  return (
    <div className="inline-flex items-center bg-muted rounded-full relative border p-0.5">
      <div className="relative flex">
        {themes.map((theme) => {
          const Icon = theme.icon
          return (
            <button
              key={theme.name}
              className={cn(
                "relative z-10 rounded-full transition-colors duration-200",
                "w-7 h-7 flex items-center justify-center",
                selectedTheme === theme.name
                  ? "text-primary-foreground"
                  : "text-muted-foreground hover:text-foreground",
              )}
              onClick={() => handleThemeChange(theme.name)}
              aria-label={`Switch to ${theme.name} theme`}
            >
              <Icon className="w-3.5 h-3.5" />
            </button>
          )
        })}
        <motion.div
          className="absolute inset-0 w-7 h-7 bg-primary rounded-full"
          initial={false}
          animate={{
            x: selectedTheme === "system" ? 0 : selectedTheme === "light" ? 28 : 56,
          }}
          transition={{
            type: "spring",
            stiffness: 400,
            damping: 30,
          }}
        />
      </div>
    </div>
  )
}

================================================
FILE: web/components/ui/badge.tsx
================================================
import * as React from "react"
import { cva, type VariantProps } from "class-variance-authority"

import { cn } from "@/lib/utils"

const badgeVariants = cva(
  "inline-flex items-center rounded-md border px-2.5 py-0.5 text-xs font-semibold transition-colors focus:outline-none focus:ring-2 focus:ring-ring focus:ring-offset-2",
  {
    variants: {
      variant: {
        default:
          "border-transparent bg-primary text-primary-foreground shadow hover:bg-primary/80",
        secondary:
          "border-transparent bg-secondary text-secondary-foreground hover:bg-secondary/80",
        destructive:
          "border-transparent bg-destructive text-destructive-foreground shadow hover:bg-destructive/80",
        outline: "text-foreground",
      },
    },
    defaultVariants: {
      variant: "default",
    },
  }
)

export interface BadgeProps
  extends React.HTMLAttributes<HTMLDivElement>,
    VariantProps<typeof badgeVariants> {}

function Badge({ className, variant, ...props }: BadgeProps) {
  return (
    <div className={cn(badgeVariants({ variant }), className)} {...props} />
  )
}

export { Badge, badgeVariants }


================================================
FILE: web/components/ui/button.tsx
================================================
import * as React from "react"
import { Slot } from "@radix-ui/react-slot"
import { cva, type VariantProps } from "class-variance-authority"

import { cn } from "@/lib/utils"

const buttonVariants = cva(
  "inline-flex items-center justify-center gap-2 whitespace-nowrap rounded-md text-sm font-medium transition-colors focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring disabled:pointer-events-none disabled:opacity-50 [&_svg]:pointer-events-none [&_svg]:size-4 [&_svg]:shrink-0",
  {
    variants: {
      variant: {
        default:
          "bg-primary text-primary-foreground shadow hover:bg-primary/90",
        destructive:
          "bg-destructive text-destructive-foreground shadow-sm hover:bg-destructive/90",
        outline:
          "border border-input bg-background shadow-sm hover:bg-accent hover:text-accent-foreground",
        secondary:
          "bg-secondary text-secondary-foreground shadow-sm hover:bg-secondary/80",
        ghost: "hover:bg-accent hover:text-accent-foreground",
        link: "text-primary underline-offset-4 hover:underline",
      },
      size: {
        default: "h-9 px-4 py-2",
        sm: "h-8 rounded-md px-3 text-xs",
        lg: "h-10 rounded-md px-8",
        icon: "h-9 w-9",
      },
    },
    defaultVariants: {
      variant: "default",
      size: "default",
    },
  }
)

export interface ButtonProps
  extends React.ButtonHTMLAttributes<HTMLButtonElement>,
    VariantProps<typeof buttonVariants> {
  asChild?: boolean
}

const Button = React.forwardRef<HTMLButtonElement, ButtonProps>(
  ({ className, variant, size, asChild = false, ...props }, ref) => {
    const Comp = asChild ? Slot : "button"
    return (
      <Comp
        className={cn(buttonVariants({ variant, size, className }))}
        ref={ref}
        {...props}
      />
    )
  }
)
Button.displayName = "Button"

export { Button, buttonVariants }


================================================
FILE: web/components/ui/card.tsx
================================================
import * as React from "react"

import { cn } from "@/lib/utils"

const Card = React.forwardRef<
  HTMLDivElement,
  React.HTMLAttributes<HTMLDivElement>
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    className={cn(
      "rounded-xl border bg-card text-card-foreground shadow",
      className
    )}
    {...props}
  />
))
Card.displayName = "Card"

const CardHeader = React.forwardRef<
  HTMLDivElement,
  React.HTMLAttributes<HTMLDivElement>
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    className={cn("flex flex-col space-y-1.5 p-6", className)}
    {...props}
  />
))
CardHeader.displayName = "CardHeader"

const CardTitle = React.forwardRef<
  HTMLDivElement,
  React.HTMLAttributes<HTMLDivElement>
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    className={cn("font-semibold leading-none tracking-tight", className)}
    {...props}
  />
))
CardTitle.displayName = "CardTitle"

const CardDescription = React.forwardRef<
  HTMLDivElement,
  React.HTMLAttributes<HTMLDivElement>
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    className={cn("text-sm text-muted-foreground", className)}
    {...props}
  />
))
CardDescription.displayName = "CardDescription"

const CardContent = React.forwardRef<
  HTMLDivElement,
  React.HTMLAttributes<HTMLDivElement>
>(({ className, ...props }, ref) => (
  <div ref={ref} className={cn("p-6 pt-0", className)} {...props} />
))
CardContent.displayName = "CardContent"

const CardFooter = React.forwardRef<
  HTMLDivElement,
  React.HTMLAttributes<HTMLDivElement>
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    className={cn("flex items-center p-6 pt-0", className)}
    {...props}
  />
))
CardFooter.displayName = "CardFooter"

export { Card, CardHeader, CardFooter, CardTitle, CardDescription, CardContent }


================================================
FILE: web/components/ui/checkbox.tsx
================================================
"use client"

import * as React from "react"
import * as CheckboxPrimitive from "@radix-ui/react-checkbox"
import { Check } from "lucide-react"

import { cn } from "@/lib/utils"

const Checkbox = React.forwardRef<
  React.ElementRef<typeof CheckboxPrimitive.Root>,
  React.ComponentPropsWithoutRef<typeof CheckboxPrimitive.Root>
>(({ className, ...props }, ref) => (
  <CheckboxPrimitive.Root
    ref={ref}
    className={cn(
      "peer h-4 w-4 shrink-0 rounded-sm border border-primary shadow focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring disabled:cursor-not-allowed disabled:opacity-50 data-[state=checked]:bg-primary data-[state=checked]:text-primary-foreground",
      className
    )}
    {...props}
  >
    <CheckboxPrimitive.Indicator
      className={cn("flex items-center justify-center text-current")}
    >
      <Check className="h-4 w-4" />
    </CheckboxPrimitive.Indicator>
  </CheckboxPrimitive.Root>
))
Checkbox.displayName = CheckboxPrimitive.Root.displayName

export { Checkbox }


================================================
FILE: web/components/ui/dialog.tsx
================================================
// @filename: components/ui/dialog.tsx
"use client"

import * as React from "react"
import * as DialogPrimitive from "@radix-ui/react-dialog"
import { X } from "lucide-react"

import { cn } from "@/lib/utils" // Adjust path if necessary

const Dialog = DialogPrimitive.Root

const DialogTrigger = DialogPrimitive.Trigger

const DialogPortal = DialogPrimitive.Portal

const DialogClose = DialogPrimitive.Close

const DialogOverlay = React.forwardRef<
  React.ElementRef<typeof DialogPrimitive.Overlay>,
  React.ComponentPropsWithoutRef<typeof DialogPrimitive.Overlay>
>(({ className, ...props }, ref) => (
  <DialogPrimitive.Overlay
    ref={ref}
    className={cn(
      "fixed inset-0 z-50 bg-black/80", // Changed from bg-background/80 for darker overlay
      " data-[state=open]:animate-in data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=open]:fade-in-0",
      className
    )}
    {...props}
  />
))
DialogOverlay.displayName = DialogPrimitive.Overlay.displayName

const DialogContent = React.forwardRef<
  React.ElementRef<typeof DialogPrimitive.Content>,
  React.ComponentPropsWithoutRef<typeof DialogPrimitive.Content>
>(({ className, children, ...props }, ref) => (
  <DialogPortal>
    <DialogOverlay />
    <DialogPrimitive.Content
      ref={ref}
      className={cn(
        "fixed left-[50%] top-[50%] z-50 grid w-full max-w-lg translate-x-[-50%] translate-y-[-50%] gap-4 border bg-background p-6 shadow-lg duration-200 data-[state=open]:animate-in data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=open]:fade-in-0 data-[state=closed]:zoom-out-95 data-[state=open]:zoom-in-95 data-[state=closed]:slide-out-to-left-1/2 data-[state=closed]:slide-out-to-top-[48%] data-[state=open]:slide-in-from-left-1/2 data-[state=open]:slide-in-from-top-[48%] sm:rounded-lg",
        className
      )}
      {...props}
    >
      {children}
      <DialogPrimitive.Close className="absolute right-4 top-4 rounded-sm opacity-70 ring-offset-background transition-opacity hover:opacity-100 focus:outline-none focus:ring-2 focus:ring-ring focus:ring-offset-2 disabled:pointer-events-none data-[state=open]:bg-accent data-[state=open]:text-muted-foreground">
        <X className="h-4 w-4" />
        <span className="sr-only">Close</span>
      </DialogPrimitive.Close>
    </DialogPrimitive.Content>
  </DialogPortal>
))
DialogContent.displayName = DialogPrimitive.Content.displayName

const DialogHeader = ({
  className,
  ...props
}: React.HTMLAttributes<HTMLDivElement>) => (
  <div
    className={cn(
      "flex flex-col space-y-1.5 text-center sm:text-left",
      className
    )}
    {...props}
  />
)
DialogHeader.displayName = "DialogHeader"

const DialogFooter = ({
  className,
  ...props
}: React.HTMLAttributes<HTMLDivElement>) => (
  <div
    className={cn(
      "flex flex-col-reverse sm:flex-row sm:justify-end sm:space-x-2",
      className
    )}
    {...props}
  />
)
DialogFooter.displayName = "DialogFooter"

const DialogTitle = React.forwardRef<
  React.ElementRef<typeof DialogPrimitive.Title>,
  React.ComponentPropsWithoutRef<typeof DialogPrimitive.Title>
>(({ className, ...props }, ref) => (
  <DialogPrimitive.Title
    ref={ref}
    className={cn(
      "text-lg font-semibold leading-none tracking-tight",
      className
    )}
    {...props}
  />
))
DialogTitle.displayName = DialogPrimitive.Title.displayName

const DialogDescription = React.forwardRef<
  React.ElementRef<typeof DialogPrimitive.Description>,
  React.ComponentPropsWithoutRef<typeof DialogPrimitive.Description>
>(({ className, ...props }, ref) => (
  <DialogPrimitive.Description
    ref={ref}
    className={cn("text-sm text-muted-foreground", className)}
    {...props}
  />
))
DialogDescription.displayName = DialogPrimitive.Description.displayName

export {
  Dialog,
  DialogTrigger,
  DialogContent,
  DialogHeader,
  DialogFooter,
  DialogTitle,
  DialogDescription,
  DialogClose, // Also export DialogClose if you use it directly
}

================================================
FILE: web/components/ui/input.tsx
================================================
import * as React from "react"

import { cn } from "@/lib/utils"

const Input = React.forwardRef<HTMLInputElement, React.ComponentProps<"input">>(
  ({ className, type, ...props }, ref) => {
    return (
      <input
        type={type}
        className={cn(
          "flex h-9 w-full rounded-md border border-input bg-transparent px-3 py-1 text-base shadow-sm transition-colors file:border-0 file:bg-transparent file:text-sm file:font-medium file:text-foreground placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring disabled:cursor-not-allowed disabled:opacity-50 md:text-sm",
          className
        )}
        ref={ref}
        {...props}
      />
    )
  }
)
Input.displayName = "Input"

export { Input }


================================================
FILE: web/components/ui/popover.tsx
================================================
"use client"

import * as React from "react"
import * as PopoverPrimitive from "@radix-ui/react-popover"

import { cn } from "@/lib/utils"

const Popover = PopoverPrimitive.Root

const PopoverTrigger = PopoverPrimitive.Trigger

const PopoverAnchor = PopoverPrimitive.Anchor

const PopoverContent = React.forwardRef<
  React.ElementRef<typeof PopoverPrimitive.Content>,
  React.ComponentPropsWithoutRef<typeof PopoverPrimitive.Content>
>(({ className, align = "center", sideOffset = 4, ...props }, ref) => (
  <PopoverPrimitive.Portal>
    <PopoverPrimitive.Content
      ref={ref}
      align={align}
      sideOffset={sideOffset}
      className={cn(
        "z-50 w-72 rounded-md border bg-popover p-4 text-popover-foreground shadow-md outline-none data-[state=open]:animate-in data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=open]:fade-in-0 data-[state=closed]:zoom-out-95 data-[state=open]:zoom-in-95 data-[side=bottom]:slide-in-from-top-2 data-[side=left]:slide-in-from-right-2 data-[side=right]:slide-in-from-left-2 data-[side=top]:slide-in-from-bottom-2",
        className
      )}
      {...props}
    />
  </PopoverPrimitive.Portal>
))
PopoverContent.displayName = PopoverPrimitive.Content.displayName

export { Popover, PopoverTrigger, PopoverContent, PopoverAnchor }


================================================
FILE: web/components/ui/progress.tsx
================================================
"use client"

import * as React from "react"
import * as ProgressPrimitive from "@radix-ui/react-progress"

import { cn } from "@/lib/utils"

const Progress = React.forwardRef<
  React.ElementRef<typeof ProgressPrimitive.Root>,
  React.ComponentPropsWithoutRef<typeof ProgressPrimitive.Root>
>(({ className, value, ...props }, ref) => (
  <ProgressPrimitive.Root
    ref={ref}
    className={cn(
      "relative h-4 w-full overflow-hidden rounded-full bg-secondary",
      className
    )}
    {...props}
  >
    <ProgressPrimitive.Indicator
      className="h-full w-full flex-1 bg-primary transition-all"
      style={{ transform: `translateX(-${100 - (value || 0)}%)` }}
    />
  </ProgressPrimitive.Root>
))
Progress.displayName = ProgressPrimitive.Root.displayName

export { Progress }

================================================
FILE: web/components/ui/separator.tsx
================================================
"use client"

import * as React from "react"
import * as SeparatorPrimitive from "@radix-ui/react-separator"

import { cn } from "@/lib/utils"

const Separator = React.forwardRef<
  React.ElementRef<typeof SeparatorPrimitive.Root>,
  React.ComponentPropsWithoutRef<typeof SeparatorPrimitive.Root>
>(
  (
    { className, orientation = "horizontal", decorative = true, ...props },
    ref
  ) => (
    <SeparatorPrimitive.Root
      ref={ref}
      decorative={decorative}
      orientation={orientation}
      className={cn(
        "shrink-0 bg-border",
        orientation === "horizontal" ? "h-[1px] w-full" : "h-full w-[1px]",
        className
      )}
      {...props}
    />
  )
)
Separator.displayName = SeparatorPrimitive.Root.displayName

export { Separator }


================================================
FILE: web/components/ui/sheet.tsx
================================================
"use client"

import * as React from "react"
import * as SheetPrimitive from "@radix-ui/react-dialog"
import { cva, type VariantProps } from "class-variance-authority"
import { X } from "lucide-react"

import { cn } from "@/lib/utils"

const Sheet = SheetPrimitive.Root

const SheetTrigger = SheetPrimitive.Trigger

const SheetClose = SheetPrimitive.Close

const SheetPortal = SheetPrimitive.Portal

const SheetOverlay = React.forwardRef<
  React.ElementRef<typeof SheetPrimitive.Overlay>,
  React.ComponentPropsWithoutRef<typeof SheetPrimitive.Overlay>
>(({ className, ...props }, ref) => (
  <SheetPrimitive.Overlay
    className={cn(
      "fixed inset-0 z-50 bg-black/80  data-[state=open]:animate-in data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=open]:fade-in-0",
      className
    )}
    {...props}
    ref={ref}
  />
))
SheetOverlay.displayName = SheetPrimitive.Overlay.displayName

const sheetVariants = cva(
  "fixed z-50 gap-4 bg-background p-6 shadow-lg transition ease-in-out data-[state=closed]:duration-300 data-[state=open]:duration-500 data-[state=open]:animate-in data-[state=closed]:animate-out",
  {
    variants: {
      side: {
        top: "inset-x-0 top-0 border-b data-[state=closed]:slide-out-to-top data-[state=open]:slide-in-from-top",
        bottom:
          "inset-x-0 bottom-0 border-t data-[state=closed]:slide-out-to-bottom data-[state=open]:slide-in-from-bottom",
        left: "inset-y-0 left-0 h-full w-3/4 border-r data-[state=closed]:slide-out-to-left data-[state=open]:slide-in-from-left sm:max-w-sm",
        right:
          "inset-y-0 right-0 h-full w-3/4 border-l data-[state=closed]:slide-out-to-right data-[state=open]:slide-in-from-right sm:max-w-sm",
      },
    },
    defaultVariants: {
      side: "right",
    },
  }
)

interface SheetContentProps
  extends React.ComponentPropsWithoutRef<typeof SheetPrimitive.Content>,
    VariantProps<typeof sheetVariants> {}

const SheetContent = React.forwardRef<
  React.ElementRef<typeof SheetPrimitive.Content>,
  SheetContentProps
>(({ side = "right", className, children, ...props }, ref) => (
  <SheetPortal>
    <SheetOverlay />
    <SheetPrimitive.Content
      ref={ref}
      className={cn(sheetVariants({ side }), className)}
      {...props}
    >
      <SheetPrimitive.Close className="absolute right-4 top-4 rounded-sm opacity-70 ring-offset-background transition-opacity hover:opacity-100 focus:outline-none focus:ring-2 focus:ring-ring focus:ring-offset-2 disabled:pointer-events-none data-[state=open]:bg-secondary">
        <X className="h-4 w-4" />
        <span className="sr-only">Close</span>
      </SheetPrimitive.Close>
      {children}
    </SheetPrimitive.Content>
  </SheetPortal>
))
SheetContent.displayName = SheetPrimitive.Content.displayName

const SheetHeader = ({
  className,
  ...props
}: React.HTMLAttributes<HTMLDivElement>) => (
  <div
    className={cn(
      "flex flex-col space-y-2 text-center sm:text-left",
      className
    )}
    {...props}
  />
)
SheetHeader.displayName = "SheetHeader"

const SheetFooter = ({
  className,
  ...props
}: React.HTMLAttributes<HTMLDivElement>) => (
  <div
    className={cn(
      "flex flex-col-reverse sm:flex-row sm:justify-end sm:space-x-2",
      className
    )}
    {...props}
  />
)
SheetFooter.displayName = "SheetFooter"

const SheetTitle = React.forwardRef<
  React.ElementRef<typeof SheetPrimitive.Title>,
  React.ComponentPropsWithoutRef<typeof SheetPrimitive.Title>
>(({ className, ...props }, ref) => (
  <SheetPrimitive.Title
    ref={ref}
    className={cn("text-lg font-semibold text-foreground", className)}
    {...props}
  />
))
SheetTitle.displayName = SheetPrimitive.Title.displayName

const SheetDescription = React.forwardRef<
  React.ElementRef<typeof SheetPrimitive.Description>,
  React.ComponentPropsWithoutRef<typeof SheetPrimitive.Description>
>(({ className, ...props }, ref) => (
  <SheetPrimitive.Description
    ref={ref}
    className={cn("text-sm text-muted-foreground", className)}
    {...props}
  />
))
SheetDescription.displayName = SheetPrimitive.Description.displayName

export {
  Sheet,
  SheetPortal,
  SheetOverlay,
  SheetTrigger,
  SheetClose,
  SheetContent,
  SheetHeader,
  SheetFooter,
  SheetTitle,
  SheetDescription,
}


================================================
FILE: web/components/ui/sidebar.tsx
================================================
"use client"

import * as React from "react"
import { Slot } from "@radix-ui/react-slot"
import { VariantProps, cva } from "class-variance-authority"
import { PanelLeft } from "lucide-react"

import { useIsMobile } from "@/hooks/use-mobile"
import { cn } from "@/lib/utils"
import { Button } from "@/components/ui/button"
import { Input } from "@/components/ui/input"
import { Separator } from "@/components/ui/separator"
import { Sheet, SheetContent, SheetTitle } from "@/components/ui/sheet"
import { Skeleton } from "@/components/ui/skeleton"
import {
  Tooltip,
  TooltipContent,
  TooltipProvider,
  TooltipTrigger,
} from "@/components/ui/tooltip"

const SIDEBAR_COOKIE_NAME = "sidebar:state"
const SIDEBAR_COOKIE_MAX_AGE = 60 * 60 * 24 * 7
const SIDEBAR_WIDTH = "14rem"
const SIDEBAR_WIDTH_MOBILE = "16rem"
const SIDEBAR_WIDTH_ICON = "3rem"
const SIDEBAR_KEYBOARD_SHORTCUT = "b"

type SidebarContext = {
  state: "expanded" | "collapsed"
  open: boolean
  setOpen: (open: boolean) => void
  openMobile: boolean
  setOpenMobile: (open: boolean) => void
  isMobile: boolean
  toggleSidebar: () => void
}

const SidebarContext = React.createContext<SidebarContext | null>(null)

function useSidebar() {
  const context = React.useContext(SidebarContext)
  if (!context) {
    throw new Error("useSidebar must be used within a SidebarProvider.")
  }

  return context
}

const SidebarProvider = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div"> & {
    defaultOpen?: boolean
    open?: boolean
    onOpenChange?: (open: boolean) => void
  }
>(
  (
    {
      defaultOpen = true,
      open: openProp,
      onOpenChange: setOpenProp,
      className,
      style,
      children,
      ...props
    },
    ref
  ) => {
    const isMobile = useIsMobile()
    const [openMobile, setOpenMobile] = React.useState(false)

    // This is the internal state of the sidebar.
    // We use openProp and setOpenProp for control from outside the component.
    const [_open, _setOpen] = React.useState(defaultOpen)
    const open = openProp ?? _open
    const setOpen = React.useCallback(
      (value: boolean | ((value: boolean) => boolean)) => {
        const openState = typeof value === "function" ? value(open) : value
        if (setOpenProp) {
          setOpenProp(openState)
        } else {
          _setOpen(openState)
        }

        // This sets the cookie to keep the sidebar state.
        document.cookie = `${SIDEBAR_COOKIE_NAME}=${openState}; path=/; max-age=${SIDEBAR_COOKIE_MAX_AGE}`
      },
      [setOpenProp, open]
    )

    // Helper to toggle the sidebar.
    const toggleSidebar = React.useCallback(() => {
      return isMobile
        ? setOpenMobile((open) => !open)
        : setOpen((open) => !open)
    }, [isMobile, setOpen, setOpenMobile])

    // Adds a keyboard shortcut to toggle the sidebar.
    React.useEffect(() => {
      const handleKeyDown = (event: KeyboardEvent) => {
        if (
          event.key === SIDEBAR_KEYBOARD_SHORTCUT &&
          (event.metaKey || event.ctrlKey)
        ) {
          event.preventDefault()
          toggleSidebar()
        }
      }

      window.addEventListener("keydown", handleKeyDown)
      return () => window.removeEventListener("keydown", handleKeyDown)
    }, [toggleSidebar])

    // We add a state so that we can do data-state="expanded" or "collapsed".
    // This makes it easier to style the sidebar with Tailwind classes.
    const state = open ? "expanded" : "collapsed"

    const contextValue = React.useMemo<SidebarContext>(
      () => ({
        state,
        open,
        setOpen,
        isMobile,
        openMobile,
        setOpenMobile,
        toggleSidebar,
      }),
      [state, open, setOpen, isMobile, openMobile, setOpenMobile, toggleSidebar]
    )

    return (
      <SidebarContext.Provider value={contextValue}>
        <TooltipProvider delayDuration={0}>
          <div
            style={
              {
                "--sidebar-width": SIDEBAR_WIDTH,
                "--sidebar-width-icon": SIDEBAR_WIDTH_ICON,
                ...style,
              } as React.CSSProperties
            }
            className={cn(
              "group/sidebar-wrapper flex min-h-svh w-full has-[[data-variant=inset]]:bg-sidebar",
              className
            )}
            ref={ref}
            {...props}
          >
            {children}
          </div>
        </TooltipProvider>
      </SidebarContext.Provider>
    )
  }
)
SidebarProvider.displayName = "SidebarProvider"

const Sidebar = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div"> & {
    side?: "left" | "right"
    variant?: "sidebar" | "floating" | "inset"
    collapsible?: "offcanvas" | "icon" | "none"
  }
>(
  (
    {
      side = "left",
      variant = "sidebar",
      collapsible = "offcanvas",
      className,
      children,
      ...props
    },
    ref
  ) => {
    const { isMobile, state, openMobile, setOpenMobile } = useSidebar()

    if (collapsible === "none") {
      return (
        <div
          className={cn(
            "flex h-full w-[--sidebar-width] flex-col bg-sidebar text-sidebar-foreground",
            className
          )}
          ref={ref}
          {...props}
        >
          {children}
        </div>
      )
    }

    if (isMobile) {
      return (
        <Sheet open={openMobile} onOpenChange={setOpenMobile} {...props}>
          <SheetContent
            data-sidebar="sidebar"
            data-mobile="true"
            className="w-[--sidebar-width] bg-sidebar p-0 text-sidebar-foreground [&>button]:hidden"
            style={
              {
                "--sidebar-width": SIDEBAR_WIDTH_MOBILE,
              } as React.CSSProperties
            }
            side={side}
          >
            <SheetTitle className="sr-only">Mobile Menu</SheetTitle>
            <div className="flex h-full w-full flex-col">{children}</div>
          </SheetContent>
        </Sheet>
      )
    }

    return (
      <div
        ref={ref}
        className="group peer hidden text-sidebar-foreground md:block"
        data-state={state}
        data-collapsible={state === "collapsed" ? collapsible : ""}
        data-variant={variant}
        data-side={side}
      >
        {/* This is what handles the sidebar gap on desktop */}
        <div
          className={cn(
            "relative h-svh w-[--sidebar-width] bg-transparent transition-[width] duration-200 ease-linear",
            "group-data-[collapsible=offcanvas]:w-0",
            "group-data-[side=right]:rotate-180",
            variant === "floating" || variant === "inset"
              ? "group-data-[collapsible=icon]:w-[calc(var(--sidebar-width-icon)_+_theme(spacing.4))]"
              : "group-data-[collapsible=icon]:w-[--sidebar-width-icon]"
          )}
        />
        <div
          className={cn(
            "fixed inset-y-0 z-10 hidden h-svh w-[--sidebar-width] transition-[left,right,width] duration-200 ease-linear md:flex",
            side === "left"
              ? "left-0 group-data-[collapsible=offcanvas]:left-[calc(var(--sidebar-width)*-1)]"
              : "right-0 group-data-[collapsible=offcanvas]:right-[calc(var(--sidebar-width)*-1)]",
            // Adjust the padding for floating and inset variants.
            variant === "floating" || variant === "inset"
              ? "p-2 group-data-[collapsible=icon]:w-[calc(var(--sidebar-width-icon)_+_theme(spacing.4)_+2px)]"
              : "group-data-[collapsible=icon]:w-[--sidebar-width-icon] group-data-[side=left]:border-r group-data-[side=right]:border-l",
            className
          )}
          {...props}
        >
          <div
            data-sidebar="sidebar"
            className="flex h-full w-full flex-col bg-sidebar group-data-[variant=floating]:rounded-lg group-data-[variant=floating]:border group-data-[variant=floating]:border-sidebar-border group-data-[variant=floating]:shadow"
          >
            {children}
          </div>
        </div>
      </div>
    )
  }
)
Sidebar.displayName = "Sidebar"

const SidebarTrigger = React.forwardRef<
  React.ElementRef<typeof Button>,
  React.ComponentProps<typeof Button>
>(({ className, onClick, ...props }, ref) => {
  const { toggleSidebar } = useSidebar()

  return (
    <Button
      ref={ref}
      data-sidebar="trigger"
      variant="ghost"
      size="icon"
      className={cn("h-7 w-7", className)}
      onClick={(event) => {
        onClick?.(event)
        toggleSidebar()
      }}
      {...props}
    >
      <PanelLeft />
      <span className="sr-only">Toggle Sidebar</span>
    </Button>
  )
})
SidebarTrigger.displayName = "SidebarTrigger"

const SidebarRail = React.forwardRef<
  HTMLButtonElement,
  React.ComponentProps<"button">
>(({ className, ...props }, ref) => {
  const { toggleSidebar } = useSidebar()

  return (
    <button
      ref={ref}
      data-sidebar="rail"
      aria-label="Toggle Sidebar"
      tabIndex={-1}
      onClick={toggleSidebar}
      title="Toggle Sidebar"
      className={cn(
        "absolute inset-y-0 z-20 hidden w-4 -translate-x-1/2 transition-all ease-linear after:absolute after:inset-y-0 after:left-1/2 after:w-[2px] hover:after:bg-sidebar-border group-data-[side=left]:-right-4 group-data-[side=right]:left-0 sm:flex",
        "[[data-side=left]_&]:cursor-w-resize [[data-side=right]_&]:cursor-e-resize",
        "[[data-side=left][data-state=collapsed]_&]:cursor-e-resize [[data-side=right][data-state=collapsed]_&]:cursor-w-resize",
        "group-data-[collapsible=offcanvas]:translate-x-0 group-data-[collapsible=offcanvas]:after:left-full group-data-[collapsible=offcanvas]:hover:bg-sidebar",
        "[[data-side=left][data-collapsible=offcanvas]_&]:-right-2",
        "[[data-side=right][data-collapsible=offcanvas]_&]:-left-2",
        className
      )}
      {...props}
    />
  )
})
SidebarRail.displayName = "SidebarRail"

const SidebarInset = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"main">
>(({ className, ...props }, ref) => {
  return (
    <main
      ref={ref}
      className={cn(
        "relative flex min-h-svh flex-1 flex-col bg-background",
        "peer-data-[variant=inset]:min-h-[calc(100svh-theme(spacing.4))] md:peer-data-[variant=inset]:m-2 md:peer-data-[state=collapsed]:peer-data-[variant=inset]:ml-2 md:peer-data-[variant=inset]:ml-0 md:peer-data-[variant=inset]:rounded-xl md:peer-data-[variant=inset]:shadow",
        className
      )}
      {...props}
    />
  )
})
SidebarInset.displayName = "SidebarInset"

const SidebarInput = React.forwardRef<
  React.ElementRef<typeof Input>,
  React.ComponentProps<typeof Input>
>(({ className, ...props }, ref) => {
  return (
    <Input
      ref={ref}
      data-sidebar="input"
      className={cn(
        "h-8 w-full bg-background shadow-none focus-visible:ring-2 focus-visible:ring-sidebar-ring",
        className
      )}
      {...props}
    />
  )
})
SidebarInput.displayName = "SidebarInput"

const SidebarHeader = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div">
>(({ className, ...props }, ref) => {
  return (
    <div
      ref={ref}
      data-sidebar="header"
      className={cn("flex flex-col gap-2 p-2", className)}
      {...props}
    />
  )
})
SidebarHeader.displayName = "SidebarHeader"

const SidebarFooter = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div">
>(({ className, ...props }, ref) => {
  return (
    <div
      ref={ref}
      data-sidebar="footer"
      className={cn("flex flex-col gap-2 p-2", className)}
      {...props}
    />
  )
})
SidebarFooter.displayName = "SidebarFooter"

const SidebarSeparator = React.forwardRef<
  React.ElementRef<typeof Separator>,
  React.ComponentProps<typeof Separator>
>(({ className, ...props }, ref) => {
  return (
    <Separator
      ref={ref}
      data-sidebar="separator"
      className={cn("mx-2 w-auto bg-sidebar-border", className)}
      {...props}
    />
  )
})
SidebarSeparator.displayName = "SidebarSeparator"

const SidebarContent = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div">
>(({ className, ...props }, ref) => {
  return (
    <div
      ref={ref}
      data-sidebar="content"
      className={cn(
        "flex min-h-0 flex-1 flex-col gap-2 overflow-auto group-data-[collapsible=icon]:overflow-hidden",
        className
      )}
      {...props}
    />
  )
})
SidebarContent.displayName = "SidebarContent"

const SidebarGroup = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div">
>(({ className, ...props }, ref) => {
  return (
    <div
      ref={ref}
      data-sidebar="group"
      className={cn("relative flex w-full min-w-0 flex-col p-2", className)}
      {...props}
    />
  )
})
SidebarGroup.displayName = "SidebarGroup"

const SidebarGroupLabel = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div"> & { asChild?: boolean }
>(({ className, asChild = false, ...props }, ref) => {
  const Comp = asChild ? Slot : "div"

  return (
    <Comp
      ref={ref}
      data-sidebar="group-label"
      className={cn(
        "flex h-8 shrink-0 items-center rounded-md px-2 text-xs font-medium text-sidebar-foreground/70 outline-none ring-sidebar-ring transition-[margin,opa] duration-200 ease-linear focus-visible:ring-2 [&>svg]:size-4 [&>svg]:shrink-0",
        "group-data-[collapsible=icon]:-mt-8 group-data-[collapsible=icon]:opacity-0",
        className
      )}
      {...props}
    />
  )
})
SidebarGroupLabel.displayName = "SidebarGroupLabel"

const SidebarGroupAction = React.forwardRef<
  HTMLButtonElement,
  React.ComponentProps<"button"> & { asChild?: boolean }
>(({ className, asChild = false, ...props }, ref) => {
  const Comp = asChild ? Slot : "button"

  return (
    <Comp
      ref={ref}
      data-sidebar="group-action"
      className={cn(
        "absolute right-3 top-3.5 flex aspect-square w-5 items-center justify-center rounded-md p-0 text-sidebar-foreground outline-none ring-sidebar-ring transition-transform hover:bg-sidebar-accent hover:text-sidebar-accent-foreground focus-visible:ring-2 [&>svg]:size-4 [&>svg]:shrink-0",
        // Increases the hit area of the button on mobile.
        "after:absolute after:-inset-2 after:md:hidden",
        "group-data-[collapsible=icon]:hidden",
        className
      )}
      {...props}
    />
  )
})
SidebarGroupAction.displayName = "SidebarGroupAction"

const SidebarGroupContent = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div">
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    data-sidebar="group-content"
    className={cn("w-full text-sm", className)}
    {...props}
  />
))
SidebarGroupContent.displayName = "SidebarGroupContent"

const SidebarMenu = React.forwardRef<
  HTMLUListElement,
  React.ComponentProps<"ul">
>(({ className, ...props }, ref) => (
  <ul
    ref={ref}
    data-sidebar="menu"
    className={cn("flex w-full min-w-0 flex-col gap-1", className)}
    {...props}
  />
))
SidebarMenu.displayName = "SidebarMenu"

const SidebarMenuItem = React.forwardRef<
  HTMLLIElement,
  React.ComponentProps<"li">
>(({ className, ...props }, ref) => (
  <li
    ref={ref}
    data-sidebar="menu-item"
    className={cn("group/menu-item relative", className)}
    {...props}
  />
))
SidebarMenuItem.displayName = "SidebarMenuItem"

const sidebarMenuButtonVariants = cva(
  "peer/menu-button flex w-full items-center gap-2 overflow-hidden rounded-md p-2 text-left text-sm outline-none ring-sidebar-ring transition-[width,height,padding] hover:bg-sidebar-accent hover:text-sidebar-accent-foreground focus-visible:ring-2 active:bg-sidebar-accent active:text-sidebar-accent-foreground disabled:pointer-events-none disabled:opacity-50 group-has-[[data-sidebar=menu-action]]/menu-item:pr-8 aria-disabled:pointer-events-none aria-disabled:opacity-50 data-[active=true]:bg-sidebar-accent data-[active=true]:font-medium data-[active=true]:text-sidebar-accent-foreground data-[state=open]:hover:bg-sidebar-accent data-[state=open]:hover:text-sidebar-accent-foreground group-data-[collapsible=icon]:!size-8 group-data-[collapsible=icon]:!p-2 [&>span:last-child]:truncate [&>svg]:size-4 [&>svg]:shrink-0",
  {
    variants: {
      variant: {
        default: "hover:bg-sidebar-accent hover:text-sidebar-accent-foreground",
        outline:
          "bg-background shadow-[0_0_0_1px_hsl(var(--sidebar-border))] hover:bg-sidebar-accent hover:text-sidebar-accent-foreground hover:shadow-[0_0_0_1px_hsl(var(--sidebar-accent))]",
      },
      size: {
        default: "h-8 text-sm",
        sm: "h-7 text-xs",
        lg: "h-12 text-sm group-data-[collapsible=icon]:!p-0",
      },
    },
    defaultVariants: {
      variant: "default",
      size: "default",
    },
  }
)

const SidebarMenuButton = React.forwardRef<
  HTMLButtonElement,
  React.ComponentProps<"button"> & {
    asChild?: boolean
    isActive?: boolean
    tooltip?: string | React.ComponentProps<typeof TooltipContent>
  } & VariantProps<typeof sidebarMenuButtonVariants>
>(
  (
    {
      asChild = false,
      isActive = false,
      variant = "default",
      size = "default",
      tooltip,
      className,
      ...props
    },
    ref
  ) => {
    const Comp = asChild ? Slot : "button"
    const { isMobile, state } = useSidebar()

    const button = (
      <Comp
        ref={ref}
        data-sidebar="menu-button"
        data-size={size}
        data-active={isActive}
        className={cn(sidebarMenuButtonVariants({ variant, size }), className)}
        {...props}
      />
    )

    if (!tooltip) {
      return button
    }

    if (typeof tooltip === "string") {
      tooltip = {
        children: tooltip,
      }
    }

    return (
      <Tooltip>
        <TooltipTrigger asChild>{button}</TooltipTrigger>
        <TooltipContent
          side="right"
          align="center"
          hidden={state !== "collapsed" || isMobile}
          {...tooltip}
        />
      </Tooltip>
    )
  }
)
SidebarMenuButton.displayName = "SidebarMenuButton"

const SidebarMenuAction = React.forwardRef<
  HTMLButtonElement,
  React.ComponentProps<"button"> & {
    asChild?: boolean
    showOnHover?: boolean
  }
>(({ className, asChild = false, showOnHover = false, ...props }, ref) => {
  const Comp = asChild ? Slot : "button"

  return (
    <Comp
      ref={ref}
      data-sidebar="menu-action"
      className={cn(
        "absolute right-1 top-1.5 flex aspect-square w-5 items-center justify-center rounded-md p-0 text-sidebar-foreground outline-none ring-sidebar-ring transition-transform hover:bg-sidebar-accent hover:text-sidebar-accent-foreground focus-visible:ring-2 peer-hover/menu-button:text-sidebar-accent-foreground [&>svg]:size-4 [&>svg]:shrink-0",
        // Increases the hit area of the button on mobile.
        "after:absolute after:-inset-2 after:md:hidden",
        "peer-data-[size=sm]/menu-button:top-1",
        "peer-data-[size=default]/menu-button:top-1.5",
        "peer-data-[size=lg]/menu-button:top-2.5",
        "group-data-[collapsible=icon]:hidden",
        showOnHover &&
        "group-focus-within/menu-item:opacity-100 group-hover/menu-item:opacity-100 data-[state=open]:opacity-100 peer-data-[active=true]/menu-button:text-sidebar-accent-foreground md:opacity-0",
        className
      )}
      {...props}
    />
  )
})
SidebarMenuAction.displayName = "SidebarMenuAction"

const SidebarMenuBadge = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div">
>(({ className, ...props }, ref) => (
  <div
    ref={ref}
    data-sidebar="menu-badge"
    className={cn(
      "pointer-events-none absolute right-1 flex h-5 min-w-5 select-none items-center justify-center rounded-md px-1 text-xs font-medium tabular-nums text-sidebar-foreground",
      "peer-hover/menu-button:text-sidebar-accent-foreground peer-data-[active=true]/menu-button:text-sidebar-accent-foreground",
      "peer-data-[size=sm]/menu-button:top-1",
      "peer-data-[size=default]/menu-button:top-1.5",
      "peer-data-[size=lg]/menu-button:top-2.5",
      "group-data-[collapsible=icon]:hidden",
      className
    )}
    {...props}
  />
))
SidebarMenuBadge.displayName = "SidebarMenuBadge"

const SidebarMenuSkeleton = React.forwardRef<
  HTMLDivElement,
  React.ComponentProps<"div"> & {
    showIcon?: boolean
  }
>(({ className, showIcon = false, ...props }, ref) => {
  // Random width between 50 to 90%.
  const width = React.useMemo(() => {
    return `${Math.floor(Math.random() * 40) + 50}%`
  }, [])

  return (
    <div
      ref={ref}
      data-sidebar="menu-skeleton"
      className={cn("flex h-8 items-center gap-2 rounded-md px-2", className)}
      {...props}
    >
      {showIcon && (
        <Skeleton
          className="size-4 rounded-md"
          data-sidebar="menu-skeleton-icon"
        />
      )}
      <Skeleton
        className="h-4 max-w-[--skeleton-width] flex-1"
        data-sidebar="menu-skeleton-text"
        style={
          {
            "--skeleton-width": width,
          } as React.CSSProperties
        }
      />
    </div>
  )
})
SidebarMenuSkeleton.displayName = "SidebarMenuSkeleton"

const SidebarMenuSub = React.forwardRef<
  HTMLUListElement,
  React.ComponentProps<"ul">
>(({ className, ...props }, ref) => (
  <ul
    ref={ref}
    data-sidebar="menu-sub"
    className={cn(
      "mx-3.5 flex min-w-0 translate-x-px flex-col gap-1 border-l border-sidebar-border px-2.5 py-0.5",
      "group-data-[collapsible=icon]:hidden",
      className
    )}
    {...props}
  />
))
SidebarMenuSub.displayName = "SidebarMenuSub"

const SidebarMenuSubItem = React.forwardRef<
  HTMLLIElement,
  React.ComponentProps<"li">
>(({ ...props }, ref) => <li ref={ref} {...props} />)
SidebarMenuSubItem.displayName = "SidebarMenuSubItem"

const SidebarMenuSubButton = React.forwardRef<
  HTMLAnchorElement,
  React.ComponentProps<"a"> & {
    asChild?: boolean
    size?: "sm" | "md"
    isActive?: boolean
  }
>(({ asChild = false, size = "md", isActive, className, ...props }, ref) => {
  const Comp = asChild ? Slot : "a"

  return (
    <Comp
      ref={ref}
      data-sidebar="menu-sub-button"
      data-size={size}
      data-active={isActive}
      className={cn(
        "flex h-7 min-w-0 -translate-x-px items-center gap-2 overflow-hidden rounded-md px-2 text-sidebar-foreground outline-none ring-sidebar-ring hover:bg-sidebar-accent hover:text-sidebar-accent-foreground focus-visible:ring-2 active:bg-sidebar-accent active:text-sidebar-accent-foreground disabled:pointer-events-none disabled:opacity-50 aria-disabled:pointer-events-none aria-disabled:opacity-50 [&>span:last-child]:truncate [&>svg]:size-4 [&>svg]:shrink-0 [&>svg]:text-sidebar-accent-foreground",
        "data-[active=true]:bg-sidebar-accent data-[active=true]:text-sidebar-accent-foreground",
        size === "sm" && "text-xs",
        size === "md" && "text-sm",
        "group-data-[collapsible=icon]:hidden",
        className
      )}
      {...props}
    />
  )
})
SidebarMenuSubButton.displayName = "SidebarMenuSubButton"

export {
  Sidebar,
  SidebarContent,
  SidebarFooter,
  SidebarGroup,
  SidebarGroupAction,
  SidebarGroupContent,
  SidebarGroupLabel,
  SidebarHeader,
  SidebarInput,
  SidebarInset,
  SidebarMenu,
  SidebarMenuAction,
  SidebarMenuBadge,
  SidebarMenuButton,
  SidebarMenuItem,
  SidebarMenuSkeleton,
  SidebarMenuSub,
  SidebarMenuSubButton,
  SidebarMenuSubItem,
  SidebarProvider,
  SidebarRail,
  SidebarSeparator,
  SidebarTrigger,
  useSidebar,
}


================================================
FILE: web/components/ui/skeleton.tsx
================================================
import { cn } from "@/lib/utils"

function Skeleton({
  className,
  ...props
}: React.HTMLAttributes<HTMLDivElement>) {
  return (
    <div
      className={cn("animate-pulse rounded-md bg-primary/10", className)}
      {...props}
    />
  )
}

export { Skeleton }


================================================
FILE: web/components/ui/textarea.tsx
================================================
import * as React from "react"

import { cn } from "@/lib/utils"

const Textarea = React.forwardRef<
  HTMLTextAreaElement,
  React.ComponentProps<"textarea">
>(({ className, ...props }, ref) => {
  return (
    <textarea
      className={cn(
        "flex min-h-[60px] w-full rounded-md border border-input bg-transparent px-3 py-2 text-base shadow-sm placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-1 focus-visible:ring-ring disabled:cursor-not-allowed disabled:opacity-50 md:text-sm",
        className
      )}
      ref={ref}
      {...props}
    />
  )
})
Textarea.displayName = "Textarea"

export { Textarea }


================================================
FILE: web/components/ui/tooltip.tsx
================================================
"use client"

import * as React from "react"
import * as TooltipPrimitive from "@radix-ui/react-tooltip"

import { cn } from "@/lib/utils"

const TooltipProvider = TooltipPrimitive.Provider

const Tooltip = TooltipPrimitive.Root

const TooltipTrigger = TooltipPrimitive.Trigger

const TooltipContent = React.forwardRef<
  React.ElementRef<typeof TooltipPrimitive.Content>,
  React.ComponentPropsWithoutRef<typeof TooltipPrimitive.Content>
>(({ className, sideOffset = 4, ...props }, ref) => (
  <TooltipPrimitive.Portal>
    <TooltipPrimitive.Content
      ref={ref}
      sideOffset={sideOffset}
      className={cn(
        "z-50 overflow-hidden rounded-md bg-primary px-3 py-1.5 text-xs text-primary-foreground animate-in fade-in-0 zoom-in-95 data-[state=closed]:animate-out data-[state=closed]:fade-out-0 data-[state=closed]:zoom-out-95 data-[side=bottom]:slide-in-from-top-2 data-[side=left]:slide-in-from-right-2 data-[side=right]:slide-in-from-left-2 data-[side=top]:slide-in-from-bottom-2",
        className
      )}
      {...props}
    />
  </TooltipPrimitive.Portal>
))
TooltipContent.displayName = TooltipPrimitive.Content.displayName

export { Tooltip, TooltipTrigger, TooltipContent, TooltipProvider }


================================================
FILE: web/components.json
================================================
{
  "$schema": "https://ui.shadcn.com/schema.json",
  "style": "new-york",
  "rsc": true,
  "tsx": true,
  "tailwind": {
    "config": "tailwind.config.ts",
    "css": "app/globals.css",
    "baseColor": "zinc",
    "cssVariables": true,
    "prefix": ""
  },
  "aliases": {
    "components": "@/components",
    "utils": "@/lib/utils",
    "ui": "@/components/ui",
    "lib": "@/lib",
    "hooks": "@/hooks"
  },
  "iconLibrary": "lucide"
}

================================================
FILE: web/eslint.config.mjs
================================================
import { dirname } from "path";
import { fileURLToPath } from "url";
import { FlatCompat } from "@eslint/eslintrc";

const __filename = fileURLToPath(import.meta.url);
const __dirname = dirname(__filename);

const compat = new FlatCompat({
  baseDirectory: __dirname,
});

const eslintConfig = [
  ...compat.extends("next/core-web-vitals", "next/typescript"),
];

export default eslintConfig;


================================================
FILE: web/hooks/use-mobile.tsx
================================================
import * as React from "react"

const MOBILE_BREAKPOINT = 768

export function useIsMobile() {
  const [isMobile, setIsMobile] = React.useState<boolean | undefined>(undefined)

  React.useEffect(() => {
    const mql = window.matchMedia(`(max-width: ${MOBILE_BREAKPOINT - 1}px)`)
    const onChange = () => {
      setIsMobile(window.innerWidth < MOBILE_BREAKPOINT)
    }
    mql.addEventListener("change", onChange)
    setIsMobile(window.innerWidth < MOBILE_BREAKPOINT)
    return () => mql.removeEventListener("change", onChange)
  }, [])

  return !!isMobile
}


================================================
FILE: web/hooks/useLangGraphAgent/actions.ts
================================================
'use server';

import { Checkpoint } from './types';

const AGENT_URL = process.env.NEXT_PUBLIC_AGENT_URL;

export async function getHistory<TAgentState, TInterruptValue>(threadId: string): Promise<Checkpoint<TAgentState, TInterruptValue>[]> {
  const response = await fetch(`${AGENT_URL}/history?thread_id=${threadId}`);

  if (!response.ok) {
    try {
      // 尝试解析JSON错误
      const error = await response.json();
      throw new Error(error.detail || 'Failed to fetch agent history');
    } catch (jsonError) {
      // 如果响应不是JSON格式，返回状态文本或通用错误
      throw new Error(`Failed to fetch agent history: ${response.statusText || response.status}`);
    }
  }

  try {
    const data = await response.json();
    return data as Checkpoint<TAgentState, TInterruptValue>[];
  } catch (error) {
    console.error('Error parsing history response:', error);
    throw new Error('Failed to parse agent history response');
  }
}

export async function stopAgent(threadId: string): Promise<void> {
  const response = await fetch(`${AGENT_URL}/agent/stop`, {
    method: 'POST',
    headers: {
      'Content-Type': 'application/json',
    },
    body: JSON.stringify({ thread_id: threadId }),
  });

  if (!response.ok) {
    try {
      // 尝试解析JSON错误
      const error = await response.json();
      throw new Error(error.detail || 'Failed to stop agent');
    } catch (jsonError) {
      // 如果响应不是JSON格式，返回状态文本或通用错误
      throw new Error(`Failed to stop agent: ${response.statusText || response.status}`);
    }
  }
}

================================================
FILE: web/hooks/useLangGraphAgent/api.ts
================================================
import {
  AgentEvent,
  RunAgentInputInternal,
  ResumeAgentInputInternal,
  ReplayAgentInputInternal,
  ForkAgentInputInternal
} from './types';

function parseSSEMessage<TAgentState, TInterruptValue>(chunk: string): AgentEvent<TAgentState, TInterruptValue>[] {
  const messages: AgentEvent<TAgentState, TInterruptValue>[] = [];
  const lines = chunk.split('\n');
  let currentMessage: Partial<AgentEvent<TAgentState, TInterruptValue>> = {};

  for (const line of lines) {
    if (!line.trim()) {
      if (Object.keys(currentMessage).length) {
        messages.push(currentMessage as AgentEvent<TAgentState, TInterruptValue>);
        currentMessage = {};
      }
      continue;
    }

    const [field, ...valueArr] = line.split(':');
    const value = valueArr.join(':').trim();

    switch (field) {
      case 'event':
        currentMessage.event = value;
        break;
      case 'data':
        currentMessage.data = JSON.parse(value);
        break;
    }
  }

  if (Object.keys(currentMessage).length) {
    messages.push(currentMessage as AgentEvent<TAgentState, TInterruptValue>);
  }

  return messages;
}

export async function* callAgentRoute<TAgentState, TInterruptValue, TResumeValue>(
  body: RunAgentInputInternal<TAgentState> | ResumeAgentInputInternal<TResumeValue> | ForkAgentInputInternal<TAgentState> | ReplayAgentInputInternal):
  AsyncGenerator<AgentEvent<TAgentState, TInterruptValue>, void, unknown> {
  try {
    const response = await fetch('/api/agent', {
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
      },
      body: JSON.stringify(body),
    });

    if (!response.ok) {
      const error = await response.json();
      throw new Error(error.detail || 'Failed to call agent route');
    }

    const reader = response.body?.getReader();
    if (!reader) throw new Error('No reader available');

    const decoder = new TextDecoder();

    while (true) {
      const { done, value } = await reader.read();
      if (done) break;

      const chunk = decoder.decode(value);
      const parsedMessages = parseSSEMessage<TAgentState, TInterruptValue>(chunk);

      for (const msg of parsedMessages) {
        yield msg;
      }
    }
  } catch (error) {
    console.error('Error in callAgentRoute.', error);
    throw error;
  }
} 

================================================
FILE: web/hooks/useLangGraphAgent/ascii-tree.ts
================================================
import { Checkpoint } from "./types";

interface TreeNode {
  id: string;
  next?: string;
  state?: any;
  children: TreeNode[];
}

//Helper function for debugging purposes to build a tree from a list of checkpoints.
function buildTree<TAgentState, TInterruptValue>(checkpoints: Checkpoint<TAgentState, TInterruptValue>[]): TreeNode[] {
  const nodes = new Map<string, TreeNode>();
  const roots: TreeNode[] = [];

  // First create all nodes
  checkpoints.forEach(checkpoint => {
    const id = checkpoint.config.configurable.checkpoint_id;
    if (!nodes.has(id)) {
      nodes.set(id, {
        id,
        next: checkpoint.next?.[0],
        state: checkpoint.values,
        children: []
      });
    }
  });

  // Then build the tree structure
  checkpoints.forEach(checkpoint => {
    const nodeId = checkpoint.config.configurable.checkpoint_id;
    const parentId = checkpoint.parent_config?.configurable.checkpoint_id;
    const node = nodes.get(nodeId)!;

    if (parentId && nodes.has(parentId)) {
      const parent = nodes.get(parentId)!;
      parent.children.push(node);
    } else {
      roots.push(node);
    }
  });

  return roots;
}

interface PrintOptions {
  showState?: boolean;
  renderState?: (state: any) => string;
}

function defaultRenderState(state: any): string {
  const stateStr = JSON.stringify(state);
  if (stateStr.length > 50) {
    return `[${stateStr.substring(0, 47)}...]`;
  }
  return `[${stateStr}]`;
}

function printTreeNode(node: TreeNode, options: PrintOptions = {}, prefix: string = "", isLast: boolean = true): string {
  const connector = isLast ? "└── " : "├── ";
  const childPrefix = isLast ? "    " : "│   ";

  let result = prefix + connector + node.id;
  if (node.next) {
    result += ` → ${node.next}`;
  }
  if (options.showState && node.state) {
    const renderFn = options.renderState || defaultRenderState;
    result += " " + renderFn(node.state);
  }
  result += "\n";

  for (let i = 0; i < node.children.length; i++) {
    result += printTreeNode(
      node.children[i],
      options,
      prefix + childPrefix,
      i === node.children.length - 1
    );
  }

  return result;
}

export function printCheckpointTree<TAgentState, TInterruptValue>(checkpoints: Checkpoint<TAgentState, TInterruptValue>[], options: PrintOptions = {}): string {
  const roots = buildTree(checkpoints);
  let result = "";

  roots.forEach((root, index) => {
    result += printTreeNode(root, options, "", index === roots.length - 1);
  });

  return result;
} 

================================================
FILE: web/hooks/useLangGraphAgent/types.ts
================================================
/** 
 * Represents the current status of an agent:
 * - idle: agent is not running, waiting for user input
 * - running: agent is running
 * - stopping: stop request has been sent, waiting for agent to stop
 * - error: error has occurred calling agent. It can occur when the agent is not accessible 
 *          or when there is an error handling the request.
 * 
 * Note: If there is an error in the graph node, the error property will be set to true in GraphNode.
 */
export type AgentStatus = 'idle' | 'running' | 'stopping' | 'error';

/** Represents LangGraph checkpoint config */
export type CheckpointConfig = { configurable: { thread_id: string, checkpoint_id: string, checkpoint_ns: string } };

/** Represents LangGraph checkpoint metadata */
export type CheckpointMetadata = {
  source: string;
  step: number;
  writes: Record<string, object | object[]>;
  parents: Record<string, string>;
};

/** Generic interface for an interruption (Human in the loop). Value can be anything. */
export interface Interrupt<TInterruptValue> {
  value: TInterruptValue;
}

/** Represents LangGraph checkpoint
 * This object is recieved from the agent server.
 */
export interface Checkpoint<TAgentState, TInterruptValue> {
  next: string[];
  values: TAgentState;
  config: CheckpointConfig;
  interrupts?: Interrupt<TInterruptValue>[];
  parent_config?: CheckpointConfig;
  metadata?: CheckpointMetadata;
}

/** Graph checkpoint in the application.
 * @param nodes - array of nodes in the graph
 * @param stateInitial - initial state when checkpoint is created
 * @param state - state of the checkpoint after the nodes has been executed or intermediate state
 * @param stateDiff - difference between the initial state and the state after the node has been executed
 * @param interruptValue - contains the value passed to the interrupt function in the node
 * @param checkpointConfig - checkpoint config of the node
 * @param error - true if there is an error in the nodes.
 */
export interface AppCheckpoint<TAgentState, TInterruptValue> {
  nodes: GraphNode<TAgentState>[];
  stateInitial: TAgentState;
  state: TAgentState;
  stateDiff: TAgentState;
  interruptValue?: TInterruptValue;
  checkpointConfig: CheckpointConfig;
  error: boolean;
}

/** Node that is executed in the checkpoint.
 * @param name - name of the node
 * @param state - the state produced by the node
 */
export interface GraphNode<TAgentState> {
  name: string;
  state: Partial<TAgentState>;
}

/** Representation of the LangChain message. */
export interface Message {
  type: string;
  content: string;
  id?: string;
  tool_calls?: ToolCall[];
  name?: string; // Added name field
}

export type ToolCall = { name: string, args: object, id: string };

// StreamUpdateData interface for research progress updates
export interface StreamUpdateData {
  id: string;
  timestamp: number;
  title: string;
  status: 'running' | 'completed' | 'error';
  message: string;
  completedSteps?: number;
  totalSteps?: number;
  metadata?: Record<string, any>;
}

/** Data of the message chunk event. */
export interface NodeMessageChunk {
  node_name: string;
  message_chunk: MessageChunk;
}

/** Represents a LangChain message chunk. LLMs stream messages in chunks. */
export interface MessageChunk {
  content: string;
  id: string;
  tool_call_chunks?: ToolCallChunk[];
}

export type ToolCallChunk = { name?: string, args?: object, id?: string };

/** Interface for states that have messages property.
 * Inherit this interface in your agent state interface if you use messages.
 */
export interface WithMessages {
  messages: Message[];
}

/** Events that are emitted by the agent.
 * @param event - event type. Can be 'checkpoint', 'message_chunk', 'interrupt', 'custom', 'error', 'stream_update', 'end'.
 */
export interface AgentEvent<TAgentState, TInterruptValue> {
  event: string; // 'checkpoint', 'message_chunk', 'interrupt', 'custom', 'error', 'stream_update', 'end'
  data: Checkpoint<TAgentState, TInterruptValue> | NodeMessageChunk | Interrupt<TInterruptValue>[] | Partial<TAgentState> | StreamUpdateData | string | any;
}

/** Generic interface for an agent input. Thread id is required. */
interface AgentInput {
  thread_id: string;
}

export interface RunAgentInput<TAgentState> extends AgentInput {
  state: Partial<TAgentState>;
}

export interface ResumeAgentInput<TResumeValue> extends AgentInput {
  resume: TResumeValue;
}

export interface ForkAgentInput<TAgentState> extends AgentInput {
  config: CheckpointConfig;
  state: Partial<TAgentState>;
}

export interface ReplayAgentInput extends AgentInput {
  config: CheckpointConfig;
}

export interface RunAgentInputInternal<TAgentState> extends RunAgentInput<TAgentState> {
  type: "run";
}

export interface ResumeAgentInputInternal<TResumeValue> extends ResumeAgentInput<TResumeValue> {
  type: "resume";
}

export interface ForkAgentInputInternal<TAgentState> extends ForkAgentInput<TAgentState> {
  type: "fork";
}

export interface ReplayAgentInputInternal extends ReplayAgentInput {
  type: "replay";
}

================================================
FILE: web/hooks/useLangGraphAgent/useLangGraphAgent.tsx
================================================
import { useState, useCallback } from 'react';
import { v4 as uuidv4 } from 'uuid';
import {
  Checkpoint,
  Interrupt,
  AppCheckpoint,
  RunAgentInput,
  ResumeAgentInput,
  ForkAgentInput,
  ReplayAgentInput,
  RunAgentInputInternal,
  ResumeAgentInputInternal,
  ForkAgentInputInternal,
  ReplayAgentInputInternal,
  AgentStatus,
  ToolCall,
  WithMessages,
  NodeMessageChunk,
  StreamUpdateData,
  Message,
} from './types';
import { callAgentRoute } from './api';
import { getHistory, stopAgent } from './actions';

interface UseAgentStateCallbacks<TAgentState extends object | WithMessages, TInterruptValue> {
  /** Callback for when a checkpoint starts.*/
  onCheckpointStart?: (checkpoint: AppCheckpoint<TAgentState, TInterruptValue>) => void;
  /** Callback for when a checkpoint ends. */
  onCheckpointEnd?: (checkpoint: AppCheckpoint<TAgentState, TInterruptValue>) => void;
  /** Callback for when a checkpoint intermediate state is updated. It can happen in if the custom event in the node is called. */
  onCheckpointStateUpdate?: (checkpoint: AppCheckpoint<TAgentState, TInterruptValue>) => void;
}

// Singleton cache that persists across page navigations
// Enable if needed
const historyCache = new Map<string, Checkpoint<any, any>[]>();
const enableRestoreCache = false;

/**
 * Hook to manage agent state and execution.
 * @template TAgentState - Type of agent state. Can be any object or an object implementing {@link WithMessages} interface.
 *                        If the state has 'messages' property, it will be used for message processing.
 * @template TInterruptValue - Type of value used when agent execution is interrupted (usually several types of interruptions are possible).
 * @template TResumeValue - Type of value used when resuming agent execution (usually several types of resumes are possible).
 * @param callbacks - Optional callbacks for checkpoint lifecycle events (see {@link UseAgentStateCallbacks}).
 */
export function useLangGraphAgent<TAgentState extends object | WithMessages, TInterruptValue, TResumeValue>(
  callbacks?: UseAgentStateCallbacks<TAgentState, TInterruptValue>
) {
  const { onCheckpointStart, onCheckpointEnd, onCheckpointStateUpdate } = callbacks ?? {};

  const [status, setStatus] = useState<AgentStatus>('idle');
  const [restoring, setRestoring] = useState(false);
  const [restoreError, setRestoreError] = useState(false);
  const [appCheckpoints, setAppCheckpoints] = useState<AppCheckpoint<TAgentState, TInterruptValue>[]>([]);
  // Add messages state to directly manage message history
  const [messages, setMessages] = useState<Message[]>([]);
  const [progressUpdates, setProgressUpdates] = useState<Record<string, StreamUpdateData>>({});

  /**
   * Run the agent.
   * @param agentInput - Input configuration for running the agent (see {@link RunAgentInput}).
   */
  const run = useCallback(async (agentInput: RunAgentInput<TAgentState>) => {
    // Extract user input messages from state and ensure they have IDs
    const userInputMessages = (agentInput.state as WithMessages)?.messages ?? [];
    if (userInputMessages.length > 0 && !userInputMessages[0].id) {
      userInputMessages[0].id = `user-${uuidv4()}`;
    }

    // Update messages state immediately to show user input
    setMessages(prev => [...prev, ...(userInputMessages as Message[])]);
    
    setProgressUpdates({}); // Reset progress updates
    setAppCheckpoints([]); // Clear checkpoints for new run
    
    await callAgent({ type: "run", ...agentInput });
  }, []);

  /**
   * Resume the agent. Action should be called after the agent has been interrupted.
   * @param agentInput - Input configuration for resuming the agent (see {@link ResumeAgentInput}).
   */
  const resume = useCallback(async (agentInput: ResumeAgentInput<TResumeValue>) => {
    await callAgent({ type: "resume", ...agentInput });
  }, []);

  /**
   * Fork the checkpoint with the updated state.
   * @param agentInput - Input configuration for forking the agent (see {@link ForkAgentInput}).
   */
  const fork = useCallback(async (agentInput: ForkAgentInput<TAgentState>) => {
    removeAppCheckpointsAfterCheckpoint(agentInput.config.configurable.checkpoint_id);
    await callAgent({ type: "fork", ...agentInput });
  }, []);

  /**
   * Runs agent from the checkpoint.
   * @param agentInput - Input configuration for replaying the agent (see {@link ReplayAgentInput}).
   */
  const replay = useCallback(async (agentInput: ReplayAgentInput) => {
    removeAppCheckpointsAfterCheckpoint(agentInput.config.configurable.checkpoint_id);
    await callAgent({ type: "replay", ...agentInput });
  }, []);

  /**
   * Stops the agent execution. Agent will not stop immediately. It will stop before emitting the last event (see {@link AgentEvent}).
   * @param threadId - The ID of the thread to stop.
   */
  const stop = useCallback(async (threadId: string) => {
    try {
      setStatus('stopping');
      await stopAgent(threadId);
    } catch (error) {
      console.error('Error stopping agent:', error);
      setStatus('idle');
    }
  }, []);

  function removeAppCheckpointsAfterCheckpoint(checkpointId: string) {
    setAppCheckpoints(prevCheckpoints => {
      const index = prevCheckpoints.findIndex(
        node => node.checkpointConfig.configurable.checkpoint_id === checkpointId
      );
      if (index !== -1) {
        return prevCheckpoints.slice(0, index + 1);
      }
      return prevCheckpoints;
    });
  }

  const callAgent = useCallback(async (agentInput: RunAgentInputInternal<TAgentState> | ResumeAgentInputInternal<TResumeValue> | ForkAgentInputInternal<TAgentState> | ReplayAgentInputInternal) => {
    if (!agentInput.type) {
      throw new Error('Type is required');
    }

    if (!agentInput.thread_id) {
      throw new Error('Thread id is required');
    }

    // Create local copies of state to modify during streaming
    let currentMessagesCopy: Message[] = [];
    setMessages(prev => { 
      currentMessagesCopy = [...prev]; 
      return prev;
    });
    
    let currentAppCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[] = [];
    setAppCheckpoints(prev => { 
      currentAppCheckpoints = [...prev]; 
      return prev;
    });

    try {
      setStatus('running');
      // Invalidate cache when agent is called
      historyCache.delete(agentInput.thread_id);

      const messageStream = callAgentRoute<TAgentState, TInterruptValue, TResumeValue>(agentInput);
      for await (const msg of messageStream) {
        if (msg.event === 'checkpoint') {
          const checkpoint = msg.data as Checkpoint<TAgentState, TInterruptValue>;
          processCheckpoint(checkpoint, currentAppCheckpoints);
          
          // Update messages from checkpoint state if available
          const stateValues = checkpoint.values as WithMessages;
          if (stateValues?.messages) {
            currentMessagesCopy = deepCopy(stateValues.messages);
            setMessages([...currentMessagesCopy]);
          }
          
          setAppCheckpoints([...currentAppCheckpoints]);
        }

        if (msg.event === 'message_chunk') {
          processMessageChunk(msg.data as NodeMessageChunk, currentMessagesCopy);
          setMessages([...currentMessagesCopy]);
        }

        if (msg.event === 'stream_update') {
          try {
            let updateData: StreamUpdateData;
            if (typeof msg.data === 'string') {
              updateData = JSON.parse(msg.data) as StreamUpdateData;
            } else {
              updateData = msg.data as StreamUpdateData;
            }
            
            if (updateData?.id) {
              setProgressUpdates(prev => ({ ...prev, [updateData.id]: updateData }));
            } else {
              console.warn("Invalid stream_update data");
            }
          } catch (e) {
            console.error("Error processing stream_update:", e, msg.data);
          }
        }

        if (msg.event === 'custom') {
          processCustomEvent(msg.data as Partial<TAgentState>, currentAppCheckpoints);
          setAppCheckpoints([...currentAppCheckpoints]);
        }

        if (msg.event === 'interrupt') {
          processInterrupts(msg.data as Interrupt<TInterruptValue>[], currentAppCheckpoints);
          setAppCheckpoints([...currentAppCheckpoints]);
        }

        if (msg.event === 'error') {
          processError(currentAppCheckpoints);
          setAppCheckpoints([...currentAppCheckpoints]);
          setStatus('error');
        }
      }

      setStatus('idle');
    } catch (error) {
      console.error('Error in callAgent:', error);
      // Keep current messages on error
      setMessages(currentMessagesCopy);
      setStatus('error');
    }
  }, [onCheckpointStart, onCheckpointEnd, onCheckpointStateUpdate]);

  /**
   * Restores the agent state from the checkpoints history.
   * @param threadId - The ID of the thread to restore.
   * @returns Promise that resolves to the restored checkpoints
   */
  const restore = useCallback(async (threadId: string): Promise<AppCheckpoint<TAgentState, TInterruptValue>[]> => {
    if (!threadId) {
      throw new Error('Thread id is required');
    }

    try {
      setRestoring(true);
      setRestoreError(false);

      const restoredCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[] = [];
      let finalMessagesCopy: Message[] = [];
      
      let history: Checkpoint<TAgentState, TInterruptValue>[];

      // Try to get history from cache
      const cachedHistory = historyCache.get(threadId);
      if (cachedHistory && enableRestoreCache) {
        console.log("Getting history from cache");
        history = cachedHistory;
      } else {
        history = await getHistory(threadId);
        historyCache.set(threadId, history);
      }

      // History contains all forks of graph execution. We need to restore the last fork.
      const newHistory: Checkpoint<TAgentState, TInterruptValue>[] = [];
      let skipToCheckpointId: string | undefined = undefined;
      for (let i = 0; i < history.length; i++) {
        if (skipToCheckpointId && history[i].config.configurable.checkpoint_id !== skipToCheckpointId) {
          continue;
        }

        newHistory.push(history[i]);
        skipToCheckpointId = history[i].parent_config?.configurable.checkpoint_id;
      }

      for (const checkpoint of newHistory.reverse()) {
        processHistoryCheckpoint(checkpoint, restoredCheckpoints);
        
        // Extract messages from checkpoint state
        const stateValues = checkpoint.values as WithMessages;
        if (stateValues?.messages) {
          finalMessagesCopy = deepCopy(stateValues.messages);
        }
      }

      setAppCheckpoints(restoredCheckpoints);
      setMessages(finalMessagesCopy);
      
      return restoredCheckpoints;
    } catch (error) {
      console.error('Error restoring agent:', error);
      setRestoreError(true);
      throw new Error('Error restoring agent');
    } finally {
      setRestoring(false);
    }
  }, []);

  function processHistoryCheckpoint(checkpoint: Checkpoint<TAgentState, TInterruptValue>, appCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[]) {
    let interruptionInLastCheckpoint = false;

    // Update the last checkpoint with the latest checkpoint values
    if (appCheckpoints.length > 0) {
      const lastCheckpoint = appCheckpoints[appCheckpoints.length - 1];
      lastCheckpoint.state = deepCopy(checkpoint.values);
      lastCheckpoint.stateDiff = getStateDiff(lastCheckpoint.stateInitial, checkpoint.values);
      updateGraphNodeStateFromMetadata(lastCheckpoint, checkpoint);

      // Delete interrupt if there are further checkpoints to restore.
      // Preserve interrupt for the last checkpoint.
      interruptionInLastCheckpoint = lastCheckpoint.interruptValue !== undefined;
      if (interruptionInLastCheckpoint) {
        lastCheckpoint.interruptValue = undefined;
      }
    }

    // Create a new app checkpoint except for the last checkpoint.
    if (checkpoint.next.length > 0) {
      const newAppCheckpoint = createAppCheckpoint(checkpoint);

      // When restoring checkpoints from graph history, the checkpoint stores interrupts as interrupts property.
      if (checkpoint.interrupts) {
        newAppCheckpoint.interruptValue = checkpoint.interrupts?.[0]?.value; // handle only single interrupt for now
      }
      appCheckpoints.push(newAppCheckpoint);
    }
  }

  function processCheckpoint(checkpoint: Checkpoint<TAgentState, TInterruptValue>, appCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[]) {
    let interruptionInLastCheckpoint = false;

    // Update the last checkpoint with the latest checkpoint values
    if (appCheckpoints.length > 0) {
      const lastCheckpoint = appCheckpoints[appCheckpoints.length - 1];
      lastCheckpoint.state = deepCopy(checkpoint.values);
      lastCheckpoint.stateDiff = getStateDiff(lastCheckpoint.stateInitial, checkpoint.values);
      updateGraphNodeStateFromMetadata(lastCheckpoint, checkpoint);

      // Delete interrupt if there are further checkpoints. It means that the interruption was handled.
      // Preserve interrupt for the last checkpoint.
      interruptionInLastCheckpoint = lastCheckpoint.interruptValue !== undefined;
      if (interruptionInLastCheckpoint) {
        lastCheckpoint.interruptValue = undefined;
        onCheckpointEnd?.(lastCheckpoint);
      }
    }

    // Create a new checkpoint except for the last checkpoint. Do not create a new checkpoint if there was an interruption in the last checkpoint.
    if (checkpoint.next.length > 0 && !interruptionInLastCheckpoint) {
      const newCheckpoint = createAppCheckpoint(checkpoint);
      appCheckpoints.push(newCheckpoint);
      onCheckpointStart?.(newCheckpoint);
    }
  }

  function createAppCheckpoint(checkpoint: Checkpoint<TAgentState, TInterruptValue>): AppCheckpoint<TAgentState, TInterruptValue> {
    return {
      nodes: checkpoint.next.map((x, index) => {
        const matchingKey = Object.keys(checkpoint.metadata?.writes ?? {}).find(key => key === x);
        const value = matchingKey ? checkpoint.metadata?.writes?.[matchingKey] : undefined;
        return {
          name: x,
          state: matchingKey
            ? Array.isArray(value)
              ? deepCopy((value as Partial<TAgentState>[])[index] as TAgentState)
              : deepCopy(value as TAgentState)
            : {} as TAgentState
        };
      }),
      stateInitial: deepCopy(checkpoint.values),
      state: deepCopy(checkpoint.values),
      stateDiff: {} as TAgentState,
      checkpointConfig: checkpoint.config,
      error: false
    };
  }

  function updateGraphNodeStateFromMetadata(appCheckpoint: AppCheckpoint<TAgentState, TInterruptValue>, checkpoint: Checkpoint<TAgentState, TInterruptValue>) {
    // Update nodes states with the writes from the checkpoint metadata
    Object.entries(checkpoint.metadata?.writes ?? {}).forEach(([key, value]) => {
      const matchingNodes = appCheckpoint.nodes.filter(node => node.name === key);
      matchingNodes.forEach((node, index) => {
        node.state = Array.isArray(value)
          ? deepCopy((value as Partial<TAgentState>[])[index] as TAgentState)
          : deepCopy(value as TAgentState);
      });
    });
  }

  function processMessageChunk(nodeMessageChunk: NodeMessageChunk, currentMessages: Message[]) {
    if (!nodeMessageChunk?.message_chunk?.id) return;
    
    const chunkId = nodeMessageChunk.message_chunk.id;
    const chunkContent = nodeMessageChunk.message_chunk.content || '';
    const chunkToolCalls = nodeMessageChunk.message_chunk.tool_call_chunks;
    
    const existingMsgIndex = currentMessages.findIndex(m => m.id === chunkId);

    if (existingMsgIndex !== -1) {
      // Update existing message
      currentMessages[existingMsgIndex].content += chunkContent;
      
      // Process tool call chunks if available
      if (chunkToolCalls?.length > 0) {
        // Update or add tool calls
        if (!currentMessages[existingMsgIndex].tool_calls) {
          currentMessages[existingMsgIndex].tool_calls = [];
        }
        
        // For each tool call chunk, find matching tool call or create new one
        chunkToolCalls.forEach(toolCallChunk => {
          if (!toolCallChunk.id) return;
          
          const existingToolCallIndex = currentMessages[existingMsgIndex].tool_calls?.findIndex(
            tc => tc.id === toolCallChunk.id
          );
          
          if (existingToolCallIndex !== -1 && currentMessages[existingMsgIndex].tool_calls) {
            // Update existing tool call
            const toolCall = currentMessages[existingMsgIndex].tool_calls![existingToolCallIndex];
            if (toolCallChunk.name) toolCall.name = toolCallChunk.name;
            
            // Append arguments (typically JSON string)
            if (toolCallChunk.args) {
              if (!toolCall.args) toolCall.args = {};
              try {
                const argsObj = typeof toolCallChunk.args === 'string' 
                  ? JSON.parse(toolCallChunk.args)
                  : toolCallChunk.args;
                toolCall.args = { ...toolCall.args, ...argsObj };
              } catch (e) {
                console.error("Error parsing tool call args:", e);
                // If parsing fails, store as raw string
                toolCall.args = toolCallChunk.args;
              }
            }
          } else if (currentMessages[existingMsgIndex].tool_calls) {
            // Create new tool call
            currentMessages[existingMsgIndex].tool_calls.push({
              id: toolCallChunk.id,
              name: toolCallChunk.name || '',
              args: toolCallChunk.args || {}
            });
          }
        });
      }
      
      // Update node-specific messages
      if (nodeMessageChunk.node_name) {
        // This is handled by the checkpoint update, not needed here
      }
    } else {
      // Create new message
      const toolCalls: ToolCall[] = [];
      
      // Initialize tool calls if present in the chunk
      if (chunkToolCalls?.length > 0) {
        chunkToolCalls.forEach(tc => {
          if (tc.id && tc.name) {
            toolCalls.push({
              id: tc.id,
              name: tc.name,
              args: tc.args || {}
            });
          }
        });
      }
      
      const newMessage: Message = {
        type: "ai",
        content: chunkContent,
        id: chunkId,
        tool_calls: toolCalls.length > 0 ? toolCalls : undefined
      };
      
      if (nodeMessageChunk.node_name) {
        newMessage.name = nodeMessageChunk.node_name;
      }
      
      currentMessages.push(newMessage);
    }
  }

  function processCustomEvent(state: Partial<TAgentState>, appCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[]) {
    if (appCheckpoints.length === 0) {
      return;
    }

    // Update the last checkpoint state. Update only the properties that are in the custom event.
    const lastCheckpoint = appCheckpoints[appCheckpoints.length - 1];
    lastCheckpoint.state = deepCopy({ ...lastCheckpoint.state, ...state }) as TAgentState;

    // Update all child nodes with the same partial state
    lastCheckpoint.nodes.forEach(node => {
      node.state = deepCopy({ ...node.state, ...state }) as TAgentState;
    });

    onCheckpointStateUpdate?.(lastCheckpoint);
  }

  function processInterrupts(interrupts: Interrupt<TInterruptValue>[], appCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[]) {
    if (appCheckpoints.length === 0) {
      return;
    }

    const lastCheckpoint = appCheckpoints[appCheckpoints.length - 1];
    lastCheckpoint.interruptValue = interrupts[0].value; // handle only single interrupt for now
  }

  function processError(appCheckpoints: AppCheckpoint<TAgentState, TInterruptValue>[]) {
    if (appCheckpoints.length === 0) {
      return;
    }

    const lastCheckpoint = appCheckpoints[appCheckpoints.length - 1];
    lastCheckpoint.error = true;
  }

  function getStateDiff(stateOld: TAgentState, stateNew: TAgentState): TAgentState {
    const diff = {} as TAgentState;

    // Get all keys from old state (structure should be the same in both states)
    const keys = Object.keys(stateOld);

    for (const key of keys) {
      const oldValue = (stateOld as any)[key];
      const newValue = (stateNew as any)[key];

      // Handle arrays - only include new items
      if (Array.isArray(oldValue)) {
        const newItems = newValue.filter((newItem: any) =>
          !oldValue.some((oldItem: any) =>
            JSON.stringify(oldItem) === JSON.stringify(newItem)
          )
        );
        (diff as any)[key] = newItems.length > 0 ? deepCopy(newItems) : [];
        continue;
      }

      // For objects, recursively compute diff
      if (typeof oldValue === 'object' && oldValue !== null) {
        (diff as any)[key] = getStateDiff(oldValue, newValue);
      }
      // For primitive values, include both changed and unchanged
      else {
        (diff as any)[key] = newValue;
      }
    }

    return diff;
  }

  function deepCopy<T>(obj: T): T {
    if (obj === null || typeof obj !== 'object') { 
      return obj; 
    }
    try { 
      return JSON.parse(JSON.stringify(obj)); 
    } catch (e) { 
      console.error("Deep copy failed:", e); 
      return obj; 
    }
  }

  return { 
    status, 
    appCheckpoints, 
    run, 
    resume, 
    fork, 
    replay, 
    restore, 
    stop, 
    restoring,
    restoreError,
    messages,
    progressUpdates
  };
}


================================================
FILE: web/next.config.ts
================================================
import type { NextConfig } from "next";

const nextConfig: NextConfig = {
  /* config options here */
};

export default nextConfig;


================================================
FILE: web/package.json
================================================
{
  "name": "langgraph-client",
  "version": "0.1.0",
  "private": true,
  "scripts": {
    "dev": "next dev --turbopack",
    "build": "next build",
    "start": "next start",
    "lint": "next lint"
  },
  "dependencies": {
    "@radix-ui/react-checkbox": "^1.1.3",
    "@radix-ui/react-dialog": "^1.1.5",
    "@radix-ui/react-popover": "^1.1.5",
    "@radix-ui/react-progress": "^1.1.2",
    "@radix-ui/react-separator": "^1.1.1",
    "@radix-ui/react-slot": "^1.1.1",
    "@radix-ui/react-tooltip": "^1.1.7",
    "class-variance-authority": "^0.7.1",
    "clsx": "^2.1.1",
    "framer-motion": "^12.0.6",
    "lucide-react": "^0.474.0",
    "next": "15.1.0",
    "next-themes": "^0.4.4",
    "react": "^19.0.0",
    "react-dom": "^19.0.0",
    "react-json-view-lite": "^2.3.0",
    "react-markdown": "^9.0.3",
    "remark-gfm": "^4.0.0",
    "tailwind-merge": "^2.6.0",
    "tailwindcss-animate": "^1.0.7",
    "uuid": "^11.1.0",
    "zustand": "^5.0.3"
  },
  "devDependencies": {
    "@eslint/eslintrc": "^3",
    "@types/node": "^20",
    "@types/react": "^19",
    "@types/react-dom": "^19",
    "eslint": "^9",
    "eslint-config-next": "15.1.0",
    "postcss": "^8",
    "tailwindcss": "^3.4.1",
    "typescript": "^5"
  }
}


================================================
FILE: web/postcss.config.mjs
================================================
/** @type {import('postcss-load-config').Config} */
const config = {
  plugins: {
    tailwindcss: {},
  },
};

export default config;


================================================
FILE: web/stores/chat-store.tsx
================================================
import { create } from 'zustand'

export interface ChatItem {
  id: string; // Corresponds to thread_id
  name: string;
  agentId: string; // e.g., 'chat', 'deep-research'
  agentName: string; // e.g., 'default', 'deep_research', 'customer_service'
  // Optional: Add creation timestamp, last updated timestamp, etc.
  createdAt: number;
}

interface ChatStore {
  chats: ChatItem[]
  addChat: (agentId:string, agentName:string, initialName?: string) => ChatItem
}

export const useChatStore = create<ChatStore>((set, get) => ({
  chats: [],
  addChat: (agentId: string, agentName: string, initialName?: string) => {
    const newChat: ChatItem = {
      id: crypto.randomUUID(),
      // Use provided initial name or generate default based on agent and count
      name: initialName || `${agentName} Chat ${get().chats.filter(c => c.agentName === agentName).length + 1}`,
      agentId: agentId, // Store the agent ID
      agentName: agentName, // Store the agent name
      createdAt: Date.now(),
    };
    set((state) => ({
      chats: [newChat, ...state.chats] // Add to beginning for recency
    }));
    return newChat;
  }
}))

================================================
FILE: web/tailwind.config.ts
================================================
import type { Config } from "tailwindcss";

export default {
    darkMode: ["class"],
    content: [
    "./pages/**/*.{js,ts,jsx,tsx,mdx}",
    "./components/**/*.{js,ts,jsx,tsx,mdx}",
    "./app/**/*.{js,ts,jsx,tsx,mdx}",
  ],
  theme: {
  	extend: {
  		colors: {
  			background: 'hsl(var(--background))',
  			foreground: 'hsl(var(--foreground))',
  			card: {
  				DEFAULT: 'hsl(var(--card))',
  				foreground: 'hsl(var(--card-foreground))'
  			},
  			popover: {
  				DEFAULT: 'hsl(var(--popover))',
  				foreground: 'hsl(var(--popover-foreground))'
  			},
  			primary: {
  				DEFAULT: 'hsl(var(--primary))',
  				foreground: 'hsl(var(--primary-foreground))'
  			},
  			secondary: {
  				DEFAULT: 'hsl(var(--secondary))',
  				foreground: 'hsl(var(--secondary-foreground))'
  			},
  			muted: {
  				DEFAULT: 'hsl(var(--muted))',
  				foreground: 'hsl(var(--muted-foreground))'
  			},
  			accent: {
  				DEFAULT: 'hsl(var(--accent))',
  				foreground: 'hsl(var(--accent-foreground))'
  			},
  			destructive: {
  				DEFAULT: 'hsl(var(--destructive))',
  				foreground: 'hsl(var(--destructive-foreground))'
  			},
  			border: 'hsl(var(--border))',
  			input: 'hsl(var(--input))',
  			ring: 'hsl(var(--ring))',
  			chart: {
  				'1': 'hsl(var(--chart-1))',
  				'2': 'hsl(var(--chart-2))',
  				'3': 'hsl(var(--chart-3))',
  				'4': 'hsl(var(--chart-4))',
  				'5': 'hsl(var(--chart-5))'
  			},
  			sidebar: {
  				DEFAULT: 'hsl(var(--sidebar-background))',
  				foreground: 'hsl(var(--sidebar-foreground))',
  				primary: 'hsl(var(--sidebar-primary))',
  				'primary-foreground': 'hsl(var(--sidebar-primary-foreground))',
  				accent: 'hsl(var(--sidebar-accent))',
  				'accent-foreground': 'hsl(var(--sidebar-accent-foreground))',
  				border: 'hsl(var(--sidebar-border))',
  				ring: 'hsl(var(--sidebar-ring))'
  			}
  		},
  		borderRadius: {
  			lg: 'var(--radius)',
  			md: 'calc(var(--radius) - 2px)',
  			sm: 'calc(var(--radius) - 4px)'
  		}
  	}
  },
  plugins: [require("tailwindcss-animate")],
} satisfies Config;


================================================
FILE: web/tsconfig.json
================================================
{
  "compilerOptions": {
    "target": "ES2017",
    "lib": ["dom", "dom.iterable", "esnext"],
    "allowJs": true,
    "skipLibCheck": true,
    "strict": true,
    "noEmit": true,
    "esModuleInterop": true,
    "module": "esnext",
    "moduleResolution": "bundler",
    "resolveJsonModule": true,
    "isolatedModules": true,
    "jsx": "preserve",
    "incremental": true,
    "plugins": [
      {
        "name": "next"
      }
    ],
    "paths": {
      "@/*": ["./*"]
    }
  },
  "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
  "exclude": ["node_modules"]
}


================================================
FILE: web_for_a2a/.gitignore
================================================
# See https://help.github.com/articles/ignoring-files/ for more about ignoring files.

# dependencies
/node_modules
/.pnp
.pnp.*
.yarn/*
!.yarn/patches
!.yarn/plugins
!.yarn/releases
!.yarn/versions

# testing
/coverage

# next.js
/.next/
/out/

# production
/build

# misc
.DS_Store
*.pem

# debug
npm-debug.log*
yarn-debug.log*
yarn-error.log*
.pnpm-debug.log*

# env files (can opt-in for committing if needed)
.env.*

# vercel
.vercel

# typescript
*.tsbuildinfo
next-env.d.ts

================================================
FILE: web_for_a2a/Instruction.md
================================================
## 前端对接 DeepResearch A2A 流式接口实现指南 (Next.js + React)

### 1. 前提

* **A2A 服务器运行中:** 确保 `super_agents/deep_research/a2a_adapter/run_server.py` 启动的服务器正在运行，并且监听地址已知（例如 `http://127.0.0.1:8000`）。
* **技术栈:** 前端使用 Next.js, React, TypeScript, Tailwind CSS。
* **核心目标:** 在 Web UI 中实时展示 DeepResearch Agent 的研究进度和最终报告。
* **A2A 类型定义:** 理想情况下，前端可以共享或重新定义 `core/a2a/types.py` 中的关键 Pydantic 模型对应的 TypeScript 接口（如 `TaskStatusUpdateEvent`, `TaskArtifactUpdateEvent`, `Message`, `TextPart`, `DataPart` 等），以便在代码中获得类型检查和提示。

```typescript
// 示例 TypeScript 接口 (根据 types.py 定义)
interface TextPart {
  type: "text";
  text: string;
  metadata?: Record<string, any>;
}

interface DataPart {
  type: "data";
  data: Record<string, any>; // 结构化数据
  metadata?: Record<string, any>;
}

type Part = TextPart | DataPart; // 可以扩展 FilePart 等

interface Message {
  role: "user" | "agent";
  parts: Part[];
  metadata?: Record<string, any>;
}

interface TaskStatus {
  state: string; // TaskState 枚举值
  message?: Message;
  timestamp: string; // ISO format string
}

interface TaskStatusUpdateEvent {
  id: string; // Task ID
  status: TaskStatus;
  final: boolean;
  metadata?: Record<string, any>;
}

interface Artifact {
    name?: string;
    description?: string;
    parts: Part[];
    metadata?: Record<string, any>;
    index: number;
    append?: boolean;
    lastChunk?: boolean;
}

interface TaskArtifactUpdateEvent {
  id: string; // Task ID
  artifact: Artifact;
  final?: boolean; // Artifact 事件也可能有 final 标志
  metadata?: Record<string, any>;
}

// 流式响应中 result 字段的可能类型
type StreamEventResult = TaskStatusUpdateEvent | TaskArtifactUpdateEvent;

interface SendTaskStreamingResponse {
    jsonrpc: "2.0";
    id: string | number | null; // 对应请求的 ID
    result?: StreamEventResult;
    error?: {
        code: number;
        message: string;
        data?: any;
    };
}
```

### 2. 核心流程概述

1.  **用户输入:** 用户在 UI 中输入研究主题。
2.  **发起请求:** 前端使用 `Workspace` API 向 A2A 服务器的**主端点** (例如 `/`) 发送一个 HTTP `POST` 请求，请求体是符合 A2A 规范的 JSON-RPC 消息，`method` 为 `"tasks/sendSubscribe"`。
3.  **服务器响应:**
    * 如果请求有效且服务器成功启动后台任务并准备好 SSE 流，服务器**必须**返回一个 HTTP 200 OK 响应，且 `Content-Type` 头为 `text/event-stream`。
    * 如果请求无效或在建立流之前出错，服务器会返回一个普通的 JSON 响应（`Content-Type: application/json`），通常包含一个错误状态码（如 400 或 500）和 JSON-RPC 错误对象。
4.  **客户端处理流:**
    * 如果收到 `text/event-stream` 响应，客户端开始读取响应体 (Response Body) 中的数据流。
    * 流中的数据遵循 SSE 格式，主要是 `data: <JSON 字符串>\n\n`。
    * 客户端需要**持续读取、解码、解析**这些 SSE 事件。每个事件的 `data` 部分是一个 JSON 字符串，代表一个 `SendTaskStreamingResponse` 对象。
    * 客户端解析 `SendTaskStreamingResponse`，提取其中的 `result`（即 `TaskStatusUpdateEvent` 或 `TaskArtifactUpdateEvent`）。
    * 根据事件内容更新 UI（显示进度、最终报告）。
    * 直到收到带有 `final: true` 标志的事件或流被服务器关闭。

### 3. 技术选型: 为什么用 `Workspace` + ReadableStream 而不是 `EventSource`？

* 浏览器内置的 `EventSource` API 是处理 SSE 的标准方式，非常简洁易用。
* **但是，`EventSource` API 通常只能发起 `GET` 请求。** 而 A2A 协议规定 `tasks/sendSubscribe` 方法需要通过 `POST` 请求发送，因为需要传递包含 `message` 等信息的复杂 `params` 对象在请求体中。
* 因此，为了在**不修改标准 A2A 服务器行为**（即保持 `tasks/sendSubscribe` 为 POST）的情况下处理 SSE，我们需要使用更底层的 `Workspace` API。`Workspace` 可以发送 POST 请求，并且其返回的 `Response` 对象的 `.body` 属性是一个 `ReadableStream`，我们可以手动读取和解析这个流来处理 SSE 事件。

### 4. 实现步骤详解 (React/TypeScript 示例)

假设你在一个 React 组件（或自定义 Hook）中实现这个逻辑。

**步骤 1: 发起流式请求 (`tasks/sendSubscribe`)**

```typescript
import { useState, useCallback, useRef } from 'react';
import { v4 as uuidv4 } from 'uuid'; // 用于生成 Task ID
// ... import 其他类型 ...

// 在你的组件或 Hook 中
const [isLoading, setIsLoading] = useState(false);
const [error, setError] = useState<string | null>(null);
const [progressUpdates, setProgressUpdates] = useState<any[]>([]); // 存储解析后的事件数据
const [finalReport, setFinalReport] = useState<string | null>(null);
const abortControllerRef = useRef<AbortController | null>(null); // 用于中止 fetch 请求

const startStreamingResearch = useCallback(async (topic: string) => {
  setIsLoading(true);
  setError(null);
  setProgressUpdates([]);
  setFinalReport(null);

  // 确保之前的请求被中止（如果需要）
  if (abortControllerRef.current) {
    abortControllerRef.current.abort();
  }
  abortControllerRef.current = new AbortController();
  const signal = abortControllerRef.current.signal;


  const taskId = "deep_research_" + uuidv4();
  const message: Message = {
    role: "user",
    parts: [{ type: "text", text: topic }],
  };
  const payload = {
    id: taskId,
    sessionId: "web_session_" + uuidv4(), // 每次可以生成新的 Session
    message: message, // 注意：实际发送时 message 可能需要 .model_dump()，但 fetch 的 body 会 JSON.stringify
    acceptedOutputModes: ["text"],
    metadata: { skill_name: "deep_research" }
  };

  const requestBody = {
    jsonrpc: "2.0",
    method: "tasks/sendSubscribe",
    id: "req-" + taskId, // 请求本身的 ID
    params: payload
  };

  try {
    const response = await fetch(`http://127.0.0.1:8000`, { // 你的 A2A 服务器地址
      method: 'POST',
      headers: {
        'Content-Type': 'application/json',
        'Accept': 'text/event-stream', // 明确告诉服务器期望 SSE
      },
      body: JSON.stringify(requestBody),
      signal: signal, // 允许中止请求
    });

    // 步骤 2: 处理 Fetch 响应 & 获取 ReadableStream
    if (!response.ok) {
      // 如果 HTTP 状态码不是 2xx
      let errorMsg = `HTTP error! status: ${response.status}`;
      try {
        const errorJson = await response.json(); // 尝试解析错误 JSON 体
        errorMsg = errorJson?.error?.message || errorJson.detail || JSON.stringify(errorJson);
      } catch (e) {
        // 解析 JSON 失败，使用状态文本
        errorMsg = `${response.status} ${response.statusText}`;
      }
      throw new Error(errorMsg);
    }

    const contentType = response.headers.get('content-type');
    if (!contentType || !contentType.includes('text/event-stream')) {
      // 服务器没有返回 SSE 流！
      let errorMsg = `Expected Content-Type 'text/event-stream', but got '${contentType}'`;
       try {
        const errorJson = await response.json(); // 可能是 JSONRPC 错误
        errorMsg += ` - Body: ${errorJson?.error?.message || JSON.stringify(errorJson)}`;
      } catch (e) {
         // Try reading as text if not JSON
          errorMsg += ` - Body: ${await response.text()}`;
      }
      throw new Error(errorMsg);
    }

    // 获取 ReadableStream 读取器
    const reader = response.body?.getReader();
    if (!reader) {
      throw new Error('Failed to get response body reader');
    }

    // 步骤 3 & 4 & 5 & 6: 读取、解析 SSE 流并更新状态
    await processStream(reader);

  } catch (err: any) {
    if (err.name === 'AbortError') {
      console.log('Fetch aborted');
      setError('请求已中止');
    } else {
      console.error("Error during streaming request:", err);
      setError(`请求失败: ${err.message}`);
    }
    setTaskStatus('IDLE'); // 或者 'FAILED'
  } finally {
    setIsLoading(false);
     abortControllerRef.current = null; // 清理 AbortController
  }
}, []); // useCallback 依赖项根据实际情况添加

// 独立的流处理函数
const processStream = async (reader: ReadableStreamDefaultReader<Uint8Array>) => {
  const decoder = new TextDecoder();
  let buffer = '';
  let streamEnded = false;

  try {
    while (true) {
      const { done, value } = await reader.read();
      if (done) {
        console.log("Stream finished.");
        break;
      }
      buffer += decoder.decode(value, { stream: true });

      // 按 SSE 事件分隔符处理 buffer
      const events = buffer.split('\n\n');
      buffer = events.pop() || ''; // 保留最后不完整的部分

      for (const eventString of events) {
        if (!eventString.trim()) continue; // 跳过空事件

        // 解析 SSE 消息 (data: <JSON>)
        if (eventString.startsWith('data:')) {
          const jsonData = eventString.substring(5).trim();
          try {
            const eventResponse = JSON.parse(jsonData) as SendTaskStreamingResponse;

            if (eventResponse.error) {
              const error = eventResponse.error;
              console.error("Received SSE Error:", error);
              setError(`流式错误: Code=${error.code}, Msg=${error.message}`);
              streamEnded = true; // 出现错误，通常流会中断
              break; // 停止处理此流
            }

            const eventData = eventResponse.result; // TaskStatusUpdateEvent or TaskArtifactUpdateEvent
            if (!eventData) continue;

            // 更新状态 (示例：将整个事件数据存入列表)
            setProgressUpdates(prev => [...prev, eventData]);

            // 可以在这里根据 eventData 的类型做更精细的状态更新
            if ('status' in eventData) { // TaskStatusUpdateEvent
               setTaskStatus(eventData.status.state as TaskState || 'WORKING'); // 更新宏观状态
            }
            if ('artifact' in eventData) { // TaskArtifactUpdateEvent
                 // 假设最终报告在 TextPart
                 const reportPart = eventData.artifact.parts?.find(p => p.type === 'text') as TextPart | undefined;
                 if(reportPart) {
                     setFinalReport(prev => (prev || '') + reportPart.text); // 可以累积或直接设置
                 }
            }


            // 检查是否是最终事件
            if (eventData.final === true) {
              console.log("Final event flag received from server.");
              streamEnded = true;
              // 最终状态应该由事件本身携带的状态决定
              if ('status' in eventData) {
                  setTaskStatus(eventData.status.state as TaskState);
              } else {
                   setTaskStatus(TaskState.COMPLETED); // 假定 Artifact 事件也是完成
              }
               break; // 收到 final=true，我们可以停止读取这个流了
            }

          } catch (e) {
            console.error("Failed to parse SSE event data:", e, jsonData);
            // 可以选择设置错误状态或继续处理下一个事件
          }
        } else {
            // 处理其他 SSE 行 (如 event:, id:, retry:)，如果需要的话
             console.log("Received non-data SSE line:", eventString);
        }
      } // end for eventString in events
       if (streamEnded) break; // 如果内部逻辑判断流应结束，则跳出外层循环
    } // end while reader
  } catch (err: any) {
      console.error("Error reading stream:", err);
      setError(`读取流失败: ${err.message}`);
      setTaskStatus('FAILED'); // 流读取出错，标记失败
  } finally {
     // 确保 reader 被释放 (如果需要， though exiting loop usually suffices)
     // reader.releaseLock(); ? (Check MDN docs if needed)
     setIsLoading(false); // 确保加载状态结束
     if (!streamEnded && taskStatus !== TaskState.COMPLETED && taskStatus !== TaskState.FAILED) {
         // 如果流意外中断，设置一个合适的最终状态
         setError("流连接意外断开");
         setTaskStatus('FAILED'); // Or 'UNKNOWN'
     }
      console.log("Stream processing function finished.");
  }
};

// 在你的 React 组件的 JSX 中:
// <TopicInputForm onSubmit={startStreamingResearch} disabled={isLoading} />
// <StatusBar status={taskStatus} />
// <ErrorMessage error={error} />
// <ProgressDisplay updates={progressUpdates} />
// <ReportDisplay markdownContent={finalReport} />

```

**5. 处理 `DataPart` (在 `ProgressDisplay` 组件中):**

```typescript
// 假设 ProgressDisplay 组件接收 updates: any[]
const ProgressDisplay = ({ updates }: { updates: any[] }) => {
  return (
    <div className="progress-log mt-4 p-4 border rounded bg-gray-50 h-64 overflow-y-auto font-mono text-sm">
      {updates.map((eventData, index) => {
        let content = null;
        // 确定事件类型并提取 Parts
        let parts: Part[] | undefined = undefined;
        if (eventData && 'status' in eventData && eventData.status?.message?.parts) {
           parts = eventData.status.message.parts;
        } else if (eventData && 'artifact' in eventData && eventData.artifact?.parts) {
           // 注意：通常最终报告才放在 artifact 里，但这里也检查一下
           parts = eventData.artifact.parts;
        }

        if (parts) {
          content = parts.map((part, partIndex) => {
            if (part.type === 'text') {
              // 渲染 TextPart
              return <p key={`${index}-${partIndex}`} className="whitespace-pre-wrap">{part.text}</p>;
            } else if (part.type === 'data') {
              // 渲染 DataPart (示例：格式化 JSON)
              const data = part.data;
              // 尝试更友好的展示
              const step = data?.step || data?.step_name;
              const status = data?.status;
              const detail = data?.detail || data?.message;
              const query = data?.query;
              const source = data?.source;
              const count = data?.results_count;

              let friendlyText = `[${step || '步骤未知'}] ${status ? '(' + status + ')' : ''}`;
              if(source) friendlyText += ` 来源:${source}`;
              if(query) friendlyText += ` 查询:'${query}'`;
              if(count !== undefined) friendlyText += ` (${count}条结果)`;
              if(detail && detail !== readable_summary) friendlyText += ` - ${detail}`; // 避免重复


              return (
                <details key={`${index}-${partIndex}`} className="my-1 p-1 border-l-2 border-blue-300 bg-blue-50 text-xs">
                   <summary className="cursor-pointer text-blue-800">{friendlyText || `收到结构化数据 (点击展开)`}</summary>
                   <pre className="mt-1 text-gray-600 bg-white p-1 rounded overflow-x-auto">
                     {JSON.stringify(data, null, 2)}
                   </pre>
                </details>
              );
            }
            // 可以添加对 FilePart 的处理
            return null;
          });
        } else {
           // 如果无法解析 parts，显示原始事件数据（用于调试）
           content = <pre className="text-xs text-red-500">未知事件结构: {JSON.stringify(eventData)}</pre>;
        }

        // 用一个容器包裹每次更新的内容
        return <div key={index} className="update-event py-1 border-b border-gray-200">{content}</div>;
      })}
    </div>
  );
};
```

**6. 注意事项和进一步优化:**

* **错误处理:** 上述代码包含了基本的错误处理，但生产环境需要更细致的处理，例如区分网络错误、服务器错误、JSON 解析错误等。
* **SSE 解析健壮性:** 手动解析 SSE 流需要仔细处理边界情况，例如事件跨多个 `read()` 调用到达、`retry:` 指令等。可以考虑使用成熟的前端 SSE 客户端库（如果它们支持通过 `Workspace` 的 `ReadableStream` 或允许自定义请求方式）。
* **状态更新频率:** 如果服务器发送更新过于频繁，可能会导致 React 状态更新过多影响性能。可以考虑进行节流 (throttling) 或批处理 (batching) 更新。
* **`DataPart` 的约定:** 为了让前端能“理解”并友好地展示 `DataPart` 的内容，前后端需要约定好 `data` 字段中可能包含的键名和结构。
* **中止请求:** 代码中加入了 `AbortController`，允许在用户发起新的请求或离开页面时中止正在进行的 `Workspace` 请求和流式读取。
* **类型安全:** 强烈建议在前端项目中也维护一套与 `core/a2a/types.py` 同步的 TypeScript 接口定义，以获得完整的类型检查好处。

================================================
FILE: web_for_a2a/README.md
================================================
# DeepResearch A2A Web UI

## 概述

本项目是一个基于 **Next.js**, **React**, **TypeScript** 和 **Tailwind CSS** 构建的 Web 用户界面 (UI)，旨在与 **DeepResearch A2A (Agent-to-Agent) 服务器** 进行交互。用户可以通过此界面发起深度研究任务，并**实时查看**由服务器通过 Server-Sent Events (SSE) 推送的研究进度更新和最终生成的报告。

这个项目的主要目的是演示如何在现代 Web 前端应用中，使用浏览器原生 API (`Workspace`, `ReadableStream`) 来对接和处理符合 A2A 协议规范的流式响应。

## 特性

* **连接 A2A 服务:** 通过 HTTP 与指定的 DeepResearch A2A 服务器通信。
* **发起研究任务:** 向服务器发送符合 A2A `tasks/sendSubscribe` 规范的请求以启动流式研究任务。
* **实时流式更新:** 使用 `Workspace` API 的 `ReadableStream` 接收并解析来自服务器的 Server-Sent Events (SSE)，实时展示任务进度。
* **结构化数据显示:** 能够区分并展示 A2A 事件中的 `TextPart` 和 `DataPart`。
* **最终报告展示:** 在任务完成后，提取并展示最终的研究报告。
* **基础状态与错误显示:** 提供简单的 UI 反馈，显示任务的当前状态（空闲、进行中、完成、错误）和遇到的问题。

## 技术栈

* **框架:** Next.js (App Router)
* **UI 库:** React
* **语言:** TypeScript
* **样式:** Tailwind CSS
* **核心 API:** Browser `Workspace` API, `ReadableStream`, `TextDecoder`
* **辅助库:** `uuid` (用于生成客户端 Task ID 示例)

## 目录结构 (相关部分)

```
mentis/
└── web_for_a2a/            # Web UI 项目根目录
    ├── app/                # Next.js App Router 目录
    │   ├── api/
    │   │   └── a2a/        # （可选）API Route 代理目录
    │   │       └── [[...slug]]/
    │   │           └── route.ts
    │   ├── deepresearch/   # DeepResearch Agent 的 UI 页面
    │   │   └── page.tsx    # ★ UI 界面的核心实现文件
    │   └── layout.tsx      # 根布局
    │   └── page.tsx        # 根页面 (可能重定向或包含链接)
    ├── public/             # 静态资源
    ├── .env.local          # (可选) 本地环境变量配置文件
    ├── next.config.js      # Next.js 配置文件 (可能包含代理设置)
    ├── package.json
    ├── tailwind.config.ts
    └── tsconfig.json
```
*(★ 表示本文档重点关注的文件)*

## 前提条件

* Node.js (推荐 LTS 版本) 和 npm / yarn / pnpm / uv 等包管理器。
* **DeepResearch A2A 后端服务器** 必须正在运行，并且其地址可访问（默认为 `http://127.0.0.1:8000`）。
* 对 React, Next.js, TypeScript 和 `Workspace` API 有基本了解。

## 安装与设置

1.  **导航到目录:**
    ```bash
    cd mentis/web_for_a2a
    ```
2.  **安装依赖:** (根据你项目使用的包管理器选择)
    ```bash
    npm install
    # yarn install
    # pnpm install
    # uv sync
    ```
3.  **(可选) 配置后端服务器地址:**
    * 默认情况下，前端会尝试连接 `http://127.0.0.1:8000`。
    * 如果你使用了 API Route 代理（如 `/api/a2a`），或者你的 A2A 服务器地址不同，可以在 `web_for_a2a` 目录下创建一个 `.env.local` 文件，并设置环境变量：
        ```dotenv
        # .env.local
        NEXT_PUBLIC_A2A_SERVER_URL=/api/a2a # 指向代理
        # 或者
        # NEXT_PUBLIC_A2A_SERVER_URL=http://your-backend-address:port # 直接指向后端
        ```
    * **注意:** 环境变量名必须以 `NEXT_PUBLIC_` 开头，才能在浏览器端的代码中访问。`page.tsx` 中的代码 `process.env.NEXT_PUBLIC_A2A_SERVER_URL` 会读取这个值。

## 运行

1.  **确保后端 A2A 服务器已启动。**
2.  **启动 Next.js 开发服务器:**
    ```bash
    npm run dev
    # yarn dev
    # pnpm dev
    # uv run dev (如果配置了脚本)
    ```
3.  **访问页面:** 在浏览器中打开 Next.js 应用的地址（通常是 `http://localhost:3000`），并导航到 DeepResearch 页面（例如 `http://localhost:3000/deepresearch`）。

## 使用说明

当前示例 UI 非常简单：

1.  页面加载后，你会看到一个标题和一个按钮。
2.  点击 **"开始流式研究 (特斯拉主题)"** 按钮。
3.  按钮会变为 "研究进行中..." 并禁用。
4.  页面上的 **"当前状态"** 会变为 `streaming`。
5.  **"流式内容输出:"** 区域会开始实时显示从服务器推送过来的进度更新。你会看到 `[状态更新]` 或 `[收到报告片段]` 的标记，后面跟着相应的文本或结构化数据 (JSON 格式)。
6.  当研究完成或出错时，**"当前状态"** 会更新为 `completed` 或 `error`，按钮会重新启用。
7.  如果成功，最终的**研究报告**会显示在页面底部。
8.  如果过程中出现错误，错误信息会显示在状态下方。

## 核心实现：处理 A2A 流 (Fetch API + ReadableStream)

这是前端实现中最关键的部分，位于 `app/deepresearch/page.tsx` 的 `startStream` 和 `processStream` 函数中。

**为什么不直接用 `EventSource` API?**

标准的 `EventSource` 浏览器 API 非常适合接收 SSE，但它通常只能发起 `GET` 请求。而 A2A 协议规定启动流式任务 (`tasks/sendSubscribe`) 需要使用 `POST` 请求（因为要传递包含研究主题的 `message` 等参数）。为了在不修改标准 A2A 服务器行为的前提下实现此功能，我们选用了更底层的 `Workspace` API。

**`startStream` 函数主要流程:**

1.  **重置状态:** 清空之前的输出、错误，设置状态为 `streaming`。
2.  **创建 `AbortController`:** 用于在需要时（例如发起新请求或组件卸载）中止当前的 `Workspace` 请求。
3.  **构建请求体:** 创建符合 A2A `tasks/sendSubscribe` 方法要求的 JSON-RPC 请求对象，包含 `method`, `id`, 以及 `params` (内含客户端生成的 `taskId`, `sessionId`, `message` 等)。
4.  **发送 `Workspace` 请求:**
    * 使用 `POST` 方法。
    * 设置 `Content-Type: application/json` 和 `Accept: text/event-stream` 请求头。
    * 将 JSON-RPC 对象字符串化后作为 `body`。
    * 传入 `AbortController` 的 `signal`。
5.  **检查初始响应:**
    * 确认 `response.ok` (HTTP 状态码 2xx)。
    * **关键检查:** 确认 `response.headers.get('content-type')` 包含 `text/event-stream`。如果不是，说明服务器未能成功建立 SSE 连接（可能是服务器端错误或未正确返回流类型），此时应抛出错误。
    * **(调试日志)** 添加了打印所有响应头和 CORS 头 (`access-control-allow-origin`) 的日志，用于诊断连接问题。
6.  **获取 `ReadableStream`:** 从 `response.body` 获取流式读取器 `reader`。
7.  **调用 `processStream`:** 将 `reader` 传递给专门处理流的异步函数。

**`processStream` 函数主要流程 (SSE 解析核心):**

1.  **初始化:** 创建 `TextDecoder` 用于将服务器发送的 `Uint8Array` 数据块解码为文本；创建一个 `buffer` 字符串用于处理跨数据块的、不完整的 SSE 消息。
2.  **循环读取:** 使用 `while (true)` 和 `await reader.read()` 不断读取数据块。
3.  **解码与缓冲:** 将读取到的 `value` (Uint8Array) 解码并追加到 `buffer`。
4.  **分割 SSE 事件:** **关键步骤！** SSE 事件由两个连续的换行符 (`\n\n`, `\r\r`, 或 `\r\n\r\n`) 分隔。代码使用正则表达式 `/\r\n\r\n|\n\n|\r\r/` 来查找并分割出 buffer 中完整的事件字符串 (`eventString`)。未处理完的部分保留在 `buffer` 中供下次 `read()` 后拼接。
5.  **解析单个 SSE 事件:**
    * 对每个分割出的 `eventString` 进行处理。
    * 按行 (`\n`, `\r`, `\r\n`) 分割事件内部。
    * 遍历每一行，主要查找以 `data:` 开头的行，提取其后的 JSON 字符串 (`jsonData`)。SSE 事件可能包含多行 `data:`，代码会将其拼接起来。同时也处理 `event:`, `id:`, `retry:` 等标准 SSE 字段（虽然本示例主要关心 `data:`）。
    * **关键解析:** 使用 `JSON.parse(jsonData)` 将提取到的字符串解析为 JavaScript 对象 (`eventResponse`，预期符合 `SendTaskStreamingResponse` 接口)。
    * **添加了详细日志:** 在解析前后都打印了原始数据和解析结果，便于调试。
    * **错误处理:** 如果 `JSON.parse` 失败，会捕获异常，调用 `setError` 更新 UI，并停止处理流。
6.  **处理解析后的数据:**
    * 检查 `eventResponse.error`，如果存在则报告错误并停止。
    * 获取 `eventData = eventResponse.result` (即 `TaskStatusUpdateEvent` 或 `TaskArtifactUpdateEvent`)。
    * **更新 React 状态:** 调用 `setStreamedContent(prev => [...prev, eventData])` 将新的事件数据添加到状态数组中，这将触发 UI 重新渲染。
    * **检查结束标志:** 检查 `eventData.final === true`。如果为 `true`，则设置状态为 `completed` 并标记流结束。
7.  **循环与退出:** `while` 循环会持续进行，直到 `reader.read()` 返回 `done: true`，或者内部处理（如解析错误、收到 `final: true`）决定中断。

**`useEffect` 处理最终报告:**

* 当 `status` 变为 `'completed'` 时，此 Hook 会运行。
* 它会反向遍历 `streamedContent` 数组，查找最后一个包含 `artifact` 的事件。
* 如果找到，则从中提取 `TextPart` 的内容并设置到 `finalReport` 状态，用于在页面底部单独展示完整报告。

## 状态管理

主要使用 `useState` 管理以下关键状态：

* `status`: `'idle' | 'streaming' | 'completed' | 'error' | 'aborted'` - UI 的宏观状态。
* `streamedContent`: `StreamEventResult[]` - 存储从 SSE 流接收并解析出的所有事件 `result` 对象。
* `error`: `string | null` - 存储发生的错误信息。
* `finalReport`: `string | null` - 存储从最终 Artifact 中提取的报告文本。

## 数据展示

* **流式内容输出:** 通过 `.map()` 遍历 `streamedContent` 数组。
    * 根据每个 `eventData` 是 `TaskStatusUpdateEvent` 还是 `TaskArtifactUpdateEvent` 来决定显示标记（"[状态更新]" 或 "[收到报告片段]")。
    * 再遍历事件中的 `parts` 数组。
    * 对 `TextPart`，直接显示 `part.text`。
    * 对 `DataPart`，使用 `<pre>{JSON.stringify(part.data, null, 2)}</pre>` 格式化显示其 `data` 对象。**（优化点：可以根据 `data` 内部约定的字段进行更友好的渲染）**
* **最终报告:** 当 `finalReport` 有值时，在页面底部使用 `<pre>` 标签展示（可以替换为 Markdown 渲染器）。

## 限制与未来工作

* **UI 基础:** 当前 UI 非常简化，仅用于演示核心流式逻辑。需要构建更完善的组件、布局和样式。
* **仅流式:** 未包含发送同步任务 (`tasks/send`) 和轮询 (`tasks/get`) 的逻辑。
* **硬编码主题:** 研究主题是硬编码的，需要改为用户输入。
* **DataPart 展示:** 当前对 `DataPart` 只是简单显示 JSON，可以根据与后端约定的数据结构进行更丰富的可视化展示。
* **Markdown 渲染:** 最终报告目前使用 `<pre>` 显示，应替换为真正的 Markdown 渲染组件（如 `react-markdown`）。
* **错误处理:** 可以进一步细化错误处理和用户提示。
* **多轮对话/状态保持:** 当前实现不支持需要 Agent 保持状态的多轮对话。
* **真实推送通知:** 前端未处理 A2A 的推送通知逻辑。


## 后续步骤

1.  **构建更丰富的 UI 组件:** 将输入、状态、进度、报告显示拆分成独立的、样式更美观的 React 组件。
2.  **美化 `DataPart` 展示:** 根据你和后端约定好的 `DataPart` 结构，更有意义地展示结构化信息，而不是只显示 JSON。
3.  **实现用户输入:** 将硬编码的研究主题替换为真正的用户输入。
4.  **添加更完善的错误处理和用户反馈:** 例如，区分不同类型的错误，提供重试按钮等。
5.  **管理 AbortController:** 确保在组件卸载或发起新请求时，之前的 `Workspace` 请求能被正确中止。
6.  **状态管理库 (可选):** 如果应用变得复杂，可以引入 Zustand, Jotai, Redux 等状态管理库。
7.  **添加同步任务逻辑:** 如果需要，可以添加调用 `tasks/send` 和轮询 `tasks/get` 的逻辑。

================================================
FILE: web_for_a2a/app/api/a2a/route.ts
================================================
// 文件路径: app/api/a2a/[[...slug]]/route.ts (适用于 App Router)
// 或 pages/api/a2a/[...slug].ts (适用于 Pages Router, 需 slight modification in handler signature)

import { type NextRequest, NextResponse } from 'next/server';
import { NextApiRequest, NextApiResponse } from 'next'; // For Pages Router

// 后端 A2A 服务器的地址
const A2A_BACKEND_URL = process.env.A2A_BACKEND_URL || 'http://127.0.0.1:8000';

// --- App Router Version ---
export async function POST(request: NextRequest) {
  try {
    // 1. 获取前端请求的 body
    const body = await request.json();
    console.log('[API Route] Forwarding POST request to:', A2A_BACKEND_URL);
    console.log('[API Route] Request Body:', JSON.stringify(body, null, 2));

    // 2. 构造转发到 A2A 后端的请求
    // 注意： NextRequest.headers 是 Headers 对象, fetch 也接受 Headers 对象
    // 我们需要筛选或传递合适的 Headers
    const headersToForward = new Headers();
    headersToForward.set('Content-Type', 'application/json');
    // 如果后端需要 Accept 头来决定是否返回 SSE
    if (body?.method === 'tasks/sendSubscribe') {
        headersToForward.set('Accept', 'text/event-stream');
    } else {
         headersToForward.set('Accept', 'application/json');
    }
    // 你可能需要传递其他必要的头，例如 Authorization (如果需要的话)
    // const authHeader = request.headers.get('Authorization');
    // if (authHeader) headersToForward.set('Authorization', authHeader);


    // 3. 使用 fetch 将请求转发到后端 A2A 服务器
    const backendResponse = await fetch(A2A_BACKEND_URL, {
      method: 'POST',
      headers: headersToForward,
      body: JSON.stringify(body),
      // 重要：如果需要流式传输，Node fetch 需要 duplex:'half' (或者它默认支持流)
      // 对于 Vercel Edge Runtime (默认在 App Router API Routes 中)， fetch 原生支持流
      // cache: 'no-store', // 确保不缓存
    });

    console.log(`[API Route] Backend response status: ${backendResponse.status}`);
    backendResponse.headers.forEach((value, key) => console.log(`[API Route] Backend header: ${key}: ${value}`));


    // 4. 处理后端响应
    const contentType = backendResponse.headers.get('content-type');

    if (contentType?.includes('text/event-stream') && backendResponse.body) {
      // 4a. 如果是 SSE 流，将其转发给前端
      console.log('[API Route] Forwarding SSE stream...');
      // 创建一个新的 ReadableStream 将后端流转发给前端
      const stream = new ReadableStream({
        async start(controller) {
          const reader = backendResponse.body!.getReader();
          const decoder = new TextDecoder(); // 用于调试日志
          try {
            while (true) {
              const { done, value } = await reader.read();
              if (done) {
                console.log('[API Route] Backend stream ended.');
                controller.close();
                break;
              }
              const decodedChunk = decoder.decode(value); // 调试用
              console.log('[API Route] Forwarding stream chunk:', decodedChunk.replace(/\n/g, '\\n'));
              controller.enqueue(value); // 将原始 Uint8Array 块转发给前端
            }
          } catch (error) {
            console.error('[API Route] Error reading from backend stream:', error);
            controller.error(error);
          } finally {
             // 确保 reader 被释放 (尽管在 done=true 或 error 时通常会自动处理)
            try {
                reader.releaseLock();
            } catch {}
          }
        }
      });

      // 返回带有正确 SSE 头信息的流式响应
      return new Response(stream, {
        status: backendResponse.status,
        headers: {
          'Content-Type': 'text/event-stream',
          'Cache-Control': 'no-cache',
          'Connection': 'keep-alive',
          // 可以选择性地转发其他必要的后端头信息
        }
      });

    } else {
      // 4b. 如果是普通 JSON 响应，解析并转发
      console.log('[API Route] Forwarding JSON response...');
      const jsonResponse = await backendResponse.json();
      console.log('[API Route] Backend JSON:', jsonResponse);
      return NextResponse.json(jsonResponse, { status: backendResponse.status });
    }

  } catch (error: any) {
    console.error("[API Route] Error in proxy:", error);
    return NextResponse.json(
        { error: 'Proxy error', detail: error.message },
        { status: 500 }
    );
  }
}

// 可以选择性地添加 GET 处理 /.well-known/agent.json (如果前端也想通过代理获取)
export async function GET(request: NextRequest) {
  const { pathname } = request.nextUrl;
  if (pathname === '/api/a2a/.well-known/agent.json') {
     try {
         const backendResponse = await fetch(`${A2A_BACKEND_URL}/.well-known/agent.json`);
         if (!backendResponse.ok) { throw new Error(`Backend error: ${backendResponse.status}`)};
         const data = await backendResponse.json();
         return NextResponse.json(data);
     } catch (error: any) {
         console.error("[API Route] Error fetching agent card:", error);
         return NextResponse.json({ error: 'Failed to fetch agent card'}, { status: 502 });
     }
  }
   return NextResponse.json({ error: 'Not Found' }, { status: 404 });
}

// --- Pages Router Version (Alternative) ---
/*
import type { NextApiRequest, NextApiResponse } from 'next';
import httpProxyMiddleware from 'next-http-proxy-middleware'; // 需要安装 next-http-proxy-middleware

const A2A_BACKEND_URL = process.env.A2A_BACKEND_URL || 'http://127.0.0.1:8000';

export const config = {
  api: {
    // 关闭 Next.js 的默认 body 解析，让代理处理
    bodyParser: false,
  },
};

// 使用 next-http-proxy-middleware 处理代理 (更简单，但流式支持可能需要验证)
const handler = (req: NextApiRequest, res: NextApiResponse) => {
    console.log(`[API Route Pages] Forwarding request ${req.method} ${req.url} to ${A2A_BACKEND_URL}`);
    return httpProxyMiddleware(req, res, {
        target: A2A_BACKEND_URL,
        // 重写路径，移除 /api/a2a 前缀
        pathRewrite: [{
            patternStr: '^/api/a2a',
            replaceStr: '',
        }],
        // 可能需要配置 changeOrigin: true
        changeOrigin: true,
        // selfHandleResponse: true, // 可能需要手动处理流式响应头，如果库不支持
        // onProxyRes: (proxyRes, req, res) => {
        //    // 如果需要手动处理 SSE 头
        //   if (proxyRes.headers['content-type']?.includes('text/event-stream')) {
        //     res.setHeader('Content-Type', 'text/event-stream');
        //     res.setHeader('Cache-Control', 'no-cache');
        //     res.setHeader('Connection', 'keep-alive');
        //     // 可能需要移除或修改其他头
        //   }
        // }
    });
};

export default handler;
*/

================================================
FILE: web_for_a2a/app/deepresearch/page.tsx
================================================
// 文件路径: mentis/web_for_a2a/app/deepresearch/page.tsx
'use client'; // 标记为客户端组件

import { useState, useCallback, useRef, useEffect } from 'react';
import { v4 as uuidv4 } from 'uuid';

// --- A2A 类型定义 (简化版) ---
interface TextPart { type: "text"; text: string; }
interface DataPart { type: "data"; data: Record<string, any>; }
type Part = TextPart | DataPart;
interface Message { role: "user" | "agent"; parts: Part[]; }
// 使用字符串类型来匹配 TaskState 枚举值
type TaskStateString = "submitted" | "working" | "input-required" | "completed" | "canceled" | "failed" | "unknown";
interface TaskStatus { state: TaskStateString | string; message?: Message; } // 允许 string 以防万一
interface Artifact { parts: Part[]; index?: number; /* 其他可选字段 */ }
interface TaskStatusUpdateEvent { id: string; status: TaskStatus; final: boolean; }
interface TaskArtifactUpdateEvent { id:string; artifact: Artifact; final?: boolean; }
type StreamEventResult = TaskStatusUpdateEvent | TaskArtifactUpdateEvent;
interface JSONRPCError { code: number; message: string; data?: any; }
interface SendTaskStreamingResponse {
    jsonrpc?: "2.0";
    id?: string | number | null;
    result?: StreamEventResult;
    error?: JSONRPCError;
}
// --- 类型定义结束 ---

const A2A_SERVER_URL = process.env.NEXT_PUBLIC_A2A_SERVER_URL || 'http://127.0.0.1:8000';

export default function DeepResearchPage() {
  // --- 状态管理 ---
  const [status, setStatus] = useState<'idle' | 'streaming' | 'completed' | 'error' | 'aborted'>('idle');
  const [streamedContent, setStreamedContent] = useState<StreamEventResult[]>([]);
  const [error, setError] = useState<string | null>(null);
  const [finalReport, setFinalReport] = useState<string | null>(null);
  const abortControllerRef = useRef<AbortController | null>(null);

  // --- 清理函数 ---
  useEffect(() => {
    return () => {
      console.log("组件卸载，中止进行中的 fetch 请求...");
      abortControllerRef.current?.abort();
    };
  }, []);

  // --- 核心：启动流式请求并处理 (保持不变) ---
  const startStream = useCallback(async () => {
    console.log("[startStream] Initiating stream...");
    setStatus('streaming'); setError(null); setStreamedContent([]); setFinalReport(null);
    if (abortControllerRef.current) { abortControllerRef.current.abort(); }
    abortControllerRef.current = new AbortController(); const signal = abortControllerRef.current.signal;
    const taskId = "webui_deep_research_" + uuidv4();
    const research_topic = "特斯拉电动汽车的市场分析和未来发展趋势";
    const message: Message = { role: "user", parts: [{ type: "text", text: research_topic }] };
    const payload = { id: taskId, sessionId: "webui_session_" + uuidv4(), message: message, acceptedOutputModes: ["text"], metadata: { skill_name: "deep_research" } };
    const requestBody = { jsonrpc: "2.0", method: "tasks/sendSubscribe", id: "req-" + taskId, params: payload };

    try {
      console.log("[startStream] Sending request:", JSON.stringify(requestBody, null, 2));
      const response = await fetch(A2A_SERVER_URL, { method: 'POST', headers: { 'Content-Type': 'application/json', 'Accept': 'text/event-stream' }, body: JSON.stringify(requestBody), signal: signal });
      console.log(`[startStream] Initial response status: ${response.status}`);
      console.log("[startStream] Received Response Headers:"); response.headers.forEach((value, key) => { console.log(`  ${key}: ${value}`); });
      const corsHeader = response.headers.get("access-control-allow-origin"); console.log(`[startStream] Access-Control-Allow-Origin Header value: ${corsHeader}`);
      if (!response.ok) { let errorMsg = `HTTP error! status: ${response.status}`; try { const errJson = await response.json(); errorMsg = errJson?.error?.message || JSON.stringify(errJson); } catch { errorMsg = `${response.status} ${response.statusText}`; } throw new Error(errorMsg); }
      const contentType = response.headers.get('content-type'); console.log(`[startStream] Initial response Content-Type: ${contentType}`);
      if (!contentType || !contentType.includes('text/event-stream')) { let errorMsg = `Expected Content-Type 'text/event-stream', but got '${contentType}'`; try { const errBody = await response.text(); errorMsg += ` - Body: ${errBody}`; } catch {} throw new Error(errorMsg); }
      const reader = response.body?.getReader(); if (!reader) throw new Error('Failed to get response body reader');
      console.log("[startStream] Got reader, starting stream processing...");
      await processStream(reader); // 调用修正后的 processStream
      setStatus(prevStatus => { if (prevStatus === 'streaming') { console.log("[startStream] Stream processing finished without error/final flag, setting status to completed."); return 'completed'; } console.log("[startStream] Stream processing finished, keeping status:", prevStatus); return prevStatus; });
    } catch (err: any) {
      if (err.name === 'AbortError') { console.log('[startStream] Stream fetch aborted by client.'); setStatus(prevStatus => { if (prevStatus === 'streaming') { setError('请求已中止'); return 'aborted'; } return prevStatus; }); }
      else { console.error("[startStream] Error during request setup or connection:", err); setError(`请求或连接失败: ${err.message}`); setStatus('error'); }
    } finally { console.log("[startStream] Cleaning up AbortController."); abortControllerRef.current = null; }
  // eslint-disable-next-line react-hooks/exhaustive-deps
  }, []);

  // --- *** 核心修改：processStream 函数 *** ---
  const processStream = async (reader: ReadableStreamDefaultReader<Uint8Array>) => {
    const decoder = new TextDecoder();
    let buffer = '';
    let streamEndedInLoop = false;

    console.log("[processStream] Starting stream processing loop.");

    while (!streamEndedInLoop) {
      try {
         console.log("[processStream] Waiting for reader.read()...");
         const { done, value } = await reader.read();
         console.log(`[processStream] reader.read() returned: done=${done}, value size=${value?.length}`);

         if (done) {
             console.log("[processStream] Stream finished by reader (done=true).");
             streamEndedInLoop = true;
             break; // 显式跳出 while 循环
         }

         buffer += decoder.decode(value, { stream: true });
         console.log(`[processStream] Decoded chunk, current buffer size: ${buffer.length}`); // 打印 buffer 大小

         // --- 使用正则表达式分割 SSE 事件，更健壮 ---
         // SSE 事件由两个换行符分隔 (\n\n, \r\r, or \r\n\r\n)
         const eventSeparatorRegex = /\r\n\r\n|\n\n|\r\r/;
         let match;

         // 循环处理 buffer 中的所有完整事件
         while ((match = eventSeparatorRegex.exec(buffer)) !== null) {
             const boundaryIndex = match.index;
             const eventString = buffer.substring(0, boundaryIndex); // 提取事件部分
             buffer = buffer.substring(boundaryIndex + match[0].length); // 移除已处理的事件和分隔符

             if (!eventString.trim()) {
                 console.log("[processStream] Skipping empty event string found by regex.");
                 continue; // 跳过空事件
             }

             console.log('[processStream] Processing raw SSE message:', eventString.replace(/\n/g, '\\n'));

             // SSE 事件通常包含多行 (event:, id:, data:, retry:)
             // 我们主要关心 data: 行
             const lines = eventString.split(/\r\n|\n|\r/); // 按行分割
             let eventType = 'message'; // 默认事件类型
             let eventDataString = '';
             let eventId = '';

             for (const line of lines) {
                 if (line.startsWith('event:')) {
                     eventType = line.substring(6).trim();
                 } else if (line.startsWith('data:')) {
                     // 如果 data 有多行，需要拼接
                     eventDataString += line.substring(5).trim() + "\n"; // 加换行符以区分多行 data
                 } else if (line.startsWith('id:')) {
                     eventId = line.substring(3).trim();
                 } // 可以添加对 retry: 的处理
             }
             eventDataString = eventDataString.trim(); // 移除末尾的换行符

             // 只处理我们关心的包含有效数据的事件
             if (eventDataString) {
                 console.log(`[processStream] Extracted SSE fields: type=${eventType}, id=${eventId}, data=${eventDataString}`);

                 try {
                     const eventResponse = JSON.parse(eventDataString) as SendTaskStreamingResponse;
                     console.log('[processStream] Successfully parsed JSON:', eventResponse);

                     if (eventResponse.error) {
                         const error = eventResponse.error; console.error("[processStream] Received SSE Error from server:", error);
                         setError(`流式错误 (来自服务器): Code=${error.code}, Msg=${error.message}`); setStatus('error');
                         streamEndedInLoop = true; break; // Exit inner processing loop
                     }
                     const eventData = eventResponse.result;
                     if (eventData) {
                         console.log("[processStream] Preparing to call setStreamedContent with:", eventData);
                         setStreamedContent(prev => [...prev, eventData]); // Update state
                         console.log("[processStream] Call to setStreamedContent completed.");

                         if (eventData.final === true) {
                             console.log("[processStream] Final event flag received. Setting status to completed.");
                             streamEndedInLoop = true; setStatus('completed');
                             // Let the inner loop finish processing this chunk, outer loop will break
                         } else {
                             setStatus(prevStatus => (prevStatus !== 'completed' && prevStatus !== 'error' && prevStatus !== 'aborted') ? 'streaming' : prevStatus);
                         }
                     } else { console.log("[processStream] Skipping event with no result data."); }
                 } catch (e: any) {
                     console.error("[processStream] Failed to parse SSE JSON data:", e, "\nRaw JSON string was:", eventDataString);
                     setError(`解析服务器事件失败: ${e.message}. 收到的数据 (部分): ${eventDataString.substring(0, 150)}...`); setStatus('error');
                     streamEndedInLoop = true; break; // Exit inner processing loop
                 }
             } else {
                 console.log("[processStream] Skipping SSE message with no data field.");
             }
              if (streamEndedInLoop) break; // Exit inner processing loop if needed
         } // end while match = regex.exec(buffer)

          if(streamEndedInLoop) break; // Exit outer while if needed

      } catch (readError: any) {
           console.error("[processStream] Error reading from stream:", readError);
           if (readError.name !== 'AbortError') { setError(`读取流错误: ${readError.message}`); setStatus('error'); }
           else { console.log("[processStream] Stream reading aborted by client."); setStatus('aborted'); }
           streamEndedInLoop = true; break; // Exit outer while
      }
    } // end while (!streamEndedInLoop)
    console.log("[processStream] Exited stream processing loop.");
  }; // end processStream

  // --- useEffect 处理最终报告 (保持不变) ---
  useEffect(() => {
    if (status === 'completed' && streamedContent.length > 0) {
      console.log("[useEffect] Status is completed, processing final report from streamedContent.");
      const finalArtifactEvent = [...streamedContent].reverse().find(ev => ev && 'artifact' in ev) as TaskArtifactUpdateEvent | undefined;
      if (finalArtifactEvent?.artifact?.parts) {
        const reportPart = finalArtifactEvent.artifact.parts.find(p => p.type === 'text') as TextPart | undefined;
        if (reportPart) { console.log("[useEffect] Found final report text in artifact."); setFinalReport(reportPart.text); }
        else { console.log("[useEffect] Completed, but no text part found in final artifact event."); }
      } else {
           console.log("[useEffect] Completed, but no artifact event found or artifact has no parts.");
           const lastStatusEvent = [...streamedContent].reverse().find(ev => ev && 'status' in ev) as TaskStatusUpdateEvent | undefined;
           if (lastStatusEvent?.status?.message?.parts) {
                const reportPart = lastStatusEvent.status.message.parts.find(p => p.type === 'text') as TextPart | undefined;
                 if (reportPart) { console.warn("[useEffect] No artifact found, using text from last status update as final report (fallback)."); setFinalReport(reportPart.text); }
           }
      }
    }
  }, [status, streamedContent]);

  // --- UI 渲染 (保持不变) ---
  return (
    <div className="container mx-auto p-4 font-sans">
      {/* ... (JSX 代码同上一版本) ... */}
      <h1 className="text-2xl font-bold mb-4">DeepResearch A2A 流式客户端 (带调试日志 v2)</h1>
      <button onClick={startStream} disabled={status === 'streaming'} className="px-4 py-2 bg-blue-500 text-white rounded hover:bg-blue-600 disabled:bg-gray-400">
        {status === 'streaming' ? '研究进行中...' : '开始流式研究 (特斯拉主题)'}
      </button>
      <div className="mt-4">
        <p><strong>当前状态:</strong> <span className={`font-semibold ${status === 'error' ? 'text-red-500' : status === 'completed' ? 'text-green-600': status === 'aborted' ? 'text-yellow-700' : 'text-blue-600'}`}>{status}</span></p>
        {error && <p className="text-red-500 mt-2"><strong>错误:</strong> {error}</p>}
      </div>
      <h2 className="text-xl font-semibold mt-6 mb-2">流式内容输出:</h2>
      <div className="stream-output p-4 border rounded bg-gray-100 min-h-[200px] max-h-[500px] overflow-y-auto text-sm font-mono">
        {streamedContent.length === 0 && status !== 'streaming' && status !== 'error' && status !== 'aborted' && <p className="text-gray-500">尚未接收到流式内容。</p>}
        {streamedContent.map((eventData, index) => {
          let displayContent: React.ReactNode = null; let parts: Part[] | undefined = undefined;
          if (eventData && 'status' in eventData && eventData.status?.message?.parts) { parts = eventData.status.message.parts; displayContent = <span className="text-blue-700">[状态更新]</span>; }
          else if (eventData && 'artifact' in eventData && eventData.artifact?.parts) { parts = eventData.artifact.parts; displayContent = <span className="text-green-700">[收到报告片段]</span>; }
          if (parts) { displayContent = (<>{displayContent}{" "}{parts.map((part, pIdx) => { if (part.type === 'text') {return <span key={pIdx}>{part.text}</span>;} else if (part.type === 'data') {return <pre key={pIdx} className="text-xs bg-gray-200 p-1 my-1 rounded overflow-x-auto">{JSON.stringify(part.data, null, 2)}</pre>;} return null; })}</>); }
          else if (typeof eventData === 'object' && eventData !== null) { displayContent = <pre className="text-xs text-gray-500">{JSON.stringify(eventData, null, 2)}</pre>; }
          else { displayContent = <span className="text-xs text-red-500">未知事件: {String(eventData)}</span>;}
          return <div key={index} className="py-1 border-b border-gray-300">{displayContent}</div>;
        })}
        {status === 'streaming' && <p className="text-gray-500 mt-2 animate-pulse">等待服务器事件...</p>}
        {status === 'completed' && !finalReport && <p className="text-yellow-600 font-bold mt-2">流处理完成，但未找到最终报告 Artifact。</p>}
        {status === 'error' && <p className="text-red-700 font-bold mt-2">流处理因错误终止。</p>}
        {status === 'aborted' && <p className="text-yellow-700 font-bold mt-2">流处理已中止。</p>}
      </div>
       {finalReport && (
            <>
                <h2 className="text-xl font-semibold mt-6 mb-2">最终报告:</h2>
                <div className="final-report p-4 border rounded bg-white prose max-w-none"> <pre className="whitespace-pre-wrap text-sm">{finalReport}</pre> </div>
                {status === 'completed' && <p className="text-green-700 font-bold mt-2">任务已成功完成。</p>}
            </>
       )}
    </div>
  );
}

================================================
FILE: web_for_a2a/app/globals.css
================================================
@tailwind base;
@tailwind components;
@tailwind utilities;

:root {
  --foreground-rgb: 0, 0, 0;
  --background-rgb: 255, 255, 255;
}

body {
  color: rgb(var(--foreground-rgb));
  background: rgb(var(--background-rgb));
}

.prose {
  max-width: 65ch;
  color: inherit;
}

.prose pre {
  background-color: #f3f4f6;
  border-radius: 0.375rem;
  padding: 0.75rem;
  overflow-x: auto;
}

================================================
FILE: web_for_a2a/app/layout.tsx
================================================
import './globals.css';
import type { Metadata } from 'next';

export const metadata: Metadata = {
  title: 'DeepResearch A2A Web Client',
  description: '基于Next.js的DeepResearch A2A流式客户端',
};

export default function RootLayout({
  children,
}: {
  children: React.ReactNode;
}) {
  return (
    <html lang="zh">
      <body>
        {children}
      </body>
    </html>
  );
}

================================================
FILE: web_for_a2a/app/page.tsx
================================================
'use client';

import Link from 'next/link';

export default function Home() {
  return (
    <div className="container mx-auto p-8">
      <h1 className="text-3xl font-bold mb-6">DeepResearch A2A Web 客户端</h1>
      
      <div className="bg-white shadow-md rounded-lg p-6 mb-6">
        <h2 className="text-xl font-semibold mb-4">功能介绍</h2>
        <p className="mb-4">
          这是一个基于 Next.js 和 React 构建的 Web 客户端，用于连接 DeepResearch A2A 服务器并展示流式研究结果。
          通过 Server-Sent Events (SSE) 技术，可以实时接收和显示研究进度和最终报告。
        </p>
        <p className="mb-4">
          本示例演示了如何从前端 Web 应用连接到 DeepResearch A2A 服务器 (<code>tasks/sendSubscribe</code> 端点)，
          并接收、解析、显示 SSE 流。
        </p>
      </div>

      <div className="bg-blue-50 border border-blue-200 rounded-lg p-6 mb-6">
        <h2 className="text-xl font-semibold mb-4">使用前提</h2>
        <ul className="list-disc pl-6 space-y-2">
          <li>
            确保 <code>super_agents/deep_research/a2a_adapter/run_server.py</code> 启动的服务器正在运行在 
            <code>http://127.0.0.1:8000</code> (或相应的地址)。
          </li>
          <li>
            当前示例使用硬编码的研究主题 "特斯拉电动汽车的市场分析和未来发展趋势"。
          </li>
        </ul>
      </div>

      <Link 
        href="/deepresearch" 
        className="inline-block px-6 py-3 bg-blue-600 text-white font-medium rounded-lg hover:bg-blue-700 transition-colors"
      >
        进入 DeepResearch 示例页面
      </Link>
    </div>
  );
}

================================================
FILE: web_for_a2a/package.json
================================================
{
  "name": "web_for_a2a",
  "version": "0.1.0",
  "private": true,
  "scripts": {
    "dev": "next dev",
    "build": "next build",
    "start": "next start",
    "lint": "next lint"
  },
  "dependencies": {
    "next": "^14.0.0",
    "react": "^18.2.0",
    "react-dom": "^18.2.0",
    "uuid": "^9.0.1",
    "typescript": "^5.2.2",
    "@types/node": "^20.8.9",
    "@types/react": "^18.2.33",
    "@types/react-dom": "^18.2.14",
    "@types/uuid": "^9.0.6",
    "autoprefixer": "^10.4.16",
    "postcss": "^8.4.31",
    "tailwindcss": "^3.3.5"
  }
}

================================================
FILE: web_for_a2a/postcss.config.js
================================================
module.exports = {
  plugins: {
    tailwindcss: {},
    autoprefixer: {},
  },
};

================================================
FILE: web_for_a2a/tailwind.config.js
================================================
/** @type {import('tailwindcss').Config} */
module.exports = {
  content: [
    './pages/**/*.{js,ts,jsx,tsx,mdx}',
    './components/**/*.{js,ts,jsx,tsx,mdx}',
    './app/**/*.{js,ts,jsx,tsx,mdx}',
  ],
  theme: {
    extend: {},
  },
  plugins: [],
};

================================================
FILE: web_for_a2a/tsconfig.json
================================================
{
  "compilerOptions": {
    "lib": [
      "dom",
      "dom.iterable",
      "esnext"
    ],
    "allowJs": true,
    "skipLibCheck": true,
    "strict": false,
    "noEmit": true,
    "incremental": true,
    "module": "esnext",
    "esModuleInterop": true,
    "moduleResolution": "node",
    "resolveJsonModule": true,
    "isolatedModules": true,
    "jsx": "preserve",
    "plugins": [
      {
        "name": "next"
      }
    ]
  },
  "include": [
    "next-env.d.ts",
    ".next/types/**/*.ts",
    "**/*.ts",
    "**/*.tsx"
  ],
  "exclude": [
    "node_modules"
  ]
}