Repository: HKUDS/DeepCode
Branch: main
Commit: b5c741ab572a
Files: 255
Total size: 2.0 MB

Directory structure:
gitextract_3wtguj4a/

├── .dockerignore
├── .gitattributes
├── .github/
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.yml
│   │   ├── config.yml
│   │   ├── feature_request.yml
│   │   └── question.yml
│   ├── dependabot.yml
│   ├── pull_request_template.md
│   └── workflows/
│       ├── linting.yaml
│       └── pypi-publish.yml
├── .gitignore
├── .pre-commit-config.yaml
├── CHANGELOG.md
├── LICENSE
├── MANIFEST.in
├── README.md
├── README_ZH.md
├── __init__.py
├── cli/
│   ├── __init__.py
│   ├── cli_app.py
│   ├── cli_interface.py
│   ├── cli_launcher.py
│   ├── main_cli.py
│   └── workflows/
│       ├── __init__.py
│       └── cli_workflow_adapter.py
├── config/
│   ├── mcp_tool_definitions.py
│   └── mcp_tool_definitions_index.py
├── deepcode.py
├── deepcode_docker/
│   ├── .dockerignore
│   ├── Dockerfile
│   ├── docker-compose.yml
│   ├── docker-entrypoint.sh
│   └── run_docker.sh
├── mcp_agent.config.yaml
├── mcp_agent.secrets.yaml.example
├── nanobot/
│   ├── .dockerignore
│   ├── .gitignore
│   ├── COMMUNICATION.md
│   ├── Dockerfile
│   ├── LICENSE
│   ├── README.md
│   ├── SECURITY.md
│   ├── bridge/
│   │   ├── package.json
│   │   ├── src/
│   │   │   ├── index.ts
│   │   │   ├── server.ts
│   │   │   ├── types.d.ts
│   │   │   └── whatsapp.ts
│   │   └── tsconfig.json
│   ├── core_agent_lines.sh
│   ├── nanobot/
│   │   ├── __init__.py
│   │   ├── __main__.py
│   │   ├── agent/
│   │   │   ├── __init__.py
│   │   │   ├── context.py
│   │   │   ├── loop.py
│   │   │   ├── memory.py
│   │   │   ├── skills.py
│   │   │   ├── subagent.py
│   │   │   └── tools/
│   │   │       ├── __init__.py
│   │   │       ├── base.py
│   │   │       ├── cron.py
│   │   │       ├── deepcode.py
│   │   │       ├── filesystem.py
│   │   │       ├── message.py
│   │   │       ├── registry.py
│   │   │       ├── shell.py
│   │   │       ├── spawn.py
│   │   │       └── web.py
│   │   ├── bus/
│   │   │   ├── __init__.py
│   │   │   ├── events.py
│   │   │   └── queue.py
│   │   ├── channels/
│   │   │   ├── __init__.py
│   │   │   ├── base.py
│   │   │   ├── dingtalk.py
│   │   │   ├── discord.py
│   │   │   ├── email.py
│   │   │   ├── feishu.py
│   │   │   ├── manager.py
│   │   │   ├── qq.py
│   │   │   ├── slack.py
│   │   │   ├── telegram.py
│   │   │   └── whatsapp.py
│   │   ├── cli/
│   │   │   ├── __init__.py
│   │   │   └── commands.py
│   │   ├── config/
│   │   │   ├── __init__.py
│   │   │   ├── loader.py
│   │   │   └── schema.py
│   │   ├── cron/
│   │   │   ├── __init__.py
│   │   │   ├── service.py
│   │   │   └── types.py
│   │   ├── heartbeat/
│   │   │   ├── __init__.py
│   │   │   └── service.py
│   │   ├── providers/
│   │   │   ├── __init__.py
│   │   │   ├── base.py
│   │   │   ├── litellm_provider.py
│   │   │   ├── registry.py
│   │   │   └── transcription.py
│   │   ├── session/
│   │   │   ├── __init__.py
│   │   │   └── manager.py
│   │   ├── skills/
│   │   │   ├── README.md
│   │   │   ├── cron/
│   │   │   │   └── SKILL.md
│   │   │   ├── deepcode/
│   │   │   │   └── SKILL.md
│   │   │   ├── github/
│   │   │   │   └── SKILL.md
│   │   │   ├── skill-creator/
│   │   │   │   └── SKILL.md
│   │   │   ├── summarize/
│   │   │   │   └── SKILL.md
│   │   │   ├── tmux/
│   │   │   │   ├── SKILL.md
│   │   │   │   └── scripts/
│   │   │   │       ├── find-sessions.sh
│   │   │   │       └── wait-for-text.sh
│   │   │   └── weather/
│   │   │       └── SKILL.md
│   │   └── utils/
│   │       ├── __init__.py
│   │       └── helpers.py
│   ├── pyproject.toml
│   ├── run_nanobot.sh
│   └── workspace/
│       ├── AGENTS.md
│       ├── HEARTBEAT.md
│       ├── SOUL.md
│       ├── TOOLS.md
│       ├── USER.md
│       └── memory/
│           └── MEMORY.md
├── nanobot_config.json.example
├── new_ui/
│   ├── README.md
│   ├── backend/
│   │   ├── __init__.py
│   │   ├── api/
│   │   │   ├── __init__.py
│   │   │   ├── routes/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── config.py
│   │   │   │   ├── files.py
│   │   │   │   ├── requirements.py
│   │   │   │   └── workflows.py
│   │   │   └── websockets/
│   │   │       ├── __init__.py
│   │   │       ├── code_stream_ws.py
│   │   │       ├── logs_ws.py
│   │   │       └── workflow_ws.py
│   │   ├── app_utils/
│   │   │   └── __init__.py
│   │   ├── main.py
│   │   ├── models/
│   │   │   ├── __init__.py
│   │   │   ├── requests.py
│   │   │   └── responses.py
│   │   ├── services/
│   │   │   ├── __init__.py
│   │   │   ├── requirement_service.py
│   │   │   ├── session_service.py
│   │   │   └── workflow_service.py
│   │   └── settings.py
│   ├── frontend/
│   │   ├── index.html
│   │   ├── package.json
│   │   ├── postcss.config.js
│   │   ├── src/
│   │   │   ├── App.tsx
│   │   │   ├── components/
│   │   │   │   ├── common/
│   │   │   │   │   ├── Button.tsx
│   │   │   │   │   ├── Card.tsx
│   │   │   │   │   ├── ConfirmDialog.tsx
│   │   │   │   │   ├── GuardedLink.tsx
│   │   │   │   │   ├── TaskRecoveryBanner.tsx
│   │   │   │   │   ├── Toaster.tsx
│   │   │   │   │   └── index.ts
│   │   │   │   ├── input/
│   │   │   │   │   ├── ChatInput.tsx
│   │   │   │   │   ├── FileUploader.tsx
│   │   │   │   │   ├── UrlInput.tsx
│   │   │   │   │   └── index.ts
│   │   │   │   ├── interaction/
│   │   │   │   │   ├── InlineChatInteraction.tsx
│   │   │   │   │   ├── InteractionPanel.tsx
│   │   │   │   │   └── index.ts
│   │   │   │   ├── layout/
│   │   │   │   │   ├── Header.tsx
│   │   │   │   │   ├── Layout.tsx
│   │   │   │   │   ├── Sidebar.tsx
│   │   │   │   │   └── index.ts
│   │   │   │   ├── results/
│   │   │   │   │   ├── CodePreview.tsx
│   │   │   │   │   ├── FileTree.tsx
│   │   │   │   │   └── index.ts
│   │   │   │   ├── streaming/
│   │   │   │   │   ├── ActivityLogViewer.tsx
│   │   │   │   │   ├── CodeStreamViewer.tsx
│   │   │   │   │   ├── LogViewer.tsx
│   │   │   │   │   ├── ProgressTracker.tsx
│   │   │   │   │   └── index.ts
│   │   │   │   └── workflow/
│   │   │   │       ├── WorkflowCanvas.tsx
│   │   │   │       ├── WorkflowNode.tsx
│   │   │   │       └── index.ts
│   │   │   ├── hooks/
│   │   │   │   ├── index.ts
│   │   │   │   ├── useAdaptiveLayout.ts
│   │   │   │   ├── useNavigationGuard.ts
│   │   │   │   ├── useStreaming.ts
│   │   │   │   ├── useTaskRecovery.ts
│   │   │   │   └── useWebSocket.ts
│   │   │   ├── index.css
│   │   │   ├── main.tsx
│   │   │   ├── pages/
│   │   │   │   ├── ChatPlanningPage.tsx
│   │   │   │   ├── HomePage.tsx
│   │   │   │   ├── PaperToCodePage.tsx
│   │   │   │   ├── SettingsPage.tsx
│   │   │   │   ├── WorkflowEditorPage.tsx
│   │   │   │   └── index.ts
│   │   │   ├── services/
│   │   │   │   └── api.ts
│   │   │   ├── stores/
│   │   │   │   ├── index.ts
│   │   │   │   ├── sessionStore.ts
│   │   │   │   └── workflowStore.ts
│   │   │   └── types/
│   │   │       ├── api.ts
│   │   │       ├── common.ts
│   │   │       ├── index.ts
│   │   │       └── workflow.ts
│   │   ├── tailwind.config.js
│   │   ├── tsconfig.json
│   │   ├── tsconfig.node.json
│   │   └── vite.config.ts
│   └── scripts/
│       ├── build.sh
│       └── start_dev.sh
├── prompts/
│   └── code_prompts.py
├── requirements.txt
├── run.bat
├── run.sh
├── schema/
│   └── mcp-agent.config.schema.json
├── setup.py
├── tools/
│   ├── __init__.py
│   ├── bocha_search_server.py
│   ├── code_implementation_server.py
│   ├── code_indexer.py
│   ├── code_reference_indexer.py
│   ├── command_executor.py
│   ├── document_segmentation_server.py
│   ├── git_command.py
│   ├── indexer_config.yaml
│   ├── pdf_converter.py
│   ├── pdf_downloader.py
│   └── pdf_utils.py
├── ui/
│   ├── __init__.py
│   ├── app.py
│   ├── components.py
│   ├── handlers.py
│   ├── layout.py
│   ├── sidebar_feed.py
│   ├── streamlit_app.py
│   └── styles.py
├── utils/
│   ├── __init__.py
│   ├── cli_interface.py
│   ├── cross_platform_file_handler.py
│   ├── dialogue_logger.py
│   ├── file_processor.py
│   ├── llm_utils.py
│   ├── loop_detector.py
│   ├── model_limits.py
│   └── simple_llm_logger.py
└── workflows/
    ├── __init__.py
    ├── agent_orchestration_engine.py
    ├── agents/
    │   ├── __init__.py
    │   ├── code_implementation_agent.py
    │   ├── document_segmentation_agent.py
    │   ├── memory_agent_concise.py
    │   ├── memory_agent_concise_index.py
    │   ├── memory_agent_concise_multi.py
    │   └── requirement_analysis_agent.py
    ├── code_implementation_workflow.py
    ├── code_implementation_workflow_index.py
    ├── codebase_index_workflow.py
    └── plugins/
        ├── USAGE.md
        ├── __init__.py
        ├── base.py
        ├── integration.py
        ├── plan_review.py
        └── requirement_analysis.py

================================================
FILE CONTENTS
================================================

================================================
FILE: .dockerignore
================================================
# Git
.git
.gitignore

# Node
new_ui/frontend/node_modules
new_ui/frontend/dist

# Python
__pycache__
*.pyc
*.pyo
*.egg-info
.eggs
dist
build

# Virtual environments
.venv
venv
env

# IDE
.vscode
.idea
.cursor
*.swp
*.swo

# Runtime data
deepcode_lab
uploads
logs
*.log

# Docker
deepcode_docker/Dockerfile
deepcode_docker/docker-compose.yml
deepcode_docker/.dockerignore
deepcode_docker/run_docker.sh

# Documentation
assets
*.md
LICENSE


================================================
FILE: .gitattributes
================================================
# Force LF line endings for shell scripts (prevents CRLF issues in Docker)
*.sh text eol=lf
docker-entrypoint.sh text eol=lf


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.yml
================================================
name: Bug Report
description: File a bug report
title: "[Bug]:"
labels: ["bug", "triage"]

body:
  - type: checkboxes
    id: existingcheck
    attributes:
      label: Do you need to file an issue?
      description: Please help us manage our time by avoiding duplicates and common bugs with the steps below.
      options:
        - label: I have searched the existing issues and this bug is not already filed.
        - label: I believe this is a legitimate bug, not just a question or feature request.
  - type: textarea
    id: description
    attributes:
      label: Describe the bug
      description: A clear and concise description of what the bug is.
      placeholder: What went wrong?
  - type: textarea
    id: reproduce
    attributes:
      label: Steps to reproduce
      description: Steps to reproduce the behavior.
      placeholder: How can we replicate the issue?
  - type: textarea
    id: expected_behavior
    attributes:
      label: Expected Behavior
      description: A clear and concise description of what you expected to happen.
      placeholder: What should have happened?
  - type: textarea
    id: configused
    attributes:
      label: DeepCode Config Used
      description: The DeepCode configuration used for the run.
      placeholder: The settings content or DeepCode configuration
      value: |
        # Paste your config here
  - type: textarea
    id: screenshotslogs
    attributes:
      label: Logs and screenshots
      description: If applicable, add screenshots and logs to help explain your problem.
      placeholder: Add logs and screenshots here
  - type: textarea
    id: additional_information
    attributes:
      label: Additional Information
      description: |
        - DeepCode Version: e.g., v0.1.1
        - Operating System: e.g., Windows 10, Ubuntu 20.04
        - Python Version: e.g., 3.8
        - Related Issues: e.g., #1
        - Any other relevant information.
      value: |
        - DeepCode Version:
        - Operating System:
        - Python Version:
        - Related Issues:


================================================
FILE: .github/ISSUE_TEMPLATE/config.yml
================================================
blank_issues_enabled: false


================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.yml
================================================
name: Feature Request
description: File a feature request
labels: ["enhancement"]
title: "[Feature Request]:"

body:
  - type: checkboxes
    id: existingcheck
    attributes:
      label: Do you need to file a feature request?
      description: Please help us manage our time by avoiding duplicates and common feature request with the steps below.
      options:
        - label: I have searched the existing feature request and this feature request is not already filed.
        - label: I believe this is a legitimate feature request, not just a question or bug.
  - type: textarea
    id: feature_request_description
    attributes:
      label: Feature Request Description
      description: A clear and concise description of the feature request you would like.
      placeholder: What this feature request add more or improve?
  - type: textarea
    id: additional_context
    attributes:
      label: Additional Context
      description: Add any other context or screenshots about the feature request here.
      placeholder: Any additional information


================================================
FILE: .github/ISSUE_TEMPLATE/question.yml
================================================
name: Question
description: Ask a general question
labels: ["question"]
title: "[Question]:"

body:
  - type: checkboxes
    id: existingcheck
    attributes:
      label: Do you need to ask a question?
      description: Please help us manage our time by avoiding duplicates and common questions with the steps below.
      options:
        - label: I have searched the existing question and discussions and this question is not already answered.
        - label: I believe this is a legitimate question, not just a bug or feature request.
  - type: textarea
    id: question
    attributes:
      label: Your Question
      description: A clear and concise description of your question.
      placeholder: What is your question?
  - type: textarea
    id: context
    attributes:
      label: Additional Context
      description: Provide any additional context or details that might help us understand your question better.
      placeholder: Add any relevant information here


================================================
FILE: .github/dependabot.yml
================================================
# To get started with Dependabot version updates, you'll need to specify which
# package ecosystems to update and where the package manifests are located.
# Please see the documentation for all configuration options:
# https://docs.github.com/code-security/dependabot/dependabot-version-updates/configuration-options-for-the-dependabot.yml-file

version: 2
updates:
  - package-ecosystem: "pip" # See documentation for possible values
    directory: "/" # Location of package manifests
    schedule:
      interval: "weekly"


================================================
FILE: .github/pull_request_template.md
================================================
<!--
Thanks for contributing to DeepCode!

Please ensure your pull request is ready for review before submitting.

About this template

This template helps contributors provide a clear and concise description of their changes. Feel free to adjust it as needed.
-->

## Description

[Briefly describe the changes made in this pull request.]

## Related Issues

[Reference any related issues or tasks addressed by this pull request.]

## Changes Made

[List the specific changes made in this pull request.]

## Checklist

- [ ] Changes tested locally
- [ ] Code reviewed
- [ ] Documentation updated (if necessary)
- [ ] Unit tests added (if applicable)

## Additional Notes

[Add any additional notes or context for the reviewer(s).]


================================================
FILE: .github/workflows/linting.yaml
================================================
name: Linting and Formatting

on:
    push:
        branches:
            - main
    pull_request:
        branches:
            - main

jobs:
    lint-and-format:
        runs-on: ubuntu-latest

        steps:
            - name: Checkout code
              uses: actions/checkout@v2

            - name: Set up Python
              uses: actions/setup-python@v2
              with:
                python-version: '3.x'

            - name: Install dependencies
              run: |
                python -m pip install --upgrade pip
                pip install pre-commit

            - name: Run pre-commit
              run: pre-commit run --all-files --show-diff-on-failure


================================================
FILE: .github/workflows/pypi-publish.yml
================================================
name: Upload DeepCode Package

on:
  release:
    types: [published]

permissions:
  contents: read

jobs:
  release-build:
    runs-on: ubuntu-latest

    steps:
      - uses: actions/checkout@v4

      - uses: actions/setup-python@v5
        with:
          python-version: "3.x"

      - name: Build release distributions
        run: |
          python -m pip install build
          python -m build

      - name: Upload distributions
        uses: actions/upload-artifact@v4
        with:
          name: release-dists
          path: dist/

  pypi-publish:
    runs-on: ubuntu-latest
    needs:
      - release-build
    permissions:
      id-token: write

    environment:
      name: pypi

    steps:
      - name: Retrieve release distributions
        uses: actions/download-artifact@v4
        with:
          name: release-dists
          path: dist/

      - name: Publish release distributions to PyPI
        uses: pypa/gh-action-pypi-publish@release/v1
        with:
          packages-dir: dist/


================================================
FILE: .gitignore
================================================
# Python-related files
__pycache__/
*.py[cod]
*.egg-info/
.eggs/
*.tgz
*.tar.gz
*.ini

# Virtual Environment
.venv/
env/
venv/
*.env*
.env_example


# Build / Distribution
dist/
build/
site/

# Logs / Reports
*.log
*.log.*
*.logfire
*.coverage/
log/
logs/

# Node
node_modules/

# Caches
.cache/
.mypy_cache/
.pytest_cache/
.ruff_cache/
.gradio/
.history/
temp/

# IDE / Editor Files
.idea/
.vscode/
.vscode/settings.json

# Framework-specific files
local_neo4jWorkDir/
neo4jWorkDir/

# Data & Storage
inputs/
rag_storage/
examples/input/
examples/output/
deepcode-mcp/agent_folders

# Miscellaneous
.DS_Store
TODO.md
ignore_this.txt
*.ignore.*

# unit-test files
test_*
run_indexer_with_filtering.py

# Cline files
memory-bank/

# project files
deepcode_lab/

# secrets (use .env or environment variables instead)
mcp_agent.secrets.yaml
nanobot_config.json


================================================
FILE: .pre-commit-config.yaml
================================================
repos:
  - repo: https://github.com/pre-commit/pre-commit-hooks
    rev: v5.0.0
    hooks:
      - id: trailing-whitespace
      - id: end-of-file-fixer
      - id: requirements-txt-fixer


  - repo: https://github.com/astral-sh/ruff-pre-commit
    rev: v0.6.4
    hooks:
      - id: ruff-format
      - id: ruff
        args: [--fix, --ignore=E402]

  - repo: https://github.com/mgedmin/check-manifest
    rev: "0.49"
    hooks:
      - id: check-manifest
        stages: [manual]


================================================
FILE: CHANGELOG.md
================================================
# Changelog

All notable changes to DeepCode will be documented in this file.

## [1.0.6-jm] - 2025-10-19

### Added
- **Dynamic Model Limit Detection**: New `utils/model_limits.py` module that automatically detects and adapts to any LLM model's token limits and pricing
- **Loop Detection System**: `utils/loop_detector.py` prevents infinite loops by detecting repeated tool calls, timeouts, and progress stalls
- **Progress Tracking**: 8-phase progress tracking (5% → 100%) with file-level progress indicators in both UI and terminal
- **Abort Mechanism**: "Stop Processing" button in UI with global abort flag for clean process termination
- **Cache Cleanup Scripts**: `start_clean.bat` and `start_clean.ps1` to clear Python cache before starting
- **Enhanced Error Display**: Real-time error messages in both UI and terminal with timestamps
- **File Progress Tracking**: Shows files completed/total with estimated time remaining

### Fixed
- **Critical: False Error Detection**: Fixed overly aggressive error detection that was marking successful operations as failures, causing premature abort and empty file generation
- **Critical: Empty File Generation**: Files now contain actual code instead of being empty (2-byte files)
- **Unique Folder Naming**: Each project run now creates `paper_{timestamp}` folders instead of reusing `pdf_output`
- **PDF Save Location**: PDFs now save to `deepcode_lab/papers/` instead of system temp directory
- **Duplicate Folder Prevention**: Added session state caching to prevent duplicate folder creation on UI reruns
- **Token Limit Compliance**: Fixed `max_tokens` to respect model limits dynamically (e.g., gpt-4o-mini's 16,384 token limit)
- **Empty Plan Detection**: System now fails early with clear error messages when initial plan is empty or invalid
- **Process Hanging**: Fixed infinite loops and hanging on errors - process now exits cleanly
- **Token Cost Tracking**: Restored accurate token usage and cost display (was showing $0.0000)
- **PDF to Markdown Conversion**: Fixed automatic conversion and file location handling
- **Document Segmentation**: Properly uses configured 50K character threshold from `mcp_agent.config.yaml`
- **Error Propagation**: Abort mechanism now properly stops process after 10 consecutive real errors

### Changed
- **Model-Aware Token Management**: Token limits now adapt automatically based on configured model instead of hardcoded values
- **Cost Calculation**: Dynamic pricing based on actual model rates (OpenAI, Anthropic)
- **Retry Logic**: Token limits for retries now respect model maximum (87.5% → 95% → 98% of max)
- **Segmentation Workflow**: Better integration with code implementation phase
- **Error Handling**: Enhanced error propagation - errors no longer reported as "success"
- **UI Display**: Shows project folder name after PDF conversion for better visibility
- **Terminal Logging**: Added timestamps to all progress messages

### Technical Improvements
- Added document-segmentation server to code implementation workflow for better token management
- Improved error handling in agent orchestration engine with proper cleanup
- Enhanced subprocess handling on Windows (hide console windows, prevent hanging)
- Better LibreOffice detection on Windows using direct path checking
- Fixed input data format consistency (JSON with `paper_path` key)
- Added comprehensive logging throughout the pipeline
- Improved resource cleanup on errors and process termination

### Documentation
- Translated Chinese comments to English in core workflow files
- Added inline documentation for new utility modules
- Created startup scripts with clear usage instructions

### Breaking Changes
- None - all changes are backward compatible

### Known Issues
- Terminal may show trailing "Calling Tool..." line after completion (cosmetic display artifact - process completes successfully)
- Some Chinese comments remain in non-critical files (cli, tools) - translation in progress
- tiktoken package optional warning (doesn't affect functionality)

### Success Metrics
- ✅ Complete end-to-end workflow: DOCX upload → PDF conversion → Markdown → Segmentation → Planning → Code generation
- ✅ Files generated with actual code content (15+ files with proper implementation)
- ✅ Single folder per project run (no duplicates)
- ✅ Dynamic token management working across different models
- ✅ Accurate cost tracking per model
- ✅ Clean process termination with proper error handling

---

## [1.0.5] - Previous Release

See previous releases for earlier changes.


================================================
FILE: LICENSE
================================================
MIT License

Copyright (c) 2025 ✨Data Intelligence Lab@HKU✨

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: MANIFEST.in
================================================
include README.md
include LICENSE
include requirements.txt
include __init__.py
include *.png
include *.yaml
recursive-include config *.yaml
recursive-include prompts *
recursive-include schema *
recursive-include ui *.py
recursive-include cli *.py
recursive-include utils *.py
recursive-include tools *.py
recursive-include workflows *.py
global-exclude *.pyc
global-exclude .git*
global-exclude .history*
global-exclude .ruff_cache*
global-exclude __pycache__*


================================================
FILE: README.md
================================================
<div align="center">

<table style="border: none; margin: 0 auto; padding: 0; border-collapse: collapse;">
<tr>
<td align="center" style="vertical-align: middle; padding: 10px; border: none; width: 250px;">
  <img src="assets/logo.png" alt="DeepCode Logo" width="200" style="margin: 0; padding: 0; display: block;"/>
</td>
<td align="left" style="vertical-align: middle; padding: 10px 0 10px 30px; border: none;">
  <pre style="font-family: 'Courier New', monospace; font-size: 16px; color: #0EA5E9; margin: 0; padding: 0; text-shadow: 0 0 10px #0EA5E9, 0 0 20px rgba(14,165,233,0.5); line-height: 1.2; transform: skew(-1deg, 0deg); display: block;">    ██████╗ ███████╗███████╗██████╗  ██████╗ ██████╗ ██████╗ ███████╗
    ██╔══██╗██╔════╝██╔════╝██╔══██╗██╔════╝██╔═══██╗██╔══██╗██╔════╝
    ██║  ██║█████╗  █████╗  ██████╔╝██║     ██║   ██║██║  ██║█████╗
    ██║  ██║██╔══╝  ██╔══╝  ██╔═══╝ ██║     ██║   ██║██║  ██║██╔══╝
    ██████╔╝███████╗███████╗██║     ╚██████╗╚██████╔╝██████╔╝███████╗
    ╚═════╝ ╚══════╝╚══════╝╚═╝      ╚═════╝ ╚═════╝ ╚═════╝ ╚══════╝</pre>
</td>
</tr>
</table>

<div align="center">
<a href="https://trendshift.io/repositories/14665" target="_blank"><img src="https://trendshift.io/api/badge/repositories/14665" alt="HKUDS%2FDeepCode | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
</div>

<!-- <img src="https://readme-typing-svg.herokuapp.com?font=Russo+One&size=28&duration=2000&pause=800&color=06B6D4&background=00000000&center=true&vCenter=true&width=800&height=50&lines=%E2%9A%A1+OPEN+AGENTIC+CODING+%E2%9A%A1" alt="DeepCode Tech Subtitle" style="margin-top: 5px; filter: drop-shadow(0 0 12px #06B6D4) drop-shadow(0 0 24px rgba(6,182,212,0.4));"/> -->

# <img src="https://github.com/Zongwei9888/Experiment_Images/raw/43c585dca3d21b8e4b6390d835cdd34dc4b4b23d/DeepCode_images/title_logo.svg" alt="DeepCode Logo" width="32" height="32" style="vertical-align: middle; margin-right: 8px;"/> DeepCode: Open Agentic Coding

### *Advancing Code Generation with Multi-Agent Systems*

<!-- <p align="center">
  <img src="https://img.shields.io/badge/Version-1.0.0-00d4ff?style=for-the-badge&logo=rocket&logoColor=white" alt="Version">

  <img src="https://img.shields.io/badge/License-MIT-4ecdc4?style=for-the-badge&logo=opensourceinitiative&logoColor=white" alt="License">
  <img src="https://img.shields.io/badge/AI-Multi--Agent-9b59b6?style=for-the-badge&logo=brain&logoColor=white" alt="AI">
  <img src="https://img.shields.io/badge/HKU-Data_Intelligence_Lab-f39c12?style=for-the-badge&logo=university&logoColor=white" alt="HKU">
</p> -->
<p>
  <a href="https://github.com/HKUDS/DeepCode/stargazers"><img src='https://img.shields.io/github/stars/HKUDS/DeepCode?color=00d9ff&style=for-the-badge&logo=star&logoColor=white&labelColor=1a1a2e' /></a>
  <a href='https://arxiv.org/abs/2512.07921'><img src="https://img.shields.io/badge/Paper-arXiv-orange?style=for-the-badge&logo=arxiv&logoColor=white&labelColor=1a1a2e"></a>
  <img src="https://img.shields.io/badge/🐍Python-3.13-4ecdc4?style=for-the-badge&logo=python&logoColor=white&labelColor=1a1a2e">
  <!-- <a href="https://pypi.org/project/deepcode-hku/"><img src="https://img.shields.io/pypi/v/deepcode-hku.svg?style=for-the-badge&logo=pypi&logoColor=white&labelColor=1a1a2e&color=ff6b6b"></a> -->
</p>
<p>
  <a href="https://discord.gg/yF2MmDJyGJ"><img src="https://img.shields.io/badge/💬Discord-Community-7289da?style=for-the-badge&logo=discord&logoColor=white&labelColor=1a1a2e"></a>
  <a href="https://github.com/HKUDS/DeepCode/issues/11"><img src="https://img.shields.io/badge/💬WeChat-Group-07c160?style=for-the-badge&logo=wechat&logoColor=white&labelColor=1a1a2e"></a>
</p>
<div align="center">
  <div style="width: 100%; height: 2px; margin: 20px 0; background: linear-gradient(90deg, transparent, #00d9ff, transparent);"></div>
</div>

<div align="center">
  <a href="#-quick-start" style="text-decoration: none;">
    <img src="https://img.shields.io/badge/Quick%20Start-Get%20Started%20Now-00d9ff?style=for-the-badge&logo=rocket&logoColor=white&labelColor=1a1a2e">
  </a>
</div>

<div align="center" style="margin-top: 10px;">
  <a href="README.md">
    <img src="https://img.shields.io/badge/English-00d4ff?style=for-the-badge&logo=readme&logoColor=white&labelColor=1a1a2e" alt="English">
  </a>
  <a href="README_ZH.md">
    <img src="https://img.shields.io/badge/中文-00d4ff?style=for-the-badge&logo=readme&logoColor=white&labelColor=1a1a2e" alt="中文">
  </a>
</div>

### 🖥️ **Interface Showcase**

<table align="center" width="100%" style="border: none; border-collapse: collapse; margin: 30px 0;">
<tr>
<td width="50%" align="center" style="vertical-align: top; padding: 20px;">

#### 🖥️ **CLI Interface**
**Terminal-Based Development**

<div align="center">

  <img src="https://github.com/Zongwei9888/Experiment_Images/blob/8882a7313c504ca97ead6e7b36c51aa761b6a4f3/DeepCode_images/CLI.gif" alt="CLI Interface Demo" width="100%" style="border-radius: 10px; box-shadow: 0 8px 20px rgba(45,55,72,0.3); margin: 15px 0;"/>

  <div style="background: linear-gradient(135deg, #2D3748 0%, #4A5568 100%); border-radius: 12px; padding: 15px; margin: 15px 0; color: white;">
    <strong>🚀 Advanced Terminal Experience</strong><br/>
    <small>⚡ Fast command-line workflow<br/>🔧 Developer-friendly interface<br/>📊 Real-time progress tracking</small>
  </div>

  *Professional terminal interface for advanced users and CI/CD integration*
</div>

</td>
<td width="50%" align="center" style="vertical-align: top; padding: 20px;">

#### 🌐 **Web Interface**
**Visual Interactive Experience**

<div align="center">

  <img src="https://github.com/Zongwei9888/Experiment_Images/raw/8882a7313c504ca97ead6e7b36c51aa761b6a4f3/DeepCode_images/UI.gif" alt="Web Interface Demo" width="100%" style="border-radius: 10px; box-shadow: 0 8px 20px rgba(14,165,233,0.3); margin: 15px 0;"/>

  <div style="background: linear-gradient(135deg, #0EA5E9 0%, #00D4FF 100%); border-radius: 12px; padding: 15px; margin: 15px 0; color: white;">
    <strong>🎨 Modern Web Dashboard</strong><br/>
    <small>🖱️ Intuitive drag-and-drop<br/>📱 Responsive design<br/>🎯 Visual progress tracking</small>
  </div>

  *Beautiful web interface with streamlined workflow for all skill levels*
</div>

</td>
</tr>
</table>

---

<div align="center">

### 🎬 **Introduction Video**

<div style="margin: 20px 0;">
  <a href="https://youtu.be/PRgmP8pOI08" target="_blank">
    <img src="https://img.youtube.com/vi/PRgmP8pOI08/maxresdefault.jpg"
         alt="DeepCode Introduction Video"
         width="75%"
         style="border-radius: 12px; box-shadow: 0 8px 25px rgba(0,0,0,0.15); transition: transform 0.3s ease;"/>
  </a>
</div>

*🎯 **Watch our complete introduction** - See how DeepCode transforms research papers and natural language into production-ready code*

<p>
  <a href="https://youtu.be/PRgmP8pOI08" target="_blank">
    <img src="https://img.shields.io/badge/▶️_Watch_Video-FF0000?style=for-the-badge&logo=youtube&logoColor=white" alt="Watch Video"/>
  </a>
</p>

</div>

---


> *"Where AI Agents Transform Ideas into Production-Ready Code"*

</div>

---

## 📑 Table of Contents

- [📰 News](#-news)
- [🚀 Key Features](#-key-features)
- [🏗️ Architecture](#️-architecture)
- [📊 Experimental Results](#-experimental-results)
- [🚀 Quick Start](#-quick-start)
- [🤖 nanobot Integration (Feishu Chatbot)](#-nanobot-integration-feishu-chatbot)
- [💡 Examples](#-examples)
  - [🎬 Live Demonstrations](#-live-demonstrations)
- [⭐ Star History](#-star-history)
- [📄 License](#-license)


---

## 📰 News

🎉 **[2026-02] nanobot ✖️ DeepCode. Just chat naturally with openclaw/nanobot to handle your coding tasks:**

<div align="center">
<table><tr>
<td align="center"><a href="https://github.com/HKUDS/DeepCode"><img src="./assets/logo.png" alt="DeepCode" height="60"/></a></td>
<td align="center"><h2>✦</h2></td>
<td align="center"><a href="https://github.com/HKUDS/nanobot"><img src="./assets/nanobot.png" alt="nanobot" height="60"/></a></td>
</tr></table>
</div>

- [nanobot](https://github.com/HKUDS/nanobot) nanobot now powers your agentic coding & engineering! 🤖💻
- Step away from your laptop — make vibe coding even more vibe! Code directly from your phone! 📱✨
- One-command deploy: `./nanobot/run_nanobot.sh` → **[Setup Guide →](#-nanobot-integration-feishu-chatbot)**

<div align="center">
<table width="100%"><tr>
<td width="50%" align="center">
  <img src="./assets/IMG_8098.jpeg" alt="Feishu Chat Example 1" width="95%" style="border-radius: 10px; box-shadow: 0 4px 15px rgba(0,0,0,0.2);"/>
</td>
<td width="50%" align="center">
  <img src="./assets/IMG_8099.jpeg" alt="Feishu Chat Example 2" width="95%" style="border-radius: 10px; box-shadow: 0 4px 15px rgba(0,0,0,0.2);"/>
</td>
</tr></table>
<sub><em>Feishu Bot in Action — Natural language → Full code generation with setup instructions</em></sub>
</div>

---

🎉 **[2026-02] New Web UI Experience Upgrade!**

- 🔄 **User-in-Loop Interaction**: Support real-time user interaction during workflows - AI asks clarifying questions directly in the chat
- 💬 **Inline Interaction Design**: Interaction prompts appear naturally within the chat flow for a seamless experience
- 🚀 **One-Click Launch**: Simply run `deepcode` to start the new UI (cross-platform: Windows/macOS/Linux)
- 🔧 **Improved Process Management**: Enhanced service start/stop mechanism with automatic port cleanup
- 📡 **WebSocket Real-time Communication**: Fixed message loss issues, ensuring proper interaction state synchronization

<div align="center">
  <img src="./assets/NewUI.png" alt="DeepCode New UI" width="85%" style="border-radius: 12px; box-shadow: 0 4px 20px rgba(0,0,0,0.15);" />
  <br/>
  <sub><em>DeepCode New Web UI - Modern React-based Interface</em></sub>
</div>

---

🎉 **[2025-10-28] DeepCode Achieves SOTA on PaperBench!**

DeepCode sets new benchmarks on OpenAI's PaperBench Code-Dev across all categories:

- 🏆 **Surpasses Human Experts**: **75.9%** (DeepCode) vs Top Machine Learning PhDs 72.4% (+3.5%).
- 🥇 **Outperforms SOTA Commercial Code Agents**: **84.8%** (DeepCode) vs Leading Commercial Code Agents (+26.1%) (Cursor, Claude Code, and Codex).
- 🔬 **Advances Scientific Coding**: **73.5%** (DeepCode) vs PaperCoder 51.1% (+22.4%).
- 🚀 **Beats LLM Agents**: **73.5%** (DeepCode) vs best LLM frameworks 43.3% (+30.2%).

---

## 🚀 Key Features

<br/>

<table align="center" width="100%" style="border: none; table-layout: fixed;">
<tr>
<td width="30%" align="center" style="vertical-align: top; padding: 20px;">

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<h3 style="margin: 0; padding: 0;">🚀 <strong>Paper2Code</strong></h3>
</div>

<div align="center" style="margin: 15px 0;">
  <img src="https://img.shields.io/badge/ALGORITHM-IMPLEMENTATION-ff6b6b?style=for-the-badge&logo=algorithm&logoColor=white" alt="Algorithm Badge" />
</div>

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<p align="center"><strong>Automated Implementation of Complex Algorithms</strong></p>
</div>

<div style="height: 60px; display: flex; align-items: center; justify-content: center;">
<p align="center">Effortlessly converts complex algorithms from research papers into <strong>high-quality</strong>, <strong>production-ready</strong> code, accelerating algorithm reproduction.</p>
</div>


</td>
<td width="30%" align="center" style="vertical-align: top; padding: 20px;">

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<h3 style="margin: 0; padding: 0;">🎨 <strong>Text2Web</strong></h3>
</div>

<div align="center" style="margin: 15px 0;">
  <img src="https://img.shields.io/badge/FRONTEND-DEVELOPMENT-4ecdc4?style=for-the-badge&logo=react&logoColor=white" alt="Frontend Badge" />
</div>

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<p align="center"><strong>Automated Front-End Web Development</strong></p>
</div>

<div style="height: 60px; display: flex; align-items: center; justify-content: center;">
<p align="center">Translates plain textual descriptions into <strong>fully functional</strong>, <strong>visually appealing</strong> front-end web code for rapid interface creation.</p>
</div>


</td>
<td width="30%" align="center" style="vertical-align: top; padding: 20px;">

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<h3 style="margin: 0; padding: 0;">⚙️ <strong>Text2Backend</strong></h3>
</div>

<div align="center" style="margin: 15px 0;">
  <img src="https://img.shields.io/badge/BACKEND-DEVELOPMENT-9b59b6?style=for-the-badge&logo=server&logoColor=white" alt="Backend Badge" />
</div>

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<p align="center"><strong>Automated Back-End Development</strong></p>
</div>

<div style="height: 60px; display: flex; align-items: center; justify-content: center;">
<p align="center">Generates <strong>efficient</strong>, <strong>scalable</strong>, and <strong>feature-rich</strong> back-end code from simple text inputs, streamlining server-side development.</p>
</div>


</td>
</tr>
</table>

<br/>

---

## 📊 Experimental Results

<div align="center">
    <img src='./assets/result_main02.jpg' /><br>
</div>
<br/>

We evaluate **DeepCode** on the [*PaperBench*](https://openai.com/index/paperbench/) benchmark (released by OpenAI), a rigorous testbed requiring AI agents to independently reproduce 20 ICML 2024 papers from scratch. The benchmark comprises 8,316 gradable components assessed using SimpleJudge with hierarchical weighting.

Our experiments compare DeepCode against four baseline categories: **(1) Human Experts**, **(2) State-of-the-Art Commercial Code Agents**, **(3) Scientific Code Agents**, and **(4) LLM-Based Agents**.

### ① 🧠 Human Expert Performance (Top Machine Learning PhD)

**DeepCode: 75.9% vs. Top Machine Learning PhD: 72.4% (+3.5%)**

DeepCode achieves **75.9%** on the 3-paper human evaluation subset, **surpassing the best-of-3 human expert baseline (72.4%) by +3.5 percentage points**. This demonstrates that our framework not only matches but exceeds expert-level code reproduction capabilities, representing a significant milestone in autonomous scientific software engineering.

### ② 💼 State-of-the-Art Commercial Code Agents

**DeepCode: 84.8% vs. Best Commercial Agent: 58.7% (+26.1%)**

On the 5-paper subset, DeepCode substantially outperforms leading commercial coding tools:
- Cursor: 58.4%
- Claude Code: 58.7%
- Codex: 40.0%
- **DeepCode: 84.8%**

This represents a **+26.1% improvement** over the leading commercial code agent. All commercial agents utilize Claude Sonnet 4.5 or GPT-5 Codex-high, highlighting that **DeepCode's superior architecture**—rather than base model capability—drives this performance gap.

### ③ 🔬 Scientific Code Agents

**DeepCode: 73.5% vs. PaperCoder: 51.1% (+22.4%)**

Compared to PaperCoder (**51.1%**), the state-of-the-art scientific code reproduction framework, DeepCode achieves **73.5%**, demonstrating a **+22.4% relative improvement**. This substantial margin validates our multi-module architecture combining planning, hierarchical task decomposition, code generation, and iterative debugging over simpler pipeline-based approaches.

### ④ 🤖 LLM-Based Agents

**DeepCode: 73.5% vs. Best LLM Agent: 43.3% (+30.2%)**

DeepCode significantly outperforms all tested LLM agents:
- Claude 3.5 Sonnet + IterativeAgent: 27.5%
- o1 + IterativeAgent (36 hours): 42.4%
- o1 BasicAgent: 43.3%
- **DeepCode: 73.5%**

The **+30.2% improvement** over the best-performing LLM agent demonstrates that sophisticated agent scaffolding, rather than extended inference time or larger models, is critical for complex code reproduction tasks.

---

### 🎯 **Autonomous Self-Orchestrating Multi-Agent Architecture**

**The Challenges**:

- 📄 **Implementation Complexity**: Converting academic papers and complex algorithms into working code requires significant technical effort and domain expertise

- 🔬 **Research Bottleneck**: Researchers spend valuable time implementing algorithms instead of focusing on their core research and discovery work

- ⏱️ **Development Delays**: Product teams experience long wait times between concept and testable prototypes, slowing down innovation cycles

- 🔄 **Repetitive Coding**: Developers repeatedly implement similar patterns and functionality instead of building on existing solutions

**DeepCode** addresses these workflow inefficiencies by providing reliable automation for common development tasks, streamlining your development workflow from concept to code.

<div align="center">

```mermaid
flowchart LR
    A["📄 Research Papers<br/>💬 Text Prompts<br/>🌐 URLs & Document<br/>📎 Files: PDF, DOC, PPTX, TXT, HTML"] --> B["🧠 DeepCode<br/>Multi-Agent Engine"]
    B --> C["🚀 Algorithm Implementation <br/>🎨 Frontend Development <br/>⚙️ Backend Development"]

    style A fill:#ff6b6b,stroke:#c0392b,stroke-width:2px,color:#000
    style B fill:#00d4ff,stroke:#0984e3,stroke-width:3px,color:#000
    style C fill:#00b894,stroke:#00a085,stroke-width:2px,color:#000
```

</div>

---

## 🏗️ Architecture

### 📊 **System Overview**

**DeepCode** is an AI-powered development platform that automates code generation and implementation tasks. Our multi-agent system handles the complexity of translating requirements into functional, well-structured code, allowing you to focus on innovation rather than implementation details.

🎯 **Technical Capabilities**:

🧬 **Research-to-Production Pipeline**<br>
Multi-modal document analysis engine that extracts algorithmic logic and mathematical models from academic papers. Generates optimized implementations with proper data structures while preserving computational complexity characteristics.

🪄 **Natural Language Code Synthesis**<br>
Context-aware code generation using fine-tuned language models trained on curated code repositories. Maintains architectural consistency across modules while supporting multiple programming languages and frameworks.

⚡ **Automated Prototyping Engine**<br>
Intelligent scaffolding system generating complete application structures including database schemas, API endpoints, and frontend components. Uses dependency analysis to ensure scalable architecture from initial generation.

💎 **Quality Assurance Automation**<br>
Integrated static analysis with automated unit test generation and documentation synthesis. Employs AST analysis for code correctness and property-based testing for comprehensive coverage.

🔮 **CodeRAG Integration System**<br>
Advanced retrieval-augmented generation combining semantic vector embeddings with graph-based dependency analysis. Automatically discovers optimal libraries and implementation patterns from large-scale code corpus.

---

### 🔧 **Core Techniques**

- 🧠 **Intelligent Orchestration Agent**: Central decision-making system that coordinates workflow phases and analyzes requirements. Employs dynamic planning algorithms to adapt execution strategies in real-time based on evolving project complexity. Dynamically selects optimal processing strategies for each implementation step. <br>

- 💾 **Efficient Memory Mechanism**: Advanced context engineering system that manages large-scale code contexts efficiently. Implements hierarchical memory structures with intelligent compression for handling complex codebases. This component enables instant retrieval of implementation patterns and maintains semantic coherence across extended development sessions. <br>

- 🔍 **Advanced CodeRAG System**: Global code comprehension engine that analyzes complex inter-dependencies across repositories. Performs cross-codebase relationship mapping to understand architectural patterns from a holistic perspective. This module leverages dependency graphs and semantic analysis to provide globally-aware code recommendations during implementation.

---

### 🤖 **Multi-Agent Architecture of DeepCode**:

- **🎯 Central Orchestrating Agent**: Orchestrates entire workflow execution and makes strategic decisions. Coordinates specialized agents based on input complexity analysis. Implements dynamic task planning and resource allocation algorithms. <br>

- **📝 Intent Understanding Agent**: Performs deep semantic analysis of user requirements to decode complex intentions. Extracts functional specifications and technical constraints through advanced NLP processing. Transforms ambiguous human descriptions into precise, actionable development specifications with structured task decomposition. <br>

- **📄 Document Parsing Agent**: Processes complex technical documents and research papers with advanced parsing capabilities. Extracts algorithms and methodologies using document understanding models. Converts academic concepts into practical implementation specifications through intelligent content analysis. <br>

- **🏗️ Code Planning Agent**: Performs architectural design and technology stack optimization. Dynamic planning for adaptive development roadmaps. Enforces coding standards and generates modular structures through automated design pattern selection.<br>

- **🔍 Code Reference Mining Agent**: Discovers relevant repositories and frameworks through intelligent search algorithms. Analyzes codebases for compatibility and integration potential. Provides recommendations based on similarity metrics and automated dependency analysis. <br>

- **📚 Code Indexing Agent**: Builds comprehensive knowledge graphs of discovered codebases. Maintains semantic relationships between code components. Enables intelligent retrieval and cross-reference capabilities. <br>

- **🧬 Code Generation Agent**: Synthesizes gathered information into executable code implementations. Creates functional interfaces and integrates discovered components. Generates comprehensive test suites and documentation for reproducibility.

---

#### 🛠️ **Implementation Tools Matrix**

**🔧 Powered by MCP (Model Context Protocol)**

DeepCode leverages the **Model Context Protocol (MCP)** standard to seamlessly integrate with various tools and services. This standardized approach ensures reliable communication between AI agents and external systems, enabling powerful automation capabilities.

##### 📡 **MCP Servers & Tools**

| 🛠️ **MCP Server** | 🔧 **Primary Function** | 💡 **Purpose & Capabilities** |
|-------------------|-------------------------|-------------------------------|
| **🔍 brave** | Web Search Engine | Real-time information retrieval via Brave Search API |
| **🌐 bocha-mcp** | Alternative Search | Secondary search option with independent API access |
| **📂 filesystem** | File System Operations | Local file and directory management, read/write operations |
| **🌐 fetch** | Web Content Retrieval | Fetch and extract content from URLs and web resources |
| **📥 github-downloader** | Repository Management | Clone and download GitHub repositories for analysis |
| **📋 file-downloader** | Document Processing | Download and convert files (PDF, DOCX, etc.) to Markdown |
| **⚡ command-executor** | System Commands | Execute bash/shell commands for environment management |
| **🧬 code-implementation** | Code Generation Hub | Comprehensive code reproduction with execution and testing |
| **📚 code-reference-indexer** | Smart Code Search | Intelligent indexing and search of code repositories |
| **📄 document-segmentation** | Smart Document Analysis | Intelligent document segmentation for large papers and technical documents |

##### 🔧 **Legacy Tool Functions** *(for reference)*

| 🛠️ **Function** | 🎯 **Usage Context** |
|-----------------|---------------------|
| **📄 read_code_mem** | Efficient code context retrieval from memory |
| **✍️ write_file** | Direct file content generation and modification |
| **🐍 execute_python** | Python code testing and validation |
| **📁 get_file_structure** | Project structure analysis and organization |
| **⚙️ set_workspace** | Dynamic workspace and environment configuration |
| **📊 get_operation_history** | Process monitoring and operation tracking |


---

🎛️ **Multi-Interface Framework**<br>
RESTful API with CLI and web frontends featuring real-time code streaming, interactive debugging, and extensible plugin architecture for CI/CD integration.

**🚀 Multi-Agent Intelligent Pipeline:**

<div align="center">

### 🌟 **Intelligence Processing Flow**

<table align="center" width="100%" style="border: none; border-collapse: collapse;">
<tr>
<td colspan="3" align="center" style="padding: 20px; background: linear-gradient(135deg, #667eea 0%, #764ba2 100%); border-radius: 15px; color: white; font-weight: bold;">
💡 <strong>INPUT LAYER</strong><br/>
📄 Research Papers • 💬 Natural Language • 🌐 URLs • 📋 Requirements
</td>
</tr>
<tr><td colspan="3" height="20"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 15px; background: linear-gradient(135deg, #ff6b6b 0%, #ee5a24 100%); border-radius: 12px; color: white; font-weight: bold;">
🎯 <strong>CENTRAL ORCHESTRATION</strong><br/>
Strategic Decision Making • Workflow Coordination • Agent Management
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #3742fa 0%, #2f3542 100%); border-radius: 10px; color: white; width: 50%;">
📝 <strong>TEXT ANALYSIS</strong><br/>
<small>Requirement Processing</small>
</td>
<td width="10"></td>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #8c7ae6 0%, #9c88ff 100%); border-radius: 10px; color: white; width: 50%;">
📄 <strong>DOCUMENT ANALYSIS</strong><br/>
<small>Paper & Spec Processing</small>
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 15px; background: linear-gradient(135deg, #00d2d3 0%, #54a0ff 100%); border-radius: 12px; color: white; font-weight: bold;">
📋 <strong>REPRODUCTION PLANNING</strong><br/>
Deep Paper Analysis • Code Requirements Parsing • Reproduction Strategy Development
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #ffa726 0%, #ff7043 100%); border-radius: 10px; color: white; width: 50%;">
🔍 <strong>REFERENCE ANALYSIS</strong><br/>
<small>Repository Discovery</small>
</td>
<td width="10"></td>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #e056fd 0%, #f368e0 100%); border-radius: 10px; color: white; width: 50%;">
📚 <strong>CODE INDEXING</strong><br/>
<small>Knowledge Graph Building</small>
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 15px; background: linear-gradient(135deg, #26de81 0%, #20bf6b 100%); border-radius: 12px; color: white; font-weight: bold;">
🧬 <strong>CODE IMPLEMENTATION</strong><br/>
Implementation Generation • Testing • Documentation
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 20px; background: linear-gradient(135deg, #045de9 0%, #09c6f9 100%); border-radius: 15px; color: white; font-weight: bold;">
⚡ <strong>OUTPUT DELIVERY</strong><br/>
📦 Complete Codebase • 🧪 Test Suite • 📚 Documentation • 🚀 Deployment Ready
</td>
</tr>
</table>

</div>

<div align="center">
<br/>

### 🔄 **Process Intelligence Features**

<table align="center" style="border: none;">
<tr>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #ff6b6b;">
<h4>🎯 Adaptive Flow</h4>
<p><small>Dynamic agent selection based on input complexity</small></p>
</div>
</td>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #4ecdc4;">
<h4>🧠 Smart Coordination</h4>
<p><small>Intelligent task distribution and parallel processing</small></p>
</div>
</td>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #45b7d1;">
<h4>🔍 Context Awareness</h4>
<p><small>Deep understanding through CodeRAG integration</small></p>
</div>
</td>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #96ceb4;">
<h4>⚡ Quality Assurance</h4>
<p><small>Automated testing and validation throughout</small></p>
</div>
</td>
</tr>
</table>

</div>

---


## 🚀 Quick Start

### 📋 **Prerequisites**

Before installing DeepCode, ensure you have the following:

| Requirement | Version | Purpose |
|-------------|---------|---------|
| **Python** | 3.9+ | Core runtime |
| **Node.js** | 18+ | New UI frontend |
| **npm** | 8+ | Package management |

```bash
# Check your versions
python --version   # Should be 3.9+
node --version     # Should be 18+
npm --version      # Should be 8+
```

<details>
<summary><strong>📥 Install Node.js (if not installed)</strong></summary>

```bash
# macOS (using Homebrew)
brew install node

# Ubuntu/Debian
curl -fsSL https://deb.nodesource.com/setup_20.x | sudo -E bash -
sudo apt-get install -y nodejs

# Windows
# Download from https://nodejs.org/
```

</details>

### 📦 **Step 1: Installation**

Choose one of the following installation methods:

#### ⚡ **Direct Installation (Recommended)**

```bash
# 🚀 Install DeepCode package directly
pip install deepcode-hku

# 🔑 Download configuration files
curl -O https://raw.githubusercontent.com/HKUDS/DeepCode/main/mcp_agent.config.yaml
curl -O https://raw.githubusercontent.com/HKUDS/DeepCode/main/mcp_agent.secrets.yaml
```

#### 🔧 **Development Installation (From Source)**

<details>
<summary><strong>📂 Click to expand development installation options</strong></summary>

##### 🔥 **Using UV (Recommended for Development)**

```bash
git clone https://github.com/HKUDS/DeepCode.git
cd DeepCode/

curl -LsSf https://astral.sh/uv/install.sh | sh
uv venv --python=3.13
source .venv/bin/activate  # On Windows: .venv\Scripts\activate
uv pip install -r requirements.txt

# Install frontend dependencies
npm install --prefix new_ui/frontend
```

##### 🐍 **Using Traditional pip**

```bash
git clone https://github.com/HKUDS/DeepCode.git
cd DeepCode/

pip install -r requirements.txt

# Install frontend dependencies
npm install --prefix new_ui/frontend
```

</details>

### 🔧 **Step 2: Configuration**

> The following configuration applies to **all installation methods** (pip, UV, source, and Docker).

#### 🔑 API Keys *(required)*

Edit `mcp_agent.secrets.yaml` with your API keys:

```yaml
# At least ONE provider API key is required
openai:
  api_key: "your_openai_api_key"
  base_url: "https://openrouter.ai/api/v1"  # Optional: for OpenRouter or custom endpoints

anthropic:
  api_key: "your_anthropic_api_key"  # For Claude models

google:
  api_key: "your_google_api_key"     # For Gemini models
```

#### 🤖 LLM Provider *(optional)*

Edit `mcp_agent.config.yaml` to choose your preferred LLM provider (line ~106):

```yaml
# Options: "google", "anthropic", "openai"
# If not set or unavailable, will automatically fallback to first available provider
llm_provider: "google"
```

#### 🔍 Search API Keys *(optional)*

Configure web search in `mcp_agent.config.yaml`:

```yaml
# For Brave Search (default) — set in brave.env section (line ~28)
brave:
  env:
    BRAVE_API_KEY: "your_brave_api_key_here"

# For Bocha-MCP (alternative) — set in bocha-mcp.env section (line ~74)
bocha-mcp:
  env:
    BOCHA_API_KEY: "your_bocha_api_key_here"
```

#### 📄 Document Segmentation *(optional)*

Control document processing in `mcp_agent.config.yaml`:

```yaml
document_segmentation:
  enabled: true          # true/false — whether to use intelligent document segmentation
  size_threshold_chars: 50000  # Document size threshold to trigger segmentation
```

<details>
<summary><strong>🪟 Windows Users: Additional MCP Server Configuration</strong></summary>

If you're using Windows, you may need to configure MCP servers manually in `mcp_agent.config.yaml`:

```bash
# 1. Install MCP servers globally
npm i -g @modelcontextprotocol/server-brave-search
npm i -g @modelcontextprotocol/server-filesystem

# 2. Find your global node_modules path
npm -g root
```

Then update your `mcp_agent.config.yaml` to use absolute paths:

```yaml
mcp:
  servers:
    brave:
      command: "node"
      args: ["C:/Program Files/nodejs/node_modules/@modelcontextprotocol/server-brave-search/dist/index.js"]
    filesystem:
      command: "node"
      args: ["C:/Program Files/nodejs/node_modules/@modelcontextprotocol/server-filesystem/dist/index.js", "."]
```

> **Note**: Replace the path with your actual global node_modules path from step 2.

</details>

<details>
<summary><strong>🔍 Search Server Configuration (Optional)</strong></summary>

DeepCode supports multiple search servers for web search functionality. You can configure your preferred option in `mcp_agent.config.yaml`:

```yaml
# Default search server configuration
# Options: "brave" or "bocha-mcp"
default_search_server: "brave"
```

**Available Options:**
- **🔍 Brave Search** (`"brave"`): Default option with high-quality search results. Requires `BRAVE_API_KEY`. Recommended for most users.
- **🌐 Bocha-MCP** (`"bocha-mcp"`): Alternative search server. Requires `BOCHA_API_KEY`. Uses local Python server implementation.

**Full MCP server configuration in mcp_agent.config.yaml:**
```yaml
# For Brave Search (default) - around line 28
brave:
  command: "npx"
  args: ["-y", "@modelcontextprotocol/server-brave-search"]
  env:
    BRAVE_API_KEY: "your_brave_api_key_here"

# For Bocha-MCP (alternative) - around line 74
bocha-mcp:
  command: "python"
  args: ["tools/bocha_search_server.py"]
  env:
    PYTHONPATH: "."
    BOCHA_API_KEY: "your_bocha_api_key_here"
```

> **💡 Tip**: Both search servers require API key configuration. Choose the one that best fits your API access and requirements.

</details>

### ⚡ **Step 3: Launch Application**

Choose your preferred launch method:

<table width="100%">
<tr>
<th width="33%">🐳 Docker (Recommended)</th>
<th width="33%">🚀 Local (<code>deepcode</code> command)</th>
<th width="33%">🛠️ Other Methods</th>
</tr>
<tr><td>

No Python/Node needed — everything in container.

```bash
git clone https://github.com/HKUDS/DeepCode.git
cd DeepCode/
cp mcp_agent.secrets.yaml.example \
   mcp_agent.secrets.yaml
# Edit secrets with your API keys

./deepcode_docker/run_docker.sh
# Access → http://localhost:8000
```

</td><td>

Auto-installs deps on first run.

```bash
deepcode
# Frontend → http://localhost:5173
# Backend  → http://localhost:8000
# Ctrl+C to stop
```

Features: User-in-Loop, real-time progress, inline chat.

</td><td>

```bash
# macOS / Linux
./run.sh
# or: python deepcode.py

# Windows
run.bat
# or: python deepcode.py

# Classic Streamlit UI
deepcode --classic

# CLI mode
deepcode --cli
# or: python cli/main_cli.py
```

</td></tr>
</table>

<details>
<summary><strong>🐳 Docker Management Commands</strong></summary>

```bash
./deepcode_docker/run_docker.sh stop      # Stop
./deepcode_docker/run_docker.sh restart   # Restart (no rebuild needed for config changes)
./deepcode_docker/run_docker.sh --build   # Force rebuild
./deepcode_docker/run_docker.sh logs      # Real-time logs
./deepcode_docker/run_docker.sh status    # Health check
./deepcode_docker/run_docker.sh clean     # Remove containers & images
```

Or with Docker Compose directly:
```bash
docker compose -f deepcode_docker/docker-compose.yml up --build   # Build & start
docker compose -f deepcode_docker/docker-compose.yml down         # Stop
docker compose -f deepcode_docker/docker-compose.yml logs -f      # Logs
```

> **💡** Config files are mounted as volumes — edit and restart, no rebuild needed.
> **💡** Windows users: run `docker compose` commands directly if shell scripts aren't available.

</details>

### 🎯 **Step 4: Generate Code**

1. **📄 Input** — Upload a research paper, type requirements, or paste a URL
2. **🤖 Processing** — The multi-agent system analyzes, plans, and generates
3. **⚡ Output** — Receive production-ready code with tests and documentation

---

### 🔧 **Troubleshooting**

<details>
<summary><strong>❓ Common Issues & Solutions</strong></summary>

| Problem | Cause | Fix |
|---|---|---|
| Docker build fails with `tsc: not found` | Corrupted build cache | `docker builder prune -f` then rebuild with `--no-cache` |
| `error during connect` / `cannot find the file` | Docker Desktop not running | Start Docker Desktop, wait until ready, retry |
| Frontend blank page | Corrupted `node_modules` | `cd new_ui/frontend && rm -rf node_modules && npm install` |
| `ERR_CONNECTION_REFUSED` | Wrong port / backend not running | Docker: `http://localhost:8000`. Local: `http://localhost:5173` |
| `npm install` → `Could not read package.json` | Wrong directory | Use `npm install --prefix new_ui/frontend` |
| Windows: MCP servers not working | Need absolute paths | See [Windows MCP Configuration](#-step-2-configuration) above |

</details>

  ---

## 🤖 nanobot Integration (Feishu Chatbot)

> Chat with DeepCode from **Feishu** — powered by [nanobot](https://github.com/HKUDS/nanobot).

<div align="center">

```mermaid
flowchart LR
    subgraph Clients["💬 Chat Platforms"]
        direction TB
        F["<b>Feishu</b><br/>WebSocket"]
        T["<b>Telegram</b><br/>Polling"]
        D["<b>Discord</b><br/>Gateway"]
    end

    subgraph Gateway["🐈 nanobot Gateway"]
        direction TB
        A["Agent Loop<br/><i>LLM + Tool Calls</i>"]
    end

    subgraph Engine["🧠 DeepCode Engine"]
        direction TB
        P2C["Paper → Code"]
        C2C["Chat → Code"]
        TRK["Task Tracking"]
    end

    F & T & D <-->|"messages"| A
    A -->|"HTTP API"| P2C & C2C & TRK
    A -.->|"LLM API"| LLM["☁️ OpenRouter"]

    style Clients fill:#1a1a2e,stroke:#00d9ff,color:#fff
    style Gateway fill:#1a1a2e,stroke:#4ecdc4,color:#fff
    style Engine fill:#1a1a2e,stroke:#ff6b6b,color:#fff
    style LLM fill:#1a1a2e,stroke:#9b59b6,color:#fff
```

</div>

<div align="center">
<table><tr>
<td align="center"><a href="https://github.com/HKUDS/DeepCode"><img src="./assets/logo.png" alt="DeepCode" height="55"/></a></td>
<td align="center"><h2>✦</h2></td>
<td align="center"><a href="https://github.com/HKUDS/nanobot"><img src="./assets/nanobot.png" alt="nanobot" height="55"/></a></td>
</tr></table>
</div>

Both services run inside the same **Docker Compose** network. Prerequisites: **Docker Desktop** + **OpenRouter API Key** ([get one](https://openrouter.ai/keys)) + **Feishu App**.

---

### Step 1 · Create a Feishu Bot

<details open>
<summary><b>Feishu / Lark</b> (Recommended — WebSocket, no public IP needed)</summary>

1. Go to [Feishu Open Platform](https://open.feishu.cn/app) → **Create Custom App**
2. Enable **Bot** capability in App Features
3. Add permissions: `im:message` · `im:message:send_as_bot`
4. Event Subscription → select **Long Connection** → add `im.message.receive_v1`
5. Note your **App ID** (`cli_xxx`) and **App Secret** → Publish the app

> **Note**: Feishu requires an active WebSocket connection before you can save "Long Connection" mode. Start nanobot first (Step 3), then come back to configure Event Subscription.

</details>

### Step 2 · Configure

```bash
cp nanobot_config.json.example nanobot_config.json
```

Edit `nanobot_config.json` — fill in the 3 required fields:

```jsonc
{
  "channels": {
    "feishu": {
      "enabled": true,
      "appId": "cli_xxx",              // ← Feishu App ID
      "appSecret": "xxx",              // ← Feishu App Secret
      "allowFrom": []                  // [] = allow all users
    }
  },
  "providers": {
    "openrouter": {
      "apiKey": "sk-or-v1-xxx"         // ← OpenRouter API Key
    }
  },
  "agents": {
    "defaults": {
      "model": "anthropic/claude-sonnet-4-20250514"
    }
  }
}
```

> **Model choice**: Any model on [openrouter.ai/models](https://openrouter.ai/models). Use `anthropic/claude-sonnet-4-20250514` for English, `minimax/minimax-m2.1` for Chinese.

---

### Step 3 · Launch

Make sure `mcp_agent.secrets.yaml` has your DeepCode API keys (see [Configuration](#-step-2-configuration)), then:

```bash
./nanobot/run_nanobot.sh -d          # Start both DeepCode + nanobot in background
```

The script checks Docker, validates configs, builds images (first run only), and starts both containers.

```
✓ DeepCode API:  http://localhost:8000
✓ Nanobot:       http://localhost:18790
```

Now open Feishu → find your bot → send a message!

<details>
<summary><b>Management Commands</b></summary>

```bash
./nanobot/run_nanobot.sh              # Start (foreground)
./nanobot/run_nanobot.sh -d           # Start (background)
./nanobot/run_nanobot.sh stop         # Stop all services
./nanobot/run_nanobot.sh restart      # Restart (config changes take effect immediately)
./nanobot/run_nanobot.sh --build      # Force rebuild Docker images
./nanobot/run_nanobot.sh logs         # View real-time logs
./nanobot/run_nanobot.sh status       # Health check
./nanobot/run_nanobot.sh clean        # Remove containers & images
```

</details>

<details>
<summary><b>Troubleshooting</b></summary>

| Problem | Fix |
|---|---|
| Feishu bot doesn't respond | Check logs (`./nanobot/run_nanobot.sh logs`), verify `appId`/`appSecret`, ensure app is published with Long Connection mode |
| Can't connect to DeepCode | Verify `deepcode` container is healthy: `curl http://localhost:8000/health` |
| Wrong language output | Switch model — `minimax-m2.1` defaults to Chinese, use Claude/GPT for English |
| Config not taking effect | Just restart: `./nanobot/run_nanobot.sh restart` (no rebuild needed) |
| Clear chat history | Send `/clear` in chat, or: `docker exec nanobot sh -c 'rm -rf /root/.nanobot/sessions/*.jsonl'` |

</details>

---

## 💡 Examples


### 🎬 **Live Demonstrations**


<table align="center">
<tr>
<td width="33%" align="center">

#### 📄 **Paper2Code Demo**
**Research to Implementation**

<div align="center">
  <a href="https://www.youtube.com/watch?v=MQZYpLkzsbw">
    <img src="https://img.youtube.com/vi/MQZYpLkzsbw/maxresdefault.jpg" alt="Paper2Code Demo" width="100%" style="border-radius: 10px; box-shadow: 0 4px 8px rgba(0,0,0,0.1);"/>
  </a>

  **[▶️ Watch Demo](https://www.youtube.com/watch?v=MQZYpLkzsbw)**

  *Transform academic papers into production-ready code automatically*
</div>

</td>
<td width="33%" align="center">

#### 🖼️ **Image Processing Demo**
**AI-Powered Image Tools**

<div align="center">
  <a href="https://www.youtube.com/watch?v=nFt5mLaMEac">
    <img src="https://img.youtube.com/vi/nFt5mLaMEac/maxresdefault.jpg" alt="Image Processing Demo" width="100%" style="border-radius: 10px; box-shadow: 0 4px 8px rgba(0,0,0,0.1);"/>
  </a>

  **[▶️ Watch Demo](https://www.youtube.com/watch?v=nFt5mLaMEac)**

  *Intelligent image processing with background removal and enhancement*
</div>

</td>
<td width="33%" align="center">

#### 🌐 **Frontend Implementation**
**Complete Web Application**

<div align="center">
  <a href="https://www.youtube.com/watch?v=78wx3dkTaAU">
    <img src="https://img.youtube.com/vi/78wx3dkTaAU/maxresdefault.jpg" alt="Frontend Demo" width="100%" style="border-radius: 10px; box-shadow: 0 4px 8px rgba(0,0,0,0.1);"/>
  </a>

  **[▶️ Watch Demo](https://www.youtube.com/watch?v=78wx3dkTaAU)**

  *Full-stack web development from concept to deployment*
</div>

</td>
</tr>
</table>


### 🆕 **Recent Updates**

#### 📄 **Smart Document Segmentation (v1.2.0)**
- **Intelligent Processing**: Automatically handles large research papers and technical documents that exceed LLM token limits
- **Configurable Control**: Toggle segmentation via configuration with size-based thresholds
- **Semantic Analysis**: Advanced content understanding with algorithm, concept, and formula preservation
- **Backward Compatibility**: Seamlessly falls back to traditional processing for smaller documents

### 🚀 **Coming Soon**

We're continuously enhancing DeepCode with exciting new features:

#### 🔧 **Enhanced Code Reliability & Validation**
- **Automated Testing**: Comprehensive functionality testing with execution verification and error detection.
- **Code Quality Assurance**: Multi-level validation through static analysis, dynamic testing, and performance benchmarking.
- **Smart Debugging**: AI-powered error detection with automatic correction suggestions

#### 📊 **PaperBench Performance Showcase**
- **Benchmark Dashboard**: Comprehensive performance metrics on the PaperBench evaluation suite.
- **Accuracy Metrics**: Detailed comparison with state-of-the-art paper reproduction systems.
- **Success Analytics**: Statistical analysis across paper categories and complexity levels.

#### ⚡ **System-wide Optimizations**
- **Performance Boost**: Multi-threaded processing and optimized agent coordination for faster generation.
- **Enhanced Reasoning**: Advanced reasoning capabilities with improved context understanding.
- **Expanded Support**: Extended compatibility with additional programming languages and frameworks.

---

## ⭐ Star History

<div align="center">

*Community Growth Trajectory*

<a href="https://star-history.com/#HKUDS/DeepCode&Date">
  <picture>
    <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/svg?repos=HKUDS/DeepCode&type=Date&theme=dark" />
    <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/svg?repos=HKUDS/DeepCode&type=Date" />
    <img alt="Star History Chart" src="https://api.star-history.com/svg?repos=HKUDS/DeepCode&type=Date" style="border-radius: 15px; box-shadow: 0 0 30px rgba(0, 217, 255, 0.3);" />
  </picture>
</a>

</div>

---

### 🚀 **Ready to Transform Development?**

<div align="center">

<p>
  <a href="#-quick-start"><img src="https://img.shields.io/badge/🚀_Get_Started-00d4ff?style=for-the-badge&logo=rocket&logoColor=white" alt="Get Started"></a>
  <a href="https://github.com/HKUDS"><img src="https://img.shields.io/badge/🏛️_View_on_GitHub-00d4ff?style=for-the-badge&logo=github&logoColor=white" alt="View on GitHub"></a>
  <a href="https://github.com/HKUDS/deepcode-agent"><img src="https://img.shields.io/badge/⭐_Star_Project-00d4ff?style=for-the-badge&logo=star&logoColor=white" alt="Star Project"></a>
</p>

---

<div align="left">

### 📖 **Citation**


If you find DeepCode useful in your research or applications, please kindly cite:

```
@misc{li2025deepcodeopenagenticcoding,
      title={DeepCode: Open Agentic Coding},
      author={Zongwei Li and Zhonghang Li and Zirui Guo and Xubin Ren and Chao Huang},
      year={2025},
      eprint={2512.07921},
      archivePrefix={arXiv},
      primaryClass={cs.SE},
      url={https://arxiv.org/abs/2512.07921},
}
```

---


### 📄 **License**

<div align="center">

<img src="https://img.shields.io/badge/License-MIT-4ecdc4?style=for-the-badge&logo=opensourceinitiative&logoColor=white" alt="MIT License">

**MIT License** - Copyright (c) 2025 Data Intelligence Lab, The University of Hong Kong

---


<img src="https://visitor-badge.laobi.icu/badge?page_id=deepcode.readme&style=for-the-badge&color=00d4ff" alt="Visitors">

</div>


================================================
FILE: README_ZH.md
================================================
<div align="center">

<table style="border: none; margin: 0 auto; padding: 0; border-collapse: collapse;">
<tr>
<td align="center" style="vertical-align: middle; padding: 10px; border: none; width: 250px;">
  <img src="assets/logo.png" alt="DeepCode Logo" width="200" style="margin: 0; padding: 0; display: block;"/>
</td>
<td align="left" style="vertical-align: middle; padding: 10px 0 10px 30px; border: none;">
  <pre style="font-family: 'Courier New', monospace; font-size: 16px; color: #0EA5E9; margin: 0; padding: 0; text-shadow: 0 0 10px #0EA5E9, 0 0 20px rgba(14,165,233,0.5); line-height: 1.2; transform: skew(-1deg, 0deg); display: block;">    ██████╗ ███████╗███████╗██████╗  ██████╗ ██████╗ ██████╗ ███████╗
    ██╔══██╗██╔════╝██╔════╝██╔══██╗██╔════╝██╔═══██╗██╔══██╗██╔════╝
    ██║  ██║█████╗  █████╗  ██████╔╝██║     ██║   ██║██║  ██║█████╗
    ██║  ██║██╔══╝  ██╔══╝  ██╔═══╝ ██║     ██║   ██║██║  ██║██╔══╝
    ██████╔╝███████╗███████╗██║     ╚██████╗╚██████╔╝██████╔╝███████╗
    ╚═════╝ ╚══════╝╚══════╝╚═╝      ╚═════╝ ╚═════╝ ╚═════╝ ╚══════╝</pre>
</td>
</tr>
</table>

<div align="center">
<a href="https://trendshift.io/repositories/14665" target="_blank"><img src="https://trendshift.io/api/badge/repositories/14665" alt="HKUDS%2FDeepCode | Trendshift" style="width: 250px; height: 55px;" width="250" height="55"/></a>
</div>

<!-- <img src="https://readme-typing-svg.herokuapp.com?font=Russo+One&size=28&duration=2000&pause=800&color=06B6D4&background=00000000&center=true&vCenter=true&width=800&height=50&lines=%E2%9A%A1+OPEN+AGENTIC+CODING+%E2%9A%A1" alt="DeepCode Tech Subtitle" style="margin-top: 5px; filter: drop-shadow(0 0 12px #06B6D4) drop-shadow(0 0 24px rgba(6,182,212,0.4));"/> -->

# <img src="https://github.com/Zongwei9888/Experiment_Images/raw/43c585dca3d21b8e4b6390d835cdd34dc4b4b23d/DeepCode_images/title_logo.svg" alt="DeepCode Logo" width="32" height="32" style="vertical-align: middle; margin-right: 8px;"/> DeepCode: 开源智能体编程

### *基于多智能体系统推进代码生成技术*

<!-- <p align="center">
  <img src="https://img.shields.io/badge/Version-1.0.0-00d4ff?style=for-the-badge&logo=rocket&logoColor=white" alt="Version">

  <img src="https://img.shields.io/badge/License-MIT-4ecdc4?style=for-the-badge&logo=opensourceinitiative&logoColor=white" alt="License">
  <img src="https://img.shields.io/badge/AI-Multi--Agent-9b59b6?style=for-the-badge&logo=brain&logoColor=white" alt="AI">
  <img src="https://img.shields.io/badge/HKU-Data_Intelligence_Lab-f39c12?style=for-the-badge&logo=university&logoColor=white" alt="HKU">
</p> -->
<p>
  <a href="https://github.com/HKUDS/DeepCode/stargazers"><img src='https://img.shields.io/github/stars/HKUDS/DeepCode?color=00d9ff&style=for-the-badge&logo=star&logoColor=white&labelColor=1a1a2e' /></a>
  <img src="https://img.shields.io/badge/🐍Python-3.13-4ecdc4?style=for-the-badge&logo=python&logoColor=white&labelColor=1a1a2e">
  <a href="https://pypi.org/project/deepcode-hku/"><img src="https://img.shields.io/pypi/v/deepcode-hku.svg?style=for-the-badge&logo=pypi&logoColor=white&labelColor=1a1a2e&color=ff6b6b"></a>
</p>
<p>
  <a href="https://discord.gg/yF2MmDJyGJ"><img src="https://img.shields.io/badge/💬Discord-社区-7289da?style=for-the-badge&logo=discord&logoColor=white&labelColor=1a1a2e"></a>
  <a href="https://github.com/HKUDS/DeepCode/issues/11"><img src="https://img.shields.io/badge/💬微信-群组-07c160?style=for-the-badge&logo=wechat&logoColor=white&labelColor=1a1a2e"></a>
</p>
<div align="center">
  <div style="width: 100%; height: 2px; margin: 20px 0; background: linear-gradient(90deg, transparent, #00d9ff, transparent);"></div>
</div>

<div align="center">
  <a href="#-快速开始" style="text-decoration: none;">
    <img src="https://img.shields.io/badge/快速开始-立即开始-00d9ff?style=for-the-badge&logo=rocket&logoColor=white&labelColor=1a1a2e">
  </a>
</div>

<div align="center" style="margin-top: 10px;">
  <a href="README.md">
    <img src="https://img.shields.io/badge/English-00d4ff?style=for-the-badge&logo=readme&logoColor=white&labelColor=1a1a2e" alt="English">
  </a>
  <a href="README_ZH.md">
    <img src="https://img.shields.io/badge/中文-00d4ff?style=for-the-badge&logo=readme&logoColor=white&labelColor=1a1a2e" alt="中文">
  </a>
</div>

### 🖥️ **界面展示**

<table align="center" width="100%" style="border: none; border-collapse: collapse; margin: 30px 0;">
<tr>
<td width="50%" align="center" style="vertical-align: top; padding: 20px;">

#### 🖥️ **命令行界面**
**基于终端的开发环境**

<div align="center">

  <img src="https://github.com/Zongwei9888/Experiment_Images/blob/8882a7313c504ca97ead6e7b36c51aa761b6a4f3/DeepCode_images/CLI.gif" alt="CLI Interface Demo" width="100%" style="border-radius: 10px; box-shadow: 0 8px 20px rgba(45,55,72,0.3); margin: 15px 0;"/>

  <div style="background: linear-gradient(135deg, #2D3748 0%, #4A5568 100%); border-radius: 12px; padding: 15px; margin: 15px 0; color: white;">
    <strong>🚀 高级终端体验</strong><br/>
    <small>⚡ 快速命令行工作流<br/>🔧 开发者友好界面<br/>📊 实时进度跟踪</small>
  </div>

  *专业终端界面，适合高级用户和CI/CD集成*
</div>

</td>
<td width="50%" align="center" style="vertical-align: top; padding: 20px;">

#### 🌐 **Web界面**
**可视化交互体验**

<div align="center">

  <img src="https://github.com/Zongwei9888/Experiment_Images/raw/8882a7313c504ca97ead6e7b36c51aa761b6a4f3/DeepCode_images/UI.gif" alt="Web Interface Demo" width="100%" style="border-radius: 10px; box-shadow: 0 8px 20px rgba(14,165,233,0.3); margin: 15px 0;"/>

  <div style="background: linear-gradient(135deg, #0EA5E9 0%, #00D4FF 100%); border-radius: 12px; padding: 15px; margin: 15px 0; color: white;">
    <strong>🎨 现代化Web仪表板</strong><br/>
    <small>🖱️ 直观的拖拽操作<br/>📱 响应式设计<br/>🎯 可视化进度跟踪</small>
  </div>

  *美观的Web界面，为所有技能水平用户提供流畅的工作流程*
</div>

</td>
</tr>
</table>

---

<div align="center">

### 🎬 **介绍视频**

<div style="margin: 20px 0;">
  <a href="https://youtu.be/PRgmP8pOI08" target="_blank">
    <img src="https://img.youtube.com/vi/PRgmP8pOI08/maxresdefault.jpg"
         alt="DeepCode Introduction Video"
         width="75%"
         style="border-radius: 12px; box-shadow: 0 8px 25px rgba(0,0,0,0.15); transition: transform 0.3s ease;"/>
  </a>
</div>

*🎯 **观看我们的完整介绍** - 了解DeepCode如何将研究论文和自然语言转换为生产就绪的代码*

<p>
  <a href="https://youtu.be/PRgmP8pOI08" target="_blank">
    <img src="https://img.shields.io/badge/▶️_观看视频-FF0000?style=for-the-badge&logo=youtube&logoColor=white" alt="Watch Video"/>
  </a>
</p>

</div>

---


> *"AI智能体将创意转化为生产就绪代码的地方"*

</div>

---

## 📑 目录

- [📰 新闻](#-新闻)
- [🚀 核心特性](#-核心特性)
- [🏗️ 架构](#️-架构)
- [📊 实验结果](#-实验结果)
- [🚀 快速开始](#-快速开始)
- [🤖 nanobot 集成（飞书聊天机器人）](#-nanobot-集成飞书聊天机器人)
- [💡 示例](#-示例)
  - [🎬 实时演示](#-实时演示)
- [⭐ 星标历史](#-星标历史)
- [📄 许可证](#-许可证)

---

## 📰 新闻

🎉 **[2026-02] DeepCode + nanobot 集成 — 通过飞书聊天使用 DeepCode！**

<div align="center">
<table><tr>
<td align="center"><a href="https://github.com/HKUDS/DeepCode"><img src="./assets/logo.png" alt="DeepCode" height="60"/></a></td>
<td align="center"><h2>✦</h2></td>
<td align="center"><a href="https://github.com/HKUDS/nanobot"><img src="./assets/nanobot.png" alt="nanobot" height="60"/></a></td>
</tr></table>
</div>

- [nanobot](https://github.com/HKUDS/nanobot) 现已连接到 DeepCode — 在**飞书**中发送消息即可自动生成代码
- 支持**论文转代码**和**对话转代码**，以及实时任务跟踪，全部在聊天应用中完成
- 一键部署：`./nanobot/run_nanobot.sh` → **[设置指南 →](#-nanobot-集成飞书聊天机器人)**

<div align="center">
<table width="100%"><tr>
<td width="50%" align="center">
  <img src="./assets/IMG_8098.jpeg" alt="飞书聊天示例 1" width="95%" style="border-radius: 10px; box-shadow: 0 4px 15px rgba(0,0,0,0.2);"/>
</td>
<td width="50%" align="center">
  <img src="./assets/IMG_8099.jpeg" alt="飞书聊天示例 2" width="95%" style="border-radius: 10px; box-shadow: 0 4px 15px rgba(0,0,0,0.2);"/>
</td>
</tr></table>
<sub><em>飞书机器人实战 — 自然语言 → 完整代码生成，带设置说明</em></sub>
</div>

---

🎉 **[2026-02] 全新 Web UI 体验升级！**

- 🔄 **用户交互循环 (User-in-Loop)**: 支持工作流程中的实时用户交互，AI 会在对话中向您提问以澄清需求
- 💬 **内联交互设计**: 交互问题直接显示在对话框中，体验更自然流畅
- 🚀 **一键启动**: 运行 `deepcode` 即可启动新版 UI（跨平台支持：Windows/macOS/Linux）
- 🔧 **优化的进程管理**: 改进了服务启停机制，自动清理端口占用
- 📡 **WebSocket 实时通信**: 修复了消息丢失问题，确保交互状态正确同步

<div align="center">
  <img src="./assets/NewUI.png" alt="DeepCode 全新 UI" width="85%" style="border-radius: 12px; box-shadow: 0 4px 20px rgba(0,0,0,0.15);" />
  <br/>
  <sub><em>DeepCode 全新 Web UI - 基于 React 的现代界面</em></sub>
</div>

---

🎉 **[2025-10-28] DeepCode在PaperBench上达到最先进水平！**

DeepCode在OpenAI的PaperBench Code-Dev所有类别中创造新基准：

- 🏆 **超越人类专家**: **75.9%** (DeepCode) vs 顶级机器学习博士 72.4% (+3.5%)。
- 🥇 **超越最先进商业代码智能体**: **84.8%** (DeepCode) vs 领先商业代码智能体 (+26.1%) (Cursor, Claude Code, 和 Codex)。
- 🔬 **推进科学编程**: **73.5%** (DeepCode) vs PaperCoder 51.1% (+22.4%)。
- 🚀 **击败LLM智能体**: **73.5%** (DeepCode) vs 最佳LLM框架 43.3% (+30.2%)。

---

## 🚀 核心特性

<br/>

<table align="center" width="100%" style="border: none; table-layout: fixed;">
<tr>
<td width="30%" align="center" style="vertical-align: top; padding: 20px;">

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<h3 style="margin: 0; padding: 0;">🚀 <strong>论文转代码</strong></h3>
</div>

<div align="center" style="margin: 15px 0;">
  <img src="https://img.shields.io/badge/算法-实现-ff6b6b?style=for-the-badge&logo=algorithm&logoColor=white" alt="Algorithm Badge" />
</div>

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<p align="center"><strong>复杂算法的自动化实现</strong></p>
</div>

<div style="height: 60px; display: flex; align-items: center; justify-content: center;">
<p align="center">轻松将研究论文中的复杂算法转换为<strong>高质量</strong>、<strong>生产就绪</strong>的代码，加速算法复现。</p>
</div>


</td>
<td width="30%" align="center" style="vertical-align: top; padding: 20px;">

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<h3 style="margin: 0; padding: 0;">🎨 <strong>文本转Web</strong></h3>
</div>

<div align="center" style="margin: 15px 0;">
  <img src="https://img.shields.io/badge/前端-开发-4ecdc4?style=for-the-badge&logo=react&logoColor=white" alt="Frontend Badge" />
</div>

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<p align="center"><strong>自动化前端Web开发</strong></p>
</div>

<div style="height: 60px; display: flex; align-items: center; justify-content: center;">
<p align="center">将纯文本描述转换为<strong>功能完整</strong>、<strong>视觉美观</strong>的前端Web代码，快速创建界面。</p>
</div>


</td>
<td width="30%" align="center" style="vertical-align: top; padding: 20px;">

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<h3 style="margin: 0; padding: 0;">⚙️ <strong>文本转后端</strong></h3>
</div>

<div align="center" style="margin: 15px 0;">
  <img src="https://img.shields.io/badge/后端-开发-9b59b6?style=for-the-badge&logo=server&logoColor=white" alt="Backend Badge" />
</div>

<div style="height: 80px; display: flex; align-items: center; justify-content: center;">
<p align="center"><strong>自动化后端开发</strong></p>
</div>

<div style="height: 60px; display: flex; align-items: center; justify-content: center;">
<p align="center">从简单的文本输入生成<strong>高效</strong>、<strong>可扩展</strong>和<strong>功能丰富</strong>的后端代码，简化服务器端开发。</p>
</div>


</td>
</tr>
</table>

<br/>

---

## 📊 实验结果

<div align="center">
    <img src='./assets/result_main02.jpg' /><br>
</div>
<br/>

我们在[*PaperBench*](https://openai.com/index/paperbench/)基准测试（由OpenAI发布）上评估**DeepCode**，这是一个严格的测试平台，要求AI智能体从头独立复现20篇ICML 2024论文。该基准包含8,316个可评分组件，使用带有分层权重的SimpleJudge进行评估。

我们的实验将DeepCode与四个基线类别进行比较：**(1) 人类专家**，**(2) 最先进商业代码智能体**，**(3) 科学代码智能体**，以及 **(4) 基于LLM的智能体**。

### ① 🧠 人类专家表现（顶级机器学习博士）

**DeepCode: 75.9% vs. 顶级机器学习博士: 72.4% (+3.5%)**

DeepCode在3篇论文的人类评估子集上达到**75.9%**，**超越3次人类专家基线（72.4%）+3.5个百分点**。这表明我们的框架不仅匹配而且超越了专家级代码复现能力，代表了自主科学软件工程的重要里程碑。

### ② 💼 最先进商业代码智能体

**DeepCode: 84.8% vs. 最佳商业智能体: 58.7% (+26.1%)**

在5篇论文的子集上，DeepCode大幅超越领先的商业编码工具：
- Cursor: 58.4%
- Claude Code: 58.7%
- Codex: 40.0%
- **DeepCode: 84.8%**

这代表了相对于领先商业代码智能体的**+26.1%改进**。所有商业智能体都使用Claude Sonnet 4.5或GPT-5 Codex-high，突出了**DeepCode的卓越架构**——而非基础模型能力——推动了这一性能差距。

### ③ 🔬 科学代码智能体

**DeepCode: 73.5% vs. PaperCoder: 51.1% (+22.4%)**

与最先进的科学代码复现框架PaperCoder（**51.1%**）相比，DeepCode达到**73.5%**，展示了**+22.4%的相对改进**。这一显著差距验证了我们结合规划、分层任务分解、代码生成和迭代调试的多模块架构优于简单的管道式方法。

### ④ 🤖 基于LLM的智能体

**DeepCode: 73.5% vs. 最佳LLM智能体: 43.3% (+30.2%)**

DeepCode显著超越所有测试的LLM智能体：
- Claude 3.5 Sonnet + IterativeAgent: 27.5%
- o1 + IterativeAgent (36小时): 42.4%
- o1 BasicAgent: 43.3%
- **DeepCode: 73.5%**

相对于表现最佳的LLM智能体的**+30.2%改进**表明，复杂的智能体框架，而非延长的推理时间或更大的模型，对于复杂的代码复现任务至关重要。

---

### 🎯 **自主多智能体工作流**

**面临的挑战**:

- 📄 **实现复杂性**: 将学术论文和复杂算法转换为可运行代码需要大量技术投入和领域专业知识

- 🔬 **研究瓶颈**: 研究人员将宝贵时间花在算法实现上，而不是专注于核心研究和发现工作

- ⏱️ **开发延迟**: 产品团队在概念和可测试原型之间经历长时间等待，减慢创新周期

- 🔄 **重复编码**: 开发者重复实现相似的模式和功能，而不是基于现有解决方案构建

**DeepCode** 通过为常见开发任务提供可靠的自动化来解决这些工作流程低效问题，简化从概念到代码的开发工作流程。

<div align="center">

```mermaid
flowchart LR
    A["📄 研究论文<br/>💬 文本提示<br/>🌐 URL和文档<br/>📎 文件: PDF, DOC, PPTX, TXT, HTML"] --> B["🧠 DeepCode<br/>多智能体引擎"]
    B --> C["🚀 算法实现 <br/>🎨 前端开发 <br/>⚙️ 后端开发"]

    style A fill:#ff6b6b,stroke:#c0392b,stroke-width:2px,color:#000
    style B fill:#00d4ff,stroke:#0984e3,stroke-width:3px,color:#000
    style C fill:#00b894,stroke:#00a085,stroke-width:2px,color:#000
```

</div>

---

## 🏗️ 架构

### 📊 **系统概述**

**DeepCode** 是一个AI驱动的开发平台，自动化代码生成和实现任务。我们的多智能体系统处理将需求转换为功能性、结构良好代码的复杂性，让您专注于创新而非实现细节。

🎯 **技术能力**:

🧬 **研究到生产流水线**<br>
多模态文档分析引擎，从学术论文中提取算法逻辑和数学模型。生成优化的实现，使用适当的数据结构，同时保持计算复杂度特征。

🪄 **自然语言代码合成**<br>
使用在精选代码库上训练的微调语言模型进行上下文感知代码生成。在支持多种编程语言和框架的同时保持模块间架构一致性。

⚡ **自动化原型引擎**<br>
智能脚手架系统，生成包括数据库模式、API端点和前端组件的完整应用程序结构。使用依赖分析确保从初始生成开始的可扩展架构。

💎 **质量保证自动化**<br>
集成静态分析与自动化单元测试生成和文档合成。采用AST分析进行代码正确性检查和基于属性的测试进行全面覆盖。

🔮 **CodeRAG集成系统**<br>
高级检索增强生成，结合语义向量嵌入和基于图的依赖分析。从大规模代码语料库中自动发现最优库和实现模式。

---

### 🔧 **核心技术**

- 🧠 **智能编排智能体**: 协调工作流阶段和分析需求的中央决策系统。采用动态规划算法，根据不断发展的项目复杂性实时调整执行策略。为每个实现步骤动态选择最优处理策略。 <br>

- 💾 **高效内存机制**: 高效管理大规模代码上下文的高级上下文工程系统。实现分层内存结构，具有智能压缩功能，用于处理复杂代码库。该组件实现实现模式的即时检索，并在扩展开发会话中保持语义一致性。 <br>

- 🔍 **高级CodeRAG系统**: 分析跨存储库复杂相互依赖关系的全局代码理解引擎。执行跨代码库关系映射，从整体角度理解架构模式。该模块利用依赖图和语义分析在实现过程中提供全局感知的代码建议。

---

### 🤖 **DeepCode的多智能体架构**:

- **🎯 中央编排智能体**: 编排整个工作流程执行并做出战略决策。基于输入复杂性分析协调专门智能体。实现动态任务规划和资源分配算法。 <br>

- **📝 意图理解智能体**: 对用户需求进行深度语义分析以解码复杂意图。通过高级NLP处理提取功能规范和技术约束。通过结构化任务分解将模糊的人类描述转换为精确、可操作的开发规范。 <br>

- **📄 文档解析智能体**: 使用高级解析能力处理复杂的技术文档和研究论文。使用文档理解模型提取算法和方法。通过智能内容分析将学术概念转换为实用的实现规范。 <br>

- **🏗️ 代码规划智能体**: 执行架构设计和技术栈优化。动态规划适应性开发路线图。通过自动化设计模式选择执行编码标准并生成模块化结构。<br>

- **🔍 代码参考挖掘智能体**: 通过智能搜索算法发现相关存储库和框架。分析代码库的兼容性和集成潜力。基于相似性度量和自动化依赖分析提供建议。 <br>

- **📚 代码索引智能体**: 构建发现代码库的综合知识图谱。维护代码组件之间的语义关系。实现智能检索和交叉引用能力。 <br>

- **🧬 代码生成智能体**: 将收集的信息合成为可执行的代码实现。创建功能接口并集成发现的组件。生成全面的测试套件和文档以确保可重现性。

---

#### 🛠️ **实现工具矩阵**

**🔧 基于MCP (模型上下文协议) 驱动**

DeepCode利用**模型上下文协议 (MCP)** 标准与各种工具和服务无缝集成。这种标准化方法确保AI智能体和外部系统之间的可靠通信，实现强大的自动化能力。

##### 📡 **MCP服务器和工具**

| 🛠️ **MCP服务器** | 🔧 **主要功能** | 💡 **目的和能力** |
|-------------------|-------------------------|-------------------------------|
| **🔍 brave** | Web搜索引擎 | 通过Brave搜索API进行实时信息检索 |
| **🌐 bocha-mcp** | 替代搜索 | 具有独立API访问的辅助搜索选项 |
| **📂 filesystem** | 文件系统操作 | 本地文件和目录管理，读/写操作 |
| **🌐 fetch** | Web内容检索 | 从URL和Web资源获取和提取内容 |
| **📥 github-downloader** | 存储库管理 | 克隆和下载GitHub存储库进行分析 |
| **📋 file-downloader** | 文档处理 | 下载文件(PDF、DOCX等)并转换为Markdown |
| **⚡ command-executor** | 系统命令 | 执行bash/shell命令进行环境管理 |
| **🧬 code-implementation** | 代码生成中心 | 具有执行和测试的综合代码复现 |
| **📚 code-reference-indexer** | 智能代码搜索 | 代码存储库的智能索引和搜索 |
| **📄 document-segmentation** | 智能文档分析 | 大型论文和技术文档的智能文档分割 |

##### 🔧 **传统工具功能** *(供参考)*

| 🛠️ **功能** | 🎯 **使用上下文** |
|-----------------|---------------------|
| **📄 read_code_mem** | 从内存高效检索代码上下文 |
| **✍️ write_file** | 直接文件内容生成和修改 |
| **🐍 execute_python** | Python代码测试和验证 |
| **📁 get_file_structure** | 项目结构分析和组织 |
| **⚙️ set_workspace** | 动态工作空间和环境配置 |
| **📊 get_operation_history** | 过程监控和操作跟踪 |


---

🎛️ **多界面框架**<br>
具有CLI和Web前端的RESTful API，具有实时代码流、交互式调试和可扩展插件架构，用于CI/CD集成。

**🚀 多智能体智能流水线:**

<div align="center">

### 🌟 **智能处理流程**

<table align="center" width="100%" style="border: none; border-collapse: collapse;">
<tr>
<td colspan="3" align="center" style="padding: 20px; background: linear-gradient(135deg, #667eea 0%, #764ba2 100%); border-radius: 15px; color: white; font-weight: bold;">
💡 <strong>输入层</strong><br/>
📄 研究论文 • 💬 自然语言 • 🌐 URL • 📋 需求
</td>
</tr>
<tr><td colspan="3" height="20"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 15px; background: linear-gradient(135deg, #ff6b6b 0%, #ee5a24 100%); border-radius: 12px; color: white; font-weight: bold;">
🎯 <strong>中央编排</strong><br/>
战略决策制定 • 工作流程协调 • 智能体管理
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #3742fa 0%, #2f3542 100%); border-radius: 10px; color: white; width: 50%;">
📝 <strong>文本分析</strong><br/>
<small>需求处理</small>
</td>
<td width="10"></td>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #8c7ae6 0%, #9c88ff 100%); border-radius: 10px; color: white; width: 50%;">
📄 <strong>文档分析</strong><br/>
<small>论文和规范处理</small>
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 15px; background: linear-gradient(135deg, #00d2d3 0%, #54a0ff 100%); border-radius: 12px; color: white; font-weight: bold;">
📋 <strong>复现规划</strong><br/>
深度论文分析 • 代码需求解析 • 复现策略开发
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #ffa726 0%, #ff7043 100%); border-radius: 10px; color: white; width: 50%;">
🔍 <strong>参考分析</strong><br/>
<small>存储库发现</small>
</td>
<td width="10"></td>
<td align="center" style="padding: 12px; background: linear-gradient(135deg, #e056fd 0%, #f368e0 100%); border-radius: 10px; color: white; width: 50%;">
📚 <strong>代码索引</strong><br/>
<small>知识图谱构建</small>
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 15px; background: linear-gradient(135deg, #26de81 0%, #20bf6b 100%); border-radius: 12px; color: white; font-weight: bold;">
🧬 <strong>代码实现</strong><br/>
实现生成 • 测试 • 文档
</td>
</tr>
<tr><td colspan="3" height="15"></td></tr>
<tr>
<td colspan="3" align="center" style="padding: 20px; background: linear-gradient(135deg, #045de9 0%, #09c6f9 100%); border-radius: 15px; color: white; font-weight: bold;">
⚡ <strong>输出交付</strong><br/>
📦 完整代码库 • 🧪 测试套件 • 📚 文档 • 🚀 部署就绪
</td>
</tr>
</table>

</div>

<div align="center">
<br/>

### 🔄 **流程智能特性**

<table align="center" style="border: none;">
<tr>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #ff6b6b;">
<h4>🎯 自适应流程</h4>
<p><small>基于输入复杂性的动态智能体选择</small></p>
</div>
</td>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #4ecdc4;">
<h4>🧠 智能协调</h4>
<p><small>智能任务分配和并行处理</small></p>
</div>
</td>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #45b7d1;">
<h4>🔍 上下文感知</h4>
<p><small>通过CodeRAG集成的深度理解</small></p>
</div>
</td>
<td align="center" width="25%" style="padding: 15px;">
<div style="background: #f8f9fa; border-radius: 10px; padding: 15px; border-left: 4px solid #96ceb4;">
<h4>⚡ 质量保证</h4>
<p><small>全程自动化测试和验证</small></p>
</div>
</td>
</tr>
</table>

</div>

---

## 🚀 快速开始

### 📋 **前置条件**

在安装 DeepCode 之前，请确保您已安装以下软件：

| 要求 | 版本 | 用途 |
|------|------|------|
| **Python** | 3.9+ | 核心运行环境 |
| **Node.js** | 18+ | 新版 UI 前端 |
| **npm** | 8+ | 包管理工具 |

```bash
# 检查您的版本
python --version   # 应为 3.9+
node --version     # 应为 18+
npm --version      # 应为 8+
```

<details>
<summary><strong>📥 安装 Node.js（如果未安装）</strong></summary>

```bash
# macOS (使用 Homebrew)
brew install node

# Ubuntu/Debian
curl -fsSL https://deb.nodesource.com/setup_20.x | sudo -E bash -
sudo apt-get install -y nodejs

# Windows
# 从 https://nodejs.org/ 下载安装
```

</details>

### 📦 **步骤1: 安装**

选择以下任一安装方式：

#### ⚡ **直接安装 (推荐)**

```bash
# 🚀 直接安装 DeepCode 包
pip install deepcode-hku

# 🔑 下载配置文件
curl -O https://raw.githubusercontent.com/HKUDS/DeepCode/main/mcp_agent.config.yaml
curl -O https://raw.githubusercontent.com/HKUDS/DeepCode/main/mcp_agent.secrets.yaml
```

#### 🔧 **开发安装 (从源码)**

<details>
<summary><strong>📂 点击展开开发安装选项</strong></summary>

##### 🔥 **使用 UV (开发推荐)**

```bash
git clone https://github.com/HKUDS/DeepCode.git
cd DeepCode/

curl -LsSf https://astral.sh/uv/install.sh | sh
uv venv --python=3.13
source .venv/bin/activate  # Windows下: .venv\Scripts\activate
uv pip install -r requirements.txt

# 安装前端依赖
npm install --prefix new_ui/frontend
```

##### 🐍 **使用传统 pip**

```bash
git clone https://github.com/HKUDS/DeepCode.git
cd DeepCode/

pip install -r requirements.txt

# 安装前端依赖
npm install --prefix new_ui/frontend
```

</details>

### 🔧 **步骤2: 配置**

> 以下配置适用于**所有安装方式**（pip、UV、源码安装和 Docker 均通用）。

#### 🔑 API 密钥 *（必需）*

编辑 `mcp_agent.secrets.yaml`，填入你的 API 密钥：

```yaml
# 至少需要配置一个 LLM 提供商的 API Key
openai:
  api_key: "your_openai_api_key"
  base_url: "https://openrouter.ai/api/v1"  # 可选: 用于 OpenRouter 或自定义端点

anthropic:
  api_key: "your_anthropic_api_key"  # 用于 Claude 模型

google:
  api_key: "your_google_api_key"     # 用于 Gemini 模型
```

#### 🤖 LLM 提供商 *（可选）*

编辑 `mcp_agent.config.yaml` 选择你偏好的 LLM 提供商（第 ~106 行）：

```yaml
# 选项: "google", "anthropic", "openai"
# 如果未设置或不可用，将自动回退到第一个可用的提供商
llm_provider: "google"
```

#### 🔍 搜索 API 密钥 *（可选）*

在 `mcp_agent.config.yaml` 中配置 Web 搜索：

```yaml
# Brave 搜索 (默认) — 在 brave.env 部分设置 (第 ~28 行)
brave:
  env:
    BRAVE_API_KEY: "your_brave_api_key_here"

# Bocha-MCP (替代) — 在 bocha-mcp.env 部分设置 (第 ~74 行)
bocha-mcp:
  env:
    BOCHA_API_KEY: "your_bocha_api_key_here"
```

#### 📄 文档分割 *（可选）*

在 `mcp_agent.config.yaml` 中控制文档处理：

```yaml
document_segmentation:
  enabled: true          # true/false — 是否使用智能文档分割
  size_threshold_chars: 50000  # 触发分割的文档大小阈值
```

<details>
<summary><strong>🪟 Windows 用户: 额外的 MCP 服务器配置</strong></summary>

如果您使用 Windows，可能需要在 `mcp_agent.config.yaml` 中手动配置 MCP 服务器:

```bash
# 1. 全局安装 MCP 服务器
npm i -g @modelcontextprotocol/server-brave-search
npm i -g @modelcontextprotocol/server-filesystem

# 2. 找到您的全局 node_modules 路径
npm -g root
```

然后更新您的 `mcp_agent.config.yaml` 使用绝对路径:

```yaml
mcp:
  servers:
    brave:
      command: "node"
      args: ["C:/Program Files/nodejs/node_modules/@modelcontextprotocol/server-brave-search/dist/index.js"]
    filesystem:
      command: "node"
      args: ["C:/Program Files/nodejs/node_modules/@modelcontextprotocol/server-filesystem/dist/index.js", "."]
```

> **注意**: 将路径替换为步骤 2 中您实际的全局 node_modules 路径。

</details>

<details>
<summary><strong>🔍 搜索服务器配置（可选）</strong></summary>

DeepCode 支持多个搜索服务器进行 Web 搜索功能。您可以在 `mcp_agent.config.yaml` 中配置首选选项:

```yaml
# 默认搜索服务器配置
# 选项: "brave" 或 "bocha-mcp"
default_search_server: "brave"
```

**可用选项:**
- **🔍 Brave 搜索** (`"brave"`): 具有高质量搜索结果的默认选项。需要 `BRAVE_API_KEY`。推荐给大多数用户。
- **🌐 Bocha-MCP** (`"bocha-mcp"`): 替代搜索服务器。需要 `BOCHA_API_KEY`。使用本地 Python 服务器实现。

**完整 MCP 服务器配置（mcp_agent.config.yaml）:**
```yaml
# Brave 搜索 (默认) - 第 28 行左右
brave:
  command: "npx"
  args: ["-y", "@modelcontextprotocol/server-brave-search"]
  env:
    BRAVE_API_KEY: "your_brave_api_key_here"

# Bocha-MCP (替代) - 第 74 行左右
bocha-mcp:
  command: "python"
  args: ["tools/bocha_search_server.py"]
  env:
    PYTHONPATH: "."
    BOCHA_API_KEY: "your_bocha_api_key_here"
```

> **💡 提示**: 两个搜索服务器都需要 API 密钥配置。选择最适合您的 API 访问和需求的选项。

</details>

### ⚡ **步骤3: 启动应用程序**

选择您偏好的启动方式：

<table width="100%">
<tr>
<th width="33%">🐳 Docker (推荐)</th>
<th width="33%">🚀 本地 (<code>deepcode</code> 命令)</th>
<th width="33%">🛠️ 其他方式</th>
</tr>
<tr><td>

无需 Python/Node — 一切在容器内。

```bash
git clone https://github.com/HKUDS/DeepCode.git
cd DeepCode/
cp mcp_agent.secrets.yaml.example \
   mcp_agent.secrets.yaml
# 编辑填入 API Key

./deepcode_docker/run_docker.sh
# 访问 → http://localhost:8000
```

</td><td>

首次运行自动安装依赖。

```bash
deepcode
# 前端 → http://localhost:5173
# 后端 → http://localhost:8000
# Ctrl+C 停止
```

特性：用户交互循环、实时进度、内联对话。

</td><td>

```bash
# macOS / Linux
./run.sh
# 或: python deepcode.py

# Windows
run.bat
# 或: python deepcode.py

# 经典 Streamlit UI
deepcode --classic

# CLI 模式
deepcode --cli
# 或: python cli/main_cli.py
```

</td></tr>
</table>

<details>
<summary><strong>🐳 Docker 管理命令</strong></summary>

```bash
./deepcode_docker/run_docker.sh stop      # 停止
./deepcode_docker/run_docker.sh restart   # 重启（配置更改无需重建）
./deepcode_docker/run_docker.sh --build   # 强制重建
./deepcode_docker/run_docker.sh logs      # 实时日志
./deepcode_docker/run_docker.sh status    # 健康检查
./deepcode_docker/run_docker.sh clean     # 删除容器和镜像
```

或直接使用 Docker Compose：
```bash
docker compose -f deepcode_docker/docker-compose.yml up --build   # 构建并启动
docker compose -f deepcode_docker/docker-compose.yml down         # 停止
docker compose -f deepcode_docker/docker-compose.yml logs -f      # 查看日志
```

> **💡** 配置文件以卷方式挂载 — 编辑后重启即可，无需重建。
> **💡** Windows 用户：如果脚本不可用，可直接运行 `docker compose` 命令。

</details>

### 🎯 **步骤4: 生成代码**

1. **📄 输入** — 上传研究论文、输入需求，或粘贴 URL
2. **🤖 处理** — 多智能体系统分析、规划并生成
3. **⚡ 输出** — 接收带测试和文档的生产就绪代码

---

### 🔧 **常见问题排查**

<details>
<summary><strong>❓ 常见问题与解决方案</strong></summary>

| 问题 | 原因 | 解决方案 |
|---|---|---|
| Docker 构建失败 `tsc: not found` | 构建缓存损坏 | `docker builder prune -f` 然后用 `--no-cache` 重建 |
| `error during connect` / `cannot find the file` | Docker Desktop 未运行 | 启动 Docker Desktop，等待就绪后重试 |
| 前端空白页面 | `node_modules` 损坏 | `cd new_ui/frontend && rm -rf node_modules && npm install` |
| `ERR_CONNECTION_REFUSED` | 端口错误/后端未运行 | Docker: `http://localhost:8000`。本地: `http://localhost:5173` |
| `npm install` → `Could not read package.json` | 目录错误 | 使用 `npm install --prefix new_ui/frontend` |
| Windows: MCP 服务器无法工作 | 需要绝对路径 | 参见上方 [Windows MCP 配置](#-步骤2-配置) |

</details>

---

## 🤖 nanobot 集成（飞书聊天机器人）

**直接在飞书中使用 DeepCode — 发送消息，获取代码！**

[nanobot](https://github.com/HKUDS/nanobot) 是一个超轻量级 AI 助手，现已与 DeepCode 深度集成。通过飞书聊天，您可以：
- 🚀 提交**论文转代码**任务（`paper2code`）— 粘贴 arXiv 链接即可
- 💬 启动**对话转代码**（`chat2code`）— 用自然语言描述需求
- 📊 实时查询任务状态（`deepcode_status`）— 获取进度和结果
- ✅ 响应 DeepCode 交互提示 — 当 AI 需要澄清需求时直接在聊天中回答

### 🏗️ 架构概览

```mermaid
flowchart TB
    subgraph ChatPlatforms[💬 聊天平台]
        Feishu[<b>飞书</b><br/>📱 当前支持]
        Telegram[Telegram<br/>🔜 即将支持]
        Discord[Discord<br/>🔜 即将支持]
    end

    subgraph NanobotCore[🤖 Nanobot 核心]
        LLM[LLM 推理引擎<br/>Claude / GPT / Minimax]
        Tools[工具层<br/>web_fetch / code_executor / deepcode]
    end

    subgraph DeepCodeEngine[⚡ DeepCode 引擎]
        API[HTTP API<br/>任务提交 & 查询]
        Agents[多智能体系统<br/>规划 / 分析 / 生成]
        Output[代码输出<br/>测试 + 文档]
    end

    Feishu -->|WebSocket| NanobotCore
    Telegram -.->|未来集成| NanobotCore
    Discord -.->|未来集成| NanobotCore

    NanobotCore -->|调用 deepcode_* 工具| DeepCodeEngine
    DeepCodeEngine -->|返回结果 & 进度| NanobotCore
    NanobotCore -->|推送消息| Feishu

    style Feishu fill:#0EA5E9,stroke:#0284c7,stroke-width:3px,color:#fff
    style NanobotCore fill:#8b5cf6,stroke:#7c3aed,stroke-width:2px,color:#fff
    style DeepCodeEngine fill:#10b981,stroke:#059669,stroke-width:2px,color:#fff
    style Telegram fill:#d1d5db,stroke:#9ca3af,stroke-width:1px,color:#4b5563,stroke-dasharray: 5 5
    style Discord fill:#d1d5db,stroke:#9ca3af,stroke-width:1px,color:#4b5563,stroke-dasharray: 5 5
```

> 🎯 **当前支持**: 飞书（Feishu / Lark）
> 🔮 **架构预留**: Telegram 和 Discord 节点为未来扩展保留

---

### 📋 前置条件

- ✅ DeepCode 后端正在运行（见上方 [快速开始](#-快速开始)）
- ✅ 飞书企业应用（或租用应用）— 免费创建
- ✅ LLM API 密钥（OpenRouter / Claude / Minimax）

---

### 🚀 三步完成设置

#### **Step 1 · 创建飞书机器人**

<details>
<summary><strong>📱 点击展开飞书应用创建步骤</strong></summary>

1. 登录 [飞书开放平台](https://open.feishu.cn/app)
2. 点击 **创建企业自建应用**
3. 填写应用名称和描述，上传图标
4. 进入 **凭证与基础信息** 页面，复制：
   - `App ID`
   - `App Secret`
5. 进入 **事件订阅** 页面：
   - **请求地址 URL**: `http://your-server-ip:8081/feishu/event`（公网可访问）
   - **消息加密**: 复制 `Encrypt Key` 和 `Verification Token`
6. 进入 **权限管理**，开通以下权限：
   - `im:message`（接收消息）
   - `im:message:send_as_bot`（发送消息）
   - `im:chat`（获取群信息）
7. **发布版本** → 等待管理员审核通过

> 💡 **开发环境**: 可使用 [ngrok](https://ngrok.com/) 或 [localhost.run](https://localhost.run/) 将本地 8081 端口映射到公网。

</details>

---

#### **Step 2 · 配置**

编辑项目根目录的 `nanobot_config.json`:

```json
{
  "channels": [
    {
      "type": "feishu",
      "app_id": "cli_xxxxxxxxxxxxx",
      "app_secret": "your_app_secret",
      "encrypt_key": "your_encrypt_key",
      "verification_token": "your_verification_token"
    }
  ],
  "llm": {
    "provider": "openai",  // 或 "anthropic" / "minimax"
    "model": "openai/gpt-4o",  // 推荐英文模型
    "api_key": "your_api_key",
    "base_url": "https://openrouter.ai/api/v1"  // 可选
  },
  "deepcode": {
    "api_url": "http://localhost:8000"  // DeepCode 后端地址
  }
}
```

> 💡 **提示**: 使用 `nanobot_config.json.example` 作为模板。

---

#### **Step 3 · 启动**

确保 DeepCode 后端已运行，然后启动 nanobot:

```bash
cd DeepCode/
./nanobot/run_nanobot.sh
```

**Docker Compose 模式** (同时启动 DeepCode + nanobot):

```bash
docker compose -f deepcode_docker/docker-compose.yml up -d
```

访问飞书，找到你的机器人，发送消息测试：

```
hi
```

如果收到回复，说明配置成功！🎉

---

### 💡 使用示例

| 操作 | 命令示例 |
|---|---|
| **论文转代码** | `paper2code https://arxiv.org/abs/2104.09864` |
| **对话转代码** | `chat2code 实现一个计算斐波那契数列的 Python 函数` |
| **查询任务状态** | `deepcode_status task_abc123` |
| **响应交互** | 当 AI 询问"需要测试用例吗？"时直接回复 `是` 或 `否` |

---

<details>
<summary><strong>🛠️ nanobot 管理命令</strong></summary>

```bash
# 查看日志（Docker 模式）
docker compose -f deepcode_docker/docker-compose.yml logs -f nanobot

# 重启 nanobot（Docker 模式）
docker compose -f deepcode_docker/docker-compose.yml restart nanobot

# 停止所有服务（Docker 模式）
docker compose -f deepcode_docker/docker-compose.yml down
```

</details>

---

<details>
<summary><strong>🔧 常见问题（nanobot）</strong></summary>

| 问题 | 解决方案 |
|---|---|
| nanobot 响应为中文 | 修改 `nanobot_config.json` 中 `llm.model` 为英文模型（如 `gpt-4o`） |
| 飞书收不到消息 | 检查事件订阅 URL 是否可公网访问，端口 8081 是否开放 |
| DeepCode 任务提交失败 | 确认 `deepcode.api_url` 正确，后端正在运行 |
| nanobot 容器无法启动 | 检查 `nanobot_config.json` 格式是否正确（使用 JSON 验证器） |

</details>

---

  ---

## 💡 示例


### 🎬 **实时演示**


<table align="center">
<tr>
<td width="33%" align="center">

#### 📄 **论文转代码演示**
**研究到实现**

<div align="center">
  <a href="https://www.youtube.com/watch?v=MQZYpLkzsbw">
    <img src="https://img.youtube.com/vi/MQZYpLkzsbw/maxresdefault.jpg" alt="Paper2Code Demo" width="100%" style="border-radius: 10px; box-shadow: 0 4px 8px rgba(0,0,0,0.1);"/>
  </a>

  **[▶️ 观看演示](https://www.youtube.com/watch?v=MQZYpLkzsbw)**

  *自动将学术论文转换为生产就绪代码*
</div>

</td>
<td width="33%" align="center">

#### 🖼️ **图像处理演示**
**AI驱动的图像工具**

<div align="center">
  <a href="https://www.youtube.com/watch?v=nFt5mLaMEac">
    <img src="https://img.youtube.com/vi/nFt5mLaMEac/maxresdefault.jpg" alt="Image Processing Demo" width="100%" style="border-radius: 10px; box-shadow: 0 4px 8px rgba(0,0,0,0.1);"/>
  </a>

  **[▶️ 观看演示](https://www.youtube.com/watch?v=nFt5mLaMEac)**

  *智能图像处理，具有背景移除和增强功能*
</div>

</td>
<td width="33%" align="center">

#### 🌐 **前端实现**
**完整Web应用程序**

<div align="center">
  <a href="https://www.youtube.com/watch?v=78wx3dkTaAU">
    <img src="https://img.youtube.com/vi/78wx3dkTaAU/maxresdefault.jpg" alt="Frontend Demo" width="100%" style="border-radius: 10px; box-shadow: 0 4px 8px rgba(0,0,0,0.1);"/>
  </a>

  **[▶️ 观看演示](https://www.youtube.com/watch?v=78wx3dkTaAU)**

  *从概念到部署的全栈Web开发*
</div>

</td>
</tr>
</table>


### 🆕 **最新更新**

#### 📄 **智能文档分割 (v1.2.0)**
- **智能处理**: 自动处理超出LLM令牌限制的大型研究论文和技术文档
- **可配置控制**: 通过配置切换分割功能，具有基于大小的阈值
- **语义分析**: 高级内容理解，保留算法、概念和公式
- **向后兼容**: 对较小文档无缝回退到传统处理

### 🚀 **即将推出**

我们正在不断增强DeepCode的令人兴奋的新功能:

#### 🔧 **增强的代码可靠性和验证**
- **自动化测试**: 具有执行验证和错误检测的全面功能测试。
- **代码质量保证**: 通过静态分析、动态测试和性能基准测试进行多级验证。
- **智能调试**: AI驱动的错误检测，具有自动纠正建议

#### 📊 **PaperBench性能展示**
- **基准仪表板**: PaperBench评估套件的综合性能指标。
- **准确性指标**: 与最先进的论文复现系统的详细比较。
- **成功分析**: 跨论文类别和复杂度水平的统计分析。

#### ⚡ **系统级优化**
- **性能提升**: 多线程处理和优化智能体协调，实现更快的生成。
- **增强推理**: 具有改进上下文理解的高级推理能力。
- **扩展支持**: 扩展与其他编程语言和框架的兼容性。

---

## ⭐ 星标历史

<div align="center">

*社区增长轨迹*

<a href="https://star-history.com/#HKUDS/DeepCode&Date">
  <picture>
    <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/svg?repos=HKUDS/DeepCode&type=Date&theme=dark" />
    <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/svg?repos=HKUDS/DeepCode&type=Date" />
    <img alt="Star History Chart" src="https://api.star-history.com/svg?repos=HKUDS/DeepCode&type=Date" style="border-radius: 15px; box-shadow: 0 0 30px rgba(0, 217, 255, 0.3);" />
  </picture>
</a>

</div>

---

### 🚀 **准备好变革开发方式了吗？**

<div align="center">

<p>
  <a href="#-快速开始"><img src="https://img.shields.io/badge/🚀_立即开始-00d4ff?style=for-the-badge&logo=rocket&logoColor=white" alt="Get Started"></a>
  <a href="https://github.com/HKUDS"><img src="https://img.shields.io/badge/🏛️_在GitHub上查看-00d4ff?style=for-the-badge&logo=github&logoColor=white" alt="View on GitHub"></a>
  <a href="https://github.com/HKUDS/deepcode-agent"><img src="https://img.shields.io/badge/⭐_星标项目-00d4ff?style=for-the-badge&logo=star&logoColor=white" alt="Star Project"></a>
</p>

---

### 📄 **许可证**

<img src="https://img.shields.io/badge/License-MIT-4ecdc4?style=for-the-badge&logo=opensourceinitiative&logoColor=white" alt="MIT License">

**MIT许可证** - 版权所有 (c) 2025 香港大学数据智能实验室

---


<img src="https://visitor-badge.laobi.icu/badge?page_id=deepcode.readme&style=for-the-badge&color=00d4ff" alt="Visitors">

</div>


================================================
FILE: __init__.py
================================================
"""
DeepCode - AI Research Engine

🧬 Next-Generation AI Research Automation Platform
⚡ Transform research papers into working code automatically
"""

__version__ = "1.2.0"
__author__ = "DeepCode Team"
__url__ = "https://github.com/HKUDS/DeepCode"
__repo__ = "https://github.com/Jany-M/DeepCode/"

# Import main components for easy access
from utils import FileProcessor, DialogueLogger

__all__ = [
    "FileProcessor",
    "DialogueLogger",
    "__version__",
    "__author__",
    "__url__",
]


================================================
FILE: cli/__init__.py
================================================
"""
CLI Module for DeepCode Agent
DeepCode智能体CLI模块

包含以下组件 / Contains the following components:
- cli_app: CLI应用主程序 / CLI application main program
- cli_interface: CLI界面组件 / CLI interface components
- cli_launcher: CLI启动器 / CLI launcher
"""

__version__ = "1.0.0"
__author__ = "DeepCode Team - Data Intelligence Lab @ HKU"

from .cli_app import main as cli_main
from .cli_interface import CLIInterface
from .cli_launcher import main as launcher_main

__all__ = ["cli_main", "CLIInterface", "launcher_main"]


================================================
FILE: cli/cli_app.py
================================================
#!/usr/bin/env python3
"""
DeepCode - CLI Application Main Program
深度代码 - CLI应用主程序

🧬 Open-Source Code Agent by Data Intelligence Lab @ HKU
⚡ Revolutionizing research reproducibility through collaborative AI
"""

import os
import sys
import asyncio
import time
import json

# 禁止生成.pyc文件
os.environ["PYTHONDONTWRITEBYTECODE"] = "1"

# 添加项目根目录到路径
current_dir = os.path.dirname(os.path.abspath(__file__))
parent_dir = os.path.dirname(current_dir)
if parent_dir not in sys.path:
    sys.path.insert(0, parent_dir)

# 导入MCP应用和工作流

from cli.workflows import CLIWorkflowAdapter
from cli.cli_interface import CLIInterface, Colors


class CLIApp:
    """CLI应用主类 - 升级版智能体编排引擎"""

    def __init__(self):
        self.cli = CLIInterface()
        self.workflow_adapter = CLIWorkflowAdapter(cli_interface=self.cli)
        self.app = None  # Will be initialized by workflow adapter
        self.logger = None
        self.context = None
        # Document segmentation will be managed by CLI interface

    async def initialize_mcp_app(self):
        """初始化MCP应用 - 使用工作流适配器"""
        # Workflow adapter will handle MCP initialization
        return await self.workflow_adapter.initialize_mcp_app()

    async def cleanup_mcp_app(self):
        """清理MCP应用 - 使用工作流适配器"""
        await self.workflow_adapter.cleanup_mcp_app()

    async def process_requirement_analysis_non_interactive(self, initial_idea: str):
        """处理需求分析工作流（非交互式，用于命令行参数） (NEW: matching UI version)"""
        try:
            self.cli.print_separator()
            self.cli.print_status(
                "🧠 Starting requirement analysis workflow...", "info"
            )

            # Step 1: Generate guiding questions
            self.cli.print_status(
                "🤖 Generating AI-guided questions to refine your requirements...",
                "processing",
            )

            questions_result = (
                await self.workflow_adapter.execute_requirement_analysis_workflow(
                    user_input=initial_idea, analysis_mode="generate_questions"
                )
            )

            if questions_result["status"] != "success":
                self.cli.print_status(
                    f"❌ Failed to generate questions: {questions_result.get('error', 'Unknown error')}",
                    "error",
                )
                return questions_result

            # Step 2: Display questions
            questions_json = questions_result["result"]
            self.cli.display_guiding_questions(questions_json)

            # For non-interactive mode, we can't get user answers, so we provide a summary
            self.cli.print_status(
                "ℹ️  In non-interactive mode, using initial idea for implementation",
                "info",
            )
            self.cli.print_status(
                "💡 For guided analysis, please use interactive mode (python main_cli.py)",
                "info",
            )

            # Proceed directly with the initial idea as the requirement
            self.cli.print_status(
                "🚀 Starting code implementation based on initial requirements...",
                "processing",
            )

            implementation_result = await self.process_input(initial_idea, "chat")

            return {
                "status": "success",
                "questions_generated": questions_result,
                "implementation": implementation_result,
            }

        except Exception as e:
            error_msg = str(e)
            self.cli.print_error_box("Requirement Analysis Error", error_msg)
            self.cli.print_status(
                f"Error during requirement analysis: {error_msg}", "error"
            )

            return {"status": "error", "error": error_msg}

    async def process_requirement_analysis(self):
        """处理需求分析工作流（交互式） (NEW: matching UI version)"""
        try:
            # Step 1: Get initial requirements from user
            self.cli.print_separator()
            self.cli.print_status(
                "🧠 Starting requirement analysis workflow...", "info"
            )

            user_input = self.cli.get_requirement_analysis_input()

            if not user_input:
                self.cli.print_status("Requirement analysis cancelled", "warning")
                return {"status": "cancelled"}

            # Step 2: Generate guiding questions
            self.cli.print_status(
                "🤖 Generating AI-guided questions to refine your requirements...",
                "processing",
            )

            questions_result = (
                await self.workflow_adapter.execute_requirement_analysis_workflow(
                    user_input=user_input, analysis_mode="generate_questions"
                )
            )

            if questions_result["status"] != "success":
                self.cli.print_status(
                    f"❌ Failed to generate questions: {questions_result.get('error', 'Unknown error')}",
                    "error",
                )
                return questions_result

            # Step 3: Display questions and get user answers
            questions_json = questions_result["result"]
            self.cli.display_guiding_questions(questions_json)

            # Ask if user wants to answer the questions
            proceed = (
                input(
                    f"\n{Colors.BOLD}{Colors.YELLOW}Would you like to answer these questions? (y/n):{Colors.ENDC} "
                )
                .strip()
                .lower()
            )

            if proceed != "y":
                self.cli.print_status(
                    "You can still use the initial requirements for chat input",
                    "info",
                )
                return {"status": "partial", "initial_requirements": user_input}

            user_answers = self.cli.get_question_answers(questions_json)

            # Step 4: Generate requirement summary
            self.cli.print_status(
                "📄 Generating detailed requirement document...", "processing"
            )

            summary_result = (
                await self.workflow_adapter.execute_requirement_analysis_workflow(
                    user_input=user_input,
                    analysis_mode="summarize_requirements",
                    user_answers=user_answers,
                )
            )

            if summary_result["status"] != "success":
                self.cli.print_status(
                    f"❌ Failed to generate summary: {summary_result.get('error', 'Unknown error')}",
                    "error",
                )
                return summary_result

            # Step 5: Display requirement summary
            requirement_summary = summary_result["result"]
            should_proceed = self.cli.display_requirement_summary(requirement_summary)

            if should_proceed:
                # Step 6: Proceed with chat-based implementation
                self.cli.print_status(
                    "🚀 Starting code implementation based on analyzed requirements...",
                    "processing",
                )

                implementation_result = await self.process_input(
                    requirement_summary, "chat"
                )

                return {
                    "status": "success",
                    "requirement_analysis": summary_result,
                    "implementation": implementation_result,
                }
            else:
                self.cli.print_status(
                    "Requirement analysis completed. Implementation skipped.", "info"
                )
                return {
                    "status": "success",
                    "requirement_analysis": summary_result,
                    "implementation": None,
                }

        except Exception as e:
            error_msg = str(e)
            self.cli.print_error_box("Requirement Analysis Error", error_msg)
            self.cli.print_status(
                f"Error during requirement analysis: {error_msg}", "error"
            )

            return {"status": "error", "error": error_msg}

    async def process_input(self, input_source: str, input_type: str):
        """处理输入源（URL或文件）- 使用升级版智能体编排引擎"""
        try:
            # Document segmentation configuration is managed by CLI interface

            self.cli.print_separator()
            self.cli.print_status(
                "🚀 Starting intelligent agent orchestration...", "processing"
            )

            # 显示处理阶段（根据配置决定）
            chat_mode = input_type == "chat"
            self.cli.display_processing_stages(
                0, self.cli.enable_indexing, chat_mode=chat_mode
            )

            # 使用工作流适配器进行处理
            result = await self.workflow_adapter.process_input_with_orchestration(
                input_source=input_source,
                input_type=input_type,
                enable_indexing=self.cli.enable_indexing,
            )

            if result["status"] == "success":
                # 显示完成状态
                if chat_mode:
                    final_stage = 4
                else:
                    final_stage = 8 if self.cli.enable_indexing else 5
                self.cli.display_processing_stages(
                    final_stage, self.cli.enable_indexing, chat_mode=chat_mode
                )
                self.cli.print_status(
                    "🎉 Agent orchestration completed successfully!", "complete"
                )

                # 显示结果
                self.display_results(
                    result.get("analysis_result", ""),
                    result.get("download_result", ""),
                    result.get("repo_result", ""),
                    result.get("pipeline_mode", "comprehensive"),
                )
            else:
                self.cli.print_status(
                    f"❌ Processing failed: {result.get('error', 'Unknown error')}",
                    "error",
                )

            # 添加到历史记录
            self.cli.add_to_history(input_source, result)

            return result

        except Exception as e:
            error_msg = str(e)
            self.cli.print_error_box("Agent Orchestration Error", error_msg)
            self.cli.print_status(f"Error during orchestration: {error_msg}", "error")

            # 添加错误到历史记录
            error_result = {"status": "error", "error": error_msg}
            self.cli.add_to_history(input_source, error_result)

            return error_result

    def display_results(
        self,
        analysis_result: str,
        download_result: str,
        repo_result: str,
        pipeline_mode: str = "comprehensive",
    ):
        """显示处理结果"""
        self.cli.print_results_header()

        # 显示流水线模式
        if pipeline_mode == "chat":
            mode_display = "💬 Chat Planning Mode"
        elif pipeline_mode == "comprehensive":
            mode_display = "🧠 Comprehensive Mode"
        else:
            mode_display = "⚡ Optimized Mode"
        print(
            f"{Colors.BOLD}{Colors.PURPLE}🤖 PIPELINE MODE: {mode_display}{Colors.ENDC}"
        )
        self.cli.print_separator("─", 79, Colors.PURPLE)

        print(f"{Colors.BOLD}{Colors.OKCYAN}📊 ANALYSIS PHASE RESULTS:{Colors.ENDC}")
        self.cli.print_separator("─", 79, Colors.CYAN)

        # 尝试解析并格式化分析结果
        try:
            if analysis_result.strip().startswith("{"):
                parsed_analysis = json.loads(analysis_result)
                print(json.dumps(parsed_analysis, indent=2, ensure_ascii=False))
            else:
                print(
                    analysis_result[:1000] + "..."
                    if len(analysis_result) > 1000
                    else analysis_result
                )
        except Exception:
            print(
                analysis_result[:1000] + "..."
                if len(analysis_result) > 1000
                else analysis_result
            )

        print(f"\n{Colors.BOLD}{Colors.PURPLE}📥 DOWNLOAD PHASE RESULTS:{Colors.ENDC}")
        self.cli.print_separator("─", 79, Colors.PURPLE)
        print(
            download_result[:1000] + "..."
            if len(download_result) > 1000
            else download_result
        )

        print(
            f"\n{Colors.BOLD}{Colors.GREEN}⚙️  IMPLEMENTATION PHASE RESULTS:{Colors.ENDC}"
        )
        self.cli.print_separator("─", 79, Colors.GREEN)
        print(repo_result[:1000] + "..." if len(repo_result) > 1000 else repo_result)

        # 尝试提取生成的代码目录信息
        if "Code generated in:" in repo_result:
            code_dir = (
                repo_result.split("Code generated in:")[-1].strip().split("\n")[0]
            )
            print(
                f"\n{Colors.BOLD}{Colors.YELLOW}📁 Generated Code Directory: {Colors.ENDC}{code_dir}"
            )

        # 显示处理完成的工作流阶段
        print(
            f"\n{Colors.BOLD}{Colors.OKCYAN}🔄 COMPLETED WORKFLOW STAGES:{Colors.ENDC}"
        )

        if pipeline_mode == "chat":
            stages = [
                "🚀 Engine Initialization",
                "💬 Requirements Analysis",
                "🏗️ Workspace Setup",
                "📝 Implementation Plan Generation",
                "⚙️ Code Implementation",
            ]
        else:
            stages = [
                "📄 Document Processing",
                "🔍 Reference Analysis",
                "📋 Plan Generation",
                "📦 Repository Download",
                "🗂️ Codebase Indexing",
                "⚙️ Code Implementation",
            ]

        for stage in stages:
            print(f"  ✅ {stage}")

        self.cli.print_separator()

    async def run_interactive_session(self):
        """运行交互式会话"""
        # 清屏并显示启动界面
        self.cli.clear_screen()
        self.cli.print_logo()
        self.cli.print_welcome_banner()

        # 初始化MCP应用
        await self.initialize_mcp_app()

        try:
            # 主交互循环
            while self.cli.is_running:
                self.cli.create_menu()
                choice = self.cli.get_user_input()

                if choice in ["q", "quit", "exit"]:
                    self.cli.print_goodbye()
                    break

                elif choice in ["u", "url"]:
                    url = self.cli.get_url_input()
                    if url:
                        await self.process_input(url, "url")

                elif choice in ["f", "file"]:
                    file_path = self.cli.upload_file_gui()
                    if file_path:
                        await self.process_input(f"file://{file_path}", "file")

                elif choice in ["t", "chat", "text"]:
                    chat_input = self.cli.get_chat_input()
                    if chat_input:
                        await self.process_input(chat_input, "chat")

                elif choice in ["r", "req", "requirement", "requirements"]:
                    # NEW: Requirement Analysis workflow
                    await self.process_requirement_analysis()

                elif choice in ["h", "history"]:
                    self.cli.show_history()

                elif choice in ["c", "config", "configure"]:
                    # Show configuration menu - all settings managed by CLI interface
                    self.cli.show_configuration_menu()

                else:
                    self.cli.print_status(
                        "Invalid choice. Please select U, F, T, R, C, H, or Q.",
                        "warning",
                    )

                # 询问是否继续
                if self.cli.is_running and choice in [
                    "u",
                    "f",
                    "t",
                    "r",
                    "chat",
                    "text",
                    "req",
                    "requirement",
                    "requirements",
                ]:
                    if not self.cli.ask_continue():
                        self.cli.is_running = False
                        self.cli.print_status("Session ended by user", "info")

        except KeyboardInterrupt:
            print(f"\n{Colors.WARNING}⚠️  Process interrupted by user{Colors.ENDC}")
        except Exception as e:
            print(f"\n{Colors.FAIL}❌ Unexpected error: {str(e)}{Colors.ENDC}")
        finally:
            # 清理资源
            await self.cleanup_mcp_app()


async def main():
    """主函数"""
    start_time = time.time()

    try:
        # 创建并运行CLI应用
        app = CLIApp()
        await app.run_interactive_session()

    except KeyboardInterrupt:
        print(f"\n{Colors.WARNING}⚠️  Application interrupted by user{Colors.ENDC}")
    except Exception as e:
        print(f"\n{Colors.FAIL}❌ Application error: {str(e)}{Colors.ENDC}")
    finally:
        end_time = time.time()
        print(
            f"\n{Colors.BOLD}{Colors.CYAN}⏱️  Total runtime: {end_time - start_time:.2f} seconds{Colors.ENDC}"
        )

        # 清理缓存文件
        print(f"{Colors.YELLOW}🧹 Cleaning up cache files...{Colors.ENDC}")
        if os.name == "nt":  # Windows
            os.system(
                "powershell -Command \"Get-ChildItem -Path . -Filter '__pycache__' -Recurse -Directory | Remove-Item -Recurse -Force\" 2>nul"
            )
        else:  # Unix/Linux/macOS
            os.system('find . -type d -name "__pycache__" -exec rm -r {} + 2>/dev/null')

        print(
            f"{Colors.OKGREEN}✨ Goodbye! Thanks for using DeepCode CLI! ✨{Colors.ENDC}"
        )


if __name__ == "__main__":
    asyncio.run(main())


================================================
FILE: cli/cli_interface.py
================================================
#!/usr/bin/env python3
"""
Enhanced CLI Interface Module for DeepCode
增强版CLI界面模块 - 专为DeepCode设计
"""

import os
import time
import platform
from typing import Optional


class Colors:
    """ANSI color codes for terminal styling"""

    HEADER = "\033[95m"
    OKBLUE = "\033[94m"
    OKCYAN = "\033[96m"
    OKGREEN = "\033[92m"
    WARNING = "\033[93m"
    FAIL = "\033[91m"
    ENDC = "\033[0m"
    BOLD = "\033[1m"
    UNDERLINE = "\033[4m"

    # Gradient colors
    PURPLE = "\033[35m"
    MAGENTA = "\033[95m"
    BLUE = "\033[34m"
    CYAN = "\033[36m"
    GREEN = "\033[32m"
    YELLOW = "\033[33m"


class CLIInterface:
    """Enhanced CLI interface with modern styling for DeepCode"""

    def __init__(self):
        self.uploaded_file = None
        self.is_running = True
        self.processing_history = []
        self.enable_indexing = (
            False  # Default configuration (matching UI: fast mode by default)
        )

        # Load segmentation config from the same source as UI
        self._load_segmentation_config()

        # Initialize tkinter availability
        self._init_tkinter()

    def _load_segmentation_config(self):
        """Load segmentation configuration from mcp_agent.config.yaml"""
        try:
            from utils.llm_utils import get_document_segmentation_config

            seg_config = get_document_segmentation_config()
            self.segmentation_enabled = seg_config.get("enabled", True)
            self.segmentation_threshold = seg_config.get("size_threshold_chars", 50000)
        except Exception as e:
            print(f"⚠️ Warning: Failed to load segmentation config: {e}")
            # Fall back to defaults
            self.segmentation_enabled = True
            self.segmentation_threshold = 50000

    def _save_segmentation_config(self):
        """Save segmentation configuration to mcp_agent.config.yaml"""
        import yaml
        import os

        # Get the project root directory (where mcp_agent.config.yaml is located)
        current_file = os.path.abspath(__file__)
        cli_dir = os.path.dirname(current_file)  # cli directory
        project_root = os.path.dirname(cli_dir)  # project root
        config_path = os.path.join(project_root, "mcp_agent.config.yaml")

        try:
            # Read current config
            with open(config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)

            # Update document segmentation settings
            if "document_segmentation" not in config:
                config["document_segmentation"] = {}

            config["document_segmentation"]["enabled"] = self.segmentation_enabled
            config["document_segmentation"]["size_threshold_chars"] = (
                self.segmentation_threshold
            )

            # Write updated config
            with open(config_path, "w", encoding="utf-8") as f:
                yaml.dump(config, f, default_flow_style=False, allow_unicode=True)

            print(
                f"{Colors.OKGREEN}✅ Document segmentation configuration updated{Colors.ENDC}"
            )

        except Exception as e:
            print(
                f"{Colors.WARNING}⚠️ Failed to update segmentation config: {str(e)}{Colors.ENDC}"
            )

    def _init_tkinter(self):
        """Initialize tkinter availability check"""
        # Check tkinter availability for file dialogs
        self.tkinter_available = True
        try:
            import tkinter as tk

            # Test if tkinter can create a window
            test_root = tk.Tk()
            test_root.withdraw()
            test_root.destroy()
        except Exception:
            self.tkinter_available = False

    def clear_screen(self):
        """Clear terminal screen"""
        os.system("cls" if os.name == "nt" else "clear")

    def print_logo(self):
        """Print enhanced ASCII logo for DeepCode CLI"""
        logo = f"""
{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                                                               ║
║  {Colors.BOLD}{Colors.MAGENTA}██████╗ ███████╗███████╗██████╗  ██████╗ ██████╗ ██████╗ ███████╗{Colors.CYAN}               ║
║  {Colors.BOLD}{Colors.PURPLE}██╔══██╗██╔════╝██╔════╝██╔══██╗██╔════╝██╔═══██╗██╔══██╗██╔════╝{Colors.CYAN}               ║
║  {Colors.BOLD}{Colors.BLUE}██║  ██║█████╗  █████╗  ██████╔╝██║     ██║   ██║██║  ██║█████╗  {Colors.CYAN}               ║
║  {Colors.BOLD}{Colors.OKBLUE}██║  ██║██╔══╝  ██╔══╝  ██╔═══╝ ██║     ██║   ██║██║  ██║██╔══╝  {Colors.CYAN}               ║
║  {Colors.BOLD}{Colors.OKCYAN}██████╔╝███████╗███████╗██║     ╚██████╗╚██████╔╝██████╔╝███████╗{Colors.CYAN}               ║
║  {Colors.BOLD}{Colors.GREEN}╚═════╝ ╚══════╝╚══════╝╚═╝      ╚═════╝ ╚═════╝ ╚═════╝ ╚══════╝{Colors.CYAN}               ║
║                                                                               ║
║  {Colors.BOLD}{Colors.GREEN}🧬 OPEN-SOURCE CODE AGENT • DATA INTELLIGENCE LAB @ HKU 🚀           {Colors.CYAN}║
║  {Colors.BOLD}{Colors.GREEN}⚡ REVOLUTIONIZING RESEARCH REPRODUCIBILITY ⚡                      {Colors.CYAN}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(logo)

    def print_welcome_banner(self):
        """Print enhanced welcome banner"""
        banner = f"""
{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                             WELCOME TO DEEPCODE CLI                          ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║  {Colors.YELLOW}Open-Source Code Agent | Data Intelligence Lab @ HKU | MIT License        {Colors.CYAN}║
║  {Colors.GREEN}Status: Ready | Engine: Multi-Agent Architecture Initialized               {Colors.CYAN}║
║  {Colors.PURPLE}Mission: Revolutionizing Research Reproducibility                         {Colors.CYAN}║
║                                                                               ║
║  {Colors.BOLD}{Colors.OKCYAN}💎 CORE CAPABILITIES:{Colors.ENDC}                                                      {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Automated Paper-to-Code Reproduction                                {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Collaborative Multi-Agent Architecture                             {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Intelligent Code Implementation & Validation                       {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Future Vision: One Sentence → Complete Codebase                   {Colors.CYAN}║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(banner)

    def print_separator(self, char="═", length=79, color=Colors.CYAN):
        """Print a styled separator line"""
        print(f"{color}{char * length}{Colors.ENDC}")

    def print_status(self, message: str, status_type: str = "info"):
        """Print status message with appropriate styling"""
        status_styles = {
            "success": f"{Colors.OKGREEN}✅",
            "error": f"{Colors.FAIL}❌",
            "warning": f"{Colors.WARNING}⚠️ ",
            "info": f"{Colors.OKBLUE}ℹ️ ",
            "processing": f"{Colors.YELLOW}⏳",
            "upload": f"{Colors.PURPLE}📁",
            "download": f"{Colors.CYAN}📥",
            "analysis": f"{Colors.MAGENTA}🔍",
            "implementation": f"{Colors.GREEN}⚙️ ",
            "complete": f"{Colors.OKGREEN}🎉",
        }

        icon = status_styles.get(status_type, status_styles["info"])
        timestamp = time.strftime("%H:%M:%S")
        print(
            f"[{Colors.BOLD}{timestamp}{Colors.ENDC}] {icon} {Colors.BOLD}{message}{Colors.ENDC}"
        )

    def create_menu(self):
        """Create enhanced interactive menu"""
        # Display current configuration
        pipeline_mode = "🧠 COMPREHENSIVE" if self.enable_indexing else "⚡ OPTIMIZED"
        index_status = "✅ Enabled" if self.enable_indexing else "🔶 Disabled"
        segmentation_mode = (
            "📄 SMART" if self.segmentation_enabled else "📋 TRADITIONAL"
        )

        menu = f"""
{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                MAIN MENU                                      ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║  {Colors.OKGREEN}🌐 [U] Process URL       {Colors.CYAN}│  {Colors.PURPLE}📁 [F] Upload File    {Colors.CYAN}│  {Colors.MAGENTA}💬 [T] Chat Input{Colors.CYAN}    ║
║  {Colors.BLUE}🧠 [R] Req. Analysis    {Colors.CYAN}│  {Colors.OKCYAN}⚙️  [C] Configure        {Colors.CYAN}│  {Colors.YELLOW}📊 [H] History{Colors.CYAN}    ║
║  {Colors.FAIL}❌ [Q] Quit{Colors.CYAN}                                                                 ║
║                                                                               ║
║  {Colors.BOLD}🤖 Current Pipeline Mode: {pipeline_mode}{Colors.CYAN}                          ║
║  {Colors.BOLD}🗂️  Codebase Indexing: {index_status}{Colors.CYAN}                                    ║
║  {Colors.BOLD}📄 Document Processing: {segmentation_mode}{Colors.CYAN}                               ║
║                                                                               ║
║  {Colors.YELLOW}📝 URL Processing:{Colors.CYAN}                                                         ║
║  {Colors.YELLOW}   ▶ Enter research paper URL (arXiv, IEEE, ACM, etc.)                    {Colors.CYAN}║
║  {Colors.YELLOW}   ▶ Supports direct PDF links and academic paper pages                   {Colors.CYAN}║
║                                                                               ║
║  {Colors.PURPLE}📁 File Processing:{Colors.CYAN}                                                        ║
║  {Colors.PURPLE}   ▶ Upload PDF, DOCX, PPTX, HTML, or TXT files                          {Colors.CYAN}║
║  {Colors.PURPLE}   ▶ Intelligent file format detection and processing                     {Colors.CYAN}║
║                                                                               ║
║  {Colors.MAGENTA}💬 Chat Input:{Colors.CYAN}                                                           ║
║  {Colors.MAGENTA}   ▶ Describe your coding requirements in natural language                {Colors.CYAN}║
║  {Colors.MAGENTA}   ▶ AI generates implementation plan and code automatically             {Colors.CYAN}║
║                                                                               ║
║  {Colors.BLUE}🧠 Requirement Analysis (NEW):{Colors.CYAN}                                             ║
║  {Colors.BLUE}   ▶ Get AI-guided questions to refine your requirements                   {Colors.CYAN}║
║  {Colors.BLUE}   ▶ Generate detailed requirement documents from your answers             {Colors.CYAN}║
║                                                                               ║
║  {Colors.OKCYAN}🔄 Processing Pipeline:{Colors.CYAN}                                                    ║
║  {Colors.OKCYAN}   ▶ Intelligent agent orchestration → Code synthesis                     {Colors.CYAN}║
║  {Colors.OKCYAN}   ▶ Multi-agent coordination with progress tracking                     {Colors.CYAN}║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(menu)

    def get_user_input(self):
        """Get user input with styled prompt"""
        print(f"\n{Colors.BOLD}{Colors.OKCYAN}➤ Your choice: {Colors.ENDC}", end="")
        return input().strip().lower()

    def upload_file_gui(self) -> Optional[str]:
        """Enhanced file upload interface with better error handling"""
        if not self.tkinter_available:
            self.print_status(
                "GUI file dialog not available - using manual input", "warning"
            )
            return self._get_manual_file_path()

        def select_file():
            try:
                import tkinter as tk
                from tkinter import filedialog

                root = tk.Tk()
                root.withdraw()
                root.attributes("-topmost", True)

                file_types = [
                    ("Research Papers", "*.pdf;*.docx;*.doc"),
                    ("PDF Files", "*.pdf"),
                    ("Word Documents", "*.docx;*.doc"),
                    ("PowerPoint Files", "*.pptx;*.ppt"),
                    ("HTML Files", "*.html;*.htm"),
                    ("Text Files", "*.txt;*.md"),
                    ("All Files", "*.*"),
                ]

                if platform.system() == "Darwin":
                    file_types = [
                        ("Research Papers", ".pdf .docx .doc"),
                        ("PDF Files", ".pdf"),
                        ("Word Documents", ".docx .doc"),
                        ("PowerPoint Files", ".pptx .ppt"),
                        ("HTML Files", ".html .htm"),
                        ("Text Files", ".txt .md"),
                        ("All Files", ".*"),
                    ]

                file_path = filedialog.askopenfilename(
                    title="Select Research File - DeepCode CLI",
                    filetypes=file_types,
                    initialdir=os.getcwd(),
                )

                root.destroy()
                return file_path

            except Exception as e:
                self.print_status(f"File dialog error: {str(e)}", "error")
                return self._get_manual_file_path()

        self.print_status("Opening file browser dialog...", "upload")
        file_path = select_file()

        if file_path:
            self.print_status(
                f"File selected: {os.path.basename(file_path)}", "success"
            )
            return file_path
        else:
            self.print_status("No file selected", "warning")
            return None

    def _get_manual_file_path(self) -> Optional[str]:
        """Get file path through manual input with validation"""
        self.print_separator("─", 79, Colors.YELLOW)
        print(f"{Colors.BOLD}{Colors.YELLOW}📁 Manual File Path Input{Colors.ENDC}")
        print(
            f"{Colors.CYAN}Please enter the full path to your research paper file:{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}Supported formats: PDF, DOCX, PPTX, HTML, TXT, MD{Colors.ENDC}"
        )
        self.print_separator("─", 79, Colors.YELLOW)

        while True:
            print(f"\n{Colors.BOLD}{Colors.OKCYAN}📂 File path: {Colors.ENDC}", end="")
            file_path = input().strip()

            if not file_path:
                self.print_status(
                    "Empty path entered. Please try again or press Ctrl+C to cancel.",
                    "warning",
                )
                continue

            file_path = os.path.expanduser(file_path)
            file_path = os.path.abspath(file_path)

            if not os.path.exists(file_path):
                self.print_status(f"File not found: {file_path}", "error")
                retry = (
                    input(f"{Colors.YELLOW}Try again? (y/n): {Colors.ENDC}")
                    .strip()
                    .lower()
                )
                if retry != "y":
                    return None
                continue

            if not os.path.isfile(file_path):
                self.print_status(f"Path is not a file: {file_path}", "error")
                continue

            supported_extensions = {
                ".pdf",
                ".docx",
                ".doc",
                ".pptx",
                ".ppt",
                ".html",
                ".htm",
                ".txt",
                ".md",
            }
            file_ext = os.path.splitext(file_path)[1].lower()

            if file_ext not in supported_extensions:
                self.print_status(f"Unsupported file format: {file_ext}", "warning")
                proceed = (
                    input(f"{Colors.YELLOW}Process anyway? (y/n): {Colors.ENDC}")
                    .strip()
                    .lower()
                )
                if proceed != "y":
                    continue

            self.print_status(
                f"File validated: {os.path.basename(file_path)}", "success"
            )
            return file_path

    def get_url_input(self) -> str:
        """Enhanced URL input with validation"""
        self.print_separator("─", 79, Colors.GREEN)
        print(f"{Colors.BOLD}{Colors.GREEN}🌐 URL Input Interface{Colors.ENDC}")
        print(
            f"{Colors.CYAN}Enter a research paper URL from supported platforms:{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}• arXiv (arxiv.org)        • IEEE Xplore (ieeexplore.ieee.org){Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}• ACM Digital Library      • SpringerLink • Nature • Science{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}• Direct PDF links         • Academic publisher websites{Colors.ENDC}"
        )
        self.print_separator("─", 79, Colors.GREEN)

        while True:
            print(f"\n{Colors.BOLD}{Colors.OKCYAN}🔗 URL: {Colors.ENDC}", end="")
            url = input().strip()

            if not url:
                self.print_status(
                    "Empty URL entered. Please try again or press Ctrl+C to cancel.",
                    "warning",
                )
                continue

            if not url.startswith(("http://", "https://")):
                self.print_status("URL must start with http:// or https://", "error")
                retry = (
                    input(f"{Colors.YELLOW}Try again? (y/n): {Colors.ENDC}")
                    .strip()
                    .lower()
                )
                if retry != "y":
                    return ""
                continue

            academic_domains = [
                "arxiv.org",
                "ieeexplore.ieee.org",
                "dl.acm.org",
                "link.springer.com",
                "nature.com",
                "science.org",
                "scholar.google.com",
                "researchgate.net",
                "semanticscholar.org",
            ]

            is_academic = any(domain in url.lower() for domain in academic_domains)
            if not is_academic and not url.lower().endswith(".pdf"):
                self.print_status(
                    "URL doesn't appear to be from a known academic platform", "warning"
                )
                proceed = (
                    input(f"{Colors.YELLOW}Process anyway? (y/n): {Colors.ENDC}")
                    .strip()
                    .lower()
                )
                if proceed != "y":
                    continue

            self.print_status(f"URL validated: {url}", "success")
            return url

    def get_chat_input(self) -> str:
        """Enhanced chat input interface for coding requirements"""
        self.print_separator("─", 79, Colors.PURPLE)
        print(f"{Colors.BOLD}{Colors.PURPLE}💬 Chat Input Interface{Colors.ENDC}")
        print(
            f"{Colors.CYAN}Describe your coding requirements in natural language.{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}Our AI will analyze your needs and generate a comprehensive implementation plan.{Colors.ENDC}"
        )
        self.print_separator("─", 79, Colors.PURPLE)

        # Display examples to help users
        print(f"\n{Colors.BOLD}{Colors.YELLOW}💡 Examples:{Colors.ENDC}")
        print(f"{Colors.CYAN}Academic Research:{Colors.ENDC}")
        print(
            "  • 'I need to implement a reinforcement learning algorithm for robotic control'"
        )
        print(
            "  • 'Create a neural network for image classification with attention mechanisms'"
        )
        print(f"{Colors.CYAN}Engineering Projects:{Colors.ENDC}")
        print(
            "  • 'Develop a web application for project management with user authentication'"
        )
        print("  • 'Create a data visualization dashboard for sales analytics'")
        print(f"{Colors.CYAN}Mixed Projects:{Colors.ENDC}")
        print(
            "  • 'Implement a machine learning model with a web interface for real-time predictions'"
        )

        self.print_separator("─", 79, Colors.PURPLE)

        print(
            f"\n{Colors.BOLD}{Colors.OKCYAN}✏️  Enter your coding requirements below:{Colors.ENDC}"
        )
        print(
            f"{Colors.YELLOW}(Type your description, press Enter twice when finished, or Ctrl+C to cancel){Colors.ENDC}"
        )

        lines = []
        empty_line_count = 0

        while True:
            try:
                if len(lines) == 0:
                    print(f"{Colors.BOLD}> {Colors.ENDC}", end="")
                else:
                    print(f"{Colors.BOLD}  {Colors.ENDC}", end="")

                line = input()

                if line.strip() == "":
                    empty_line_count += 1
                    if empty_line_count >= 2:
                        # Two consecutive empty lines means user finished input
                        break
                    lines.append("")  # Keep empty line for formatting
                else:
                    empty_line_count = 0
                    lines.append(line)

            except KeyboardInterrupt:
                print(f"\n{Colors.WARNING}Input cancelled by user{Colors.ENDC}")
                return ""

        # Join all lines and clean up
        user_input = "\n".join(lines).strip()

        if not user_input:
            self.print_status("No input provided", "warning")
            return ""

        if len(user_input) < 20:
            self.print_status(
                "Input too short. Please provide more detailed requirements (at least 20 characters)",
                "warning",
            )
            retry = (
                input(f"{Colors.YELLOW}Try again? (y/n): {Colors.ENDC}").strip().lower()
            )
            if retry == "y":
                return self.get_chat_input()  # Recursive call for retry
            return ""

        # Display input summary
        word_count = len(user_input.split())
        char_count = len(user_input)

        print(f"\n{Colors.BOLD}{Colors.GREEN}📋 Input Summary:{Colors.ENDC}")
        print(f"  • {Colors.CYAN}Word count: {word_count}{Colors.ENDC}")
        print(f"  • {Colors.CYAN}Character count: {char_count}{Colors.ENDC}")

        # Show preview
        preview = user_input[:200] + "..." if len(user_input) > 200 else user_input
        print(f"\n{Colors.BOLD}{Colors.CYAN}📄 Preview:{Colors.ENDC}")
        print(f"{Colors.YELLOW}{preview}{Colors.ENDC}")

        # Confirm with user
        confirm = (
            input(
                f"\n{Colors.BOLD}{Colors.OKCYAN}Proceed with this input? (y/n): {Colors.ENDC}"
            )
            .strip()
            .lower()
        )
        if confirm != "y":
            retry = (
                input(f"{Colors.YELLOW}Edit input? (y/n): {Colors.ENDC}")
                .strip()
                .lower()
            )
            if retry == "y":
                return self.get_chat_input()  # Recursive call for retry
            return ""

        self.print_status(
            f"Chat input captured: {word_count} words, {char_count} characters",
            "success",
        )
        return user_input

    def show_progress_bar(self, message: str, duration: float = 2.0):
        """Show animated progress bar"""
        print(f"\n{Colors.BOLD}{Colors.CYAN}{message}{Colors.ENDC}")

        bar_length = 50
        for i in range(bar_length + 1):
            percent = (i / bar_length) * 100
            filled = "█" * i
            empty = "░" * (bar_length - i)

            print(
                f"\r{Colors.OKGREEN}[{filled}{empty}] {percent:3.0f}%{Colors.ENDC}",
                end="",
                flush=True,
            )
            time.sleep(duration / bar_length)

        print(f"\n{Colors.OKGREEN}✓ {message} completed{Colors.ENDC}")

    def show_spinner(self, message: str, duration: float = 1.0):
        """Show spinner animation"""
        spinner_chars = "⠋⠙⠹⠸⠼⠴⠦⠧⠇⠏"
        end_time = time.time() + duration

        print(
            f"{Colors.BOLD}{Colors.CYAN}{message}... {Colors.ENDC}", end="", flush=True
        )

        i = 0
        while time.time() < end_time:
            print(
                f"\r{Colors.BOLD}{Colors.CYAN}{message}... {Colors.YELLOW}{spinner_chars[i % len(spinner_chars)]}{Colors.ENDC}",
                end="",
                flush=True,
            )
            time.sleep(0.1)
            i += 1

        print(
            f"\r{Colors.BOLD}{Colors.CYAN}{message}... {Colors.OKGREEN}✓{Colors.ENDC}"
        )

    def display_processing_stages(
        self,
        current_stage: int = 0,
        enable_indexing: bool = True,
        chat_mode: bool = False,
    ):
        """Display processing pipeline stages with current progress"""
        if chat_mode:
            # Chat mode - simplified workflow for user requirements
            stages = [
                ("🚀", "Initialize", "Setting up chat engine"),
                ("💬", "Planning", "Analyzing requirements"),
                ("🏗️", "Setup", "Creating workspace"),
                ("📝", "Save Plan", "Saving implementation plan"),
                ("⚙️", "Implement", "Generating code"),
            ]
            pipeline_mode = "CHAT PLANNING"
        elif enable_indexing:
            # Full pipeline with all stages
            stages = [
                ("🚀", "Initialize", "Setting up AI engine"),
                ("📊", "Analyze", "Analyzing research content"),
                ("📥", "Download", "Processing document"),
                ("📋", "Plan", "Generating code architecture"),
                ("🔍", "References", "Analyzing references"),
                ("📦", "Repos", "Downloading repositories"),
                ("🗂️", "Index", "Building code index"),
                ("⚙️", "Implement", "Implementing code"),
            ]
            pipeline_mode = "COMPREHENSIVE"
        else:
            # Fast mode - skip indexing related stages
            stages = [
                ("🚀", "Initialize", "Setting up AI engine"),
                ("📊", "Analyze", "Analyzing research content"),
                ("📥", "Download", "Processing document"),
                ("📋", "Plan", "Generating code architecture"),
                ("⚙️", "Implement", "Implementing code"),
            ]
            pipeline_mode = "OPTIMIZED"

        print(
            f"\n{Colors.BOLD}{Colors.CYAN}📋 {pipeline_mode} PIPELINE STATUS{Colors.ENDC}"
        )
        self.print_separator("─", 79, Colors.CYAN)

        for i, (icon, name, desc) in enumerate(stages):
            if i < current_stage:
                status = f"{Colors.OKGREEN}✓ COMPLETED{Colors.ENDC}"
            elif i == current_stage:
                status = f"{Colors.YELLOW}⏳ IN PROGRESS{Colors.ENDC}"
            else:
                status = f"{Colors.CYAN}⏸️  PENDING{Colors.ENDC}"

            print(
                f"{icon} {Colors.BOLD}{name:<12}{Colors.ENDC} │ {desc:<25} │ {status}"
            )

        self.print_separator("─", 79, Colors.CYAN)

    def print_results_header(self):
        """Print results section header"""
        header = f"""
{Colors.BOLD}{Colors.OKGREEN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                              PROCESSING RESULTS                              ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(header)

    def print_error_box(self, title: str, error_msg: str):
        """Print formatted error box"""
        print(
            f"\n{Colors.FAIL}╔══════════════════════════════════════════════════════════════╗"
        )
        print(f"║ {Colors.BOLD}ERROR: {title:<50}{Colors.FAIL} ║")
        print("╠══════════════════════════════════════════════════════════════╣")

        words = error_msg.split()
        lines = []
        current_line = ""

        for word in words:
            if len(current_line + word) <= 54:
                current_line += word + " "
            else:
                lines.append(current_line.strip())
                current_line = word + " "
        if current_line:
            lines.append(current_line.strip())

        for line in lines:
            print(f"║ {line:<56} ║")

        print(
            f"╚══════════════════════════════════════════════════════════════╝{Colors.ENDC}"
        )

    def cleanup_cache(self):
        """清理Python缓存文件 / Clean up Python cache files"""
        try:
            self.print_status("Cleaning up cache files...", "info")
            # 清理__pycache__目录
            os.system('find . -type d -name "__pycache__" -exec rm -r {} + 2>/dev/null')
            # 清理.pyc文件
            os.system('find . -name "*.pyc" -delete 2>/dev/null')
            self.print_status("Cache cleanup completed", "success")
        except Exception as e:
            self.print_status(f"Cache cleanup failed: {e}", "warning")

    def print_goodbye(self):
        """Print goodbye message"""
        # 清理缓存文件
        self.cleanup_cache()

        goodbye = f"""
{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                GOODBYE                                        ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║  {Colors.OKGREEN}🎉 Thank you for using DeepCode CLI!                                     {Colors.CYAN}║
║                                                                               ║
║  {Colors.YELLOW}🧬 Join our community in revolutionizing research reproducibility         {Colors.CYAN}║
║  {Colors.PURPLE}⚡ Together, we're building the future of automated code generation       {Colors.CYAN}║
║                                                                               ║
║  {Colors.OKCYAN}💡 Questions? Contribute to our open-source mission at GitHub             {Colors.CYAN}║
║  {Colors.GREEN}🧹 Cache files cleaned up for optimal performance                         {Colors.CYAN}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(goodbye)

    def get_requirement_analysis_input(self) -> str:
        """Enhanced requirement analysis input interface (NEW: matching UI version)"""
        self.print_separator("─", 79, Colors.BLUE)
        print(
            f"{Colors.BOLD}{Colors.BLUE}🧠 Requirement Analysis Interface{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}Describe your project idea or requirements briefly.{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}Our AI will generate guiding questions to help you refine your vision.{Colors.ENDC}"
        )
        self.print_separator("─", 79, Colors.BLUE)

        # Display examples
        print(f"\n{Colors.BOLD}{Colors.YELLOW}💡 Examples:{Colors.ENDC}")
        print(
            f"{Colors.CYAN}  • 'I want to build a machine learning system for image recognition'{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}  • 'Create a web app for project management with real-time collaboration'{Colors.ENDC}"
        )
        print(
            f"{Colors.CYAN}  • 'Develop a data analysis pipeline for financial forecasting'{Colors.ENDC}"
        )

        self.print_separator("─", 79, Colors.BLUE)

        print(
            f"\n{Colors.BOLD}{Colors.OKCYAN}✏️  Enter your initial requirements below:{Colors.ENDC}"
        )
        print(
            f"{Colors.YELLOW}(Type your description, press Enter twice when finished, or Ctrl+C to cancel){Colors.ENDC}"
        )

        lines = []
        empty_line_count = 0

        while True:
            try:
                if len(lines) == 0:
                    print(f"{Colors.BOLD}> {Colors.ENDC}", end="")
                else:
                    print(f"{Colors.BOLD}  {Colors.ENDC}", end="")

                line = input()

                if line.strip() == "":
                    empty_line_count += 1
                    if empty_line_count >= 2:
                        break
                    lines.append("")
                else:
                    empty_line_count = 0
                    lines.append(line)

            except KeyboardInterrupt:
                print(f"\n{Colors.WARNING}Input cancelled by user{Colors.ENDC}")
                return ""

        user_input = "\n".join(lines).strip()

        if not user_input:
            self.print_status("No input provided", "warning")
            return ""

        if len(user_input) < 20:
            self.print_status(
                "Input too short. Please provide more details (at least 20 characters)",
                "warning",
            )
            retry = (
                input(f"{Colors.YELLOW}Try again? (y/n): {Colors.ENDC}").strip().lower()
            )
            if retry == "y":
                return self.get_requirement_analysis_input()
            return ""

        # Display input summary
        word_count = len(user_input.split())
        char_count = len(user_input)

        print(f"\n{Colors.BOLD}{Colors.GREEN}📋 Input Summary:{Colors.ENDC}")
        print(f"  • {Colors.CYAN}Word count: {word_count}{Colors.ENDC}")
        print(f"  • {Colors.CYAN}Character count: {char_count}{Colors.ENDC}")

        # Show preview
        preview = user_input[:200] + "..." if len(user_input) > 200 else user_input
        print(f"\n{Colors.BOLD}{Colors.CYAN}📄 Preview:{Colors.ENDC}")
        print(f"{Colors.YELLOW}{preview}{Colors.ENDC}")

        # Confirm
        confirm = (
            input(
                f"\n{Colors.BOLD}{Colors.OKCYAN}Proceed with this input? (y/n): {Colors.ENDC}"
            )
            .strip()
            .lower()
        )
        if confirm != "y":
            retry = (
                input(f"{Colors.YELLOW}Edit input? (y/n): {Colors.ENDC}")
                .strip()
                .lower()
            )
            if retry == "y":
                return self.get_requirement_analysis_input()
            return ""

        self.print_status(
            f"Requirement input captured: {word_count} words, {char_count} characters",
            "success",
        )
        return user_input

    def display_guiding_questions(self, questions_json: str):
        """Display AI-generated guiding questions (NEW: matching UI version)"""
        import json

        try:
            questions = json.loads(questions_json)

            self.print_separator("═", 79, Colors.GREEN)
            print(
                f"\n{Colors.BOLD}{Colors.GREEN}🤖 AI-Generated Guiding Questions{Colors.ENDC}"
            )
            print(
                f"{Colors.CYAN}Please answer these questions to help refine your requirements:{Colors.ENDC}\n"
            )
            self.print_separator("─", 79, Colors.GREEN)

            for i, q in enumerate(questions, 1):
                print(
                    f"\n{Colors.BOLD}{Colors.YELLOW}Question {i}:{Colors.ENDC} {Colors.CYAN}{q}{Colors.ENDC}"
                )

            self.print_separator("═", 79, Colors.GREEN)

        except json.JSONDecodeError:
            self.print_status("Failed to parse questions", "error")
            print(questions_json)

    def get_question_answers(self, questions_json: str) -> dict:
        """Get user answers to guiding questions (NEW: matching UI version)"""
        import json

        try:
            questions = json.loads(questions_json)
            answers = {}

            print(
                f"\n{Colors.BOLD}{Colors.BLUE}📝 Answer the following questions:{Colors.ENDC}"
            )
            print(
                f"{Colors.CYAN}(Type your answer and press Enter for each question){Colors.ENDC}\n"
            )

            for i, question in enumerate(questions, 1):
                print(
                    f"\n{Colors.BOLD}{Colors.YELLOW}Q{i}:{Colors.ENDC} {Colors.CYAN}{question}{Colors.ENDC}"
                )
                print(f"{Colors.BOLD}{Colors.OKCYAN}Your answer:{Colors.ENDC} ", end="")

                answer = input().strip()
                answers[f"question_{i}"] = answer

                if answer:
                    self.print_status(f"Answer {i} recorded", "success")
                else:
                    self.print_status(f"Answer {i} left blank", "warning")

            return answers

        except json.JSONDecodeError:
            self.print_status("Failed to parse questions", "error")
            return {}

    def display_requirement_summary(self, summary: str):
        """Display generated requirement document (NEW: matching UI version)"""
        self.print_separator("═", 79, Colors.GREEN)
        print(
            f"\n{Colors.BOLD}{Colors.GREEN}📄 Generated Requirement Document{Colors.ENDC}\n"
        )
        self.print_separator("─", 79, Colors.GREEN)

        print(f"{Colors.CYAN}{summary}{Colors.ENDC}")

        self.print_separator("═", 79, Colors.GREEN)

        # Ask if user wants to proceed with implementation
        proceed = (
            input(
                f"\n{Colors.BOLD}{Colors.YELLOW}Would you like to proceed with code implementation based on these requirements? (y/n):{Colors.ENDC} "
            )
            .strip()
            .lower()
        )

        return proceed == "y"

    def ask_continue(self) -> bool:
        """Ask if user wants to continue with another paper"""
        self.print_separator("─", 79, Colors.YELLOW)
        print(f"\n{Colors.BOLD}{Colors.YELLOW}🔄 Process another paper?{Colors.ENDC}")
        choice = input(f"{Colors.OKCYAN}Continue? (y/n): {Colors.ENDC}").strip().lower()
        return choice in ["y", "yes", "1", "true"]

    def add_to_history(self, input_source: str, result: dict):
        """Add processing result to history"""
        entry = {
            "timestamp": time.strftime("%Y-%m-%d %H:%M:%S"),
            "input_source": input_source,
            "status": result.get("status", "unknown"),
            "result": result,
        }
        self.processing_history.append(entry)

    def show_history(self):
        """Display processing history"""
        if not self.processing_history:
            self.print_status("No processing history available", "info")
            return

        print(f"\n{Colors.BOLD}{Colors.CYAN}📚 PROCESSING HISTORY{Colors.ENDC}")
        self.print_separator("─", 79, Colors.CYAN)

        for i, entry in enumerate(self.processing_history, 1):
            status_icon = "✅" if entry["status"] == "success" else "❌"
            source = entry["input_source"]
            if len(source) > 50:
                source = source[:47] + "..."

            print(f"{i}. {status_icon} {entry['timestamp']} | {source}")

        self.print_separator("─", 79, Colors.CYAN)

    def show_configuration_menu(self):
        """Show configuration options menu"""
        self.clear_screen()

        # Get segmentation config status
        segmentation_enabled = getattr(self, "segmentation_enabled", True)
        segmentation_threshold = getattr(self, "segmentation_threshold", 50000)

        print(f"""
{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                           CONFIGURATION MENU                                  ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║                                                                               ║
║  {Colors.BOLD}🤖 Agent Orchestration Engine Configuration{Colors.CYAN}                             ║
║                                                                               ║
║  {Colors.OKCYAN}[1] Pipeline Mode:{Colors.CYAN}                                                        ║
║      {Colors.BOLD}🧠 Comprehensive Mode{Colors.CYAN} - Full intelligence analysis (Default)         ║
║         ✓ Research Analysis + Resource Processing                            ║
║         ✓ Reference Intelligence Discovery                                   ║
║         ✓ Automated Repository Acquisition                                   ║
║         ✓ Codebase Intelligence Orchestration                               ║
║         ✓ Intelligent Code Implementation Synthesis                         ║
║                                                                               ║
║      {Colors.BOLD}⚡ Optimized Mode{Colors.CYAN} - Fast processing (Skip indexing)                    ║
║         ✓ Research Analysis + Resource Processing                            ║
║         ✓ Code Architecture Synthesis                                        ║
║         ✓ Intelligent Code Implementation Synthesis                         ║
║         ✗ Reference Intelligence Discovery (Skipped)                        ║
║         ✗ Repository Acquisition (Skipped)                                   ║
║         ✗ Codebase Intelligence Orchestration (Skipped)                     ║
║                                                                               ║
║  {Colors.OKCYAN}[2] Document Processing:{Colors.CYAN}                                                   ║
║      {Colors.BOLD}📄 Smart Segmentation{Colors.CYAN} - Intelligent document analysis (Default)      ║
║         ✓ Semantic boundary detection                                        ║
║         ✓ Algorithm integrity preservation                                   ║
║         ✓ Formula chain recognition                                          ║
║         ✓ Adaptive character limits                                          ║
║                                                                               ║
║      {Colors.BOLD}📋 Traditional Processing{Colors.CYAN} - Full document reading                       ║
║         ✓ Complete document analysis                                         ║
║         ✗ Smart segmentation (Disabled)                                      ║
║                                                                               ║
║  {Colors.YELLOW}Current Settings:{Colors.CYAN}                                                         ║
║    Pipeline: {'🧠 Comprehensive Mode' if self.enable_indexing else '⚡ Optimized Mode'}                                          ║
║    Document: {'📄 Smart Segmentation' if segmentation_enabled else '📋 Traditional Processing'}                                ║
║    Threshold: {segmentation_threshold} characters                                    ║
║                                                                               ║
║  {Colors.OKGREEN}[T] Toggle Pipeline    {Colors.BLUE}[S] Toggle Segmentation    {Colors.FAIL}[B] Back{Colors.CYAN}     ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
""")

        while True:
            print(
                f"\n{Colors.BOLD}{Colors.OKCYAN}➤ Configuration choice: {Colors.ENDC}",
                end="",
            )
            choice = input().strip().lower()

            if choice in ["t", "toggle"]:
                self.enable_indexing = not self.enable_indexing
                mode = "🧠 Comprehensive" if self.enable_indexing else "⚡ Optimized"
                self.print_status(f"Pipeline mode switched to: {mode}", "success")
                time.sleep(1)
                self.show_configuration_menu()
                return

            elif choice in ["s", "segmentation"]:
                current_state = getattr(self, "segmentation_enabled", True)
                self.segmentation_enabled = not current_state
                # Save the configuration to file
                self._save_segmentation_config()
                seg_mode = (
                    "📄 Smart Segmentation"
                    if self.segmentation_enabled
                    else "📋 Traditional Processing"
                )
                self.print_status(
                    f"Document processing switched to: {seg_mode}", "success"
                )
                time.sleep(1)
                self.show_configuration_menu()
                return

            elif choice in ["b", "back"]:
                return

            else:
                self.print_status(
                    "Invalid choice. Please enter 'T', 'S', or 'B'.", "warning"
                )


================================================
FILE: cli/cli_launcher.py
================================================
#!/usr/bin/env python3
"""
DeepCode - CLI Research Engine Launcher
DeepCode - CLI研究引擎启动器

🧬 Open-Source Code Agent by Data Intelligence Lab @ HKU (CLI Edition)
⚡ Revolutionizing research reproducibility through collaborative AI via command line
"""

import sys
from pathlib import Path


def check_dependencies():
    """检查必要的依赖是否已安装 / Check if necessary dependencies are installed"""
    import importlib.util

    print("🔍 Checking CLI dependencies...")

    missing_deps = []

    # Check asyncio availability
    if importlib.util.find_spec("asyncio") is not None:
        print("✅ Asyncio is available")
    else:
        missing_deps.append("asyncio")

    # Check PyYAML availability
    if importlib.util.find_spec("yaml") is not None:
        print("✅ PyYAML is installed")
    else:
        missing_deps.append("pyyaml")

    # Check Tkinter availability
    if importlib.util.find_spec("tkinter") is not None:
        print("✅ Tkinter is available (for file dialogs)")
    else:
        print("⚠️  Tkinter not available - file dialogs will use manual input")

    # Check for MCP agent dependencies
    if importlib.util.find_spec("mcp_agent.app") is not None:
        print("✅ MCP Agent framework is available")
    else:
        missing_deps.append("mcp-agent")

    # Check for workflow dependencies
    # 添加项目根目录到路径
    current_dir = Path(__file__).parent
    project_root = current_dir.parent
    if str(project_root) not in sys.path:
        sys.path.insert(0, str(project_root))

    if importlib.util.find_spec("workflows.agent_orchestration_engine") is not None:
        print("✅ Workflow modules are available")
    else:
        print("⚠️  Workflow modules may not be properly configured")

    # Check for CLI components
    if importlib.util.find_spec("cli.cli_app") is not None:
        print("✅ CLI application components are available")
    else:
        print("❌ CLI application components missing")
        missing_deps.append("cli-components")

    if missing_deps:
        print("\n❌ Missing dependencies:")
        for dep in missing_deps:
            print(f"   - {dep}")
        print("\nPlease install missing dependencies using:")
        print(
            f"pip install {' '.join([d for d in missing_deps if d != 'cli-components'])}"
        )
        if "cli-components" in missing_deps:
            print(
                "CLI components appear to be missing - please check the cli/ directory"
            )
        return False

    print("✅ All CLI dependencies satisfied")
    return True


def print_banner():
    """显示CLI启动横幅 / Display CLI startup banner"""
    banner = """
╔══════════════════════════════════════════════════════════════╗
║                                                              ║
║    🧬 DeepCode - Open-Source Code Agent                      ║
║                                                              ║
║    ⚡ DATA INTELLIGENCE LAB @ HKU ⚡                        ║
║                                                              ║
║                               ║
║                                                              ║
╚══════════════════════════════════════════════════════════════╝
"""
    print(banner)


def main():
    """主函数 / Main function"""
    print_banner()

    # 检查依赖 / Check dependencies
    if not check_dependencies():
        print("\n🚨 Please install missing dependencies and try again.")
        sys.exit(1)

    # 获取当前脚本目录 / Get current script directory
    current_dir = Path(__file__).parent
    project_root = current_dir.parent
    cli_app_path = current_dir / "cli_app.py"

    # 检查cli_app.py是否存在 / Check if cli_app.py exists
    if not cli_app_path.exists():
        print(f"❌ CLI application file not found: {cli_app_path}")
        print("Please ensure the cli/cli_app.py file exists.")
        sys.exit(1)

    print(f"\n📁 CLI App location: {cli_app_path}")
    print("🖥️  Starting DeepCode CLI interface...")
    print("🚀 Initializing command line application")
    print("=" * 70)
    print("💡 Tip: Follow the interactive prompts to process your research")
    print("🛑 Press Ctrl+C to exit at any time")
    print("=" * 70)

    # 启动CLI应用 / Launch CLI application
    try:
        # 导入并运行CLI应用
        if str(project_root) not in sys.path:
            sys.path.insert(0, str(project_root))  # 添加项目根目录到路径
        from cli.cli_app import main as cli_main

        print("\n🎯 Launching CLI application...")

        # 使用asyncio运行主函数
        import asyncio

        asyncio.run(cli_main())

    except KeyboardInterrupt:
        print("\n\n🛑 DeepCode CLI stopped by user")
        print("Thank you for using DeepCode CLI! 🧬")
    except ImportError as e:
        print(f"\n❌ Failed to import CLI application: {e}")
        print("Please check if all modules are properly installed.")
        sys.exit(1)
    except Exception as e:
        print(f"\n❌ Unexpected error: {e}")
        print("Please check your Python environment and try again.")
        sys.exit(1)


if __name__ == "__main__":
    main()


================================================
FILE: cli/main_cli.py
================================================
#!/usr/bin/env python3
"""
DeepCode CLI - Open-Source Code Agent
深度代码CLI - 开源代码智能体

🧬 Data Intelligence Lab @ HKU
⚡ Revolutionizing Research Reproducibility through Multi-Agent Architecture
"""

import os
import sys
import asyncio
import argparse

# 禁止生成.pyc文件
os.environ["PYTHONDONTWRITEBYTECODE"] = "1"

# 添加项目根目录到路径
current_dir = os.path.dirname(os.path.abspath(__file__))
parent_dir = os.path.dirname(current_dir)
if parent_dir not in sys.path:
    sys.path.insert(0, parent_dir)

# 导入CLI应用
from cli.cli_app import CLIApp, Colors


def print_enhanced_banner():
    """显示增强版启动横幅"""
    banner = f"""
{Colors.CYAN}╔══════════════════════════════════════════════════════════════════════════════╗
║                                                                              ║
║    {Colors.BOLD}{Colors.MAGENTA}🧬 DeepCode - Open-Source Code Agent{Colors.CYAN}                              ║
║                                                                              ║
║    {Colors.BOLD}{Colors.YELLOW}⚡ DATA INTELLIGENCE LAB @ HKU ⚡{Colors.CYAN}                                ║
║                                                                              ║
║    Revolutionizing research reproducibility through collaborative AI         ║
║    Building the future where code is reproduced from natural language       ║
║                                                                              ║
║    {Colors.BOLD}{Colors.GREEN}🤖 Key Features:{Colors.CYAN}                                                    ║
║    • Automated paper-to-code reproduction                                   ║
║    • Multi-agent collaborative architecture                                 ║
║    • Open-source and extensible design                                      ║
║    • Join our growing research community                                    ║
║                                                                              ║
╚══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
    print(banner)


def check_environment():
    """检查运行环境"""
    print(f"{Colors.CYAN}🔍 Checking environment...{Colors.ENDC}")

    # 检查Python版本
    if sys.version_info < (3, 8):
        print(
            f"{Colors.FAIL}❌ Python 3.8+ required. Current: {sys.version}{Colors.ENDC}"
        )
        return False

    print(f"{Colors.OKGREEN}✅ Python {sys.version.split()[0]} - OK{Colors.ENDC}")

    # 检查必要模块
    required_modules = [
        ("asyncio", "Async IO support"),
        ("pathlib", "Path handling"),
        ("typing", "Type hints"),
    ]

    missing_modules = []
    for module, desc in required_modules:
        try:
            __import__(module)
            print(f"{Colors.OKGREEN}✅ {desc} - OK{Colors.ENDC}")
        except ImportError:
            missing_modules.append(module)
            print(f"{Colors.FAIL}❌ {desc} - Missing{Colors.ENDC}")

    if missing_modules:
        print(
            f"{Colors.FAIL}❌ Missing required modules: {', '.join(missing_modules)}{Colors.ENDC}"
        )
        return False

    print(f"{Colors.OKGREEN}✅ Environment check passed{Colors.ENDC}")
    return True


def parse_arguments():
    """解析命令行参数"""
    parser = argparse.ArgumentParser(
        description="DeepCode CLI - Open-Source Code Agent by Data Intelligence Lab @ HKU",
        formatter_class=argparse.RawDescriptionHelpFormatter,
        epilog=f"""
{Colors.BOLD}Examples:{Colors.ENDC}
  {Colors.CYAN}python main_cli.py{Colors.ENDC}                                      # Interactive mode
  {Colors.CYAN}python main_cli.py --file paper.pdf{Colors.ENDC}                       # Process file directly
  {Colors.CYAN}python main_cli.py --url https://...{Colors.ENDC}                      # Process URL directly
  {Colors.CYAN}python main_cli.py --chat "Build a web app..."{Colors.ENDC}            # Process chat requirements
  {Colors.CYAN}python main_cli.py --requirement "ML system for..."{Colors.ENDC}       # Guided requirement analysis (NEW)
  {Colors.CYAN}python main_cli.py --optimized{Colors.ENDC}                            # Use optimized mode
  {Colors.CYAN}python main_cli.py --disable-segmentation{Colors.ENDC}                 # Disable document segmentation
  {Colors.CYAN}python main_cli.py --segmentation-threshold 30000{Colors.ENDC}         # Custom segmentation threshold

{Colors.BOLD}Pipeline Modes:{Colors.ENDC}
  {Colors.GREEN}Comprehensive{Colors.ENDC}:          Full intelligence analysis with indexing
  {Colors.YELLOW}Optimized{Colors.ENDC}:              Fast processing without indexing
  {Colors.BLUE}Requirement Analysis{Colors.ENDC}:   Guided Q&A to refine requirements (NEW)

{Colors.BOLD}Document Processing:{Colors.ENDC}
  {Colors.BLUE}Smart Segmentation{Colors.ENDC}: Intelligent document segmentation for large papers
  {Colors.MAGENTA}Supported Formats{Colors.ENDC}: PDF, DOCX, DOC, PPT, PPTX, XLS, XLSX, HTML, TXT, MD
        """,
    )

    parser.add_argument(
        "--file", "-f", type=str, help="Process a specific file (PDF, DOCX, TXT, etc.)"
    )

    parser.add_argument(
        "--url", "-u", type=str, help="Process a research paper from URL"
    )

    parser.add_argument(
        "--chat",
        "-t",
        type=str,
        help="Process coding requirements via chat input (provide requirements as argument)",
    )

    parser.add_argument(
        "--requirement",
        "-r",
        type=str,
        help="Process requirements via guided analysis (provide initial idea as argument)",
    )

    parser.add_argument(
        "--optimized",
        "-o",
        action="store_true",
        help="Use optimized mode (skip indexing for faster processing)",
    )

    parser.add_argument(
        "--disable-segmentation",
        action="store_true",
        help="Disable intelligent document segmentation (use traditional full-document processing)",
    )

    parser.add_argument(
        "--segmentation-threshold",
        type=int,
        default=50000,
        help="Document size threshold (characters) to trigger segmentation (default: 50000)",
    )

    parser.add_argument(
        "--verbose", "-v", action="store_true", help="Enable verbose output"
    )

    return parser.parse_args()


async def run_direct_processing(app: CLIApp, input_source: str, input_type: str):
    """直接处理模式（非交互式）"""
    try:
        print(
            f"\n{Colors.BOLD}{Colors.CYAN}🚀 Starting direct processing mode...{Colors.ENDC}"
        )
        print(f"{Colors.CYAN}Input: {input_source}{Colors.ENDC}")
        print(f"{Colors.CYAN}Type: {input_type}{Colors.ENDC}")
        print(
            f"{Colors.CYAN}Mode: {'🧠 Comprehensive' if app.cli.enable_indexing else '⚡ Optimized'}{Colors.ENDC}"
        )

        # 初始化应用
        init_result = await app.initialize_mcp_app()
        if init_result["status"] != "success":
            print(
                f"{Colors.FAIL}❌ Initialization failed: {init_result['message']}{Colors.ENDC}"
            )
            return False

        # 处理输入
        result = await app.process_input(input_source, input_type)

        if result["status"] == "success":
            print(
                f"\n{Colors.BOLD}{Colors.OKGREEN}🎉 Processing completed successfully!{Colors.ENDC}"
            )
            return True
        else:
            print(
                f"\n{Colors.BOLD}{Colors.FAIL}❌ Processing failed: {result.get('error', 'Unknown error')}{Colors.ENDC}"
            )
            return False

    except Exception as e:
        print(f"\n{Colors.FAIL}❌ Direct processing error: {str(e)}{Colors.ENDC}")
        return False
    finally:
        await app.cleanup_mcp_app()


async def run_requirement_analysis(app: CLIApp, initial_idea: str):
    """需求分析模式（非交互式） - NEW: matching UI version"""
    try:
        print(
            f"\n{Colors.BOLD}{Colors.BLUE}🧠 Starting requirement analysis mode...{Colors.ENDC}"
        )
        print(f"{Colors.CYAN}Initial Idea: {initial_idea}{Colors.ENDC}")

        # 初始化应用
        init_result = await app.initialize_mcp_app()
        if init_result["status"] != "success":
            print(
                f"{Colors.FAIL}❌ Initialization failed: {init_result['message']}{Colors.ENDC}"
            )
            return False

        # 执行需求分析工作流
        result = await app.process_requirement_analysis_non_interactive(initial_idea)

        if result["status"] == "success":
            print(
                f"\n{Colors.BOLD}{Colors.OKGREEN}🎉 Requirement analysis completed successfully!{Colors.ENDC}"
            )
            return True
        else:
            print(
                f"\n{Colors.BOLD}{Colors.FAIL}❌ Requirement analysis failed: {result.get('error', 'Unknown error')}{Colors.ENDC}"
            )
            return False

    except Exception as e:
        print(f"\n{Colors.FAIL}❌ Requirement analysis error: {str(e)}{Colors.ENDC}")
        return False
    finally:
        await app.cleanup_mcp_app()


async def main():
    """主函数"""
    # 解析命令行参数
    args = parse_arguments()

    # 显示横幅
    print_enhanced_banner()

    # 检查环境
    if not check_environment():
        print(
            f"\n{Colors.FAIL}🚨 Environment check failed. Please fix the issues and try again.{Colors.ENDC}"
        )
        sys.exit(1)

    try:
        # 创建CLI应用
        app = CLIApp()

        # 设置配置 - 默认禁用索引功能以加快处理速度
        if args.optimized:
            app.cli.enable_indexing = False
            print(
                f"\n{Colors.YELLOW}⚡ Optimized mode enabled - indexing disabled{Colors.ENDC}"
            )
        else:
            # 默认也禁用索引功能
            app.cli.enable_indexing = False
            print(
                f"\n{Colors.YELLOW}⚡ Fast mode enabled - indexing disabled by default{Colors.ENDC}"
            )

        # Configure document segmentation settings
        if hasattr(args, "disable_segmentation") and args.disable_segmentation:
            print(
                f"\n{Colors.MAGENTA}📄 Document segmentation disabled - using traditional processing{Colors.ENDC}"
            )
            app.cli.segmentation_enabled = False
            app.cli.segmentation_threshold = args.segmentation_threshold
            app.cli._save_segmentation_config()
        else:
            print(
                f"\n{Colors.BLUE}📄 Smart document segmentation enabled (threshold: {args.segmentation_threshold} chars){Colors.ENDC}"
            )
            app.cli.segmentation_enabled = True
            app.cli.segmentation_threshold = args.segmentation_threshold
            app.cli._save_segmentation_config()

        # 检查是否为直接处理模式
        if args.file or args.url or args.chat or args.requirement:
            if args.file:
                # 验证文件存在
                if not os.path.exists(args.file):
                    print(f"{Colors.FAIL}❌ File not found: {args.file}{Colors.ENDC}")
                    sys.exit(1)
                # 使用 file:// 前缀保持与交互模式一致，确保文件被复制而非移动
                file_url = f"file://{os.path.abspath(args.file)}"
                success = await run_direct_processing(app, file_url, "file")
            elif args.url:
                success = await run_direct_processing(app, args.url, "url")
            elif args.chat:
                # 验证chat输入长度
                if len(args.chat.strip()) < 20:
                    print(
                        f"{Colors.FAIL}❌ Chat input too short. Please provide more detailed requirements (at least 20 characters){Colors.ENDC}"
                    )
                    sys.exit(1)
                success = await run_direct_processing(app, args.chat, "chat")
            elif args.requirement:
                # NEW: Requirement analysis mode
                # 验证需求输入长度
                if len(args.requirement.strip()) < 10:
                    print(
                        f"{Colors.FAIL}❌ Requirement input too short. Please provide more details (at least 10 characters){Colors.ENDC}"
                    )
                    sys.exit(1)
                success = await run_requirement_analysis(app, args.requirement)

            sys.exit(0 if success else 1)
        else:
            # 交互式模式
            print(f"\n{Colors.CYAN}🎮 Starting interactive mode...{Colors.ENDC}")
            await app.run_interactive_session()

    except KeyboardInterrupt:
        print(f"\n{Colors.WARNING}⚠️  Application interrupted by user{Colors.ENDC}")
        sys.exit(1)
    except Exception as e:
        print(f"\n{Colors.FAIL}❌ Application errors: {str(e)}{Colors.ENDC}")
        sys.exit(1)


if __name__ == "__main__":
    asyncio.run(main())


================================================
FILE: cli/workflows/__init__.py
================================================
"""
CLI-specific Workflow Adapters
CLI专用工作流适配器

This module provides CLI-optimized versions of workflow components that are
specifically adapted for command-line interface usage patterns.
"""

from .cli_workflow_adapter import CLIWorkflowAdapter

__all__ = ["CLIWorkflowAdapter"]


================================================
FILE: cli/workflows/cli_workflow_adapter.py
================================================
"""
CLI Workflow Adapter for Agent Orchestration Engine
CLI工作流适配器 - 智能体编排引擎

This adapter provides CLI-optimized interface to the latest agent orchestration engine,
with enhanced progress reporting, error handling, and CLI-specific optimizations.

Version: 2.1 (Updated to match UI version - Added Requirement Analysis)
Changes:
- Default enable_indexing=False for faster processing (matching UI defaults)
- Mode-aware progress callback with detailed stage mapping
- Chat pipeline now accepts enable_indexing parameter
- Improved error handling and resource management
- Enhanced progress display for different modes (fast/comprehensive/chat)
- NEW: Added requirement analysis workflow support
"""

import os
from typing import Callable, Dict, Any
from mcp_agent.app import MCPApp


class CLIWorkflowAdapter:
    """
    CLI-optimized workflow adapter for the intelligent agent orchestration engine.

    This adapter provides:
    - Enhanced CLI progress reporting
    - Optimized error handling for CLI environments
    - Streamlined interface for command-line usage
    - Integration with the latest agent orchestration engine
    """

    def __init__(self, cli_interface=None):
        """
        Initialize CLI workflow adapter.

        Args:
            cli_interface: CLI interface instance for progress reporting
        """
        self.cli_interface = cli_interface
        self.app = None
        self.logger = None
        self.context = None

    async def initialize_mcp_app(self) -> Dict[str, Any]:
        """
        Initialize MCP application for CLI usage (improved version matching UI).

        Returns:
            dict: Initialization result
        """
        try:
            if self.cli_interface:
                self.cli_interface.show_spinner(
                    "🚀 Initializing Agent Orchestration Engine", 2.0
                )

            # Initialize MCP application using async context manager (matching UI pattern)
            self.app = MCPApp(name="cli_agent_orchestration")
            self.app_context = self.app.run()
            agent_app = await self.app_context.__aenter__()

            self.logger = agent_app.logger
            self.context = agent_app.context

            # Configure filesystem access
            self.context.config.mcp.servers["filesystem"].args.extend([os.getcwd()])

            if self.cli_interface:
                self.cli_interface.print_status(
                    "🧠 Agent Orchestration Engine initialized successfully", "success"
                )

            return {
                "status": "success",
                "message": "MCP application initialized successfully",
            }

        except Exception as e:
            error_msg = f"Failed to initialize MCP application: {str(e)}"
            if self.cli_interface:
                self.cli_interface.print_status(error_msg, "error")
            return {"status": "error", "message": error_msg}

    async def cleanup_mcp_app(self):
        """
        Clean up MCP application resources.
        """
        if hasattr(self, "app_context"):
            try:
                await self.app_context.__aexit__(None, None, None)
                if self.cli_interface:
                    self.cli_interface.print_status(
                        "🧹 Resources cleaned up successfully", "info"
                    )
            except Exception as e:
                if self.cli_interface:
                    self.cli_interface.print_status(
                        f"⚠️ Cleanup warning: {str(e)}", "warning"
                    )

    def create_cli_progress_callback(self, enable_indexing: bool = True) -> Callable:
        """
        Create CLI-optimized progress callback function with mode-aware stage mapping.

        This matches the UI version's detailed progress mapping logic.

        Args:
            enable_indexing: Whether indexing is enabled (affects stage mapping)

        Returns:
            Callable: Progress callback function
        """

        def progress_callback(progress: int, message: str):
            if self.cli_interface:
                # Mode-aware stage mapping (matching UI version logic)
                if enable_indexing:
                    # Full workflow mapping: Initialize -> Analyze -> Download -> Plan -> References -> Repos -> Index -> Implement
                    if progress <= 5:
                        stage = 0  # Initialize
                    elif progress <= 10:
                        stage = 1  # Analyze
                    elif progress <= 25:
                        stage = 2  # Download
                    elif progress <= 40:
                        stage = 3  # Plan
                    elif progress <= 50:
                        stage = 4  # References
                    elif progress <= 60:
                        stage = 5  # Repos
                    elif progress <= 70:
                        stage = 6  # Index
                    elif progress <= 85:
                        stage = 7  # Implement
                    else:
                        stage = 8  # Complete
                else:
                    # Fast mode mapping: Initialize -> Analyze -> Download -> Plan -> Implement
                    if progress <= 5:
                        stage = 0  # Initialize
                    elif progress <= 10:
                        stage = 1  # Analyze
                    elif progress <= 25:
                        stage = 2  # Download
                    elif progress <= 40:
                        stage = 3  # Plan
                    elif progress <= 85:
                        stage = 4  # Implement (skip References, Repos, Index)
                    else:
                        stage = 4  # Complete

                self.cli_interface.display_processing_stages(stage, enable_indexing)

                # Display status message
                self.cli_interface.print_status(message, "processing")

        return progress_callback

    async def execute_full_pipeline(
        self, input_source: str, enable_indexing: bool = False
    ) -> Dict[str, Any]:
        """
        Execute the complete intelligent multi-agent research orchestration pipeline.

        Updated to match UI version: default enable_indexing=False for faster processing.

        Args:
            input_source: Research input source (file path, URL, or preprocessed analysis)
            enable_indexing: Whether to enable advanced intelligence analysis (default: False)

        Returns:
            dict: Comprehensive pipeline execution result
        """
        try:
            # Import the latest agent orchestration engine
            from workflows.agent_orchestration_engine import (
                execute_multi_agent_research_pipeline,
            )

            # Create CLI progress callback with mode awareness
            progress_callback = self.create_cli_progress_callback(enable_indexing)

            # Display pipeline start
            if self.cli_interface:
                if enable_indexing:
                    mode_msg = "🧠 comprehensive (with indexing)"
                else:
                    mode_msg = "⚡ fast (indexing disabled)"
                self.cli_interface.print_status(
                    f"🚀 Starting {mode_msg} agent orchestration pipeline...",
                    "processing",
                )
                self.cli_interface.display_processing_stages(0, enable_indexing)

            # Execute the pipeline
            result = await execute_multi_agent_research_pipeline(
                input_source=input_source,
                logger=self.logger,
                progress_callback=progress_callback,
                enable_indexing=enable_indexing,
            )

            # Display completion
            if self.cli_interface:
                final_stage = 8 if enable_indexing else 4
                self.cli_interface.display_processing_stages(
                    final_stage, enable_indexing
                )
                self.cli_interface.print_status(
                    "🎉 Agent orchestration pipeline completed successfully!",
                    "complete",
                )

            return {
                "status": "success",
                "result": result,
                "pipeline_mode": "comprehensive" if enable_indexing else "optimized",
            }

        except Exception as e:
            error_msg = f"Pipeline execution failed: {str(e)}"
            if self.cli_interface:
                self.cli_interface.print_status(error_msg, "error")

            return {
                "status": "error",
                "error": error_msg,
                "pipeline_mode": "comprehensive" if enable_indexing else "optimized",
            }

    async def execute_requirement_analysis_workflow(
        self, user_input: str, analysis_mode: str, user_answers: Dict[str, str] = None
    ) -> Dict[str, Any]:
        """
        Execute requirement analysis workflow (NEW: matching UI version).

        This workflow helps users refine their requirements through guided questions
        and intelligent analysis before starting code implementation.

        Args:
            user_input: User's initial requirements or description
            analysis_mode: Analysis mode ("generate_questions" or "summarize_requirements")
            user_answers: Dictionary of user answers to guiding questions (for summarize mode)

        Returns:
            dict: Analysis result with questions or requirement summary
        """
        try:
            # Import the requirement analysis workflow
            from workflows.agent_orchestration_engine import (
                execute_requirement_analysis_workflow,
            )

            # Create CLI progress callback
            def analysis_progress_callback(progress: int, message: str):
                if self.cli_interface:
                    self.cli_interface.print_status(message, "processing")

            # Display workflow start
            if self.cli_interface:
                if analysis_mode == "generate_questions":
                    self.cli_interface.print_status(
                        "🤖 Generating guiding questions for your requirements...",
                        "processing",
                    )
                else:
                    self.cli_interface.print_status(
                        "📄 Analyzing and summarizing your detailed requirements...",
                        "processing",
                    )

            # Execute the requirement analysis workflow
            result = await execute_requirement_analysis_workflow(
                user_input=user_input,
                analysis_mode=analysis_mode,
                user_answers=user_answers,
                logger=self.logger,
                progress_callback=analysis_progress_callback,
            )

            # Display completion
            if self.cli_interface:
                if result["status"] == "success":
                    if analysis_mode == "generate_questions":
                        self.cli_interface.print_status(
                            "✅ Guiding questions generated successfully!", "success"
                        )
                    else:
                        self.cli_interface.print_status(
                            "✅ Requirements analysis completed successfully!",
                            "success",
                        )
                else:
                    self.cli_interface.print_status(
                        f"❌ Analysis failed: {result.get('error', 'Unknown error')}",
                        "error",
                    )

            return result

        except Exception as e:
            error_msg = f"Requirement analysis workflow failed: {str(e)}"
            if self.cli_interface:
                self.cli_interface.print_status(error_msg, "error")

            return {"status": "error", "error": error_msg}

    async def execute_chat_pipeline(
        self, user_input: str, enable_indexing: bool = False
    ) -> Dict[str, Any]:
        """
        Execute the chat-based planning and implementation pipeline.

        Updated to match UI version: accepts enable_indexing parameter.

        Args:
            user_input: User's coding requirements and description
            enable_indexing: Whether to enable indexing for enhanced code understanding (default: False)

        Returns:
            dict: Chat pipeline execution result
        """
        try:
            # Import the chat-based pipeline
            from workflows.agent_orchestration_engine import (
                execute_chat_based_planning_pipeline,
            )

            # Create CLI progress callback for chat mode
            def chat_progress_callback(progress: int, message: str):
                if self.cli_interface:
                    # Map progress to CLI stages for chat mode (matching UI logic)
                    if progress <= 5:
                        stage = 0  # Initialize
                    elif progress <= 30:
                        stage = 1  # Planning
                    elif progress <= 50:
                        stage = 2  # Setup
                    elif progress <= 70:
                        stage = 3  # Save Plan
                    else:
                        stage = 4  # Implement

                    self.cli_interface.display_processing_stages(stage, chat_mode=True)

                    # Display status message
                    self.cli_interface.print_status(message, "processing")

            # Display pipeline start
            if self.cli_interface:
                indexing_note = (
                    " (with indexing)" if enable_indexing else " (fast mode)"
                )
                self.cli_interface.print_status(
                    f"🚀 Starting chat-based planning pipeline{indexing_note}...",
                    "processing",
                )
                self.cli_interface.display_processing_stages(0, chat_mode=True)

            # Execute the chat pipeline with configurable indexing
            result = await execute_chat_based_planning_pipeline(
                user_input=user_input,
                logger=self.logger,
                progress_callback=chat_progress_callback,
                enable_indexing=enable_indexing,  # Pass through enable_indexing parameter
            )

            # Display completion
            if self.cli_interface:
                self.cli_interface.display_processing_stages(4, chat_mode=True)
                self.cli_interface.print_status(
                    "🎉 Chat-based planning pipeline completed successfully!",
                    "complete",
                )

            return {"status": "success", "result": result, "pipeline_mode": "chat"}

        except Exception as e:
            error_msg = f"Chat pipeline execution failed: {str(e)}"
            if self.cli_interface:
                self.cli_interface.print_status(error_msg, "error")

            return {"status": "error", "error": error_msg, "pipeline_mode": "chat"}

    async def process_input_with_orchestration(
        self, input_source: str, input_type: str, enable_indexing: bool = False
    ) -> Dict[str, Any]:
        """
        Process input using the intelligent agent orchestration engine.

        This is the main CLI interface to the latest agent orchestration capabilities.
        Updated to match UI version: default enable_indexing=False.

        Args:
            input_source: Input source (file path, URL, or chat input)
            input_type: Type of input ('file', 'url', or 'chat')
            enable_indexing: Whether to enable advanced intelligence analysis (default: False)

        Returns:
            dict: Processing result with status and details
        """
        pipeline_result = None

        try:
            # Initialize MCP app
            init_result = await self.initialize_mcp_app()
            if init_result["status"] != "success":
                return init_result

            # Process file:// URLs for traditional file/URL inputs
            if input_source.startswith("file://"):
                file_path = input_source[7:]
                if os.name == "nt" and file_path.startswith("/"):
                    file_path = file_path.lstrip("/")
                input_source = file_path

            # Execute appropriate pipeline based on input type
            if input_type == "chat":
                # Use chat-based planning pipeline for user requirements
                # Pass enable_indexing to chat pipeline as well
                pipeline_result = await self.execute_chat_pipeline(
                    input_source, enable_indexing=enable_indexing
                )
            else:
                # Use traditional multi-agent research pipeline for files/URLs
                pipeline_result = await self.execute_full_pipeline(
                    input_source, enable_indexing=enable_indexing
                )

            return {
                "status": pipeline_result["status"],
                "analysis_result": "Integrated into agent orchestration pipeline",
                "download_result": "Integrated into agent orchestration pipeline",
                "repo_result": pipeline_result.get("result", ""),
                "pipeline_mode": pipeline_result.get("pipeline_mode", "comprehensive"),
                "error": pipeline_result.get("error"),
            }

        except Exception as e:
            error_msg = f"Error during orchestrated processing: {str(e)}"
            if self.cli_interface:
                self.cli_interface.print_status(error_msg, "error")

            return {
                "status": "error",
                "error": error_msg,
                "analysis_result": "",
                "download_result": "",
                "repo_result": "",
                "pipeline_mode": "comprehensive" if enable_indexing else "optimized",
            }

        finally:
            # Clean up resources
            await self.cleanup_mcp_app()


================================================
FILE: config/mcp_tool_definitions.py
================================================
"""
MCP工具定义配置模块
MCP Tool Definitions Configuration Module

将工具定义从主程序逻辑中分离，提供标准化的工具定义格式
Separate tool definitions from main program logic, providing standardized tool definition format

支持的工具类型：
- 文件操作工具 (File Operations)
- 代码执行工具 (Code Execution)
- 搜索工具 (Search Tools)
- 项目结构工具 (Project Structure Tools)
"""

from typing import Dict, List, Any


class MCPToolDefinitions:
    """MCP工具定义管理器"""

    @staticmethod
    def get_code_implementation_tools() -> List[Dict[str, Any]]:
        """
        获取代码实现相关的工具定义
        Get tool definitions for code implementation
        """
        return [
            # MCPToolDefinitions._get_read_file_tool(),
            # MCPToolDefinitions._get_read_multiple_files_tool(),
            # MCPToolDefinitions._get_read_code_mem_tool(),
            MCPToolDefinitions._get_write_file_tool(),
            # MCPToolDefinitions._get_write_multiple_files_tool(),
            # MCPToolDefinitions._get_execute_python_tool(),
            # MCPToolDefinitions._get_execute_bash_tool(),
        ]

    @staticmethod
    def _get_read_file_tool() -> Dict[str, Any]:
        """读取文件工具定义"""
        return {
            "name": "read_file",
            "description": "Read file content, supports specifying line number range",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_path": {
                        "type": "string",
                        "description": "File path, relative to workspace",
                    },
                    "start_line": {
                        "type": "integer",
                        "description": "Start line number (starting from 1, optional)",
                    },
                    "end_line": {
                        "type": "integer",
                        "description": "End line number (starting from 1, optional)",
                    },
                },
                "required": ["file_path"],
            },
        }

    @staticmethod
    def _get_read_multiple_files_tool() -> Dict[str, Any]:
        """批量读取多个文件工具定义"""
        return {
            "name": "read_multiple_files",
            "description": "Read multiple files in a single operation (for batch reading)",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_requests": {
                        "type": "string",
                        "description": 'JSON string with file requests, e.g., \'{"file1.py": {}, "file2.py": {"start_line": 1, "end_line": 10}}\' or simple array \'["file1.py", "file2.py"]\'',
                    },
                    "max_files": {
                        "type": "integer",
                        "description": "Maximum number of files to read in one operation",
                        "default": 5,
                        "minimum": 1,
                        "maximum": 10,
                    },
                },
                "required": ["file_requests"],
            },
        }

    @staticmethod
    def _get_read_code_mem_tool() -> Dict[str, Any]:
        """Read code memory tool definition - reads from implement_code_summary.md"""
        return {
            "name": "read_code_mem",
            "description": "Check if file summaries exist in implement_code_summary.md for multiple files in a single call. Returns summaries for all requested files if available.",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_paths": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "List of file paths to check for summary information in implement_code_summary.md",
                    }
                },
                "required": ["file_paths"],
            },
        }

    @staticmethod
    def _get_write_file_tool() -> Dict[str, Any]:
        """写入文件工具定义"""
        return {
            "name": "write_file",
            "description": "Write content to file",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_path": {
                        "type": "string",
                        "description": "File path, relative to workspace",
                    },
                    "content": {
                        "type": "string",
                        "description": "Content to write to file",
                    },
                    "create_dirs": {
                        "type": "boolean",
                        "description": "Whether to create directories if they don't exist",
                        "default": True,
                    },
                    "create_backup": {
                        "type": "boolean",
                        "description": "Whether to create backup file if file already exists",
                        "default": False,
                    },
                },
                "required": ["file_path", "content"],
            },
        }

    @staticmethod
    def _get_write_multiple_files_tool() -> Dict[str, Any]:
        """批量写入多个文件工具定义"""
        return {
            "name": "write_multiple_files",
            "description": "Write multiple files in a single operation (for batch implementation)",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_implementations": {
                        "type": "string",
                        "description": 'JSON string mapping file paths to content, e.g., \'{"file1.py": "content1", "file2.py": "content2"}\'',
                    },
                    "create_dirs": {
                        "type": "boolean",
                        "description": "Whether to create directories if they don't exist",
                        "default": True,
                    },
                    "create_backup": {
                        "type": "boolean",
                        "description": "Whether to create backup files if they already exist",
                        "default": False,
                    },
                    "max_files": {
                        "type": "integer",
                        "description": "Maximum number of files to write in one operation",
                        "default": 5,
                        "minimum": 1,
                        "maximum": 10,
                    },
                },
                "required": ["file_implementations"],
            },
        }

    @staticmethod
    def _get_execute_python_tool() -> Dict[str, Any]:
        """Python执行工具定义"""
        return {
            "name": "execute_python",
            "description": "Execute Python code and return output",
            "input_schema": {
                "type": "object",
                "properties": {
                    "code": {"type": "string", "description": "Python code to execute"},
                    "timeout": {
                        "type": "integer",
                        "description": "Timeout in seconds",
                        "default": 30,
                    },
                },
                "required": ["code"],
            },
        }

    @staticmethod
    def _get_execute_bash_tool() -> Dict[str, Any]:
        """Bash执行工具定义"""
        return {
            "name": "execute_bash",
            "description": "Execute bash command",
            "input_schema": {
                "type": "object",
                "properties": {
                    "command": {
                        "type": "string",
                        "description": "Bash command to execute",
                    },
                    "timeout": {
                        "type": "integer",
                        "description": "Timeout in seconds",
                        "default": 30,
                    },
                },
                "required": ["command"],
            },
        }

    @staticmethod
    def _get_file_structure_tool() -> Dict[str, Any]:
        """文件结构获取工具定义"""
        return {
            "name": "get_file_structure",
            "description": "Get directory file structure",
            "input_schema": {
                "type": "object",
                "properties": {
                    "directory": {
                        "type": "string",
                        "description": "Directory path, relative to workspace",
                        "default": ".",
                    },
                    "max_depth": {
                        "type": "integer",
                        "description": "Maximum traversal depth",
                        "default": 5,
                    },
                },
            },
        }

    @staticmethod
    def _get_search_code_references_tool() -> Dict[str, Any]:
        """统一代码参考搜索工具定义 - 合并了三个步骤为一个工具"""
        return {
            "name": "search_code_references",
            "description": "UNIFIED TOOL: Search relevant reference code from index files. Combines directory setup, index loading, and searching in a single call.",
            "input_schema": {
                "type": "object",
                "properties": {
                    "indexes_path": {
                        "type": "string",
                        "description": "Path to the indexes directory containing JSON index files",
                    },
                    "target_file": {
                        "type": "string",
                        "description": "Target file path to be implemented",
                    },
                    "keywords": {
                        "type": "string",
                        "description": "Search keywords, comma-separated",
                        "default": "",
                    },
                    "max_results": {
                        "type": "integer",
                        "description": "Maximum number of results to return",
                        "default": 10,
                    },
                },
                "required": ["indexes_path", "target_file"],
            },
        }

    @staticmethod
    def _get_get_indexes_overview_tool() -> Dict[str, Any]:
        """获取索引概览工具定义"""
        return {
            "name": "get_indexes_overview",
            "description": "Get overview of all available reference code index information from specified directory",
            "input_schema": {
                "type": "object",
                "properties": {
                    "indexes_path": {
                        "type": "string",
                        "description": "Path to the indexes directory containing JSON index files",
                    }
                },
                "required": ["indexes_path"],
            },
        }

    @staticmethod
    def _get_set_workspace_tool() -> Dict[str, Any]:
        """Set workspace directory tool definition"""
        return {
            "name": "set_workspace",
            "description": "Set the workspace directory for file operations",
            "input_schema": {
                "type": "object",
                "properties": {
                    "workspace_path": {
                        "type": "string",
                        "description": "Directory path for the workspace",
                    }
                },
                "required": ["workspace_path"],
            },
        }

    # @staticmethod
    # def _get_set_indexes_directory_tool() -> Dict[str, Any]:
    #     """Set indexes directory tool definition - DEPRECATED: Use unified search_code_references instead"""
    #     return {
    #         "name": "set_indexes_directory",
    #         "description": "Set the directory path for code reference indexes",
    #         "input_schema": {
    #             "type": "object",
    #             "properties": {
    #                 "indexes_path": {
    #                     "type": "string",
    #                     "description": "Directory path containing index JSON files"
    #                 }
    #             },
    #             "required": ["indexes_path"]
    #         }
    #     }

    @staticmethod
    def get_available_tool_sets() -> Dict[str, str]:
        """
        获取可用的工具集合
        Get available tool sets
        """
        return {
            "code_implementation": "代码实现相关工具集 / Code implementation tool set",
            # 可以在这里添加更多工具集
            # "data_analysis": "数据分析工具集 / Data analysis tool set",
            # "web_scraping": "网页爬取工具集 / Web scraping tool set",
        }

    @staticmethod
    def get_tool_set(tool_set_name: str) -> List[Dict[str, Any]]:
        """
        根据名称获取特定的工具集
        Get specific tool set by name
        """
        tool_sets = {
            "code_implementation": MCPToolDefinitions.get_code_implementation_tools(),
        }

        return tool_sets.get(tool_set_name, [])

    @staticmethod
    def get_all_tools() -> List[Dict[str, Any]]:
        """
        获取所有可用工具
        Get all available tools
        """
        all_tools = []
        for tool_set_name in MCPToolDefinitions.get_available_tool_sets().keys():
            all_tools.extend(MCPToolDefinitions.get_tool_set(tool_set_name))
        return all_tools


# 便捷访问函数
def get_mcp_tools(tool_set: str = "code_implementation") -> List[Dict[str, Any]]:
    """
    便捷函数：获取MCP工具定义
    Convenience function: Get MCP tool definitions

    Args:
        tool_set: 工具集名称 (默认: "code_implementation")

    Returns:
        工具定义列表
    """
    return MCPToolDefinitions.get_tool_set(tool_set)


================================================
FILE: config/mcp_tool_definitions_index.py
================================================
"""
MCP工具定义配置模块
MCP Tool Definitions Configuration Module

将工具定义从主程序逻辑中分离，提供标准化的工具定义格式
Separate tool definitions from main program logic, providing standardized tool definition format

支持的工具类型：
- 文件操作工具 (File Operations)
- 代码执行工具 (Code Execution)
- 搜索工具 (Search Tools)
- 项目结构工具 (Project Structure Tools)
"""

from typing import Dict, List, Any


class MCPToolDefinitions:
    """MCP工具定义管理器"""

    @staticmethod
    def get_code_implementation_tools() -> List[Dict[str, Any]]:
        """
        获取代码实现相关的工具定义
        Get tool definitions for code implementation
        """
        return [
            # MCPToolDefinitions._get_read_file_tool(),
            # MCPToolDefinitions._get_read_multiple_files_tool(),
            # MCPToolDefinitions._get_read_code_mem_tool(),
            MCPToolDefinitions._get_write_file_tool(),
            # MCPToolDefinitions._get_write_multiple_files_tool(),
            # MCPToolDefinitions._get_execute_python_tool(),
            # MCPToolDefinitions._get_execute_bash_tool(),
            MCPToolDefinitions._get_search_code_references_tool(),
            # MCPToolDefinitions._get_search_code_tool(),
            # MCPToolDefinitions._get_file_structure_tool(),
            # MCPToolDefinitions._get_set_workspace_tool(),
            # MCPToolDefinitions._get_operation_history_tool(),
        ]

    @staticmethod
    def get_code_evaluation_tools() -> List[Dict[str, Any]]:
        """
        获取代码评估相关的工具定义
        Get tool definitions for code evaluation
        """
        return [
            MCPToolDefinitions._get_analyze_repo_structure_tool(),
            MCPToolDefinitions._get_detect_dependencies_tool(),
            MCPToolDefinitions._get_assess_code_quality_tool(),
            MCPToolDefinitions._get_evaluate_documentation_tool(),
            MCPToolDefinitions._get_check_reproduction_readiness_tool(),
            MCPToolDefinitions._get_generate_evaluation_summary_tool(),
            MCPToolDefinitions._get_detect_empty_files_tool(),
            MCPToolDefinitions._get_detect_missing_files_tool(),
            MCPToolDefinitions._get_generate_code_revision_report_tool(),
        ]

    @staticmethod
    def _get_read_file_tool() -> Dict[str, Any]:
        """读取文件工具定义"""
        return {
            "name": "read_file",
            "description": "Read file content, supports specifying line number range",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_path": {
                        "type": "string",
                        "description": "File path, relative to workspace",
                    },
                    "start_line": {
                        "type": "integer",
                        "description": "Start line number (starting from 1, optional)",
                    },
                    "end_line": {
                        "type": "integer",
                        "description": "End line number (starting from 1, optional)",
                    },
                },
                "required": ["file_path"],
            },
        }

    @staticmethod
    def _get_read_multiple_files_tool() -> Dict[str, Any]:
        """批量读取多个文件工具定义"""
        return {
            "name": "read_multiple_files",
            "description": "Read multiple files in a single operation (for batch reading)",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_requests": {
                        "type": "string",
                        "description": 'JSON string with file requests, e.g., \'{"file1.py": {}, "file2.py": {"start_line": 1, "end_line": 10}}\' or simple array \'["file1.py", "file2.py"]\'',
                    },
                    "max_files": {
                        "type": "integer",
                        "description": "Maximum number of files to read in one operation",
                        "default": 5,
                        "minimum": 1,
                        "maximum": 10,
                    },
                },
                "required": ["file_requests"],
            },
        }

    @staticmethod
    def _get_read_code_mem_tool() -> Dict[str, Any]:
        """Read code memory tool definition - reads from implement_code_summary.md"""
        return {
            "name": "read_code_mem",
            "description": "Check if file summaries exist in implement_code_summary.md for multiple files in a single call. Returns summaries for all requested files if available.",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_paths": {
                        "type": "array",
                        "items": {"type": "string"},
                        "description": "List of file paths to check for summary information in implement_code_summary.md",
                    }
                },
                "required": ["file_paths"],
            },
        }

    @staticmethod
    def _get_write_file_tool() -> Dict[str, Any]:
        """写入文件工具定义"""
        return {
            "name": "write_file",
            "description": "Write content to file",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_path": {
                        "type": "string",
                        "description": "File path, relative to workspace",
                    },
                    "content": {
                        "type": "string",
                        "description": "Content to write to file",
                    },
                    "create_dirs": {
                        "type": "boolean",
                        "description": "Whether to create directories if they don't exist",
                        "default": True,
                    },
                    "create_backup": {
                        "type": "boolean",
                        "description": "Whether to create backup file if file already exists",
                        "default": False,
                    },
                },
                "required": ["file_path", "content"],
            },
        }

    @staticmethod
    def _get_write_multiple_files_tool() -> Dict[str, Any]:
        """批量写入多个文件工具定义"""
        return {
            "name": "write_multiple_files",
            "description": "Write multiple files in a single operation (for batch implementation)",
            "input_schema": {
                "type": "object",
                "properties": {
                    "file_implementations": {
                        "type": "string",
                        "description": 'JSON string mapping file paths to content, e.g., \'{"file1.py": "content1", "file2.py": "content2"}\'',
                    },
                    "create_dirs": {
                        "type": "boolean",
                        "description": "Whether to create directories if they don't exist",
                        "default": True,
                    },
                    "create_backup": {
                        "type": "boolean",
                        "description": "Whether to create backup files if they already exist",
                        "default": False,
                    },
                    "max_files": {
                        "type": "integer",
                        "description": "Maximum number of files to write in one operation",
                        "default": 5,
                        "minimum": 1,
                        "maximum": 10,
                    },
                },
                "required": ["file_implementations"],
            },
        }

    @staticmethod
    def _get_execute_python_tool() -> Dict[str, Any]:
        """Python执行工具定义"""
        return {
            "name": "execute_python",
            "description": "Execute Python code and return output",
            "input_schema": {
                "type": "object",
                "properties": {
                    "code": {"type": "string", "description": "Python code to execute"},
                    "timeout": {
                        "type": "integer",
                        "description": "Timeout in seconds",
                        "default": 30,
                    },
                },
                "required": ["code"],
            },
        }

    @staticmethod
    def _get_execute_bash_tool() -> Dict[str, Any]:
        """Bash执行工具定义"""
        return {
            "name": "execute_bash",
            "description": "Execute bash command",
            "input_schema": {
                "type": "object",
                "properties": {
                    "command": {
                        "type": "string",
                        "description": "Bash command to execute",
                    },
                    "timeout": {
                        "type": "integer",
                        "description": "Timeout in seconds",
                        "default": 30,
                    },
                },
                "required": ["command"],
            },
        }

    @staticmethod
    def _get_file_structure_tool() -> Dict[str, Any]:
        """文件结构获取工具定义"""
        return {
            "name": "get_file_structure",
            "description": "Get directory file structure",
            "input_schema": {
                "type": "object",
                "properties": {
                    "directory": {
                        "type": "string",
                        "description": "Directory path, relative to workspace",
                        "default": ".",
                    },
                    "max_depth": {
                        "type": "integer",
                        "description": "Maximum traversal depth",
                        "default": 5,
                    },
                },
            },
        }

    @staticmethod
    def _get_search_code_references_tool() -> Dict[str, Any]:
        """统一代码参考搜索工具定义 - 合并了三个步骤为一个工具"""
        return {
            "name": "search_code_references",
            "description": "UNIFIED TOOL: Search relevant reference code from index files. Combines directory setup, index loading, and searching in a single call.",
            "input_schema": {
                "type": "object",
                "properties": {
                    "indexes_path": {
                        "type": "string",
                        "description": "Path to the indexes directory containing JSON index files",
                    },
                    "target_file": {
                        "type": "string",
                        "description": "Target file path to be implemented",
                    },
                    "keywords": {
                        "type": "string",
                        "description": "Search keywords, comma-separated",
                        "default": "",
                    },
                    "max_results": {
                        "type": "integer",
                        "description": "Maximum number of results to return",
                        "default": 10,
                    },
                },
                "required": ["indexes_path", "target_file"],
            },
        }

    @staticmethod
    def _get_search_code_tool() -> Dict[str, Any]:
        """代码搜索工具定义 - 在当前代码库中搜索模式"""
        return {
            "name": "search_code",
            "description": "Search patterns in code files within the current repository",
            "input_schema": {
                "type": "object",
                "properties": {
                    "pattern": {
                        "type": "string",
                        "description": "Search pattern",
                    },
                    "file_pattern": {
                        "type": "string",
                        "description": "File pattern (e.g., '*.py')",
                        "default": "*.py",
                    },
                    "use_regex": {
                        "type": "boolean",
                        "description": "Whether to use regular expressions",
                        "default": False,
                    },
                    "search_directory": {
                        "type": "string",
                        "description": "Specify search directory (optional)",
                    },
                },
                "required": ["pattern"],
            },
        }

    @staticmethod
    def _get_operation_history_tool() -> Dict[str, Any]:
        """操作历史工具定义"""
        return {
            "name": "get_operation_history",
            "description": "Get operation history",
            "input_schema": {
                "type": "object",
                "properties": {
                    "last_n": {
                        "type": "integer",
                        "description": "Return the last N operations",
                        "default": 10,
                    },
                },
            },
        }

    @staticmethod
    def _get_get_indexes_overview_tool() -> Dict[str, Any]:
        """获取索引概览工具定义"""
        return {
            "name": "get_indexes_overview",
            "description": "Get overview of all available reference code index information from specified directory",
            "input_schema": {
                "type": "object",
                "properties": {
                    "indexes_path": {
                        "type": "string",
                        "description": "Path to the indexes directory containing JSON index files",
                    }
                },
                "required": ["indexes_path"],
            },
        }

    @staticmethod
    def _get_set_workspace_tool() -> Dict[str, Any]:
        """Set workspace directory tool definition"""
        return {
            "name": "set_workspace",
            "description": "Set the workspace directory for file operations",
            "input_schema": {
                "type": "object",
                "properties": {
                    "workspace_path": {
                        "type": "string",
                        "description": "Directory path for the workspace",
                    }
                },
                "required": ["workspace_path"],
            },
        }

    # @staticmethod
    # def _get_set_indexes_directory_tool() -> Dict[str, Any]:
    #     """Set indexes directory tool definition - DEPRECATED: Use unified search_code_references instead"""
    #     return {
    #         "name": "set_indexes_directory",
    #         "description": "Set the directory path for code reference indexes",
    #         "input_schema": {
    #             "type": "object",
    #             "properties": {
    #                 "indexes_path": {
    #                     "type": "string",
    #                     "description": "Directory path containing index JSON files"
    #                 }
    #             },
    #             "required": ["indexes_path"]
    #         }
    #     }

    # Code evaluation tool definitions
    @staticmethod
    def _get_analyze_repo_structure_tool() -> Dict[str, Any]:
        return {
            "name": "analyze_repo_structure",
            "description": "Perform comprehensive repository structure analysis",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository to analyze",
                    }
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_detect_dependencies_tool() -> Dict[str, Any]:
        return {
            "name": "detect_dependencies",
            "description": "Detect and analyze project dependencies across multiple languages",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository",
                    }
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_assess_code_quality_tool() -> Dict[str, Any]:
        return {
            "name": "assess_code_quality",
            "description": "Assess code quality metrics and identify potential issues",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository",
                    }
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_evaluate_documentation_tool() -> Dict[str, Any]:
        return {
            "name": "evaluate_documentation",
            "description": "Evaluate documentation completeness and quality",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository",
                    },
                    "docs_path": {
                        "type": "string",
                        "description": "Optional path to external documentation",
                    },
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_check_reproduction_readiness_tool() -> Dict[str, Any]:
        return {
            "name": "check_reproduction_readiness",
            "description": "Assess repository readiness for reproduction and validation",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository",
                    },
                    "docs_path": {
                        "type": "string",
                        "description": "Optional path to reproduction documentation",
                    },
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_generate_evaluation_summary_tool() -> Dict[str, Any]:
        return {
            "name": "generate_evaluation_summary",
            "description": "Generate comprehensive evaluation summary combining all analysis results",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository",
                    },
                    "docs_path": {
                        "type": "string",
                        "description": "Optional path to reproduction documentation",
                    },
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_detect_empty_files_tool() -> Dict[str, Any]:
        return {
            "name": "detect_empty_files",
            "description": "Detect empty files in the repository that may need implementation",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository to analyze",
                    }
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_detect_missing_files_tool() -> Dict[str, Any]:
        return {
            "name": "detect_missing_files",
            "description": "Detect missing essential files like main programs, tests, requirements, etc.",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository to analyze",
                    }
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def _get_generate_code_revision_report_tool() -> Dict[str, Any]:
        return {
            "name": "generate_code_revision_report",
            "description": "Generate comprehensive code revision report combining empty files, missing files, and quality analysis",
            "input_schema": {
                "type": "object",
                "properties": {
                    "repo_path": {
                        "type": "string",
                        "description": "Path to the repository to analyze",
                    },
                    "docs_path": {
                        "type": "string",
                        "description": "Optional path to documentation",
                    },
                },
                "required": ["repo_path"],
            },
        }

    @staticmethod
    def get_available_tool_sets() -> Dict[str, str]:
        """
        获取可用的工具集合
        Get available tool sets
        """
        return {
            "code_implementation": "代码实现相关工具集 / Code implementation tool set",
            "code_evaluation": "代码评估相关工具集 / Code evaluation tool set",
            # 可以在这里添加更多工具集
            # "data_analysis": "数据分析工具集 / Data analysis tool set",
            # "web_scraping": "网页爬取工具集 / Web scraping tool set",
        }

    @staticmethod
    def get_tool_set(tool_set_name: str) -> List[Dict[str, Any]]:
        """
        根据名称获取特定的工具集
        Get specific tool set by name
        """
        tool_sets = {
            "code_implementation": MCPToolDefinitions.get_code_implementation_tools(),
            "code_evaluation": MCPToolDefinitions.get_code_evaluation_tools(),
        }

        return tool_sets.get(tool_set_name, [])

    @staticmethod
    def get_all_tools() -> List[Dict[str, Any]]:
        """
        获取所有可用工具
        Get all available tools
        """
        all_tools = []
        for tool_set_name in MCPToolDefinitions.get_available_tool_sets().keys():
            all_tools.extend(MCPToolDefinitions.get_tool_set(tool_set_name))
        return all_tools


# 便捷访问函数
def get_mcp_tools(tool_set: str = "code_implementation") -> List[Dict[str, Any]]:
    """
    便捷函数：获取MCP工具定义
    Convenience function: Get MCP tool definitions

    Args:
        tool_set: 工具集名称 (默认: "code_implementation")

    Returns:
        工具定义列表
    """
    return MCPToolDefinitions.get_tool_set(tool_set)


================================================
FILE: deepcode.py
================================================
#!/usr/bin/env python3
"""
DeepCode - AI Research Engine Launcher

🧬 Next-Generation AI Research Automation Platform
⚡ Transform research papers into working code automatically

Cross-platform support: Windows, macOS, Linux
"""

import os
import sys
import subprocess
import signal
import platform
import socket
import time
from pathlib import Path


# Global process references for cleanup
_backend_process = None
_frontend_process = None


def get_platform():
    """Get current platform"""
    system = platform.system().lower()
    if system == "darwin":
        return "macos"
    elif system == "windows":
        return "windows"
    else:
        return "linux"


def check_dependencies():
    """Check if necessary dependencies are installed for new UI"""
    import importlib.util
    import shutil

    print("🔍 Checking dependencies...")

    missing_deps = []
    missing_system_deps = []

    # Check FastAPI availability (for backend)
    if importlib.util.find_spec("fastapi") is not None:
        print("✅ FastAPI is installed")
    else:
        missing_deps.append("fastapi>=0.104.0")

    # Check uvicorn availability (for backend server)
    if importlib.util.find_spec("uvicorn") is not None:
        print("✅ Uvicorn is installed")
    else:
        missing_deps.append("uvicorn>=0.24.0")

    # Check PyYAML availability
    if importlib.util.find_spec("yaml") is not None:
        print("✅ PyYAML is installed")
    else:
        missing_deps.append("pyyaml>=6.0")

    # Check pydantic-settings availability
    if importlib.util.find_spec("pydantic_settings") is not None:
        print("✅ Pydantic-settings is installed")
    else:
        missing_deps.append("pydantic-settings>=2.0.0")

    # Check Node.js availability (for frontend)
    node_cmd = "node.exe" if get_platform() == "windows" else "node"
    if shutil.which(node_cmd) or shutil.which("node"):
        try:
            result = subprocess.run(
                ["node", "--version"],
                capture_output=True,
                text=True,
                timeout=5,
                shell=(get_platform() == "windows"),
            )
            if result.returncode == 0:
                print(f"✅ Node.js is installed ({result.stdout.strip()})")
        except Exception:
            missing_system_deps.append("Node.js")
    else:
        missing_system_deps.append("Node.js")
        print("❌ Node.js not found (required for frontend)")

    # Check npm availability
    npm_cmd = "npm.cmd" if get_platform() == "windows" else "npm"
    if shutil.which(npm_cmd) or shutil.which("npm"):
        print("✅ npm is available")
    else:
        missing_system_deps.append("npm")
        print("❌ npm not found (required for frontend)")

    # Display missing dependencies
    if missing_deps or missing_system_deps:
        print("\n📋 Dependency Status:")

        if missing_deps:
            print("❌ Missing Python dependencies:")
            for dep in missing_deps:
                print(f"   - {dep}")
            print(f"\nInstall with: pip install {' '.join(missing_deps)}")

        if missing_system_deps:
            print("\n❌ Missing system dependencies:")
            for dep in missing_system_deps:
                print(f"   - {dep}")
            print("\nInstall Node.js:")
            print("   - Windows/macOS: https://nodejs.org/")
            print("   - macOS: brew install node")
            print("   - Ubuntu/Debian: sudo apt-get install nodejs npm")

        # Fail if critical dependencies are missing
        if missing_deps or missing_system_deps:
            return False
    else:
        print("✅ All dependencies satisfied")

    return True


def is_port_in_use(port: int) -> bool:
    """Check if a port is in use (cross-platform)"""
    with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
        return s.connect_ex(("localhost", port)) == 0


def kill_process_on_port(port: int):
    """Kill process using a specific port (cross-platform)"""
    current_platform = get_platform()

    try:
        if current_platform == "windows":
            # Windows: use netstat and taskkill
            result = subprocess.run(
                f"netstat -ano | findstr :{port}",
                capture_output=True,
                text=True,
                shell=True,
            )
            if result.stdout:
                for line in result.stdout.strip().split("\n"):
                    parts = line.split()
                    if len(parts) >= 5:
                        pid = parts[-1]
                        if pid.isdigit():
                            subprocess.run(
                                f"taskkill /F /PID {pid}",
                                shell=True,
                                capture_output=True,
                            )
                            print(f"  ✓ Killed process on port {port} (PID: {pid})")
        else:
            # macOS/Linux: use lsof
            result = subprocess.run(
                f"lsof -ti :{port}", capture_output=True, text=True, shell=True
            )
            if result.stdout:
                pids = result.stdout.strip().split("\n")
                for pid in pids:
                    if pid.isdigit():
                        os.kill(int(pid), signal.SIGKILL)
                        print(f"  ✓ Killed process on port {port} (PID: {pid})")
    except Exception as e:
        print(f"  ⚠️ Could not kill process on port {port}: {e}")


def cleanup_ports():
    """Clean up ports 8000 and 5173 if in use"""
    for port in [8000, 5173]:
        if is_port_in_use(port):
            print(f"⚠️ Port {port} is in use, cleaning up...")
            kill_process_on_port(port)
            time.sleep(1)


def install_backend_deps():
    """Install backend dependencies if needed"""
    import importlib.util

    if importlib.util.find_spec("fastapi") is None:
        print("📦 Installing backend dependencies...")
        deps = [
            "fastapi",
            "uvicorn",
            "pydantic-settings",
            "python-multipart",
            "aiofiles",
            "websockets",
            "pyyaml",
        ]
        subprocess.run(
            [sys.executable, "-m", "pip", "install", "-q"] + deps, check=True
        )
        print("✅ Backend dependencies installed")


def install_frontend_deps(frontend_dir: Path):
    """Install frontend dependencies if needed"""
    node_modules = frontend_dir / "node_modules"

    if not node_modules.exists():
        print("📦 Installing frontend dependencies (first run)...")
        npm_cmd = "npm.cmd" if get_platform() == "windows" else "npm"
        subprocess.run(
            [npm_cmd, "install"],
            cwd=frontend_dir,
            check=True,
            shell=(get_platform() == "windows"),
        )
        print("✅ Frontend dependencies installed")


def start_backend(backend_dir: Path):
    """Start the backend server"""
    global _backend_process

    print("🔧 Starting backend server...")

    # Use shell=True on Windows for proper command handling
    if get_platform() == "windows":
        _backend_process = subprocess.Popen(
            f'"{sys.executable}" -m uvicorn main:app --host 0.0.0.0 --port 8000 --reload',
            cwd=backend_dir,
            shell=True,
            creationflags=subprocess.CREATE_NEW_PROCESS_GROUP,
        )
    else:
        _backend_process = subprocess.Popen(
            [
                sys.executable,
                "-m",
                "uvicorn",
                "main:app",
                "--host",
                "0.0.0.0",
                "--port",
                "8000",
                "--reload",
            ],
            cwd=backend_dir,
            start_new_session=True,  # Create new process group
        )

    # Wait for backend to start
    time.sleep(2)

    if _backend_process.poll() is None:
        print("✅ Backend started: http://localhost:8000")
        return True
    else:
        print("❌ Backend failed to start")
        return False


def start_frontend(frontend_dir: Path):
    """Start the frontend dev server"""
    global _frontend_process

    print("🎨 Starting frontend server...")

    npm_cmd = "npm.cmd" if get_platform() == "windows" else "npm"

    if get_platform() == "windows":
        _frontend_process = subprocess.Popen(
            f"{npm_cmd} run dev",
            cwd=frontend_dir,
            shell=True,
            creationflags=subprocess.CREATE_NEW_PROCESS_GROUP,
        )
    else:
        _frontend_process = subprocess.Popen(
            [npm_cmd, "run", "dev"],
            cwd=frontend_dir,
            start_new_session=True,  # Create new process group
        )

    # Wait for frontend to start
    time.sleep(3)

    if _frontend_process.poll() is None:
        print("✅ Frontend started: http://localhost:5173")
        return True
    else:
        print("❌ Frontend failed to start")
        return False


def cleanup_processes():
    """Clean up running processes"""
    global _backend_process, _frontend_process

    print("\n🛑 Stopping services...")

    for name, proc in [("Backend", _backend_process), ("Frontend", _frontend_process)]:
        if proc and proc.poll() is None:
            try:
                if get_platform() == "windows":
                    # Windows: use taskkill with /T to kill tree
                    subprocess.run(
                        f"taskkill /F /T /PID {proc.pid}",
                        shell=True,
                        capture_output=True,
                    )
                else:
                    # Unix: kill the process group
                    try:
                        os.killpg(os.getpgid(proc.pid), signal.SIGTERM)
                        proc.wait(timeout=5)
                    except Exception:
                        os.killpg(os.getpgid(proc.pid), signal.SIGKILL)
                print(f"  ✓ {name} stopped")
            except Exception:
                # Fallback: try direct terminate
                try:
                    proc.terminate()
                    proc.wait(timeout=3)
                    print(f"  ✓ {name} stopped")
                except Exception:
                    try:
                        proc.kill()
                        print(f"  ✓ {name} killed")
                    except Exception:
                        print(f"  ⚠️ Could not stop {name}")

    # Also clean up any orphaned processes on ports
    time.sleep(0.5)
    for port in [8000, 5173]:
        if is_port_in_use(port):
            kill_process_on_port(port)

    print("✅ All services stopped")


def cleanup_cache():
    """Clean up Python cache files"""
    try:
        print("🧹 Cleaning up cache files...")
        # Clean up __pycache__ directories
        os.system('find . -type d -name "__pycache__" -exec rm -r {} + 2>/dev/null')
        # Clean up .pyc files
        os.system('find . -name "*.pyc" -delete 2>/dev/null')
        print("✅ Cache cleanup completed")
    except Exception as e:
        print(f"⚠️  Cache cleanup failed: {e}")


def print_banner():
    """Display startup banner"""
    banner = """
╔══════════════════════════════════════════════════════════════╗
║                                                              ║
║    🧬 DeepCode - AI Research Engine                          ║
║                                                              ║
║    ⚡ NEURAL • AUTONOMOUS • REVOLUTIONARY ⚡                ║
║                                                              ║
║    Transform research papers into working code               ║
║    Next-generation AI automation platform                   ║
║                                                              ║
╚══════════════════════════════════════════════════════════════╝
"""
    print(banner)


def launch_classic_ui():
    """Launch classic Streamlit UI"""
    import importlib.util

    print("🌐 Launching Classic Streamlit UI...")

    # Check if Streamlit is installed
    if importlib.util.find_spec("streamlit") is None:
        print("❌ Streamlit is not installed.")
        print("Install with: pip install streamlit")
        sys.exit(1)

    current_dir = Path(__file__).parent
    streamlit_app_path = current_dir / "ui" / "streamlit_app.py"

    if not streamlit_app_path.exists():
        print(f"❌ Streamlit app not found: {streamlit_app_path}")
        sys.exit(1)

    print(f"📁 UI App: {streamlit_app_path}")
    print("🚀 Launching on http://localhost:8501")
    print("=" * 70)

    try:
        cmd = [
            sys.executable,
            "-m",
            "streamlit",
            "run",
            str(streamlit_app_path),
            "--server.port",
            "8501",
            "--server.address",
            "localhost",
            "--browser.gatherUsageStats",
            "false",
        ]
        subprocess.run(cmd, check=True)
    except KeyboardInterrupt:
        print("\n\n🛑 Streamlit server stopped by user")
    except Exception as e:
        print(f"\n❌ Error: {e}")
        sys.exit(1)


def _check_docker_prerequisites():
    """Check Docker prerequisites and config files. Returns (current_dir, compose_file, compose_args)."""
    import shutil

    current_dir = Path(__file__).parent
    compose_file = current_dir / "deepcode_docker" / "docker-compose.yml"

    if not compose_file.exists():
        print("❌ deepcode_docker/docker-compose.yml not found")
        print("   Make sure you are running from the DeepCode project root.")
        sys.exit(1)

    # Check Docker is installed
    if not shutil.which("docker"):
        print("❌ Docker not found. Please install Docker Desktop first.")
        print("   https://www.docker.com/products/docker-desktop")
        sys.exit(1)

    # Check Docker daemon is running
    result = subprocess.run(["docker", "info"], capture_output=True, text=True)
    if result.returncode != 0:
        print("❌ Docker is installed but not running.")
        print("   Please start Docker Desktop and try again.")
        sys.exit(1)

    # Check/create secrets file
    secrets_file = current_dir / "mcp_agent.secrets.yaml"
    if not secrets_file.exists():
        example = current_dir / "mcp_agent.secrets.yaml.example"
        if example.exists():
            print("⚠️  mcp_agent.secrets.yaml not found.")
            print("   Creating from template...")
            import shutil as sh

            sh.copy2(example, secrets_file)
            print(f"   ✅ Created {secrets_file}")
            print("")
            print("   ⚠️  Please edit mcp_agent.secrets.yaml and fill in your API keys:")
            print(f"      {secrets_file}")
            print("")
            print(
                "   At least ONE LLM provider key is required (OpenAI/Anthropic/Google)."
            )
            print("   Then run 'deepcode' again.")
            sys.exit(0)
        else:
            print(
                "❌ mcp_agent.secrets.yaml not found. Please create it with your API keys."
            )
            sys.exit(1)

    # Check config file
    config_file = current_dir / "mcp_agent.config.yaml"
    if not config_file.exists():
        print("❌ mcp_agent.config.yaml not found.")
        print("   This file should be in the project root.")
        sys.exit(1)

    # Ensure data directories exist
    for d in ["deepcode_lab", "uploads", "logs"]:
        (current_dir / d).mkdir(exist_ok=True)

    os.chdir(current_dir)
    compose_args = ["docker", "compose", "-f", str(compose_file)]

    return current_dir, compose_file, compose_args


def launch_docker():
    """Launch DeepCode via Docker"""
    current_dir, compose_file, compose_args = _check_docker_prerequisites()

    print("🐳 Starting DeepCode with Docker...")
    print("=" * 50)

    try:
        # Check if image exists (auto-build on first run)
        result = subprocess.run(
            compose_args + ["images", "-q"], capture_output=True, text=True
        )
        if not result.stdout.strip():
            print(
                "📦 First run detected — building Docker image (may take a few minutes)..."
            )
            subprocess.run(compose_args + ["build"], check=True)

        # Start (if already running, docker compose will detect and skip)
        subprocess.run(compose_args + ["up", "-d"], check=True)

        print("")
        print("=" * 50)
        print("✅ DeepCode is running!")
        print("")
        print("   🌐 Open: http://localhost:8000")
        print("   📚 Docs: http://localhost:8000/docs")
        print("")
        print("   📋 View logs:  docker logs deepcode -f")
        print(
            "   🛑 Stop:       docker compose -f deepcode_docker/docker-compose.yml down"
        )
        print("=" * 50)

    except subprocess.CalledProcessError as e:
        print(f"\n❌ Docker failed: {e}")
        sys.exit(1)
    except KeyboardInterrupt:
        print("\n🛑 Cancelled")


def launch_docker_cli():
    """Launch DeepCode CLI inside Docker container"""
    current_dir, compose_file, compose_args = _check_docker_prerequisites()

    print("🖥️  Starting DeepCode CLI in Docker...")
    print("=" * 50)

    try:
        # Check if image exists (auto-build on first run)
        result = subprocess.run(
            compose_args + ["images", "-q"], capture_output=True, text=True
        )
        if not result.stdout.strip():
            print(
                "📦 First run detected — building Docker image (may take a few minutes)..."
            )
            subprocess.run(compose_args + ["build"], check=True)

        # Run CLI interactively
        subprocess.run(
            compose_args + ["run", "--rm", "-it", "deepcode", "cli"], check=True
        )

    except subprocess.CalledProcessError as e:
        print(f"\n❌ Docker failed: {e}")
        sys.exit(1)
    except KeyboardInterrupt:
        print("\n🛑 Cancelled")


def launch_paper_test(paper_name: str, fast_mode: bool = False):
    """Launch paper testing mode"""
    try:
        print("\n🧪 Launching Paper Test Mode")
        print(f"📄 Paper: {paper_name}")
        print(f"⚡ Fast mode: {'enabled' if fast_mode else 'disabled'}")
        print("=" * 60)

        # Run the test setup
        setup_cmd = [sys.executable, "test_paper.py", paper_name]
        if fast_mode:
            setup_cmd.append("--fast")

        result = subprocess.run(setup_cmd, check=True)

        if result.returncode == 0:
            print("\n✅ Paper test setup completed successfully!")
            print("📁 Files are ready in deepcode_lab/papers/")
            print("\n💡 Next steps:")
            print("   1. Install MCP dependencies: pip install -r requirements.txt")
            print(
                f"   2. Run full pipeline: python -m workflows.paper_test_engine --paper {paper_name}"
                + (" --fast" if fast_mode else "")
            )

    except subprocess.CalledProcessError as e:
        print(f"\n❌ Paper test setup failed: {e}")
        sys.exit(1)
    except Exception as e:
        print(f"\n❌ Unexpected error: {e}")
        sys.exit(1)


def main():
    """Main function"""
    # Parse command line arguments
    if len(sys.argv) > 1:
        if sys.argv[1] == "test" and len(sys.argv) >= 3:
            # Paper testing mode: python deepcode.py test rice [--fast]
            paper_name = sys.argv[2]
            fast_mode = "--fast" in sys.argv or "-f" in sys.argv

            print_banner()
            launch_paper_test(paper_name, fast_mode)
            return
        elif sys.argv[1] == "--local":
            # Launch locally (without Docker) — fall through to local launch below
            print_banner()
            pass
        elif sys.argv[1] == "--docker":
            # Explicit Docker launch (same as default)
            print_banner()
            launch_docker()
            return
        elif sys.argv[1] == "--cli":
            # Launch CLI inside Docker container
            print_banner()
            launch_docker_cli()
            return
        elif sys.argv[1] == "--classic":
            # Launch classic Streamlit UI
            print_banner()
            launch_classic_ui()
            return
        elif sys.argv[1] in ["--help", "-h", "help"]:
            print_banner()
            print("""
🔧 Usage:
   deepcode                              - Launch via Docker (default, recommended)
   deepcode --docker                     - Same as above (launch via Docker)
   deepcode --cli                        - Launch interactive CLI in Docker
   deepcode --local                      - Launch locally (requires Python + Node.js)
   deepcode test <paper>                 - Test paper reproduction
   deepcode test <paper> --fast          - Test paper (fast mode)
   deepcode --classic                    - Launch classic Streamlit UI

📄 Examples:
   deepcode                              - Start with Docker (one command)
   deepcode --cli                        - Interactive CLI in Docker
   deepcode --local                      - Start the new UI locally
   deepcode test rice                    - Test RICE paper reproduction
   deepcode test rice --fast             - Test RICE paper (fast mode)

🌐 New UI Features:
   • User-in-Loop interaction
   • Real-time progress tracking
   • Inline chat interaction
   • Modern React-based interface

📁 Available papers:""")

            # List available papers
            papers_dir = "papers"
            if os.path.exists(papers_dir):
                for item in os.listdir(papers_dir):
                    item_path = os.path.join(papers_dir, item)
                    if os.path.isdir(item_path):
                        paper_md = os.path.join(item_path, "paper.md")
                        addendum_md = os.path.join(item_path, "addendum.md")
                        status = "✅" if os.path.exists(paper_md) else "❌"
                        addendum_status = "📄" if os.path.exists(addendum_md) else "➖"
                        print(f"   {status} {item} {addendum_status}")
            print(
                "\n   Legend: ✅ = paper.md exists, 📄 = addendum.md exists, ➖ = no addendum"
            )
            return
        else:
            # Unknown argument — show help hint
            print(f"Unknown option: {sys.argv[1]}")
            print("Run 'deepcode --help' for usage information.")
            sys.exit(1)
    else:
        # Default (no arguments) → Docker
        print_banner()
        launch_docker()
        return

    # --- Local launch (only reached via --local) ---

    # Show platform info
    current_platform = get_platform()
    print(f"🖥️  Platform: {current_platform.capitalize()}")

    # Check dependencies
    if not check_dependencies():
        print("\n🚨 Please install missing dependencies and try again.")
        sys.exit(1)

    # Get paths
    current_dir = Path(__file__).parent
    new_ui_dir = current_dir / "new_ui"
    backend_dir = new_ui_dir / "backend"
    frontend_dir = new_ui_dir / "frontend"

    # Check if new_ui directory exists
    if not new_ui_dir.exists():
        print(f"❌ New UI directory not found: {new_ui_dir}")
        sys.exit(1)

    print("\n🚀 Starting DeepCode New UI...")
    print("=" * 70)
    print("🎨 Frontend:  http://localhost:5173")
    print("🔧 Backend:   http://localhost:8000")
    print("📚 API Docs:  http://localhost:8000/docs")
    print("=" * 70)
    print("💡 Tip: Keep this terminal open while using the application")
    print("🛑 Press Ctrl+C to stop all services")
    print("=" * 70)

    try:
        # Clean up ports if in use
        cleanup_ports()

        # Install dependencies if needed
        install_backend_deps()
        install_frontend_deps(frontend_dir)

        # Start services
        if not start_backend(backend_dir):
            print("❌ Failed to start backend")
            sys.exit(1)

        if not start_frontend(frontend_dir):
            print("❌ Failed to start frontend")
            cleanup_processes()
            sys.exit(1)

        print("\n" + "=" * 70)
        print("╔════════════════════════════════════════╗")
        print("║  🎉 DeepCode New UI is running!        ║")
        print("╠════════════════════════════════════════╣")
        print("║                                        ║")
        print("║  🌐 Frontend: http://localhost:5173    ║")
        print("║  🔧 Backend:  http://localhost:8000    ║")
        print("║  📚 API Docs: http://localhost:8000/docs║")
        print("║                                        ║")
        print("║  Press Ctrl+C to stop all services     ║")
        print("╚════════════════════════════════════════╝")
        print("=" * 70 + "\n")

        # Wait for processes
        while True:
            # Check if processes are still running
            if _backend_process and _backend_process.poll() is not None:
                print("⚠️ Backend process exited unexpectedly")
                break
            if _frontend_process and _frontend_process.poll() is not None:
                print("⚠️ Frontend process exited unexpectedly")
                break
            time.sleep(1)

    except KeyboardInterrupt:
        print("\n")
    except Exception as e:
        print(f"\n❌ Unexpected error: {e}")
    finally:
        cleanup_processes()
        cleanup_cache()
        print("Thank you for using DeepCode! 🧬")


if __name__ == "__main__":
    main()


================================================
FILE: deepcode_docker/.dockerignore
================================================
# Git
.git
.gitignore

# Node
new_ui/frontend/node_modules
new_ui/frontend/dist

# Python
__pycache__
*.pyc
*.pyo
*.egg-info
.eggs
dist
build

# Virtual environments
.venv
venv
env

# IDE
.vscode
.idea
.cursor
*.swp
*.swo

# Runtime data
deepcode_lab
uploads
logs
*.log

# Docker
deepcode_docker/Dockerfile
deepcode_docker/docker-compose.yml
deepcode_docker/.dockerignore
deepcode_docker/run_docker.sh

# Documentation
assets
*.md
LICENSE


================================================
FILE: deepcode_docker/Dockerfile
================================================
# =============================================================
# DeepCode - Docker Build
# Multi-stage: Frontend build → Final image with Python + Node
# =============================================================

# ------ Stage 1: Build frontend static assets ------
FROM node:18-alpine AS frontend-builder

WORKDIR /build
COPY new_ui/frontend/package*.json ./
RUN npm ci --no-audit --no-fund
COPY new_ui/frontend/ ./
RUN npm run build


# ------ Stage 2: Final image ------
FROM python:3.10-slim

# Metadata
LABEL maintainer="DeepCode Team"
LABEL description="DeepCode - AI Research Engine"
LABEL version="1.0"

# Environment
ENV PYTHONDONTWRITEBYTECODE=1 \
    PYTHONUNBUFFERED=1 \
    DEEPCODE_ENV=docker \
    DEEPCODE_HOST=0.0.0.0 \
    DEEPCODE_PORT=8000

# Install system dependencies:
#   - git: for git clone operations in workflows
#   - nodejs/npm/npx: for MCP servers (brave-search, filesystem, fetch)
#   - curl: for health checks
RUN apt-get update && \
    apt-get install -y --no-install-recommends \
        git \
        curl \
        ca-certificates && \
    # Install Node.js 18 via official binary (includes npm + npx)
    ARCH=$(dpkg --print-architecture) && \
    if [ "$ARCH" = "arm64" ]; then NODE_ARCH="arm64"; else NODE_ARCH="x64"; fi && \
    curl -fsSL https://nodejs.org/dist/v18.20.8/node-v18.20.8-linux-${NODE_ARCH}.tar.gz \
        | tar -xz -C /usr/local --strip-components=1 && \
    # Install uv (Python package installer, used by mcp-server-fetch)
    pip install --no-cache-dir uv && \
    # Cleanup
    apt-get clean && \
    rm -rf /var/lib/apt/lists/* && \
    # Verify
    node --version && npm --version && npx --version

WORKDIR /app

# Install Python dependencies first (cache layer)
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt

# Pre-install npx MCP server packages (avoid download at runtime)
RUN npx -y @modelcontextprotocol/server-brave-search --help 2>/dev/null || true && \
    npx -y @modelcontextprotocol/server-filesystem --help 2>/dev/null || true

# Copy project source code
COPY __init__.py setup.py deepcode.py ./
COPY config/ ./config/
COPY prompts/ ./prompts/
COPY schema/ ./schema/
COPY tools/ ./tools/
COPY utils/ ./utils/
COPY workflows/ ./workflows/
COPY cli/ ./cli/
COPY ui/ ./ui/
COPY new_ui/backend/ ./new_ui/backend/

# Copy frontend build output from Stage 1
COPY --from=frontend-builder /build/dist ./new_ui/frontend/dist

# Create runtime directories
RUN mkdir -p deepcode_lab uploads logs

# Copy entrypoint script
COPY deepcode_docker/docker-entrypoint.sh /docker-entrypoint.sh
RUN chmod +x /docker-entrypoint.sh

EXPOSE 8000

HEALTHCHECK --interval=30s --timeout=10s --start-period=15s --retries=3 \
    CMD curl -f http://localhost:8000/health || exit 1

ENTRYPOINT ["/docker-entrypoint.sh"]


================================================
FILE: deepcode_docker/docker-compose.yml
================================================
services:
  deepcode:
    build:
      context: ..
      dockerfile: deepcode_docker/Dockerfile
    container_name: deepcode
    ports:
      - "8000:8000"
    volumes:
      # Configuration (required)
      - ../mcp_agent.config.yaml:/app/mcp_agent.config.yaml:ro
      - ../mcp_agent.secrets.yaml:/app/mcp_agent.secrets.yaml:ro

      # Persistent data
      - ../deepcode_lab:/app/deepcode_lab
      - ../uploads:/app/uploads
      - ../logs:/app/logs
    environment:
      - DEEPCODE_ENV=docker
      - DEEPCODE_PORT=8000
    restart: unless-stopped

  nanobot:
    build:
      context: ..
      dockerfile: nanobot/Dockerfile
    container_name: nanobot
    ports:
      - "18790:18790"
    volumes:
      # nanobot configuration (飞书/Telegram token 等)
      - ../nanobot_config.json:/root/.nanobot/config.json:ro

      # Persistent workspace data
      - nanobot-workspace:/root/.nanobot/workspace
      - nanobot-sessions:/root/.nanobot/sessions

      # Shared with DeepCode: nanobot can access generated code
      - ../deepcode_lab:/app/deepcode_lab
    environment:
      - NANOBOT_ENV=docker
      # Internal API URL for nanobot -> DeepCode communication
      - DEEPCODE_API_URL=http://deepcode:8000
    depends_on:
      - deepcode
    restart: unless-stopped

volumes:
  nanobot-workspace:
  nanobot-sessions:


================================================
FILE: deepcode_docker/docker-entrypoint.sh
================================================
#!/bin/bash
set -e

echo "============================================"
echo "  DeepCode - AI Research Engine (Docker)"
echo "============================================"

# ------ Validate configuration ------
if [ ! -f "mcp_agent.config.yaml" ]; then
    echo "⚠️  mcp_agent.config.yaml not found, using default config"
fi

if [ ! -f "mcp_agent.secrets.yaml" ]; then
    echo ""
    echo "❌ ERROR: mcp_agent.secrets.yaml not found!"
    echo ""
    echo "Please mount your secrets file:"
    echo "  docker run -v ./mcp_agent.secrets.yaml:/app/mcp_agent.secrets.yaml ..."
    echo ""
    echo "Or use docker-compose with the provided template."
    echo ""
    exit 1
fi

# ------ Ensure directories exist ------
mkdir -p deepcode_lab uploads logs

# ------ CLI mode: launch interactive CLI ------
if [ "$1" = "cli" ]; then
    shift
    echo ""
    echo "🖥️  Starting DeepCode CLI..."
    echo "============================================"
    echo ""
    exec python cli/main_cli.py "$@"
fi

# ------ Web mode (default): start backend + frontend ------
echo ""
echo "🚀 Starting DeepCode..."
echo "   API:  http://localhost:${DEEPCODE_PORT:-8000}"
echo "   Docs: http://localhost:${DEEPCODE_PORT:-8000}/docs"
echo "============================================"
echo ""

exec python -m uvicorn new_ui.backend.main:app \
    --host "${DEEPCODE_HOST:-0.0.0.0}" \
    --port "${DEEPCODE_PORT:-8000}" \
    --workers 1 \
    --log-level info


================================================
FILE: deepcode_docker/run_docker.sh
================================================
#!/bin/bash
# DeepCode Docker 一键启动脚本

set -e

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_ROOT="$(cd "$SCRIPT_DIR/.." && pwd)"
COMPOSE_FILE="$SCRIPT_DIR/docker-compose.yml"

# 颜色定义
RED='\033[0;31m'
GREEN='\033[0;32m'
BLUE='\033[0;34m'
YELLOW='\033[1;33m'
CYAN='\033[0;36m'
NC='\033[0m'

# docker compose wrapper — always use the correct compose file
dc() {
    docker compose -f "$COMPOSE_FILE" "$@"
}

echo ""
echo "╔════════════════════════════════════════╗"
echo "║   DeepCode - Docker 启动脚本          ║"
echo "╚════════════════════════════════════════╝"
echo ""

# ============ 检查 Docker 环境 ============
check_docker() {
    if ! command -v docker &> /dev/null; then
        echo -e "${RED}❌ 未检测到 Docker，请先安装 Docker Desktop${NC}"
        echo "   下载地址: https://www.docker.com/products/docker-desktop"
        exit 1
    fi

    if ! docker info &> /dev/null 2>&1; then
        echo -e "${RED}❌ Docker 服务未运行，请先启动 Docker Desktop${NC}"
        exit 1
    fi

    echo -e "${GREEN}✓ Docker 环境正常${NC}"
}

# ============ 检查配置文件 ============
check_config() {
    if [ ! -f "$PROJECT_ROOT/mcp_agent.config.yaml" ]; then
        echo -e "${RED}❌ 缺少 mcp_agent.config.yaml 配置文件${NC}"
        exit 1
    fi
    echo -e "${GREEN}✓ mcp_agent.config.yaml 已找到${NC}"

    if [ ! -f "$PROJECT_ROOT/mcp_agent.secrets.yaml" ]; then
        if [ -f "$PROJECT_ROOT/mcp_agent.secrets.yaml.example" ]; then
            echo -e "${YELLOW}⚠ 未找到 mcp_agent.secrets.yaml${NC}"
            echo -e "${YELLOW}  正在从模板创建...${NC}"
            cp "$PROJECT_ROOT/mcp_agent.secrets.yaml.example" "$PROJECT_ROOT/mcp_agent.secrets.yaml"
            echo -e "${YELLOW}  ⚡ 请编辑 mcp_agent.secrets.yaml 填入你的 API Key，然后重新运行此脚本${NC}"
            exit 1
        else
            echo -e "${RED}❌ 缺少 mcp_agent.secrets.yaml，且未找到模板文件${NC}"
            exit 1
        fi
    fi
    echo -e "${GREEN}✓ mcp_agent.secrets.yaml 已找到${NC}"
}

# ============ 创建必要目录 ============
ensure_dirs() {
    mkdir -p "$PROJECT_ROOT/deepcode_lab" "$PROJECT_ROOT/uploads" "$PROJECT_ROOT/logs"
    echo -e "${GREEN}✓ 数据目录已就绪 (deepcode_lab/, uploads/, logs/)${NC}"
}

# ============ 解析命令行参数 ============
ACTION="up"
BUILD_FLAG=""
DETACH_FLAG=""

usage() {
    echo "用法: $0 [选项]"
    echo ""
    echo "选项:"
    echo "  --build       强制重新构建镜像"
    echo "  -d, --detach  后台运行（不占用终端）"
    echo "  stop          停止容器"
    echo "  restart       重启容器"
    echo "  logs          查看容器日志"
    echo "  status        查看容器状态"
    echo "  cli           在 Docker 容器内启动交互式 CLI"
    echo "  clean         停止并删除容器和镜像"
    echo "  -h, --help    显示帮助信息"
    echo ""
    echo "示例:"
    echo "  $0                  # 构建并启动（首次会自动构建）"
    echo "  $0 --build          # 强制重新构建后启动"
    echo "  $0 -d               # 后台启动"
    echo "  $0 stop             # 停止服务"
    echo "  $0 logs             # 查看实时日志"
    echo "  $0 cli              # 启动交互式 CLI"
    echo "  $0 clean            # 完全清理"
}

while [[ $# -gt 0 ]]; do
    case $1 in
        --build)
            BUILD_FLAG="--build"
            shift
            ;;
        -d|--detach)
            DETACH_FLAG="-d"
            shift
            ;;
        stop)
            ACTION="stop"
            shift
            ;;
        restart)
            ACTION="restart"
            shift
            ;;
        logs)
            ACTION="logs"
            shift
            ;;
        status)
            ACTION="status"
            shift
            ;;
        clean)
            ACTION="clean"
            shift
            ;;
        cli)
            ACTION="cli"
            shift
            break  # Remaining args passed to CLI
            ;;
        -h|--help)
            usage
            exit 0
            ;;
        *)
            echo -e "${RED}未知参数: $1${NC}"
            usage
            exit 1
            ;;
    esac
done

# ============ 执行操作 ============
case $ACTION in
    up)
        check_docker
        check_config
        ensure_dirs

        echo ""
        echo -e "${BLUE}🐳 启动 DeepCode Docker 容器...${NC}"

        # 检查镜像是否存在，首次运行自动构建
        if [ -z "$BUILD_FLAG" ]; then
            if ! docker images | grep -q "deepcode"; then
                echo -e "${YELLOW}⚡ 首次运行，自动构建镜像（可能需要几分钟）...${NC}"
                BUILD_FLAG="--build"
            fi
        fi

        dc up $BUILD_FLAG $DETACH_FLAG

        if [ -n "$DETACH_FLAG" ]; then
            # 后台模式，等待容器启动后显示信息
            echo ""
            echo -e "${YELLOW}⏳ 等待服务启动...${NC}"
            for i in $(seq 1 30); do
                if curl -sf http://localhost:8000/health > /dev/null 2>&1; then
                    echo ""
                    echo "╔════════════════════════════════════════╗"
                    echo -e "║  ${GREEN}DeepCode 已启动! (Docker)${NC}             ║"
                    echo "╠════════════════════════════════════════╣"
                    echo "║                                        ║"
                    echo "║  🌐 访问: http://localhost:8000        ║"
                    echo "║  📚 API:  http://localhost:8000/docs   ║"
                    echo "║                                        ║"
                    echo "║  查看日志: $0 logs                     ║"
                    echo "║  停止服务: $0 stop                     ║"
                    echo "╚════════════════════════════════════════╝"
                    echo ""
                    exit 0
                fi
                sleep 2
            done
            echo -e "${YELLOW}⚠ 服务仍在启动中，请稍后访问 http://localhost:8000${NC}"
            echo -e "   使用 ${CYAN}$0 logs${NC} 查看启动日志"
        fi
        ;;

    stop)
        check_docker
        echo -e "${BLUE}🛑 停止 DeepCode 容器...${NC}"
        dc down
        echo -e "${GREEN}✓ 服务已停止${NC}"
        ;;

    restart)
        check_docker
        echo -e "${BLUE}🔄 重启 DeepCode 容器...${NC}"
        dc down
        dc up -d $BUILD_FLAG
        echo -e "${GREEN}✓ 服务已重启${NC}"
        echo -e "   访问: http://localhost:8000"
        ;;

    logs)
        check_docker
        echo -e "${BLUE}📋 DeepCode 容器日志 (Ctrl+C 退出):${NC}"
        echo ""
        dc logs -f
        ;;

    status)
        check_docker
        echo -e "${BLUE}📊 DeepCode 容器状态:${NC}"
        echo ""
        dc ps
        echo ""
        # 检查健康状态
        if curl -sf http://localhost:8000/health > /dev/null 2>&1; then
            echo -e "${GREEN}✓ 服务运行正常 (http://localhost:8000)${NC}"
        else
            echo -e "${YELLOW}⚠ 服务未响应或未启动${NC}"
        fi
        ;;

    cli)
        check_docker
        check_config
        ensure_dirs
        echo ""
        echo -e "${BLUE}🖥️  启动 DeepCode CLI (Docker)...${NC}"
        echo ""
        dc run --rm -it deepcode cli "$@"
        ;;

    clean)
        check_docker
        echo -e "${YELLOW}⚠ 即将停止并删除 DeepCode 容器和镜像${NC}"
        echo -e "${YELLOW}  (数据目录 deepcode_lab/, uploads/, logs/ 不会被删除)${NC}"
        read -p "确认? [y/N] " confirm
        if [[ "$confirm" =~ ^[Yy]$ ]]; then
            dc down --rmi local --remove-orphans
            echo -e "${GREEN}✓ 已清理完成${NC}"
        else
            echo "已取消"
        fi
        ;;
esac


================================================
FILE: mcp_agent.config.yaml
================================================
$schema: ./schema/mcp-agent.config.schema.json
anthropic: null
default_search_server: filesystem
document_segmentation:
  enabled: false
  size_threshold_chars: 50000
execution_engine: asyncio
logger:
  level: info
  path_settings:
    path_pattern: logs/mcp-agent-{unique_id}.jsonl
    timestamp_format: '%Y%m%d_%H%M%S'
    unique_id: timestamp
  progress_display: false
  transports:
  - console
  - file
mcp:
  servers:
    bocha-mcp:
      args:
      - tools/bocha_search_server.py
      command: python
      env:
        BOCHA_API_KEY: ''
        PYTHONPATH: .
    brave:
      # macos and linux should use this
      args:
      - -y
      - '@modelcontextprotocol/server-brave-search'
      command: npx

      # windows should use this
      # args:
      # # please use the correct path for your system
      # - C:/Users/LEGION/AppData/Roaming/npm/node_modules/@modelcontextprotocol/server-brave-search/dist/index.js
      # command: node
      env:
        BRAVE_API_KEY: ''
    filesystem:
      # macos and linux should use this
      # Note: "No valid root directories" warning is harmless - connection still works
      args:
      - -y
      - '@modelcontextprotocol/server-filesystem'
      - .
      - ./deepcode_lab
      command: npx

      # windows should use this
      # args:
      # # please use the correct path for your system
      # - C:/Users/LEGION/AppData/Roaming/npm/node_modules/@modelcontextprotocol/server-filesystem/dist/index.js
      # - .
      # command: node


    code-implementation:
      args:
      - tools/code_implementation_server.py
      command: python
      description: Paper code reproduction tool server - provides file operations,
        code execution, search and other functions
      env:
        PYTHONPATH: .
    code-reference-indexer:
      args:
      - tools/code_reference_indexer.py
      command: python
      description: Code reference indexer server - Provides intelligent code reference
        search from indexed repositories
      env:
        PYTHONPATH: .
    command-executor:
      args:
      - tools/command_executor.py
      command: python
      env:
        PYTHONPATH: .
    document-segmentation:
      args:
      - tools/document_segmentation_server.py
      command: python
      description: Document segmentation server - Provides intelligent document analysis
        and segmented reading to optimize token usage
      env:
        PYTHONPATH: .
    fetch:
      args:
      - mcp-server-fetch
      command: uvx
    file-downloader:
      args:
      - tools/pdf_downloader.py
      command: python
      env:
        PYTHONPATH: .
    github-downloader:
      args:
      - tools/git_command.py
      command: python
      env:
        PYTHONPATH: .
# LLM Provider Priority (选择使用哪个LLM / Choose which LLM to use)
# Options: "anthropic", "google", "openai"
# If not set or provider unavailable, will fallback to first available provider
llm_provider: "openai"  # 设置为 "google", "anthropic", 或 "openai"

#openrouter can be used here and openai professional key
openai:
  base_max_tokens: 40000
  default_model: "google/gemini-3-flash-preview"
  planning_model: "google/gemini-3-flash-preview"
  implementation_model: "google/gemini-3-flash-preview"
  reasoning_effort: low  # Only for thinking models
  max_tokens_policy: adaptive
  retry_max_tokens: 32768

# Provider configurations
# default_model is used by mcp_agent for planning/analysis phases
# implementation_model is used by code_implementation_workflow for code generation
google:
  default_model: "gemini-3-pro-preview"
  planning_model: "gemini-3-pro-preview"
  implementation_model: "gemini-2.5-flash"

anthropic:
  default_model: "claude-sonnet-4.5"
  planning_model: "claude-sonnet-4.5"
  implementation_model: "claude-sonnet-3.5"


planning_mode: traditional


================================================
FILE: mcp_agent.secrets.yaml.example
================================================
# =============================================================
# DeepCode - API Keys Configuration
# =============================================================
# Copy this file to mcp_agent.secrets.yaml and fill in your keys.
#
# At least ONE LLM provider API key is required.
# Config file takes priority over environment variables.
# =============================================================

# OpenAI / OpenRouter
openai:
  api_key: ""
  # For OpenRouter (recommended - access multiple models via one key):
  # base_url: "https://openrouter.ai/api/v1"

# Anthropic (Claude)
anthropic:
  api_key: ""

# Google (Gemini)
google:
  api_key: ""


================================================
FILE: nanobot/.dockerignore
================================================
__pycache__
*.pyc
*.pyo
*.pyd
*.egg-info
dist/
build/
.git
.env
.assets
node_modules/
bridge/dist/
workspace/


================================================
FILE: nanobot/.gitignore
================================================
.assets
.env
*.pyc
dist/
build/
docs/
*.egg-info/
*.egg
*.pyc
*.pyo
*.pyd
*.pyw
*.pyz
*.pywz
*.pyzz
.venv/
__pycache__/
poetry.lock
.pytest_cache/
tests/
botpy.log


================================================
FILE: nanobot/COMMUNICATION.md
================================================
We provide QR codes for joining the HKUDS discussion groups on **WeChat** and **Feishu**.

You can join by scanning the QR codes below:

<img src="https://github.com/HKUDS/.github/blob/main/profile/QR.png" alt="WeChat QR Code" width="400"/>


================================================
FILE: nanobot/Dockerfile
================================================
FROM ghcr.io/astral-sh/uv:python3.12-bookworm-slim

# Install Node.js 20 for the WhatsApp bridge
RUN apt-get update && \
    apt-get install -y --no-install-recommends curl ca-certificates gnupg git && \
    mkdir -p /etc/apt/keyrings && \
    curl -fsSL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg && \
    echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_20.x nodistro main" > /etc/apt/sources.list.d/nodesource.list && \
    apt-get update && \
    apt-get install -y --no-install-recommends nodejs && \
    apt-get purge -y gnupg && \
    apt-get autoremove -y && \
    rm -rf /var/lib/apt/lists/*

WORKDIR /app

# Install Python dependencies first (cached layer)
# Note: build context is DeepCode root, so paths start with nanobot/
COPY nanobot/pyproject.toml nanobot/README.md nanobot/LICENSE ./
RUN mkdir -p nanobot bridge && touch nanobot/__init__.py && \
    uv pip install --system --no-cache . && \
    rm -rf nanobot bridge

# Copy the full source and install
COPY nanobot/nanobot/ nanobot/
COPY nanobot/bridge/ bridge/
RUN uv pip install --system --no-cache .

# Build the WhatsApp bridge
WORKDIR /app/bridge
RUN npm install && npm run build
WORKDIR /app

# Create config directory
RUN mkdir -p /root/.nanobot

# Gateway default port
EXPOSE 18790

ENTRYPOINT ["nanobot"]
CMD ["gateway"]


================================================
FILE: nanobot/LICENSE
================================================
MIT License

Copyright (c) 2025 nanobot contributors

Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.


================================================
FILE: nanobot/README.md
================================================
<div align="center">
  <img src="nanobot_logo.png" alt="nanobot" width="500">
  <h1>nanobot: Ultra-Lightweight Personal AI Assistant</h1>
  <p>
    <a href="https://pypi.org/project/nanobot-ai/"><img src="https://img.shields.io/pypi/v/nanobot-ai" alt="PyPI"></a>
    <a href="https://pepy.tech/project/nanobot-ai"><img src="https://static.pepy.tech/badge/nanobot-ai" alt="Downloads"></a>
    <img src="https://img.shields.io/badge/python-≥3.11-blue" alt="Python">
    <img src="https://img.shields.io/badge/license-MIT-green" alt="License">
    <a href="./COMMUNICATION.md"><img src="https://img.shields.io/badge/Feishu-Group-E9DBFC?style=flat&logo=feishu&logoColor=white" alt="Feishu"></a>
    <a href="./COMMUNICATION.md"><img src="https://img.shields.io/badge/WeChat-Group-C5EAB4?style=flat&logo=wechat&logoColor=white" alt="WeChat"></a>
    <a href="https://discord.gg/MnCvHqpUGB"><img src="https://img.shields.io/badge/Discord-Community-5865F2?style=flat&logo=discord&logoColor=white" alt="Discord"></a>
  </p>
</div>

🐈 **nanobot** is an **ultra-lightweight** personal AI assistant inspired by [Clawdbot](https://github.com/openclaw/openclaw)

⚡️ Delivers core agent functionality in just **~4,000** lines of code — **99% smaller** than Clawdbot's 430k+ lines.

📏 Real-time line count: **3,510 lines** (run `bash core_agent_lines.sh` to verify anytime)

## 📢 News

- **2026-02-09** 💬 Added Slack, Email, and QQ support — nanobot now supports multiple chat platforms!
- **2026-02-08** 🔧 Refactored Providers—adding a new LLM provider now takes just 2 simple steps! Check [here](#providers).
- **2026-02-07** 🚀 Released v0.1.3.post5 with Qwen support & several key improvements! Check [here](https://github.com/HKUDS/nanobot/releases/tag/v0.1.3.post5) for details.
- **2026-02-06** ✨ Added Moonshot/Kimi provider, Discord integration, and enhanced security hardening!
- **2026-02-05** ✨ Added Feishu channel, DeepSeek provider, and enhanced scheduled tasks support!
- **2026-02-04** 🚀 Released v0.1.3.post4 with multi-provider & Docker support! Check [here](https://github.com/HKUDS/nanobot/releases/tag/v0.1.3.post4) for details.
- **2026-02-03** ⚡ Integrated vLLM for local LLM support and improved natural language task scheduling!
- **2026-02-02** 🎉 nanobot officially launched! Welcome to try 🐈 nanobot!

## Key Features of nanobot:

🪶 **Ultra-Lightweight**: Just ~4,000 lines of core agent code — 99% smaller than Clawdbot.

🔬 **Research-Ready**: Clean, readable code that's easy to understand, modify, and extend for research.

⚡️ **Lightning Fast**: Minimal footprint means faster startup, lower resource usage, and quicker iterations.

💎 **Easy-to-Use**: One-click to deploy and you're ready to go.

## 🏗️ Architecture

<p align="center">
  <img src="nanobot_arch.png" alt="nanobot architecture" width="800">
</p>

## ✨ Features

<table align="center">
  <tr align="center">
    <th><p align="center">📈 24/7 Real-Time Market Analysis</p></th>
    <th><p align="center">🚀 Full-Stack Software Engineer</p></th>
    <th><p align="center">📅 Smart Daily Routine Manager</p></th>
    <th><p align="center">📚 Personal Knowledge Assistant</p></th>
  </tr>
  <tr>
    <td align="center"><p align="center"><img src="case/search.gif" width="180" height="400"></p></td>
    <td align="center"><p align="center"><img src="case/code.gif" width="180" height="400"></p></td>
    <td align="center"><p align="center"><img src="case/scedule.gif" width="180" height="400"></p></td>
    <td align="center"><p align="center"><img src="case/memory.gif" width="180" height="400"></p></td>
  </tr>
  <tr>
    <td align="center">Discovery • Insights • Trends</td>
    <td align="center">Develop • Deploy • Scale</td>
    <td align="center">Schedule • Automate • Organize</td>
    <td align="center">Learn • Memory • Reasoning</td>
  </tr>
</table>

## 📦 Install

**Install from source** (latest features, recommended for development)

```bash
git clone https://github.com/HKUDS/nanobot.git
cd nanobot
pip install -e .
```

**Install with [uv](https://github.com/astral-sh/uv)** (stable, fast)

```bash
uv tool install nanobot-ai
```

**Install from PyPI** (stable)

```bash
pip install nanobot-ai
```

## 🚀 Quick Start

> [!TIP]
> Set your API key in `~/.nanobot/config.json`.
> Get API keys: [OpenRouter](https://openrouter.ai/keys) (Global) · [DashScope](https://dashscope.console.aliyun.com) (Qwen) · [Brave Search](https://brave.com/search/api/) (optional, for web search)

**1. Initialize**

```bash
nanobot onboard
```

**2. Configure** (`~/.nanobot/config.json`)

For OpenRouter - recommended for global users:
```json
{
  "providers": {
    "openrouter": {
      "apiKey": "sk-or-v1-xxx"
    }
  },
  "agents": {
    "defaults": {
      "model": "anthropic/claude-opus-4-5"
    }
  }
}
```

**3. Chat**

```bash
nanobot agent -m "What is 2+2?"
```

That's it! You have a working AI assistant in 2 minutes.

## 🖥️ Local Models (vLLM)

Run nanobot with your own local models using vLLM or any OpenAI-compatible server.

**1. Start your vLLM server**

```bash
vllm serve meta-llama/Llama-3.1-8B-Instruct --port 8000
```

**2. Configure** (`~/.nanobot/config.json`)

```json
{
  "providers": {
    "vllm": {
      "apiKey": "dummy",
      "apiBase": "http://localhost:8000/v1"
    }
  },
  "agents": {
    "defaults": {
      "model": "meta-llama/Llama-3.1-8B-Instruct"
    }
  }
}
```

**3. Chat**

```bash
nanobot agent -m "Hello from my local LLM!"
```

> [!TIP]
> The `apiKey` can be any non-empty string for local servers that don't require authentication.

## 💬 Chat Apps

Talk to your nanobot through Telegram, Discord, WhatsApp, Feishu, DingTalk, Slack, Email, or QQ — anytime, anywhere.

| Channel | Setup |
|---------|-------|
| **Telegram** | Easy (just a token) |
| **Discord** | Easy (bot token + intents) |
| **WhatsApp** | Medium (scan QR) |
| **Feishu** | Medium (app credentials) |
| **DingTalk** | Medium (app credentials) |
| **Slack** | Medium (bot + app tokens) |
| **Email** | Medium (IMAP/SMTP credentials) |
| **QQ** | Easy (app credentials) |

<details>
<summary><b>Telegram</b> (Recommended)</summary>

**1. Create a bot**
- Open Telegram, search `@BotFather`
- Send `/newbot`, follow prompts
- Copy the token

**2. Configure**

```json
{
  "channels": {
    "telegram": {
      "enabled": true,
      "token": "YOUR_BOT_TOKEN",
      "allowFrom": ["YOUR_USER_ID"]
    }
  }
}
```

> You can find your **User ID** in Telegram settings. It is shown as `@yourUserId`.
> Copy this value **without the `@` symbol** and paste it into the config file.


**3. Run**

```bash
nanobot gateway
```

</details>

<details>
<summary><b>Discord</b></summary>

**1. Create a bot**
- Go to https://discord.com/developers/applications
- Create an application → Bot → Add Bot
- Copy the bot token

**2. Enable intents**
- In the Bot settings, enable **MESSAGE CONTENT INTENT**
- (Optional) Enable **SERVER MEMBERS INTENT** if you plan to use allow lists based on member data

**3. Get your User ID**
- Discord Settings → Advanced → enable **Developer Mode**
- Right-click your avatar → **Copy User ID**

**4. Configure**

```json
{
  "channels": {
    "discord": {
      "enabled": true,
      "token": "YOUR_BOT_TOKEN",
      "allowFrom": ["YOUR_USER_ID"]
    }
  }
}
```

**5. Invite the bot**
- OAuth2 → URL Generator
- Scopes: `bot`
- Bot Permissions: `Send Messages`, `Read Message History`
- Open the generated invite URL and add the bot to your server

**6. Run**

```bash
nanobot gateway
```

</details>

<details>
<summary><b>WhatsApp</b></summary>

Requires **Node.js ≥18**.

**1. Link device**

```bash
nanobot channels login
# Scan QR with WhatsApp → Settings → Linked Devices
```

**2. Configure**

```json
{
  "channels": {
    "whatsapp": {
      "enabled": true,
      "allowFrom": ["+1234567890"]
    }
  }
}
```

**3. Run** (two terminals)

```bash
# Terminal 1
nanobot channels login

# Terminal 2
nanobot gateway
```

</details>

<details>
<summary><b>Feishu (飞书)</b></summary>

Uses **WebSocket** long connection — no public IP required.

**1. Create a Feishu bot**
- Visit [Feishu Open Platform](https://open.feishu.cn/app)
- Create a new app → Enable **Bot** capability
- **Permissions**: Add `im:message` (send messages)
- **Events**: Add `im.message.receive_v1` (receive messages)
  - Select **Long Connection** mode (requires running nanobot first to establish connection)
- Get **App ID** and **App Secret** from "Credentials & Basic Info"
- Publish the app

**2. Configure**

```json
{
  "channels": {
    "feishu": {
      "enabled": true,
      "appId": "cli_xxx",
      "appSecret": "xxx",
      "encryptKey": "",
      "verificationToken": "",
      "allowFrom": []
    }
  }
}
```

> `encryptKey` and `verificationToken` are optional for Long Connection mode.
> `allowFrom`: Leave empty to allow all users, or add `["ou_xxx"]` to restrict access.

**3. Run**

```bash
nanobot gateway
```

> [!TIP]
> Feishu uses WebSocket to receive messages — no webhook or public IP needed!

</details>

<details>
<summary><b>QQ (QQ私聊)</b></summary>

Uses **botpy SDK** with WebSocket — no public IP required.

**1. Create a QQ bot**
- Visit [QQ Open Platform](https://q.qq.com)
- Create a new bot application
- Get **AppID** and **Secret** from "Developer Settings"

**2. Configure**

```json
{
  "channels": {
    "qq": {
      "enabled": true,
      "appId": "YOUR_APP_ID",
      "secret": "YOUR_APP_SECRET",
      "allowFrom": []
    }
  }
}
```

> `allowFrom`: Leave empty for public access, or add user openids to restrict access.
> Example: `"allowFrom": ["user_openid_1", "user_openid_2"]`

**3. Run**

```bash
nanobot gateway
```

> [!TIP]
> QQ bot currently supports **private messages only**. Group chat support coming soon!

</details>

<details>
<summary><b>DingTalk (钉钉)</b></summary>

Uses **Stream Mode** — no public IP required.

**1. Create a DingTalk bot**
- Visit [DingTalk Open Platform](https://open-dev.dingtalk.com/)
- Create a new app -> Add **Robot** capability
- **Configuration**:
  - Toggle **Stream Mode** ON
- **Permissions**: Add necessary permissions for sending messages
- Get **AppKey** (Client ID) and **AppSecret** (Client Secret) from "Credentials"
- Publish the app

**2. Configure**

```json
{
  "channels": {
    "dingtalk": {
      "enabled": true,
      "clientId": "YOUR_APP_KEY",
      "clientSecret": "YOUR_APP_SECRET",
      "allowFrom": []
    }
  }
}
```

> `allowFrom`: Leave empty to allow all users, or add `["staffId"]` to restrict access.

**3. Run**

```bash
nanobot gateway
```

</details>

<details>
<summary><b>Slack</b></summary>

Uses **Socket Mode** — no public URL required.

**1. Create a Slack app**
- Go to [Slack API](https://api.slack.com/apps) → Create New App
- **OAuth & Permissions**: Add bot scopes: `chat:write`, `reactions:write`, `app_mentions:read`
- Install to your workspace and copy the **Bot Token** (`xoxb-...`)
- **Socket Mode**: Enable it and generate an **App-Level Token** (`xapp-...`) with `connections:write` scope
- **Event Subscriptions**: Subscribe to `message.im`, `message.channels`, `app_mention`

**2. Configure**

```json
{
  "channels": {
    "slack": {
      "enabled": true,
      "botToken": "xoxb-...",
      "appToken": "xapp-...",
      "groupPolicy": "mention"
    }
  }
}
```

> `groupPolicy`: `"mention"` (respond only when @mentioned), `"open"` (respond to all messages), or `"allowlist"` (restrict to specific channels).
> DM policy defaults to open. Set `"dm": {"enabled": false}` to disable DMs.

**3. Run**

```bash
nanobot gateway
```

</details>

<details>
<summary><b>Email</b></summary>

Give nanobot its own email account. It polls **IMAP** for incoming mail and replies via **SMTP** — like a personal email assistant.

**1. Get credentials (Gmail example)**
- Create a dedicated Gmail account for your bot (e.g. `my-nanobot@gmail.com`)
- Enable 2-Step Verification → Create an [App Password](https://myaccount.google.com/apppasswords)
- Use this app password for both IMAP and SMTP

**2. Configure**

> - `consentGranted` must be `true` to allow mailbox access. This is a safety gate — set `false` to fully disable.
> - `allowFrom`: Leave empty to accept emails from anyone, or restrict to specific senders.
> - `smtpUseTls` and `smtpUseSsl` default to `true` / `false` respectively, which is correct for Gmail (port 587 + STARTTLS). No need to set them explicitly.
> - Set `"autoReplyEnabled": false` if you only want to read/analyze emails without sending automatic replies.

```json
{
  "channels": {
    "email": {
      "enabled": true,
      "consentGranted": true,
      "imapHost": "imap.gmail.com",
      "imapPort": 993,
      "imapUsername": "my-nanobot@gmail.com",
      "imapPassword": "your-app-password",
      "smtpHost": "smtp.gmail.com",
      "smtpPort": 587,
      "smtpUsername": "my-nanobot@gmail.com",
      "smtpPassword": "your-app-password",
      "fromAddress": "my-nanobot@gmail.com",
      "allowFrom": ["your-real-email@gmail.com"]
    }
  }
}
```


**3. Run**

```bash
nanobot gateway
```

</details>

## ⚙️ Configuration

Config file: `~/.nanobot/config.json`

### Providers

> [!TIP]
> - **Groq** provides free voice transcription via Whisper. If configured, Telegram voice messages will be automatically transcribed.
> - **Zhipu Coding Plan**: If you're on Zhipu's coding plan, set `"apiBase": "https://open.bigmodel.cn/api/coding/paas/v4"` in your zhipu provider config.

| Provider | Purpose | Get API Key |
|----------|---------|-------------|
| `openrouter` | LLM (recommended, access to all models) | [openrouter.ai](https://openrouter.ai) |
| `anthropic` | LLM (Claude direct) | [console.anthropic.com](https://console.anthropic.com) |
| `openai` | LLM (GPT direct) | [platform.openai.com](https://platform.openai.com) |
| `deepseek` | LLM (DeepSeek direct) | [platform.deepseek.com](https://platform.deepseek.com) |
| `groq` | LLM + **Voice transcription** (Whisper) | [console.groq.com](https://console.groq.com) |
| `gemini` | LLM (Gemini direct) | [aistudio.google.com](https://aistudio.google.com) |
| `aihubmix` | LLM (API gateway, access to all models) | [aihubmix.com](https://aihubmix.com) |
| `dashscope` | LLM (Qwen) | [dashscope.console.aliyun.com](https://dashscope.console.aliyun.com) |
| `moonshot` | LLM (Moonshot/Kimi) | [platform.moonshot.cn](https://platform.moonshot.cn) |
| `zhipu` | LLM (Zhipu GLM) | [open.bigmodel.cn](https://open.bigmodel.cn) |
| `vllm` | LLM (local, any OpenAI-compatible server) | — |

<details>
<summary><b>Adding a New Provider (Developer Guide)</b></summary>

nanobot uses a **Provider Registry** (`nanobot/providers/registry.py`) as the single source of truth.
Adding a new provider only takes **2 steps** — no if-elif chains to touch.

**Step 1.** Add a `ProviderSpec` entry to `PROVIDERS` in `nanobot/providers/registry.py`:

```python
ProviderSpec(
    name="myprovider",                   # config field name
    keywords=("myprovider", "mymodel"),  # model-name keywords for auto-matching
    env_key="MYPROVIDER_API_KEY",        # env var for LiteLLM
    display_name="My Provider",          # shown in `nanobot status`
    litellm_prefix="myprovider",         # auto-prefix: model → myprovider/model
    skip_prefixes=("myprovider/",),      # don't double-prefix
)
```

**Step 2.** Add a field to `ProvidersConfig` in `nanobot/config/schema.py`:

```python
class ProvidersConfig(BaseModel):
    ...
    myprovider: ProviderConfig = ProviderConfig()
```

That's it! Environment variables, model prefixing, config matching, and `nanobot status` display will all work automatically.

**Common `ProviderSpec` options:**

| Field | Description | Example |
|-------|-------------|---------|
| `litellm_prefix` | Auto-prefix model names for LiteLLM | `"dashscope"` → `dashscope/qwen-max` |
| `skip_prefixes` | Don't prefix if model already starts with these | `("dashscope/", "openrouter/")` |
| `env_extras` | Additional env vars to set | `(("ZHIPUAI_API_KEY", "{api_key}"),)` |
| `model_overrides` | Per-model parameter overrides | `(("kimi-k2.5", {"temperature": 1.0}),)` |
| `is_gateway` | Can route any model (like OpenRouter) | `True` |
| `detect_by_key_prefix` | Detect gateway by API key prefix | `"sk-or-"` |
| `detect_by_base_keyword` | Detect gateway by API base URL | `"openrouter"` |
| `strip_model_prefix` | Strip existing prefix before re-prefixing | `True` (for AiHubMix) |

</details>


### Security

> For production deployments, set `"restrictToWorkspace": true` in your config to sandbox the agent.

| Option | Default | Description |
|--------|---------|-------------|
| `tools.restrictToWorkspace` | `false` | When `true`, restricts **all** agent tools (shell, file read/write/edit, list) to the workspace directory. Prevents path traversal and out-of-scope access. |
| `channels.*.allowFrom` | `[]` (allow all) | Whitelist of user IDs. Empty = allow everyone; non-empty = only listed users can interact. |


## CLI Reference

| Command | Description |
|---------|-------------|
| `nanobot onboard` | Initialize config & workspace |
| `nanobot agent -m "..."` | Chat with the agent |
| `nanobot agent` | Interactive chat mode |
| `nanobot agent --no-markdown` | Show plain-text replies |
| `nanobot agent --logs` | Show runtime logs during chat |
| `nanobot gateway` | Start the gateway |
| `nanobot status` | Show status |
| `nanobot channels login` | Link WhatsApp (scan QR) |
| `nanobot channels status` | Show channel status |

Interactive mode exits: `exit`, `quit`, `/exit`, `/quit`, `:q`, or `Ctrl+D`.

<details>
<summary><b>Scheduled Tasks (Cron)</b></summary>

```bash
# Add a job
nanobot cron add --name "daily" --message "Good morning!" --cron "0 9 * * *"
nanobot cron add --name "hourly" --message "Check status" --every 3600

# List jobs
nanobot cron list

# Remove a job
nanobot cron remove <job_id>
```

</details>

## 🐳 Docker

> [!TIP]
> The `-v ~/.nanobot:/root/.nanobot` flag mounts your local config directory into the container, so your config and workspace persist across container restarts.

Build and run nanobot in a container:

```bash
# Build the image
docker build -t nanobot .

# Initialize config (first time only)
docker run -v ~/.nanobot:/root/.nanobot --rm nanobot onboard

# Edit config on host to add API keys
vim ~/.nanobot/config.json

# Run gateway (connects to Telegram/WhatsApp)
docker run -v ~/.nanobot:/root/.nanobot -p 18790:18790 nanobot gateway

# Or run a single command
docker run -v ~/.nanobot:/root/.nanobot --rm nanobot agent -m "Hello!"
docker run -v ~/.nanobot:/root/.nanobot --rm nanobot status
```

## 📁 Project Structure

```
nanobot/
├── agent/          # 🧠 Core agent logic
│   ├── loop.py     #    Agent loop (LLM ↔ tool execution)
│   ├── context.py  #    Prompt builder
│   ├── memory.py   #    Persistent memory
│   ├── skills.py   #    Skills loader
│   ├── subagent.py #    Background task execution
│   └── tools/      #    Built-in tools (incl. spawn)
├── skills/         # 🎯 Bundled skills (github, weather, tmux...)
├── channels/       # 📱 WhatsApp integration
├── bus/            # 🚌 Message routing
├── cron/           # ⏰ Scheduled tasks
├── heartbeat/      # 💓 Proactive wake-up
├── providers/      # 🤖 LLM providers (OpenRouter, etc.)
├── session/        # 💬 Conversation sessions
├── config/         # ⚙️ Configuration
└── cli/            # 🖥️ Commands
```

## 🤝 Contribute & Roadmap

PRs welcome! The codebase is intentionally small and readable. 🤗

**Roadmap** — Pick an item and [open a PR](https://github.com/HKUDS/nanobot/pulls)!

- [x] **Voice Transcription** — Support for Groq Whisper (Issue #13)
- [ ] **Multi-modal** — See and hear (images, voice, video)
- [ ] **Long-term memory** — Never forget important context
- [ ] **Better reasoning** — Multi-step planning and reflection
- [ ] **More integrations** — Calendar and more
- [ ] **Self-improvement** — Learn from feedback and mistakes

### Contributors

<a href="https://github.com/HKUDS/nanobot/graphs/contributors">
  <img src="https://contrib.rocks/image?repo=HKUDS/nanobot&max=100&columns=12" />
</a>


## ⭐ Star History

<div align="center">
  <a href="https://star-history.com/#HKUDS/nanobot&Date">
    <picture>
      <source media="(prefers-color-scheme: dark)" srcset="https://api.star-history.com/svg?repos=HKUDS/nanobot&type=Date&theme=dark" />
      <source media="(prefers-color-scheme: light)" srcset="https://api.star-history.com/svg?repos=HKUDS/nanobot&type=Date" />
      <img alt="Star History Chart" src="https://api.star-history.com/svg?repos=HKUDS/nanobot&type=Date" style="border-radius: 15px; box-shadow: 0 0 30px rgba(0, 217, 255, 0.3);" />
    </picture>
  </a>
</div>

<p align="center">
  <em> Thanks for visiting ✨ nanobot!</em><br><br>
  <img src="https://visitor-badge.laobi.icu/badge?page_id=HKUDS.nanobot&style=for-the-badge&color=00d4ff" alt="Views">
</p>


<p align="center">
  <sub>nanobot is for educational, research, and technical exchange purposes only</sub>
</p>


================================================
FILE: nanobot/SECURITY.md
================================================
# Security Policy

## Reporting a Vulnerability

If you discover a security vulnerability in nanobot, please report it by:

1. **DO NOT** open a public GitHub issue
2. Create a private security advisory on GitHub or contact the repository maintainers
3. Include:
   - Description of the vulnerability
   - Steps to reproduce
   - Potential impact
   - Suggested fix (if any)

We aim to respond to security reports within 48 hours.

## Security Best Practices

### 1. API Key Management

**CRITICAL**: Never commit API keys to version control.

```bash
# ✅ Good: Store in config file with restricted permissions
chmod 600 ~/.nanobot/config.json

# ❌ Bad: Hardcoding keys in code or committing them
```

**Recommendations:**
- Store API keys in `~/.nanobot/config.json` with file permissions set to `0600`
- Consider using environment variables for sensitive keys
- Use OS keyring/credential manager for production deployments
- Rotate API keys regularly
- Use separate API keys for development and production

### 2. Channel Access Control

**IMPORTANT**: Always configure `allowFrom` lists for production use.

```json
{
  "channels": {
    "telegram": {
      "enabled": true,
      "token": "YOUR_BOT_TOKEN",
      "allowFrom": ["123456789", "987654321"]
    },
    "whatsapp": {
      "enabled": true,
      "allowFrom": ["+1234567890"]
    }
  }
}
```

**Security Notes:**
- Empty `allowFrom` list will **ALLOW ALL** users (open by default for personal use)
- Get your Telegram user ID from `@userinfobot`
- Use full phone numbers with country code for WhatsApp
- Review access logs regularly for unauthorized access attempts

### 3. Shell Command Execution

The `exec` tool can execute shell commands. While dangerous command patterns are blocked, you should:

- ✅ Review all tool usage in agent logs
- ✅ Understand what commands the agent is running
- ✅ Use a dedicated user account with limited privileges
- ✅ Never run nanobot as root
- ❌ Don't disable security checks
- ❌ Don't run on systems with sensitive data without careful review

**Blocked patterns:**
- `rm -rf /` - Root filesystem deletion
- Fork bombs
- Filesystem formatting (`mkfs.*`)
- Raw disk writes
- Other destructive operations

### 4. File System Access

File operations have path traversal protection, but:

- ✅ Run nanobot with a dedicated user account
- ✅ Use filesystem permissions to protect sensitive directories
- ✅ Regularly audit file operations in logs
- ❌ Don't give unrestricted access to sensitive files

### 5. Network Security

**API Calls:**
- All external API calls use HTTPS by default
- Timeouts are configured to prevent hanging requests
- Consider using a firewall to restrict outbound connections if needed

**WhatsApp Bridge:**
- The bridge runs on `localhost:3001` by default
- If exposing to network, use proper authentication and TLS
- Keep authentication data in `~/.nanobot/whatsapp-auth` secure (mode 0700)

### 6. Dependency Security

**Critical**: Keep dependencies updated!

```bash
# Check for vulnerable dependencies
pip install pip-audit
pip-audit

# Update to latest secure versions
pip install --upgrade nanobot-ai
```

For Node.js dependencies (WhatsApp bridge):
```bash
cd bridge
npm audit
npm audit fix
```

**Important Notes:**
- Keep `litellm` updated to the latest version for security fixes
- We've updated `ws` to `>=8.17.1` to fix DoS vulnerability
- Run `pip-audit` or `npm audit` regularly
- Subscribe to security advisories for nanobot and its dependencies

### 7. Production Deployment

For production use:

1. **Isolate the Environment**
   ```bash
   # Run in a container or VM
   docker run --rm -it python:3.11
   pip install nanobot-ai
   ```

2. **Use a Dedicated User**
   ```bash
   sudo useradd -m -s /bin/bash nanobot
   sudo -u nanobot nanobot gateway
   ```

3. **Set Proper Permissions**
   ```bash
   chmod 700 ~/.nanobot
   chmod 600 ~/.nanobot/config.json
   chmod 700 ~/.nanobot/whatsapp-auth
   ```

4. **Enable Logging**
   ```bash
   # Configure log monitoring
   tail -f ~/.nanobot/logs/nanobot.log
   ```

5. **Use Rate Limiting**
   - Configure rate limits on your API providers
   - Monitor usage for anomalies
   - Set spending limits on LLM APIs

6. **Regular Updates**
   ```bash
   # Check for updates weekly
   pip install --upgrade nanobot-ai
   ```

### 8. Development vs Production

**Development:**
- Use separate API keys
- Test with non-sensitive data
- Enable verbose logging
- Use a test Telegram bot

**Production:**
- Use dedicated API keys with spending limits
- Restrict file system access
- Enable audit logging
- Regular security reviews
- Monitor for unusual activity

### 9. Data Privacy

- **Logs may contain sensitive information** - secure log files appropriately
- **LLM providers see your prompts** - review their privacy policies
- **Chat history is stored locally** - protect the `~/.nanobot` directory
- **API keys are in plain text** - use OS keyring for production

### 10. Incident Response

If you suspect a security breach:

1. **Immediately revoke compromised API keys**
2. **Review logs for unauthorized access**
   ```bash
   grep "Access denied" ~/.nanobot/logs/nanobot.log
   ```
3. **Check for unexpected file modifications**
4. **Rotate all credentials**
5. **Update to latest version**
6. **Report the incident** to maintainers

## Security Features

### Built-in Security Controls

✅ **Input Validation**
- Path traversal protection on file operations
- Dangerous command pattern detection
- Input length limits on HTTP requests

✅ **Authentication**
- Allow-list based access control
- Failed authentication attempt logging
- Open by default (configure allowFrom for production use)

✅ **Resource Protection**
- Command execution timeouts (60s default)
- Output truncation (10KB limit)
- HTTP request timeouts (10-30s)

✅ **Secure Communication**
- HTTPS for all external API calls
- TLS for Telegram API
- WebSocket security for WhatsApp bridge

## Known Limitations

⚠️ **Current Security Limitations:**

1. **No Rate Limiting** - Users can send unlimited messages (add your own if needed)
2. **Plain Text Config** - API keys stored in plain text (use keyring for production)
3. **No Session Management** - No automatic session expiry
4. **Limited Command Filtering** - Only blocks obvious dangerous patterns
5. **No Audit Trail** - Limited security event logging (enhance as needed)

## Security Checklist

Before deploying nanobot:

- [ ] API keys stored securely (not in code)
- [ ] Config file permissions set to 0600
- [ ] `allowFrom` lists configured for all channels
- [ ] Running as non-root user
- [ ] File system permissions properly restricted
- [ ] Dependencies updated to latest secure versions
- [ ] Logs monitored for security events
- [ ] Rate limits configured on API providers
- [ ] Backup and disaster recovery plan in place
- [ ] Security review of custom skills/tools

## Updates

**Last Updated**: 2026-02-03

For the latest security updates and announcements, check:
- GitHub Security Advisories: https://github.com/HKUDS/nanobot/security/advisories
- Release Notes: https://github.com/HKUDS/nanobot/releases

## License

See LICENSE file for details.


================================================
FILE: nanobot/bridge/package.json
================================================
{
  "name": "nanobot-whatsapp-bridge",
  "version": "0.1.0",
  "description": "WhatsApp bridge for nanobot using Baileys",
  "type": "module",
  "main": "dist/index.js",
  "scripts": {
    "build": "tsc",
    "start": "node dist/index.js",
    "dev": "tsc && node dist/index.js"
  },
  "dependencies": {
    "@whiskeysockets/baileys": "7.0.0-rc.9",
    "ws": "^8.17.1",
    "qrcode-terminal": "^0.12.0",
    "pino": "^9.0.0"
  },
  "devDependencies": {
    "@types/node": "^20.14.0",
    "@types/ws": "^8.5.10",
    "typescript": "^5.4.0"
  },
  "engines": {
    "node": ">=20.0.0"
  }
}


================================================
FILE: nanobot/bridge/src/index.ts
================================================
#!/usr/bin/env node
/**
 * nanobot WhatsApp Bridge
 *
 * This bridge connects WhatsApp Web to nanobot's Python backend
 * via WebSocket. It handles authentication, message forwarding,
 * and reconnection logic.
 *
 * Usage:
 *   npm run build && npm start
 *
 * Or with custom settings:
 *   BRIDGE_PORT=3001 AUTH_DIR=~/.nanobot/whatsapp npm start
 */

// Polyfill crypto for Baileys in ESM
import { webcrypto } from 'crypto';
if (!globalThis.crypto) {
  (globalThis as any).crypto = webcrypto;
}

import { BridgeServer } from './server.js';
import { homedir } from 'os';
import { join } from 'path';

const PORT = parseInt(process.env.BRIDGE_PORT || '3001', 10);
const AUTH_DIR = process.env.AUTH_DIR || join(homedir(), '.nanobot', 'whatsapp-auth');

console.log('🐈 nanobot WhatsApp Bridge');
console.log('========================\n');

const server = new BridgeServer(PORT, AUTH_DIR);

// Handle graceful shutdown
process.on('SIGINT', async () => {
  console.log('\n\nShutting down...');
  await server.stop();
  process.exit(0);
});

process.on('SIGTERM', async () => {
  await server.stop();
  process.exit(0);
});

// Start the server
server.start().catch((error) => {
  console.error('Failed to start bridge:', error);
  process.exit(1);
});


================================================
FILE: nanobot/bridge/src/server.ts
================================================
/**
 * WebSocket server for Python-Node.js bridge communication.
 */

import { WebSocketServer, WebSocket } from 'ws';
import { WhatsAppClient, InboundMessage } from './whatsapp.js';

interface SendCommand {
  type: 'send';
  to: string;
  text: string;
}

interface BridgeMessage {
  type: 'message' | 'status' | 'qr' | 'error';
  [key: string]: unknown;
}

export class BridgeServer {
  private wss: WebSocketServer | null = null;
  private wa: WhatsAppClient | null = null;
  private clients: Set<WebSocket> = new Set();

  constructor(private port: number, private authDir: string) {}

  async start(): Promise<void> {
    // Create WebSocket server
    this.wss = new WebSocketServer({ port: this.port });
    console.log(`🌉 Bridge server listening on ws://localhost:${this.port}`);

    // Initialize WhatsApp client
    this.wa = new WhatsAppClient({
      authDir: this.authDir,
      onMessage: (msg) => this.broadcast({ type: 'message', ...msg }),
      onQR: (qr) => this.broadcast({ type: 'qr', qr }),
      onStatus: (status) => this.broadcast({ type: 'status', status }),
    });

    // Handle WebSocket connections
    this.wss.on('connection', (ws) => {
      console.log('🔗 Python client connected');
      this.clients.add(ws);

      ws.on('message', async (data) => {
        try {
          const cmd = JSON.parse(data.toString()) as SendCommand;
          await this.handleCommand(cmd);
          ws.send(JSON.stringify({ type: 'sent', to: cmd.to }));
        } catch (error) {
          console.error('Error handling command:', error);
          ws.send(JSON.stringify({ type: 'error', error: String(error) }));
        }
      });

      ws.on('close', () => {
        console.log('🔌 Python client disconnected');
        this.clients.delete(ws);
      });

      ws.on('error', (error) => {
        console.error('WebSocket error:', error);
        this.clients.delete(ws);
      });
    });

    // Connect to WhatsApp
    await this.wa.connect();
  }

  private async handleCommand(cmd: SendCommand): Promise<void> {
    if (cmd.type === 'send' && this.wa) {
      await this.wa.sendMessage(cmd.to, cmd.text);
    }
  }

  private broadcast(msg: BridgeMessage): void {
    const data = JSON.stringify(msg);
    for (const client of this.clients) {
      if (client.readyState === WebSocket.OPEN) {
        client.send(data);
      }
    }
  }

  async stop(): Promise<void> {
    // Close all client connections
    for (const client of this.clients) {
      client.close();
    }
    this.clients.clear();

    // Close WebSocket server
    if (this.wss) {
      this.wss.close();
      this.wss = null;
    }

    // Disconnect WhatsApp
    if (this.wa) {
      await this.wa.disconnect();
      this.wa = null;
    }
  }
}


================================================
FILE: nanobot/bridge/src/types.d.ts
================================================
declare module 'qrcode-terminal' {
  export function generate(text: string, options?: { small?: boolean }): void;
}


================================================
FILE: nanobot/bridge/src/whatsapp.ts
================================================
/**
 * WhatsApp client wrapper using Baileys.
 * Based on OpenClaw's working implementation.
 */

/* eslint-disable @typescript-eslint/no-explicit-any */
import makeWASocket, {
  DisconnectReason,
  useMultiFileAuthState,
  fetchLatestBaileysVersion,
  makeCacheableSignalKeyStore,
} from '@whiskeysockets/baileys';

import { Boom } from '@hapi/boom';
import qrcode from 'qrcode-terminal';
import pino from 'pino';

const VERSION = '0.1.0';

export interface InboundMessage {
  id: string;
  sender: string;
  pn: string;
  content: string;
  timestamp: number;
  isGroup: boolean;
}

export interface WhatsAppClientOptions {
  authDir: string;
  onMessage: (msg: InboundMessage) => void;
  onQR: (qr: string) => void;
  onStatus: (status: string) => void;
}

export class WhatsAppClient {
  private sock: any = null;
  private options: WhatsAppClientOptions;
  private reconnecting = false;

  constructor(options: WhatsAppClientOptions) {
    this.options = options;
  }

  async connect(): Promise<void> {
    const logger = pino({ level: 'silent' });
    const { state, saveCreds } = await useMultiFileAuthState(this.options.authDir);
    const { version } = await fetchLatestBaileysVersion();

    console.log(`Using Baileys version: ${version.join('.')}`);

    // Create socket following OpenClaw's pattern
    this.sock = makeWASocket({
      auth: {
        creds: state.creds,
        keys: makeCacheableSignalKeyStore(state.keys, logger),
      },
      version,
      logger,
      printQRInTerminal: false,
      browser: ['nanobot', 'cli', VERSION],
      syncFullHistory: false,
      markOnlineOnConnect: false,
    });

    // Handle WebSocket errors
    if (this.sock.ws && typeof this.sock.ws.on === 'function') {
      this.sock.ws.on('error', (err: Error) => {
        console.error('WebSocket error:', err.message);
      });
    }

    // Handle connection updates
    this.sock.ev.on('connection.update', async (update: any) => {
      const { connection, lastDisconnect, qr } = update;

      if (qr) {
        // Display QR code in terminal
        console.log('\n📱 Scan this QR code with WhatsApp (Linked Devices):\n');
        qrcode.generate(qr, { small: true });
        this.options.onQR(qr);
      }

      if (connection === 'close') {
        const statusCode = (lastDisconnect?.error as Boom)?.output?.statusCode;
        const shouldReconnect = statusCode !== DisconnectReason.loggedOut;

        console.log(`Connection closed. Status: ${statusCode}, Will reconnect: ${shouldReconnect}`);
        this.options.onStatus('disconnected');

        if (shouldReconnect && !this.reconnecting) {
          this.reconnecting = true;
          console.log('Reconnecting in 5 seconds...');
          setTimeout(() => {
            this.reconnecting = false;
            this.connect();
          }, 5000);
        }
      } else if (connection === 'open') {
        console.log('✅ Connected to WhatsApp');
        this.options.onStatus('connected');
      }
    });

    // Save credentials on update
    this.sock.ev.on('creds.update', saveCreds);

    // Handle incoming messages
    this.sock.ev.on('messages.upsert', async ({ messages, type }: { messages: any[]; type: string }) => {
      if (type !== 'notify') return;

      for (const msg of messages) {
        // Skip own messages
        if (msg.key.fromMe) continue;

        // Skip status updates
        if (msg.key.remoteJid === 'status@broadcast') continue;

        const content = this.extractMessageContent(msg);
        if (!content) continue;

        const isGroup = msg.key.remoteJid?.endsWith('@g.us') || false;

        this.options.onMessage({
          id: msg.key.id || '',
          sender: msg.key.remoteJid || '',
          pn: msg.key.remoteJidAlt || '',
          content,
          timestamp: msg.messageTimestamp as number,
          isGroup,
        });
      }
    });
  }

  private extractMessageContent(msg: any): string | null {
    const message = msg.message;
    if (!message) return null;

    // Text message
    if (message.conversation) {
      return message.conversation;
    }

    // Extended text (reply, link preview)
    if (message.extendedTextMessage?.text) {
      return message.extendedTextMessage.text;
    }

    // Image with caption
    if (message.imageMessage?.caption) {
      return `[Image] ${message.imageMessage.caption}`;
    }

    // Video with caption
    if (message.videoMessage?.caption) {
      return `[Video] ${message.videoMessage.caption}`;
    }

    // Document with caption
    if (message.documentMessage?.caption) {
      return `[Document] ${message.documentMessage.caption}`;
    }

    // Voice/Audio message
    if (message.audioMessage) {
      return `[Voice Message]`;
    }

    return null;
  }

  async sendMessage(to: string, text: string): Promise<void> {
    if (!this.sock) {
      throw new Error('Not connected');
    }

    await this.sock.sendMessage(to, { text });
  }

  async disconnect(): Promise<void> {
    if (this.sock) {
      this.sock.end(undefined);
      this.sock = null;
    }
  }
}


================================================
FILE: nanobot/bridge/tsconfig.json
================================================
{
  "compilerOptions": {
    "target": "ES2022",
    "module": "ESNext",
    "moduleResolution": "node",
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
    "outDir": "./dist",
    "rootDir": "./src",
    "declaration": true,
    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "dist"]
}


================================================
FILE: nanobot/core_agent_lines.sh
================================================
#!/bin/bash
# Count core agent lines (excluding channels/, cli/, providers/ adapters)
cd "$(dirname "$0")" || exit 1

echo "nanobot core agent line count"
echo "================================"
echo ""

for dir in agent agent/tools bus config cron heartbeat session utils; do
  count=$(find "nanobot/$dir" -maxdepth 1 -name "*.py" -exec cat {} + | wc -l)
  printf "  %-16s %5s lines\n" "$dir/" "$count"
done

root=$(cat nanobot/__init__.py nanobot/__main__.py | wc -l)
printf "  %-16s %5s lines\n" "(root)" "$root"

echo ""
total=$(find nanobot -name "*.py" ! -path "*/channels/*" ! -path "*/cli/*" ! -path "*/providers/*" | xargs cat | wc -l)
echo "  Core total:     $total lines"
echo ""
echo "  (excludes: channels/, cli/, providers/)"


================================================
FILE: nanobot/nanobot/__init__.py
================================================
"""
nanobot - A lightweight AI agent framework
"""

__version__ = "0.1.0"
__logo__ = "🐈"


================================================
FILE: nanobot/nanobot/__main__.py
================================================
"""
Entry point for running nanobot as a module: python -m nanobot
"""

from nanobot.cli.commands import app

if __name__ == "__main__":
    app()


================================================
FILE: nanobot/nanobot/agent/__init__.py
================================================
"""Agent core module."""

from nanobot.agent.context import ContextBuilder
from nanobot.agent.loop import AgentLoop
from nanobot.agent.memory import MemoryStore
from nanobot.agent.skills import SkillsLoader

__all__ = ["AgentLoop", "ContextBuilder", "MemoryStore", "SkillsLoader"]


================================================
FILE: nanobot/nanobot/agent/context.py
================================================
"""Context builder for assembling agent prompts."""

import base64
import mimetypes
import platform
from pathlib import Path
from typing import Any

from nanobot.agent.memory import MemoryStore
from nanobot.agent.skills import SkillsLoader


class ContextBuilder:
    """
    Builds the context (system prompt + messages) for the agent.

    Assembles bootstrap files, memory, skills, and conversation history
    into a coherent prompt for the LLM.
    """

    BOOTSTRAP_FILES = ["AGENTS.md", "SOUL.md", "USER.md", "TOOLS.md", "IDENTITY.md"]

    def __init__(self, workspace: Path):
        self.workspace = workspace
        self.memory = MemoryStore(workspace)
        self.skills = SkillsLoader(workspace)

    def build_system_prompt(self, skill_names: list[str] | None = None) -> str:
        """
        Build the system prompt from bootstrap files, memory, and skills.

        Args:
            skill_names: Optional list of skills to include.

        Returns:
            Complete system prompt.
        """
        parts = []

        # Core identity
        parts.append(self._get_identity())

        # Bootstrap files
        bootstrap = self._load_bootstrap_files()
        if bootstrap:
            parts.append(bootstrap)

        # Memory context
        memory = self.memory.get_memory_context()
        if memory:
            parts.append(f"# Memory\n\n{memory}")

        # Skills - progressive loading
        # 1. Always-loaded skills: include full content
        always_skills = self.skills.get_always_skills()
        if always_skills:
            always_content = self.skills.load_skills_for_context(always_skills)
            if always_content:
                parts.append(f"# Active Skills\n\n{always_content}")

        # 2. Available skills: only show summary (agent uses read_file to load)
        skills_summary = self.skills.build_skills_summary()
        if skills_summary:
            parts.append(f"""# Skills

The following skills extend your capabilities. To use a skill, read its SKILL.md file using the read_file tool.
Skills with available="false" need dependencies installed first - you can try installing them with apt/brew.

{skills_summary}""")

        return "\n\n---\n\n".join(parts)

    def _get_identity(self) -> str:
        """Get the core identity section."""
        from datetime import datetime

        now = datetime.now().strftime("%Y-%m-%d %H:%M (%A)")
        workspace_path = str(self.workspace.expanduser().resolve())
        system = platform.system()
        runtime = f"{'macOS' if system == 'Darwin' else system} {platform.machine()}, Python {platform.python_version()}"

        return f"""# nanobot 🐈

You are nanobot, a helpful AI assistant. You have access to tools that allow you to:
- Read, write, and edit files
- Execute shell commands
- Search the web and fetch web pages
- Send messages to users on chat channels
- Spawn subagents for complex background tasks

## Current Time
{now}

## Runtime
{runtime}

## Workspace
Your workspace is at: {workspace_path}
- Memory files: {workspace_path}/memory/MEMORY.md
- Daily notes: {workspace_path}/memory/YYYY-MM-DD.md
- Custom skills: {workspace_path}/skills/{{skill-name}}/SKILL.md

IMPORTANT: When responding to direct questions or conversations, reply directly with your text response.
Only use the 'message' tool when you need to send a message to a specific chat channel (like WhatsApp).
For normal conversation, just respond with text - do not call the message tool.

Always be helpful, accurate, and concise. When using tools, explain what you're doing.
When remembering something, write to {workspace_path}/memory/MEMORY.md"""

    def _load_bootstrap_files(self) -> str:
        """Load all bootstrap files from workspace."""
        parts = []

        for filename in self.BOOTSTRAP_FILES:
            file_path = self.workspace / filename
            if file_path.exists():
                content = file_path.read_text(encoding="utf-8")
                parts.append(f"## {filename}\n\n{content}")

        return "\n\n".join(parts) if parts else ""

    def build_messages(
        self,
        history: list[dict[str, Any]],
        current_message: str,
        skill_names: list[str] | None = None,
        media: list[str] | None = None,
        channel: str | None = None,
        chat_id: str | None = None,
    ) -> list[dict[str, Any]]:
        """
        Build the complete message list for an LLM call.

        Args:
            history: Previous conversation messages.
            current_message: The new user message.
            skill_names: Optional skills to include.
            media: Optional list of local file paths for images/media.
            channel: Current channel (telegram, feishu, etc.).
            chat_id: Current chat/user ID.

        Returns:
            List of messages including system prompt.
        """
        messages = []

        # System prompt
        system_prompt = self.build_system_prompt(skill_names)
        if channel and chat_id:
            system_prompt += f"\n\n## Current Session\nChannel: {channel}\nChat ID: {chat_id}"
        messages.append({"role": "system", "content": system_prompt})

        # History
        messages.extend(history)

        # Current message (with optional image attachments)
        user_content = self._build_user_content(current_message, media)
        messages.append({"role": "user", "content": user_content})

        return messages

    def _build_user_content(self, text: str, media: list[str] | None) -> str | list[dict[str, Any]]:
        """Build user message content with optional base64-encoded images."""
        if not media:
            return text

        images = []
        for path in media:
            p = Path(path)
            mime, _ = mimetypes.guess_type(path)
            if not p.is_file() or not mime or not mime.startswith("image/"):
                continue
            b64 = base64.b64encode(p.read_bytes()).decode()
            images.append({"type": "image_url", "image_url": {"url": f"data:{mime};base64,{b64}"}})

        if not images:
            return text
        return images + [{"type": "text", "text": text}]

    def add_tool_result(
        self, messages: list[dict[str, Any]], tool_call_id: str, tool_name: str, result: str
    ) -> list[dict[str, Any]]:
        """
        Add a tool result to the message list.

        Args:
            messages: Current message list.
            tool_call_id: ID of the tool call.
            tool_name: Name of the tool.
            result: Tool execution result.

        Returns:
            Updated message list.
        """
        messages.append(
            {"role": "tool", "tool_call_id": tool_call_id, "name": tool_name, "content": result}
        )
        return messages

    def add_assistant_message(
        self,
        messages: list[dict[str, Any]],
        content: str | None,
        tool_calls: list[dict[str, Any]] | None = None,
        reasoning_content: str | None = None,
    ) -> list[dict[str, Any]]:
        """
        Add an assistant message to the message list.

        Args:
            messages: Current message list.
            content: Message content.
            tool_calls: Optional tool calls.
            reasoning_content: Thinking output (Kimi, DeepSeek-R1, etc.).

        Returns:
            Updated message list.
        """
        msg: dict[str, Any] = {"role": "assistant", "content": content or ""}

        if tool_calls:
            msg["tool_calls"] = tool_calls

        # Thinking models reject history without this
        if reasoning_content:
            msg["reasoning_content"] = reasoning_content

        messages.append(msg)
        return messages


================================================
FILE: nanobot/nanobot/agent/loop.py
================================================
"""Agent loop: the core processing engine."""

from __future__ import annotations

import asyncio
import json
import os
from pathlib import Path
from typing import TYPE_CHECKING

from loguru import logger

from nanobot.agent.context import ContextBuilder
from nanobot.agent.subagent import SubagentManager
from nanobot.agent.tools.cron import CronTool
from nanobot.agent.tools.filesystem import EditFileTool, ListDirTool, ReadFileTool, WriteFileTool
from nanobot.agent.tools.message import MessageTool
from nanobot.agent.tools.registry import ToolRegistry
from nanobot.agent.tools.shell import ExecTool
from nanobot.agent.tools.spawn import SpawnTool
from nanobot.agent.tools.web import WebFetchTool, WebSearchTool
from nanobot.bus.events import InboundMessage, OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.providers.base import LLMProvider
from nanobot.session.manager import SessionManager

if TYPE_CHECKING:
    from nanobot.config.schema import ExecToolConfig
    from nanobot.cron.service import CronService


class AgentLoop:
    """
    The agent loop is the core processing engine.

    It:
    1. Receives messages from the bus
    2. Builds context with history, memory, skills
    3. Calls the LLM
    4. Executes tool calls
    5. Sends responses back
    """

    def __init__(
        self,
        bus: MessageBus,
        provider: LLMProvider,
        workspace: Path,
        model: str | None = None,
        max_iterations: int = 20,
        brave_api_key: str | None = None,
        exec_config: ExecToolConfig | None = None,
        cron_service: CronService | None = None,
        restrict_to_workspace: bool = False,
        session_manager: SessionManager | None = None,
    ):
        from nanobot.config.schema import ExecToolConfig

        self.bus = bus
        self.provider = provider
        self.workspace = workspace
        self.model = model or provider.get_default_model()
        self.max_iterations = max_iterations
        self.brave_api_key = brave_api_key
        self.exec_config = exec_config or ExecToolConfig()
        self.cron_service = cron_service
        self.restrict_to_workspace = restrict_to_workspace

        self.context = ContextBuilder(workspace)
        self.sessions = session_manager or SessionManager(workspace)
        self.tools = ToolRegistry()
        self.subagents = SubagentManager(
            provider=provider,
            workspace=workspace,
            bus=bus,
            model=self.model,
            brave_api_key=brave_api_key,
            exec_config=self.exec_config,
            restrict_to_workspace=restrict_to_workspace,
        )

        self._running = False
        self._register_default_tools()

    def _register_default_tools(self) -> None:
        """Register the default set of tools."""
        # File tools (restrict to workspace if configured)
        allowed_dir = self.workspace if self.restrict_to_workspace else None
        self.tools.register(ReadFileTool(allowed_dir=allowed_dir))
        self.tools.register(WriteFileTool(allowed_dir=allowed_dir))
        self.tools.register(EditFileTool(allowed_dir=allowed_dir))
        self.tools.register(ListDirTool(allowed_dir=allowed_dir))

        # Shell tool
        self.tools.register(
            ExecTool(
                working_dir=str(self.workspace),
                timeout=self.exec_config.timeout,
                restrict_to_workspace=self.restrict_to_workspace,
            )
        )

        # Web tools
        self.tools.register(WebSearchTool(api_key=self.brave_api_key))
        self.tools.register(WebFetchTool())

        # Message tool
        message_tool = MessageTool(send_callback=self.bus.publish_outbound)
        self.tools.register(message_tool)

        # Spawn tool (for subagents)
        spawn_tool = SpawnTool(manager=self.subagents)
        self.tools.register(spawn_tool)

        # Cron tool (for scheduling)
        if self.cron_service:
            self.tools.register(CronTool(self.cron_service))

        # DeepCode tools (conditionally loaded when DEEPCODE_API_URL is set)
        deepcode_url = os.environ.get("DEEPCODE_API_URL")
        if deepcode_url:
            from nanobot.agent.tools.deepcode import create_all_tools

            for tool in create_all_tools(api_url=deepcode_url):
                self.tools.register(tool)
            logger.info(f"DeepCode tools registered (API: {deepcode_url})")

    async def run(self) -> None:
        """Run the agent loop, processing messages from the bus."""
        self._running = True
        logger.info("Agent loop started")

        while self._running:
            try:
                # Wait for next message
                msg = await asyncio.wait_for(self.bus.consume_inbound(), timeout=1.0)

                # Process it
                try:
                    response = await self._process_message(msg)
                    if response:
                        await self.bus.publish_outbound(response)
                except Exception as e:
                    logger.error(f"Error processing message: {e}")
                    # Send error response
                    await self.bus.publish_outbound(
                        OutboundMessage(
                            channel=msg.channel,
                            chat_id=msg.chat_id,
                            content=f"Sorry, I encountered an error: {str(e)}",
                        )
                    )
            except asyncio.TimeoutError:
                continue

    def stop(self) -> None:
        """Stop the agent loop."""
        self._running = False
        logger.info("Agent loop stopping")

    async def _process_message(self, msg: InboundMessage) -> OutboundMessage | None:
        """
        Process a single inbound message.

        Args:
            msg: The inbound message to process.

        Returns:
            The response message, or None if no response needed.
        """
        # Handle system messages (subagent announces)
        # The chat_id contains the original "channel:chat_id" to route back to
        if msg.channel == "system":
            return await self._process_system_message(msg)

        preview = msg.content[:80] + "..." if len(msg.content) > 80 else msg.content
        logger.info(f"Processing message from {msg.channel}:{msg.sender_id}: {preview}")

        # Get or create session
        session = self.sessions.get_or_create(msg.session_key)

        # Update tool contexts
        message_tool = self.tools.get("message")
        if isinstance(message_tool, MessageTool):
            message_tool.set_context(msg.channel, msg.chat_id)

        spawn_tool = self.tools.get("spawn")
        if isinstance(spawn_tool, SpawnTool):
            spawn_tool.set_context(msg.channel, msg.chat_id)

        cron_tool = self.tools.get("cron")
        if isinstance(cron_tool, CronTool):
            cron_tool.set_context(msg.channel, msg.chat_id)

        # Build initial messages (use get_history for LLM-formatted messages)
        messages = self.context.build_messages(
            history=session.get_history(),
            current_message=msg.content,
            media=msg.media if msg.media else None,
            channel=msg.channel,
            chat_id=msg.chat_id,
        )

        # Agent loop
        iteration = 0
        final_content = None

        while iteration < self.max_iterations:
            iteration += 1

            # Call LLM
            response = await self.provider.chat(
                messages=messages, tools=self.tools.get_definitions(), model=self.model
            )

            # Handle tool calls
            if response.has_tool_calls:
                # Add assistant message with tool calls
                tool_call_dicts = [
                    {
                        "id": tc.id,
                        "type": "function",
                        "function": {
                            "name": tc.name,
                            "arguments": json.dumps(tc.arguments),  # Must be JSON string
                        },
                    }
                    for tc in response.tool_calls
                ]
                messages = self.context.add_assistant_message(
                    messages,
                    response.content,
                    tool_call_dicts,
                    reasoning_content=response.reasoning_content,
                )

                # Execute tools
                for tool_call in response.tool_calls:
                    args_str = json.dumps(tool_call.arguments, ensure_ascii=False)
                    logger.info(f"Tool call: {tool_call.name}({args_str[:200]})")
                    result = await self.tools.execute(tool_call.name, tool_call.arguments)
                    messages = self.context.add_tool_result(
                        messages, tool_call.id, tool_call.name, result
                    )
            else:
                # No tool calls, we're done
                final_content = response.content
                break

        if final_content is None:
            final_content = "I've completed processing but have no response to give."

        # Log response preview
        preview = final_content[:120] + "..." if len(final_content) > 120 else final_content
        logger.info(f"Response to {msg.channel}:{msg.sender_id}: {preview}")

        # Save to session
        session.add_message("user", msg.content)
        session.add_message("assistant", final_content)
        self.sessions.save(session)

        return OutboundMessage(
            channel=msg.channel,
            chat_id=msg.chat_id,
            content=final_content,
            metadata=msg.metadata
            or {},  # Pass through for channel-specific needs (e.g. Slack thread_ts)
        )

    async def _process_system_message(self, msg: InboundMessage) -> OutboundMessage | None:
        """
        Process a system message (e.g., subagent announce).

        The chat_id field contains "original_channel:original_chat_id" to route
        the response back to the correct destination.
        """
        logger.info(f"Processing system message from {msg.sender_id}")

        # Parse origin from chat_id (format: "channel:chat_id")
        if ":" in msg.chat_id:
            parts = msg.chat_id.split(":", 1)
            origin_channel = parts[0]
            origin_chat_id = parts[1]
        else:
            # Fallback
            origin_channel = "cli"
            origin_chat_id = msg.chat_id

        # Use the origin session for context
        session_key = f"{origin_channel}:{origin_chat_id}"
        session = self.sessions.get_or_create(session_key)

        # Update tool contexts
        message_tool = self.tools.get("message")
        if isinstance(message_tool, MessageTool):
            message_tool.set_context(origin_channel, origin_chat_id)

        spawn_tool = self.tools.get("spawn")
        if isinstance(spawn_tool, SpawnTool):
            spawn_tool.set_context(origin_channel, origin_chat_id)

        cron_tool = self.tools.get("cron")
        if isinstance(cron_tool, CronTool):
            cron_tool.set_context(origin_channel, origin_chat_id)

        # Build messages with the announce content
        messages = self.context.build_messages(
            history=session.get_history(),
            current_message=msg.content,
            channel=origin_channel,
            chat_id=origin_chat_id,
        )

        # Agent loop (limited for announce handling)
        iteration = 0
        final_content = None

        while iteration < self.max_iterations:
            iteration += 1

            response = await self.provider.chat(
                messages=messages, tools=self.tools.get_definitions(), model=self.model
            )

            if response.has_tool_calls:
                tool_call_dicts = [
                    {
                        "id": tc.id,
                        "type": "function",
                        "function": {"name": tc.name, "arguments": json.dumps(tc.arguments)},
                    }
                    for tc in response.tool_calls
                ]
                messages = self.context.add_assistant_message(
                    messages,
                    response.content,
                    tool_call_dicts,
                    reasoning_content=response.reasoning_content,
                )

                for tool_call in response.tool_calls:
                    args_str = json.dumps(tool_call.arguments, ensure_ascii=False)
                    logger.info(f"Tool call: {tool_call.name}({args_str[:200]})")
                    result = await self.tools.execute(tool_call.name, tool_call.arguments)
                    messages = self.context.add_tool_result(
                        messages, tool_call.id, tool_call.name, result
                    )
            else:
                final_content = response.content
                break

        if final_content is None:
            final_content = "Background task completed."

        # Save to session (mark as system message in history)
        session.add_message("user", f"[System: {msg.sender_id}] {msg.content}")
        session.add_message("assistant", final_content)
        self.sessions.save(session)

        return OutboundMessage(
            channel=origin_channel, chat_id=origin_chat_id, content=final_content
        )

    async def process_direct(
        self,
        content: str,
        session_key: str = "cli:direct",
        channel: str = "cli",
        chat_id: str = "direct",
    ) -> str:
        """
        Process a message directly (for CLI or cron usage).

        Args:
            content: The message content.
            session_key: Session identifier.
            channel: Source channel (for context).
            chat_id: Source chat ID (for context).

        Returns:
            The agent's response.
        """
        msg = InboundMessage(channel=channel, sender_id="user", chat_id=chat_id, content=content)

        response = await self._process_message(msg)
        return response.content if response else ""


================================================
FILE: nanobot/nanobot/agent/memory.py
================================================
"""Memory system for persistent agent memory."""

from datetime import datetime
from pathlib import Path

from nanobot.utils.helpers import ensure_dir, today_date


class MemoryStore:
    """
    Memory system for the agent.

    Supports daily notes (memory/YYYY-MM-DD.md) and long-term memory (MEMORY.md).
    """

    def __init__(self, workspace: Path):
        self.workspace = workspace
        self.memory_dir = ensure_dir(workspace / "memory")
        self.memory_file = self.memory_dir / "MEMORY.md"

    def get_today_file(self) -> Path:
        """Get path to today's memory file."""
        return self.memory_dir / f"{today_date()}.md"

    def read_today(self) -> str:
        """Read today's memory notes."""
        today_file = self.get_today_file()
        if today_file.exists():
            return today_file.read_text(encoding="utf-8")
        return ""

    def append_today(self, content: str) -> None:
        """Append content to today's memory notes."""
        today_file = self.get_today_file()

        if today_file.exists():
            existing = today_file.read_text(encoding="utf-8")
            content = existing + "\n" + content
        else:
            # Add header for new day
            header = f"# {today_date()}\n\n"
            content = header + content

        today_file.write_text(content, encoding="utf-8")

    def read_long_term(self) -> str:
        """Read long-term memory (MEMORY.md)."""
        if self.memory_file.exists():
            return self.memory_file.read_text(encoding="utf-8")
        return ""

    def write_long_term(self, content: str) -> None:
        """Write to long-term memory (MEMORY.md)."""
        self.memory_file.write_text(content, encoding="utf-8")

    def get_recent_memories(self, days: int = 7) -> str:
        """
        Get memories from the last N days.

        Args:
            days: Number of days to look back.

        Returns:
            Combined memory content.
        """
        from datetime import timedelta

        memories = []
        today = datetime.now().date()

        for i in range(days):
            date = today - timedelta(days=i)
            date_str = date.strftime("%Y-%m-%d")
            file_path = self.memory_dir / f"{date_str}.md"

            if file_path.exists():
                content = file_path.read_text(encoding="utf-8")
                memories.append(content)

        return "\n\n---\n\n".join(memories)

    def list_memory_files(self) -> list[Path]:
        """List all memory files sorted by date (newest first)."""
        if not self.memory_dir.exists():
            return []

        files = list(self.memory_dir.glob("????-??-??.md"))
        return sorted(files, reverse=True)

    def get_memory_context(self) -> str:
        """
        Get memory context for the agent.

        Returns:
            Formatted memory context including long-term and recent memories.
        """
        parts = []

        # Long-term memory
        long_term = self.read_long_term()
        if long_term:
            parts.append("## Long-term Memory\n" + long_term)

        # Today's notes
        today = self.read_today()
        if today:
            parts.append("## Today's Notes\n" + today)

        return "\n\n".join(parts) if parts else ""


================================================
FILE: nanobot/nanobot/agent/skills.py
================================================
"""Skills loader for agent capabilities."""

import json
import os
import re
import shutil
from pathlib import Path

# Default builtin skills directory (relative to this file)
BUILTIN_SKILLS_DIR = Path(__file__).parent.parent / "skills"


class SkillsLoader:
    """
    Loader for agent skills.

    Skills are markdown files (SKILL.md) that teach the agent how to use
    specific tools or perform certain tasks.
    """

    def __init__(self, workspace: Path, builtin_skills_dir: Path | None = None):
        self.workspace = workspace
        self.workspace_skills = workspace / "skills"
        self.builtin_skills = builtin_skills_dir or BUILTIN_SKILLS_DIR

    def list_skills(self, filter_unavailable: bool = True) -> list[dict[str, str]]:
        """
        List all available skills.

        Args:
            filter_unavailable: If True, filter out skills with unmet requirements.

        Returns:
            List of skill info dicts with 'name', 'path', 'source'.
        """
        skills = []

        # Workspace skills (highest priority)
        if self.workspace_skills.exists():
            for skill_dir in self.workspace_skills.iterdir():
                if skill_dir.is_dir():
                    skill_file = skill_dir / "SKILL.md"
                    if skill_file.exists():
                        skills.append(
                            {"name": skill_dir.name, "path": str(skill_file), "source": "workspace"}
                        )

        # Built-in skills
        if self.builtin_skills and self.builtin_skills.exists():
            for skill_dir in self.builtin_skills.iterdir():
                if skill_dir.is_dir():
                    skill_file = skill_dir / "SKILL.md"
                    if skill_file.exists() and not any(s["name"] == skill_dir.name for s in skills):
                        skills.append(
                            {"name": skill_dir.name, "path": str(skill_file), "source": "builtin"}
                        )

        # Filter by requirements
        if filter_unavailable:
            return [s for s in skills if self._check_requirements(self._get_skill_meta(s["name"]))]
        return skills

    def load_skill(self, name: str) -> str | None:
        """
        Load a skill by name.

        Args:
            name: Skill name (directory name).

        Returns:
            Skill content or None if not found.
        """
        # Check workspace first
        workspace_skill = self.workspace_skills / name / "SKILL.md"
        if workspace_skill.exists():
            return workspace_skill.read_text(encoding="utf-8")

        # Check built-in
        if self.builtin_skills:
            builtin_skill = self.builtin_skills / name / "SKILL.md"
            if builtin_skill.exists():
                return builtin_skill.read_text(encoding="utf-8")

        return None

    def load_skills_for_context(self, skill_names: list[str]) -> str:
        """
        Load specific skills for inclusion in agent context.

        Args:
            skill_names: List of skill names to load.

        Returns:
            Formatted skills content.
        """
        parts = []
        for name in skill_names:
            content = self.load_skill(name)
            if content:
                content = self._strip_frontmatter(content)
                parts.append(f"### Skill: {name}\n\n{content}")

        return "\n\n---\n\n".join(parts) if parts else ""

    def build_skills_summary(self) -> str:
        """
        Build a summary of all skills (name, description, path, availability).

        This is used for progressive loading - the agent can read the full
        skill content using read_file when needed.

        Returns:
            XML-formatted skills summary.
        """
        all_skills = self.list_skills(filter_unavailable=False)
        if not all_skills:
            return ""

        def escape_xml(s: str) -> str:
            return s.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")

        lines = ["<skills>"]
        for s in all_skills:
            name = escape_xml(s["name"])
            path = s["path"]
            desc = escape_xml(self._get_skill_description(s["name"]))
            skill_meta = self._get_skill_meta(s["name"])
            available = self._check_requirements(skill_meta)

            lines.append(f'  <skill available="{str(available).lower()}">')
            lines.append(f"    <name>{name}</name>")
            lines.append(f"    <description>{desc}</description>")
            lines.append(f"    <location>{path}</location>")

            # Show missing requirements for unavailable skills
            if not available:
                missing = self._get_missing_requirements(skill_meta)
                if missing:
                    lines.append(f"    <requires>{escape_xml(missing)}</requires>")

            lines.append("  </skill>")
        lines.append("</skills>")

        return "\n".join(lines)

    def _get_missing_requirements(self, skill_meta: dict) -> str:
        """Get a description of missing requirements."""
        missing = []
        requires = skill_meta.get("requires", {})
        for b in requires.get("bins", []):
            if not shutil.which(b):
                missing.append(f"CLI: {b}")
        for env in requires.get("env", []):
            if not os.environ.get(env):
                missing.append(f"ENV: {env}")
        return ", ".join(missing)

    def _get_skill_description(self, name: str) -> str:
        """Get the description of a skill from its frontmatter."""
        meta = self.get_skill_metadata(name)
        if meta and meta.get("description"):
            return meta["description"]
        return name  # Fallback to skill name

    def _strip_frontmatter(self, content: str) -> str:
        """Remove YAML frontmatter from markdown content."""
        if content.startswith("---"):
            match = re.match(r"^---\n.*?\n---\n", content, re.DOTALL)
            if match:
                return content[match.end() :].strip()
        return content

    def _parse_nanobot_metadata(self, raw: str) -> dict:
        """Parse nanobot metadata JSON from frontmatter."""
        try:
            data = json.loads(raw)
            return data.get("nanobot", {}) if isinstance(data, dict) else {}
        except (json.JSONDecodeError, TypeError):
            return {}

    def _check_requirements(self, skill_meta: dict) -> bool:
        """Check if skill requirements are met (bins, env vars)."""
        requires = skill_meta.get("requires", {})
        for b in requires.get("bins", []):
            if not shutil.which(b):
                return False
        for env in requires.get("env", []):
            if not os.environ.get(env):
                return False
        return True

    def _get_skill_meta(self, name: str) -> dict:
        """Get nanobot metadata for a skill (cached in frontmatter)."""
        meta = self.get_skill_metadata(name) or {}
        return self._parse_nanobot_metadata(meta.get("metadata", ""))

    def get_always_skills(self) -> list[str]:
        """Get skills marked as always=true that meet requirements."""
        result = []
        for s in self.list_skills(filter_unavailable=True):
            meta = self.get_skill_metadata(s["name"]) or {}
            skill_meta = self._parse_nanobot_metadata(meta.get("metadata", ""))
            if skill_meta.get("always") or meta.get("always"):
                result.append(s["name"])
        return result

    def get_skill_metadata(self, name: str) -> dict | None:
        """
        Get metadata from a skill's frontmatter.

        Args:
            name: Skill name.

        Returns:
            Metadata dict or None.
        """
        content = self.load_skill(name)
        if not content:
            return None

        if content.startswith("---"):
            match = re.match(r"^---\n(.*?)\n---", content, re.DOTALL)
            if match:
                # Simple YAML parsing
                metadata = {}
                for line in match.group(1).split("\n"):
                    if ":" in line:
                        key, value = line.split(":", 1)
                        metadata[key.strip()] = value.strip().strip("\"'")
                return metadata

        return None


================================================
FILE: nanobot/nanobot/agent/subagent.py
================================================
"""Subagent manager for background task execution."""

from __future__ import annotations

import asyncio
import json
import uuid
from pathlib import Path
from typing import TYPE_CHECKING, Any

from loguru import logger

from nanobot.agent.tools.filesystem import ListDirTool, ReadFileTool, WriteFileTool
from nanobot.agent.tools.registry import ToolRegistry
from nanobot.agent.tools.shell import ExecTool
from nanobot.agent.tools.web import WebFetchTool, WebSearchTool
from nanobot.bus.events import InboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.providers.base import LLMProvider

if TYPE_CHECKING:
    from nanobot.config.schema import ExecToolConfig


class SubagentManager:
    """
    Manages background subagent execution.

    Subagents are lightweight agent instances that run in the background
    to handle specific tasks. They share the same LLM provider but have
    isolated context and a focused system prompt.
    """

    def __init__(
        self,
        provider: LLMProvider,
        workspace: Path,
        bus: MessageBus,
        model: str | None = None,
        brave_api_key: str | None = None,
        exec_config: ExecToolConfig | None = None,
        restrict_to_workspace: bool = False,
    ):
        from nanobot.config.schema import ExecToolConfig

        self.provider = provider
        self.workspace = workspace
        self.bus = bus
        self.model = model or provider.get_default_model()
        self.brave_api_key = brave_api_key
        self.exec_config = exec_config or ExecToolConfig()
        self.restrict_to_workspace = restrict_to_workspace
        self._running_tasks: dict[str, asyncio.Task[None]] = {}

    async def spawn(
        self,
        task: str,
        label: str | None = None,
        origin_channel: str = "cli",
        origin_chat_id: str = "direct",
    ) -> str:
        """
        Spawn a subagent to execute a task in the background.

        Args:
            task: The task description for the subagent.
            label: Optional human-readable label for the task.
            origin_channel: The channel to announce results to.
            origin_chat_id: The chat ID to announce results to.

        Returns:
            Status message indicating the subagent was started.
        """
        task_id = str(uuid.uuid4())[:8]
        display_label = label or task[:30] + ("..." if len(task) > 30 else "")

        origin = {
            "channel": origin_channel,
            "chat_id": origin_chat_id,
        }

        # Create background task
        bg_task = asyncio.create_task(self._run_subagent(task_id, task, display_label, origin))
        self._running_tasks[task_id] = bg_task

        # Cleanup when done
        bg_task.add_done_callback(lambda _: self._running_tasks.pop(task_id, None))

        logger.info(f"Spawned subagent [{task_id}]: {display_label}")
        return f"Subagent [{display_label}] started (id: {task_id}). I'll notify you when it completes."

    async def _run_subagent(
        self,
        task_id: str,
        task: str,
        label: str,
        origin: dict[str, str],
    ) -> None:
        """Execute the subagent task and announce the result."""
        logger.info(f"Subagent [{task_id}] starting task: {label}")

        try:
            # Build subagent tools (no message tool, no spawn tool)
            tools = ToolRegistry()
            allowed_dir = self.workspace if self.restrict_to_workspace else None
            tools.register(ReadFileTool(allowed_dir=allowed_dir))
            tools.register(WriteFileTool(allowed_dir=allowed_dir))
            tools.register(ListDirTool(allowed_dir=allowed_dir))
            tools.register(
                ExecTool(
                    working_dir=str(self.workspace),
                    timeout=self.exec_config.timeout,
                    restrict_to_workspace=self.restrict_to_workspace,
                )
            )
            tools.register(WebSearchTool(api_key=self.brave_api_key))
            tools.register(WebFetchTool())

            # Build messages with subagent-specific prompt
            system_prompt = self._build_subagent_prompt(task)
            messages: list[dict[str, Any]] = [
                {"role": "system", "content": system_prompt},
                {"role": "user", "content": task},
            ]

            # Run agent loop (limited iterations)
            max_iterations = 15
            iteration = 0
            final_result: str | None = None

            while iteration < max_iterations:
                iteration += 1

                response = await self.provider.chat(
                    messages=messages,
                    tools=tools.get_definitions(),
                    model=self.model,
                )

                if response.has_tool_calls:
                    # Add assistant message with tool calls
                    tool_call_dicts = [
                        {
                            "id": tc.id,
                            "type": "function",
                            "function": {
                                "name": tc.name,
                                "arguments": json.dumps(tc.arguments),
                            },
                        }
                        for tc in response.tool_calls
                    ]
                    messages.append(
                        {
                            "role": "assistant",
                            "content": response.content or "",
                            "tool_calls": tool_call_dicts,
                        }
                    )

                    # Execute tools
                    for tool_call in response.tool_calls:
                        args_str = json.dumps(tool_call.arguments)
                        logger.debug(
                            f"Subagent [{task_id}] executing: {tool_call.name} with arguments: {args_str}"
                        )
                        result = await tools.execute(tool_call.name, tool_call.arguments)
                        messages.append(
                            {
                                "role": "tool",
                                "tool_call_id": tool_call.id,
                                "name": tool_call.name,
                                "content": result,
                            }
                        )
                else:
                    final_result = response.content
                    break

            if final_result is None:
                final_result = "Task completed but no final response was generated."

            logger.info(f"Subagent [{task_id}] completed successfully")
            await self._announce_result(task_id, label, task, final_result, origin, "ok")

        except Exception as e:
            error_msg = f"Error: {str(e)}"
            logger.error(f"Subagent [{task_id}] failed: {e}")
            await self._announce_result(task_id, label, task, error_msg, origin, "error")

    async def _announce_result(
        self,
        task_id: str,
        label: str,
        task: str,
        result: str,
        origin: dict[str, str],
        status: str,
    ) -> None:
        """Announce the subagent result to the main agent via the message bus."""
        status_text = "completed successfully" if status == "ok" else "failed"

        announce_content = f"""[Subagent '{label}' {status_text}]

Task: {task}

Result:
{result}

Summarize this naturally for the user. Keep it brief (1-2 sentences). Do not mention technical details like "subagent" or task IDs."""

        # Inject as system message to trigger main agent
        msg = InboundMessage(
            channel="system",
            sender_id="subagent",
            chat_id=f"{origin['channel']}:{origin['chat_id']}",
            content=announce_content,
        )

        await self.bus.publish_inbound(msg)
        logger.debug(
            f"Subagent [{task_id}] announced result to {origin['channel']}:{origin['chat_id']}"
        )

    def _build_subagent_prompt(self, task: str) -> str:
        """Build a focused system prompt for the subagent."""
        return f"""# Subagent

You are a subagent spawned by the main agent to complete a specific task.

## Your Task
{task}

## Rules
1. Stay focused - complete only the assigned task, nothing else
2. Your final response will be reported back to the main agent
3. Do not initiate conversations or take on side tasks
4. Be concise but informative in your findings

## What You Can Do
- Read and write files in the workspace
- Execute shell commands
- Search the web and fetch web pages
- Complete the task thoroughly

## What You Cannot Do
- Send messages directly to users (no message tool available)
- Spawn other subagents
- Access the main agent's conversation history

## Workspace
Your workspace is at: {self.workspace}

When you have completed the task, provide a clear summary of your findings or actions."""

    def get_running_count(self) -> int:
        """Return the number of currently running subagents."""
        return len(self._running_tasks)


================================================
FILE: nanobot/nanobot/agent/tools/__init__.py
================================================
"""Agent tools module."""

from nanobot.agent.tools.base import Tool
from nanobot.agent.tools.registry import ToolRegistry

__all__ = ["Tool", "ToolRegistry"]


================================================
FILE: nanobot/nanobot/agent/tools/base.py
================================================
"""Base class for agent tools."""

from abc import ABC, abstractmethod
from typing import Any


class Tool(ABC):
    """
    Abstract base class for agent tools.

    Tools are capabilities that the agent can use to interact with
    the environment, such as reading files, executing commands, etc.
    """

    _TYPE_MAP = {
        "string": str,
        "integer": int,
        "number": (int, float),
        "boolean": bool,
        "array": list,
        "object": dict,
    }

    @property
    @abstractmethod
    def name(self) -> str:
        """Tool name used in function calls."""
        pass

    @property
    @abstractmethod
    def description(self) -> str:
        """Description of what the tool does."""
        pass

    @property
    @abstractmethod
    def parameters(self) -> dict[str, Any]:
        """JSON Schema for tool parameters."""
        pass

    @abstractmethod
    async def execute(self, **kwargs: Any) -> str:
        """
        Execute the tool with given parameters.

        Args:
            **kwargs: Tool-specific parameters.

        Returns:
            String result of the tool execution.
        """
        pass

    def validate_params(self, params: dict[str, Any]) -> list[str]:
        """Validate tool parameters against JSON schema. Returns error list (empty if valid)."""
        schema = self.parameters or {}
        if schema.get("type", "object") != "object":
            raise ValueError(f"Schema must be object type, got {schema.get('type')!r}")
        return self._validate(params, {**schema, "type": "object"}, "")

    def _validate(self, val: Any, schema: dict[str, Any], path: str) -> list[str]:
        t, label = schema.get("type"), path or "parameter"
        if t in self._TYPE_MAP and not isinstance(val, self._TYPE_MAP[t]):
            return [f"{label} should be {t}"]

        errors = []
        if "enum" in schema and val not in schema["enum"]:
            errors.append(f"{label} must be one of {schema['enum']}")
        if t in ("integer", "number"):
            if "minimum" in schema and val < schema["minimum"]:
                errors.append(f"{label} must be >= {schema['minimum']}")
            if "maximum" in schema and val > schema["maximum"]:
                errors.append(f"{label} must be <= {schema['maximum']}")
        if t == "string":
            if "minLength" in schema and len(val) < schema["minLength"]:
                errors.append(f"{label} must be at least {schema['minLength']} chars")
            if "maxLength" in schema and len(val) > schema["maxLength"]:
                errors.append(f"{label} must be at most {schema['maxLength']} chars")
        if t == "object":
            props = schema.get("properties", {})
            for k in schema.get("required", []):
                if k not in val:
                    errors.append(f"missing required {path + '.' + k if path else k}")
            for k, v in val.items():
                if k in props:
                    errors.extend(self._validate(v, props[k], path + "." + k if path else k))
        if t == "array" and "items" in schema:
            for i, item in enumerate(val):
                errors.extend(
                    self._validate(item, schema["items"], f"{path}[{i}]" if path else f"[{i}]")
                )
        return errors

    def to_schema(self) -> dict[str, Any]:
        """Convert tool to OpenAI function schema format."""
        return {
            "type": "function",
            "function": {
                "name": self.name,
                "description": self.description,
                "parameters": self.parameters,
            },
        }


================================================
FILE: nanobot/nanobot/agent/tools/cron.py
================================================
"""Cron tool for scheduling reminders and tasks."""

from typing import Any

from nanobot.agent.tools.base import Tool
from nanobot.cron.service import CronService
from nanobot.cron.types import CronSchedule


class CronTool(Tool):
    """Tool to schedule reminders and recurring tasks."""

    def __init__(self, cron_service: CronService):
        self._cron = cron_service
        self._channel = ""
        self._chat_id = ""

    def set_context(self, channel: str, chat_id: str) -> None:
        """Set the current session context for delivery."""
        self._channel = channel
        self._chat_id = chat_id

    @property
    def name(self) -> str:
        return "cron"

    @property
    def description(self) -> str:
        return "Schedule reminders and recurring tasks. Actions: add, list, remove."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "action": {
                    "type": "string",
                    "enum": ["add", "list", "remove"],
                    "description": "Action to perform",
                },
                "message": {"type": "string", "description": "Reminder message (for add)"},
                "every_seconds": {
                    "type": "integer",
                    "description": "Interval in seconds (for recurring tasks)",
                },
                "cron_expr": {
                    "type": "string",
                    "description": "Cron expression like '0 9 * * *' (for scheduled tasks)",
                },
                "job_id": {"type": "string", "description": "Job ID (for remove)"},
            },
            "required": ["action"],
        }

    async def execute(
        self,
        action: str,
        message: str = "",
        every_seconds: int | None = None,
        cron_expr: str | None = None,
        job_id: str | None = None,
        **kwargs: Any,
    ) -> str:
        if action == "add":
            return self._add_job(message, every_seconds, cron_expr)
        elif action == "list":
            return self._list_jobs()
        elif action == "remove":
            return self._remove_job(job_id)
        return f"Unknown action: {action}"

    def _add_job(self, message: str, every_seconds: int | None, cron_expr: str | None) -> str:
        if not message:
            return "Error: message is required for add"
        if not self._channel or not self._chat_id:
            return "Error: no session context (channel/chat_id)"

        # Build schedule
        if every_seconds:
            schedule = CronSchedule(kind="every", every_ms=every_seconds * 1000)
        elif cron_expr:
            schedule = CronSchedule(kind="cron", expr=cron_expr)
        else:
            return "Error: either every_seconds or cron_expr is required"

        job = self._cron.add_job(
            name=message[:30],
            schedule=schedule,
            message=message,
            deliver=True,
            channel=self._channel,
            to=self._chat_id,
        )
        return f"Created job '{job.name}' (id: {job.id})"

    def _list_jobs(self) -> str:
        jobs = self._cron.list_jobs()
        if not jobs:
            return "No scheduled jobs."
        lines = [f"- {j.name} (id: {j.id}, {j.schedule.kind})" for j in jobs]
        return "Scheduled jobs:\n" + "\n".join(lines)

    def _remove_job(self, job_id: str | None) -> str:
        if not job_id:
            return "Error: job_id is required for remove"
        if self._cron.remove_job(job_id):
            return f"Removed job {job_id}"
        return f"Job {job_id} not found"


================================================
FILE: nanobot/nanobot/agent/tools/deepcode.py
================================================
"""
DeepCode integration tools for nanobot.

These tools allow nanobot to interact with the DeepCode backend API
for paper-to-code reproduction, chat-based code generation, and task management.

Communication: HTTP requests to DeepCode's FastAPI backend.
In Docker Compose: nanobot -> http://deepcode:8000/api/v1/...
"""

import os
from typing import Any

import httpx

from nanobot.agent.tools.base import Tool


def _get_deepcode_url() -> str:
    """Get DeepCode API base URL from environment."""
    return os.environ.get("DEEPCODE_API_URL", "http://deepcode:8000")


class DeepCodePaper2CodeTool(Tool):
    """Submit a paper (URL or file path) to DeepCode for automatic code reproduction."""

    def __init__(self, api_url: str | None = None):
        self._api_url = api_url or _get_deepcode_url()

    @property
    def name(self) -> str:
        return "deepcode_paper2code"

    @property
    def description(self) -> str:
        return (
            "Submit a research paper to DeepCode for automatic code reproduction. "
            "Accepts a paper URL (e.g. arxiv link) or a local file path. "
            "Returns a task ID for tracking progress. "
            "The code generation process runs in the background and may take 10-60 minutes. "
            "Use deepcode_status to check progress."
        )

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "input_source": {
                    "type": "string",
                    "description": "Paper URL (e.g. https://arxiv.org/abs/...) or local file path",
                },
                "input_type": {
                    "type": "string",
                    "enum": ["url", "file"],
                    "description": "Type of input: 'url' for web links, 'file' for local files",
                },
                "enable_indexing": {
                    "type": "boolean",
                    "description": "Enable code reference indexing for enhanced quality (slower but better). Default: false",
                },
            },
            "required": ["input_source", "input_type"],
        }

    async def execute(
        self,
        input_source: str,
        input_type: str = "url",
        enable_indexing: bool = False,
        **kwargs: Any,
    ) -> str:
        try:
            async with httpx.AsyncClient(timeout=30.0) as client:
                response = await client.post(
                    f"{self._api_url}/api/v1/workflows/paper-to-code",
                    json={
                        "input_source": input_source,
                        "input_type": input_type,
                        "enable_indexing": enable_indexing,
                    },
                )
                response.raise_for_status()
                data = response.json()
                task_id = data.get("task_id", "unknown")
                return (
                    f"Paper-to-code task submitted successfully!\n"
                    f"Task ID: {task_id}\n"
                    f"Status: {data.get('status', 'started')}\n"
                    f"Input: {input_source}\n"
                    f"Indexing: {'enabled' if enable_indexing else 'disabled (fast mode)'}\n\n"
                    f"The code generation is running in the background. "
                    f"Use deepcode_status with task_id='{task_id}' to check progress."
                )
        except httpx.ConnectError:
            return "Error: Cannot connect to DeepCode backend. Is the DeepCode service running?"
        except httpx.HTTPStatusError as e:
            return (
                f"Error: DeepCode API returned status {e.response.status_code}: {e.response.text}"
            )
        except Exception as e:
            return f"Error submitting paper to DeepCode: {str(e)}"


class DeepCodeChat2CodeTool(Tool):
    """Submit text requirements to DeepCode for code generation."""

    def __init__(self, api_url: str | None = None):
        self._api_url = api_url or _get_deepcode_url()

    @property
    def name(self) -> str:
        return "deepcode_chat2code"

    @property
    def description(self) -> str:
        return (
            "Submit coding requirements to DeepCode for automatic code generation. "
            "Provide a text description of what you want to build (e.g. web app, algorithm, backend service). "
            "DeepCode will generate a complete implementation. "
            "Returns a task ID for tracking progress."
        )

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "requirements": {
                    "type": "string",
                    "description": "Detailed description of coding requirements",
                },
                "enable_indexing": {
                    "type": "boolean",
                    "description": "Enable code reference indexing for enhanced quality. Default: false",
                },
            },
            "required": ["requirements"],
        }

    async def execute(
        self,
        requirements: str,
        enable_indexing: bool = False,
        **kwargs: Any,
    ) -> str:
        try:
            async with httpx.AsyncClient(timeout=30.0) as client:
                response = await client.post(
                    f"{self._api_url}/api/v1/workflows/chat-planning",
                    json={
                        "requirements": requirements,
                        "enable_indexing": enable_indexing,
                    },
                )
                response.raise_for_status()
                data = response.json()
                task_id = data.get("task_id", "unknown")
                return (
                    f"Chat-to-code task submitted successfully!\n"
                    f"Task ID: {task_id}\n"
                    f"Status: {data.get('status', 'started')}\n"
                    f"Requirements: {requirements[:200]}{'...' if len(requirements) > 200 else ''}\n\n"
                    f"The code generation is running in the background. "
                    f"Use deepcode_status with task_id='{task_id}' to check progress."
                )
        except httpx.ConnectError:
            return "Error: Cannot connect to DeepCode backend. Is the DeepCode service running?"
        except httpx.HTTPStatusError as e:
            return (
                f"Error: DeepCode API returned status {e.response.status_code}: {e.response.text}"
            )
        except Exception as e:
            return f"Error submitting requirements to DeepCode: {str(e)}"


class DeepCodeStatusTool(Tool):
    """Check the status and progress of a DeepCode task."""

    def __init__(self, api_url: str | None = None):
        self._api_url = api_url or _get_deepcode_url()

    @property
    def name(self) -> str:
        return "deepcode_status"

    @property
    def description(self) -> str:
        return (
            "Check the status and progress of a DeepCode code generation task. "
            "Provide the task_id returned by deepcode_paper2code or deepcode_chat2code. "
            "Returns current status, progress percentage, and result when complete."
        )

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "task_id": {
                    "type": "string",
                    "description": "The task ID to check status for",
                },
            },
            "required": ["task_id"],
        }

    async def execute(self, task_id: str, **kwargs: Any) -> str:
        try:
            async with httpx.AsyncClient(timeout=15.0) as client:
                response = await client.get(f"{self._api_url}/api/v1/workflows/status/{task_id}")
                response.raise_for_status()
                data = response.json()

                status = data.get("status", "unknown")
                progress = data.get("progress", 0)
                message = data.get("message", "")
                result = data.get("result")
                error = data.get("error")

                lines = [
                    f"Task ID: {task_id}",
                    f"Status: {status}",
                    f"Progress: {progress}%",
                ]

                if message:
                    lines.append(f"Message: {message}")

                if status == "completed" and result:
                    lines.append(f"\nResult:\n{result}")
                elif status == "error" and error:
                    lines.append(f"\nError: {error}")
                elif status == "waiting_for_input":
                    interaction = data.get("pending_interaction")
                    if interaction:
                        lines.append("\nWaiting for user input:")
                        lines.append(f"  Type: {interaction.get('type', 'unknown')}")
                        lines.append(f"  Title: {interaction.get('title', '')}")
                        lines.append(f"  Description: {interaction.get('description', '')}")

                return "\n".join(lines)

        except httpx.ConnectError:
            return "Error: Cannot connect to DeepCode backend. Is the DeepCode service running?"
        except httpx.HTTPStatusError as e:
            if e.response.status_code == 404:
                return f"Error: Task '{task_id}' not found. It may have expired."
            return (
                f"Error: DeepCode API returned status {e.response.status_code}: {e.response.text}"
            )
        except Exception as e:
            return f"Error checking task status: {str(e)}"


class DeepCodeListTasksTool(Tool):
    """List active and recent DeepCode tasks."""

    def __init__(self, api_url: str | None = None):
        self._api_url = api_url or _get_deepcode_url()

    @property
    def name(self) -> str:
        return "deepcode_list_tasks"

    @property
    def description(self) -> str:
        return (
            "List all active and recent DeepCode code generation tasks. "
            "Shows task IDs, status, progress, and results summary."
        )

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "limit": {
                    "type": "integer",
                    "description": "Maximum number of recent tasks to show. Default: 10",
                    "minimum": 1,
                    "maximum": 50,
                },
            },
        }

    async def execute(self, limit: int = 10, **kwargs: Any) -> str:
        try:
            async with httpx.AsyncClient(timeout=15.0) as client:
                # Fetch active tasks
                active_resp = await client.get(f"{self._api_url}/api/v1/workflows/active")
                active_resp.raise_for_status()
                active_data = active_resp.json()

                # Fetch recent tasks
                recent_resp = await client.get(
                    f"{self._api_url}/api/v1/workflows/recent",
                    params={"limit": limit},
                )
                recent_resp.raise_for_status()
                recent_data = recent_resp.json()

                lines = []

                # Active tasks
                active_tasks = active_data.get("tasks", [])
                if active_tasks:
                    lines.append(f"=== Active Tasks ({len(active_tasks)}) ===")
                    for task in active_tasks:
                        lines.append(
                            f"  [{task.get('status', '?')}] {task.get('task_id', '?')} "
                            f"- {task.get('progress', 0)}% - {task.get('message', '')}"
                        )
                    lines.append("")

                # Recent tasks
                recent_tasks = recent_data.get("tasks", [])
                if recent_tasks:
                    lines.append(f"=== Recent Tasks ({len(recent_tasks)}) ===")
                    for task in recent_tasks:
                        status_icon = {
                            "completed": "done",
                            "error": "error",
                            "running": "running",
                            "cancelled": "cancelled",
                        }.get(task.get("status", ""), "?")
                        lines.append(
                            f"  [{status_icon}] {task.get('task_id', '?')} "
                            f"- {task.get('status', '?')} - {task.get('message', '')}"
                        )

                if not lines:
                    return "No DeepCode tasks found."

                return "\n".join(lines)

        except httpx.ConnectError:
            return "Error: Cannot connect to DeepCode backend. Is the DeepCode service running?"
        except Exception as e:
            return f"Error listing tasks: {str(e)}"


class DeepCodeCancelTool(Tool):
    """Cancel a running DeepCode task."""

    def __init__(self, api_url: str | None = None):
        self._api_url = api_url or _get_deepcode_url()

    @property
    def name(self) -> str:
        return "deepcode_cancel"

    @property
    def description(self) -> str:
        return "Cancel a running DeepCode code generation task."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "task_id": {
                    "type": "string",
                    "description": "The task ID to cancel",
                },
            },
            "required": ["task_id"],
        }

    async def execute(self, task_id: str, **kwargs: Any) -> str:
        try:
            async with httpx.AsyncClient(timeout=15.0) as client:
                response = await client.post(f"{self._api_url}/api/v1/workflows/cancel/{task_id}")
                response.raise_for_status()
                return f"Task '{task_id}' has been cancelled successfully."
        except httpx.ConnectError:
            return "Error: Cannot connect to DeepCode backend. Is the DeepCode service running?"
        except httpx.HTTPStatusError as e:
            if e.response.status_code == 400:
                return f"Error: Task '{task_id}' not found or cannot be cancelled."
            return (
                f"Error: DeepCode API returned status {e.response.status_code}: {e.response.text}"
            )
        except Exception as e:
            return f"Error cancelling task: {str(e)}"


class DeepCodeRespondTool(Tool):
    """Respond to a DeepCode User-in-Loop interaction request."""

    def __init__(self, api_url: str | None = None):
        self._api_url = api_url or _get_deepcode_url()

    @property
    def name(self) -> str:
        return "deepcode_respond"

    @property
    def description(self) -> str:
        return (
            "Respond to a DeepCode User-in-Loop interaction. "
            "When a DeepCode task is waiting for user input (e.g. requirement clarification, "
            "plan review), use this tool to submit the user's response. "
            "First check deepcode_status to see the pending interaction details."
        )

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "task_id": {
                    "type": "string",
                    "description": "The task ID that is waiting for input",
                },
                "action": {
                    "type": "string",
                    "enum": ["submit", "confirm", "modify", "skip", "cancel"],
                    "description": "User's action: submit answers, confirm plan, modify, skip, or cancel",
                },
                "data": {
                    "type": "object",
                    "description": "Response data (e.g. answers to questions, modification feedback)",
                },
                "skipped": {
                    "type": "boolean",
                    "description": "Whether the user chose to skip this interaction. Default: false",
                },
            },
            "required": ["task_id", "action"],
        }

    async def execute(
        self,
        task_id: str,
        action: str,
        data: dict | None = None,
        skipped: bool = False,
        **kwargs: Any,
    ) -> str:
        try:
            async with httpx.AsyncClient(timeout=30.0) as client:
                response = await client.post(
                    f"{self._api_url}/api/v1/workflows/respond/{task_id}",
                    json={
                        "action": action,
                        "data": data or {},
                        "skipped": skipped,
                    },
                )
                response.raise_for_status()
                response.json()  # validate JSON response
                return (
                    f"Response submitted successfully!\n"
                    f"Task ID: {task_id}\n"
                    f"Action: {action}\n"
                    f"The workflow will now continue."
                )
        except httpx.ConnectError:
            return "Error: Cannot connect to DeepCode backend. Is the DeepCode service running?"
        except httpx.HTTPStatusError as e:
            if e.response.status_code == 400:
                detail = e.response.json().get("detail", "Unknown error")
                return f"Error: {detail}"
            return (
                f"Error: DeepCode API returned status {e.response.status_code}: {e.response.text}"
            )
        except Exception as e:
            return f"Error responding to interaction: {str(e)}"


# ============================================================
# Helper: create all DeepCode tools at once
# ============================================================


def create_all_tools(api_url: str | None = None) -> list[Tool]:
    """
    Create all DeepCode tools with the given API URL.

    Usage in AgentLoop._register_default_tools():
        deepcode_url = os.environ.get("DEEPCODE_API_URL")
        if deepcode_url:
            from nanobot.agent.tools.deepcode import create_all_tools
            for tool in create_all_tools(api_url=deepcode_url):
                self.tools.register(tool)
    """
    url = api_url or _get_deepcode_url()
    return [
        DeepCodePaper2CodeTool(api_url=url),
        DeepCodeChat2CodeTool(api_url=url),
        DeepCodeStatusTool(api_url=url),
        DeepCodeListTasksTool(api_url=url),
        DeepCodeCancelTool(api_url=url),
        DeepCodeRespondTool(api_url=url),
    ]


================================================
FILE: nanobot/nanobot/agent/tools/filesystem.py
================================================
"""File system tools: read, write, edit."""

from pathlib import Path
from typing import Any

from nanobot.agent.tools.base import Tool


def _resolve_path(path: str, allowed_dir: Path | None = None) -> Path:
    """Resolve path and optionally enforce directory restriction."""
    resolved = Path(path).expanduser().resolve()
    if allowed_dir and not str(resolved).startswith(str(allowed_dir.resolve())):
        raise PermissionError(f"Path {path} is outside allowed directory {allowed_dir}")
    return resolved


class ReadFileTool(Tool):
    """Tool to read file contents."""

    def __init__(self, allowed_dir: Path | None = None):
        self._allowed_dir = allowed_dir

    @property
    def name(self) -> str:
        return "read_file"

    @property
    def description(self) -> str:
        return "Read the contents of a file at the given path."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {"path": {"type": "string", "description": "The file path to read"}},
            "required": ["path"],
        }

    async def execute(self, path: str, **kwargs: Any) -> str:
        try:
            file_path = _resolve_path(path, self._allowed_dir)
            if not file_path.exists():
                return f"Error: File not found: {path}"
            if not file_path.is_file():
                return f"Error: Not a file: {path}"

            content = file_path.read_text(encoding="utf-8")
            return content
        except PermissionError as e:
            return f"Error: {e}"
        except Exception as e:
            return f"Error reading file: {str(e)}"


class WriteFileTool(Tool):
    """Tool to write content to a file."""

    def __init__(self, allowed_dir: Path | None = None):
        self._allowed_dir = allowed_dir

    @property
    def name(self) -> str:
        return "write_file"

    @property
    def description(self) -> str:
        return "Write content to a file at the given path. Creates parent directories if needed."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "path": {"type": "string", "description": "The file path to write to"},
                "content": {"type": "string", "description": "The content to write"},
            },
            "required": ["path", "content"],
        }

    async def execute(self, path: str, content: str, **kwargs: Any) -> str:
        try:
            file_path = _resolve_path(path, self._allowed_dir)
            file_path.parent.mkdir(parents=True, exist_ok=True)
            file_path.write_text(content, encoding="utf-8")
            return f"Successfully wrote {len(content)} bytes to {path}"
        except PermissionError as e:
            return f"Error: {e}"
        except Exception as e:
            return f"Error writing file: {str(e)}"


class EditFileTool(Tool):
    """Tool to edit a file by replacing text."""

    def __init__(self, allowed_dir: Path | None = None):
        self._allowed_dir = allowed_dir

    @property
    def name(self) -> str:
        return "edit_file"

    @property
    def description(self) -> str:
        return "Edit a file by replacing old_text with new_text. The old_text must exist exactly in the file."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "path": {"type": "string", "description": "The file path to edit"},
                "old_text": {"type": "string", "description": "The exact text to find and replace"},
                "new_text": {"type": "string", "description": "The text to replace with"},
            },
            "required": ["path", "old_text", "new_text"],
        }

    async def execute(self, path: str, old_text: str, new_text: str, **kwargs: Any) -> str:
        try:
            file_path = _resolve_path(path, self._allowed_dir)
            if not file_path.exists():
                return f"Error: File not found: {path}"

            content = file_path.read_text(encoding="utf-8")

            if old_text not in content:
                return "Error: old_text not found in file. Make sure it matches exactly."

            # Count occurrences
            count = content.count(old_text)
            if count > 1:
                return f"Warning: old_text appears {count} times. Please provide more context to make it unique."

            new_content = content.replace(old_text, new_text, 1)
            file_path.write_text(new_content, encoding="utf-8")

            return f"Successfully edited {path}"
        except PermissionError as e:
            return f"Error: {e}"
        except Exception as e:
            return f"Error editing file: {str(e)}"


class ListDirTool(Tool):
    """Tool to list directory contents."""

    def __init__(self, allowed_dir: Path | None = None):
        self._allowed_dir = allowed_dir

    @property
    def name(self) -> str:
        return "list_dir"

    @property
    def description(self) -> str:
        return "List the contents of a directory."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {"path": {"type": "string", "description": "The directory path to list"}},
            "required": ["path"],
        }

    async def execute(self, path: str, **kwargs: Any) -> str:
        try:
            dir_path = _resolve_path(path, self._allowed_dir)
            if not dir_path.exists():
                return f"Error: Directory not found: {path}"
            if not dir_path.is_dir():
                return f"Error: Not a directory: {path}"

            items = []
            for item in sorted(dir_path.iterdir()):
                prefix = "📁 " if item.is_dir() else "📄 "
                items.append(f"{prefix}{item.name}")

            if not items:
                return f"Directory {path} is empty"

            return "\n".join(items)
        except PermissionError as e:
            return f"Error: {e}"
        except Exception as e:
            return f"Error listing directory: {str(e)}"


================================================
FILE: nanobot/nanobot/agent/tools/message.py
================================================
"""Message tool for sending messages to users."""

from typing import Any, Awaitable, Callable

from nanobot.agent.tools.base import Tool
from nanobot.bus.events import OutboundMessage


class MessageTool(Tool):
    """Tool to send messages to users on chat channels."""

    def __init__(
        self,
        send_callback: Callable[[OutboundMessage], Awaitable[None]] | None = None,
        default_channel: str = "",
        default_chat_id: str = "",
    ):
        self._send_callback = send_callback
        self._default_channel = default_channel
        self._default_chat_id = default_chat_id

    def set_context(self, channel: str, chat_id: str) -> None:
        """Set the current message context."""
        self._default_channel = channel
        self._default_chat_id = chat_id

    def set_send_callback(self, callback: Callable[[OutboundMessage], Awaitable[None]]) -> None:
        """Set the callback for sending messages."""
        self._send_callback = callback

    @property
    def name(self) -> str:
        return "message"

    @property
    def description(self) -> str:
        return "Send a message to the user. Use this when you want to communicate something."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "content": {"type": "string", "description": "The message content to send"},
                "channel": {
                    "type": "string",
                    "description": "Optional: target channel (telegram, discord, etc.)",
                },
                "chat_id": {"type": "string", "description": "Optional: target chat/user ID"},
            },
            "required": ["content"],
        }

    async def execute(
        self, content: str, channel: str | None = None, chat_id: str | None = None, **kwargs: Any
    ) -> str:
        channel = channel or self._default_channel
        chat_id = chat_id or self._default_chat_id

        if not channel or not chat_id:
            return "Error: No target channel/chat specified"

        if not self._send_callback:
            return "Error: Message sending not configured"

        msg = OutboundMessage(channel=channel, chat_id=chat_id, content=content)

        try:
            await self._send_callback(msg)
            return f"Message sent to {channel}:{chat_id}"
        except Exception as e:
            return f"Error sending message: {str(e)}"


================================================
FILE: nanobot/nanobot/agent/tools/registry.py
================================================
"""Tool registry for dynamic tool management."""

from typing import Any

from nanobot.agent.tools.base import Tool


class ToolRegistry:
    """
    Registry for agent tools.

    Allows dynamic registration and execution of tools.
    """

    def __init__(self):
        self._tools: dict[str, Tool] = {}

    def register(self, tool: Tool) -> None:
        """Register a tool."""
        self._tools[tool.name] = tool

    def unregister(self, name: str) -> None:
        """Unregister a tool by name."""
        self._tools.pop(name, None)

    def get(self, name: str) -> Tool | None:
        """Get a tool by name."""
        return self._tools.get(name)

    def has(self, name: str) -> bool:
        """Check if a tool is registered."""
        return name in self._tools

    def get_definitions(self) -> list[dict[str, Any]]:
        """Get all tool definitions in OpenAI format."""
        return [tool.to_schema() for tool in self._tools.values()]

    async def execute(self, name: str, params: dict[str, Any]) -> str:
        """
        Execute a tool by name with given parameters.

        Args:
            name: Tool name.
            params: Tool parameters.

        Returns:
            Tool execution result as string.

        Raises:
            KeyError: If tool not found.
        """
        tool = self._tools.get(name)
        if not tool:
            return f"Error: Tool '{name}' not found"

        try:
            errors = tool.validate_params(params)
            if errors:
                return f"Error: Invalid parameters for tool '{name}': " + "; ".join(errors)
            return await tool.execute(**params)
        except Exception as e:
            return f"Error executing {name}: {str(e)}"

    @property
    def tool_names(self) -> list[str]:
        """Get list of registered tool names."""
        return list(self._tools.keys())

    def __len__(self) -> int:
        return len(self._tools)

    def __contains__(self, name: str) -> bool:
        return name in self._tools


================================================
FILE: nanobot/nanobot/agent/tools/shell.py
================================================
"""Shell execution tool."""

import asyncio
import os
import re
from pathlib import Path
from typing import Any

from nanobot.agent.tools.base import Tool


class ExecTool(Tool):
    """Tool to execute shell commands."""

    def __init__(
        self,
        timeout: int = 60,
        working_dir: str | None = None,
        deny_patterns: list[str] | None = None,
        allow_patterns: list[str] | None = None,
        restrict_to_workspace: bool = False,
    ):
        self.timeout = timeout
        self.working_dir = working_dir
        self.deny_patterns = deny_patterns or [
            r"\brm\s+-[rf]{1,2}\b",  # rm -r, rm -rf, rm -fr
            r"\bdel\s+/[fq]\b",  # del /f, del /q
            r"\brmdir\s+/s\b",  # rmdir /s
            r"\b(format|mkfs|diskpart)\b",  # disk operations
            r"\bdd\s+if=",  # dd
            r">\s*/dev/sd",  # write to disk
            r"\b(shutdown|reboot|poweroff)\b",  # system power
            r":\(\)\s*\{.*\};\s*:",  # fork bomb
        ]
        self.allow_patterns = allow_patterns or []
        self.restrict_to_workspace = restrict_to_workspace

    @property
    def name(self) -> str:
        return "exec"

    @property
    def description(self) -> str:
        return "Execute a shell command and return its output. Use with caution."

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "command": {"type": "string", "description": "The shell command to execute"},
                "working_dir": {
                    "type": "string",
                    "description": "Optional working directory for the command",
                },
            },
            "required": ["command"],
        }

    async def execute(self, command: str, working_dir: str | None = None, **kwargs: Any) -> str:
        cwd = working_dir or self.working_dir or os.getcwd()
        guard_error = self._guard_command(command, cwd)
        if guard_error:
            return guard_error

        try:
            process = await asyncio.create_subprocess_shell(
                command,
                stdout=asyncio.subprocess.PIPE,
                stderr=asyncio.subprocess.PIPE,
                cwd=cwd,
            )

            try:
                stdout, stderr = await asyncio.wait_for(process.communicate(), timeout=self.timeout)
            except asyncio.TimeoutError:
                process.kill()
                return f"Error: Command timed out after {self.timeout} seconds"

            output_parts = []

            if stdout:
                output_parts.append(stdout.decode("utf-8", errors="replace"))

            if stderr:
                stderr_text = stderr.decode("utf-8", errors="replace")
                if stderr_text.strip():
                    output_parts.append(f"STDERR:\n{stderr_text}")

            if process.returncode != 0:
                output_parts.append(f"\nExit code: {process.returncode}")

            result = "\n".join(output_parts) if output_parts else "(no output)"

            # Truncate very long output
            max_len = 10000
            if len(result) > max_len:
                result = result[:max_len] + f"\n... (truncated, {len(result) - max_len} more chars)"

            return result

        except Exception as e:
            return f"Error executing command: {str(e)}"

    def _guard_command(self, command: str, cwd: str) -> str | None:
        """Best-effort safety guard for potentially destructive commands."""
        cmd = command.strip()
        lower = cmd.lower()

        for pattern in self.deny_patterns:
            if re.search(pattern, lower):
                return "Error: Command blocked by safety guard (dangerous pattern detected)"

        if self.allow_patterns:
            if not any(re.search(p, lower) for p in self.allow_patterns):
                return "Error: Command blocked by safety guard (not in allowlist)"

        if self.restrict_to_workspace:
            if "..\\" in cmd or "../" in cmd:
                return "Error: Command blocked by safety guard (path traversal detected)"

            cwd_path = Path(cwd).resolve()

            win_paths = re.findall(r"[A-Za-z]:\\[^\\\"']+", cmd)
            posix_paths = re.findall(r"/[^\s\"']+", cmd)

            for raw in win_paths + posix_paths:
                try:
                    p = Path(raw).resolve()
                except Exception:
                    continue
                if cwd_path not in p.parents and p != cwd_path:
                    return "Error: Command blocked by safety guard (path outside working dir)"

        return None


================================================
FILE: nanobot/nanobot/agent/tools/spawn.py
================================================
"""Spawn tool for creating background subagents."""

from typing import TYPE_CHECKING, Any

from nanobot.agent.tools.base import Tool

if TYPE_CHECKING:
    from nanobot.agent.subagent import SubagentManager


class SpawnTool(Tool):
    """
    Tool to spawn a subagent for background task execution.

    The subagent runs asynchronously and announces its result back
    to the main agent when complete.
    """

    def __init__(self, manager: "SubagentManager"):
        self._manager = manager
        self._origin_channel = "cli"
        self._origin_chat_id = "direct"

    def set_context(self, channel: str, chat_id: str) -> None:
        """Set the origin context for subagent announcements."""
        self._origin_channel = channel
        self._origin_chat_id = chat_id

    @property
    def name(self) -> str:
        return "spawn"

    @property
    def description(self) -> str:
        return (
            "Spawn a subagent to handle a task in the background. "
            "Use this for complex or time-consuming tasks that can run independently. "
            "The subagent will complete the task and report back when done."
        )

    @property
    def parameters(self) -> dict[str, Any]:
        return {
            "type": "object",
            "properties": {
                "task": {
                    "type": "string",
                    "description": "The task for the subagent to complete",
                },
                "label": {
                    "type": "string",
                    "description": "Optional short label for the task (for display)",
                },
            },
            "required": ["task"],
        }

    async def execute(self, task: str, label: str | None = None, **kwargs: Any) -> str:
        """Spawn a subagent to execute the given task."""
        return await self._manager.spawn(
            task=task,
            label=label,
            origin_channel=self._origin_channel,
            origin_chat_id=self._origin_chat_id,
        )


================================================
FILE: nanobot/nanobot/agent/tools/web.py
================================================
"""Web tools: web_search and web_fetch."""

import html
import json
import os
import re
from typing import Any
from urllib.parse import urlparse

import httpx

from nanobot.agent.tools.base import Tool

# Shared constants
USER_AGENT = "Mozilla/5.0 (Macintosh; Intel Mac OS X 14_7_2) AppleWebKit/537.36"
MAX_REDIRECTS = 5  # Limit redirects to prevent DoS attacks


def _strip_tags(text: str) -> str:
    """Remove HTML tags and decode entities."""
    text = re.sub(r"<script[\s\S]*?</script>", "", text, flags=re.I)
    text = re.sub(r"<style[\s\S]*?</style>", "", text, flags=re.I)
    text = re.sub(r"<[^>]+>", "", text)
    return html.unescape(text).strip()


def _normalize(text: str) -> str:
    """Normalize whitespace."""
    text = re.sub(r"[ \t]+", " ", text)
    return re.sub(r"\n{3,}", "\n\n", text).strip()


def _validate_url(url: str) -> tuple[bool, str]:
    """Validate URL: must be http(s) with valid domain."""
    try:
        p = urlparse(url)
        if p.scheme not in ("http", "https"):
            return False, f"Only http/https allowed, got '{p.scheme or 'none'}'"
        if not p.netloc:
            return False, "Missing domain"
        return True, ""
    except Exception as e:
        return False, str(e)


class WebSearchTool(Tool):
    """Search the web using Brave Search API."""

    name = "web_search"
    description = "Search the web. Returns titles, URLs, and snippets."
    parameters = {
        "type": "object",
        "properties": {
            "query": {"type": "string", "description": "Search query"},
            "count": {
                "type": "integer",
                "description": "Results (1-10)",
                "minimum": 1,
                "maximum": 10,
            },
        },
        "required": ["query"],
    }

    def __init__(self, api_key: str | None = None, max_results: int = 5):
        self.api_key = api_key or os.environ.get("BRAVE_API_KEY", "")
        self.max_results = max_results

    async def execute(self, query: str, count: int | None = None, **kwargs: Any) -> str:
        if not self.api_key:
            return "Error: BRAVE_API_KEY not configured"

        try:
            n = min(max(count or self.max_results, 1), 10)
            async with httpx.AsyncClient() as client:
                r = await client.get(
                    "https://api.search.brave.com/res/v1/web/search",
                    params={"q": query, "count": n},
                    headers={"Accept": "application/json", "X-Subscription-Token": self.api_key},
                    timeout=10.0,
                )
                r.raise_for_status()

            results = r.json().get("web", {}).get("results", [])
            if not results:
                return f"No results for: {query}"

            lines = [f"Results for: {query}\n"]
            for i, item in enumerate(results[:n], 1):
                lines.append(f"{i}. {item.get('title', '')}\n   {item.get('url', '')}")
                if desc := item.get("description"):
                    lines.append(f"   {desc}")
            return "\n".join(lines)
        except Exception as e:
            return f"Error: {e}"


class WebFetchTool(Tool):
    """Fetch and extract content from a URL using Readability."""

    name = "web_fetch"
    description = "Fetch URL and extract readable content (HTML → markdown/text)."
    parameters = {
        "type": "object",
        "properties": {
            "url": {"type": "string", "description": "URL to fetch"},
            "extractMode": {"type": "string", "enum": ["markdown", "text"], "default": "markdown"},
            "maxChars": {"type": "integer", "minimum": 100},
        },
        "required": ["url"],
    }

    def __init__(self, max_chars: int = 50000):
        self.max_chars = max_chars

    async def execute(
        self,
        url: str,
        extract_mode: str = "markdown",
        max_chars: int | None = None,
        **kwargs: Any,
    ) -> str:
        from readability import Document

        # Backward compatibility for callers using camelCase argument names
        if "extractMode" in kwargs and extract_mode == "markdown":
            extract_mode = kwargs["extractMode"]
        if "maxChars" in kwargs and max_chars is None:
            max_chars = kwargs["maxChars"]

        max_chars = max_chars or self.max_chars

        # Validate URL before fetching
        is_valid, error_msg = _validate_url(url)
        if not is_valid:
            return json.dumps({"error": f"URL validation failed: {error_msg}", "url": url})

        try:
            async with httpx.AsyncClient(
                follow_redirects=True, max_redirects=MAX_REDIRECTS, timeout=30.0
            ) as client:
                r = await client.get(url, headers={"User-Agent": USER_AGENT})
                r.raise_for_status()

            ctype = r.headers.get("content-type", "")

            # JSON
            if "application/json" in ctype:
                text, extractor = json.dumps(r.json(), indent=2), "json"
            # HTML
            elif "text/html" in ctype or r.text[:256].lower().startswith(("<!doctype", "<html")):
                doc = Document(r.text)
                content = (
                    self._to_markdown(doc.summary())
                    if extract_mode == "markdown"
                    else _strip_tags(doc.summary())
                )
                text = f"# {doc.title()}\n\n{content}" if doc.title() else content
                extractor = "readability"
            else:
                text, extractor = r.text, "raw"

            truncated = len(text) > max_chars
            if truncated:
                text = text[:max_chars]

            return json.dumps(
                {
                    "url": url,
                    "finalUrl": str(r.url),
                    "status": r.status_code,
                    "extractor": extractor,
                    "truncated": truncated,
                    "length": len(text),
                    "text": text,
                }
            )
        except Exception as e:
            return json.dumps({"error": str(e), "url": url})

    def _to_markdown(self, html: str) -> str:
        """Convert HTML to markdown."""
        # Convert links, headings, lists before stripping tags
        text = re.sub(
            r'<a\s+[^>]*href=["\']([^"\']+)["\'][^>]*>([\s\S]*?)</a>',
            lambda m: f"[{_strip_tags(m[2])}]({m[1]})",
            html,
            flags=re.I,
        )
        text = re.sub(
            r"<h([1-6])[^>]*>([\s\S]*?)</h\1>",
            lambda m: f'\n{"#" * int(m[1])} {_strip_tags(m[2])}\n',
            text,
            flags=re.I,
        )
        text = re.sub(
            r"<li[^>]*>([\s\S]*?)</li>", lambda m: f"\n- {_strip_tags(m[1])}", text, flags=re.I
        )
        text = re.sub(r"</(p|div|section|article)>", "\n\n", text, flags=re.I)
        text = re.sub(r"<(br|hr)\s*/?>", "\n", text, flags=re.I)
        return _normalize(_strip_tags(text))


================================================
FILE: nanobot/nanobot/bus/__init__.py
================================================
"""Message bus module for decoupled channel-agent communication."""

from nanobot.bus.events import InboundMessage, OutboundMessage
from nanobot.bus.queue import MessageBus

__all__ = ["MessageBus", "InboundMessage", "OutboundMessage"]


================================================
FILE: nanobot/nanobot/bus/events.py
================================================
"""Event types for the message bus."""

from dataclasses import dataclass, field
from datetime import datetime
from typing import Any


@dataclass
class InboundMessage:
    """Message received from a chat channel."""

    channel: str  # telegram, discord, slack, whatsapp
    sender_id: str  # User identifier
    chat_id: str  # Chat/channel identifier
    content: str  # Message text
    timestamp: datetime = field(default_factory=datetime.now)
    media: list[str] = field(default_factory=list)  # Media URLs
    metadata: dict[str, Any] = field(default_factory=dict)  # Channel-specific data

    @property
    def session_key(self) -> str:
        """Unique key for session identification."""
        return f"{self.channel}:{self.chat_id}"


@dataclass
class OutboundMessage:
    """Message to send to a chat channel."""

    channel: str
    chat_id: str
    content: str
    reply_to: str | None = None
    media: list[str] = field(default_factory=list)
    metadata: dict[str, Any] = field(default_factory=dict)


================================================
FILE: nanobot/nanobot/bus/queue.py
================================================
"""Async message queue for decoupled channel-agent communication."""

import asyncio
from typing import Awaitable, Callable

from loguru import logger

from nanobot.bus.events import InboundMessage, OutboundMessage


class MessageBus:
    """
    Async message bus that decouples chat channels from the agent core.

    Channels push messages to the inbound queue, and the agent processes
    them and pushes responses to the outbound queue.
    """

    def __init__(self):
        self.inbound: asyncio.Queue[InboundMessage] = asyncio.Queue()
        self.outbound: asyncio.Queue[OutboundMessage] = asyncio.Queue()
        self._outbound_subscribers: dict[
            str, list[Callable[[OutboundMessage], Awaitable[None]]]
        ] = {}
        self._running = False

    async def publish_inbound(self, msg: InboundMessage) -> None:
        """Publish a message from a channel to the agent."""
        await self.inbound.put(msg)

    async def consume_inbound(self) -> InboundMessage:
        """Consume the next inbound message (blocks until available)."""
        return await self.inbound.get()

    async def publish_outbound(self, msg: OutboundMessage) -> None:
        """Publish a response from the agent to channels."""
        await self.outbound.put(msg)

    async def consume_outbound(self) -> OutboundMessage:
        """Consume the next outbound message (blocks until available)."""
        return await self.outbound.get()

    def subscribe_outbound(
        self, channel: str, callback: Callable[[OutboundMessage], Awaitable[None]]
    ) -> None:
        """Subscribe to outbound messages for a specific channel."""
        if channel not in self._outbound_subscribers:
            self._outbound_subscribers[channel] = []
        self._outbound_subscribers[channel].append(callback)

    async def dispatch_outbound(self) -> None:
        """
        Dispatch outbound messages to subscribed channels.
        Run this as a background task.
        """
        self._running = True
        while self._running:
            try:
                msg = await asyncio.wait_for(self.outbound.get(), timeout=1.0)
                subscribers = self._outbound_subscribers.get(msg.channel, [])
                for callback in subscribers:
                    try:
                        await callback(msg)
                    except Exception as e:
                        logger.error(f"Error dispatching to {msg.channel}: {e}")
            except asyncio.TimeoutError:
                continue

    def stop(self) -> None:
        """Stop the dispatcher loop."""
        self._running = False

    @property
    def inbound_size(self) -> int:
        """Number of pending inbound messages."""
        return self.inbound.qsize()

    @property
    def outbound_size(self) -> int:
        """Number of pending outbound messages."""
        return self.outbound.qsize()


================================================
FILE: nanobot/nanobot/channels/__init__.py
================================================
"""Chat channels module with plugin architecture."""

from nanobot.channels.base import BaseChannel
from nanobot.channels.manager import ChannelManager

__all__ = ["BaseChannel", "ChannelManager"]


================================================
FILE: nanobot/nanobot/channels/base.py
================================================
"""Base channel interface for chat platforms."""

from abc import ABC, abstractmethod
from typing import Any

from loguru import logger

from nanobot.bus.events import InboundMessage, OutboundMessage
from nanobot.bus.queue import MessageBus


class BaseChannel(ABC):
    """
    Abstract base class for chat channel implementations.

    Each channel (Telegram, Discord, etc.) should implement this interface
    to integrate with the nanobot message bus.
    """

    name: str = "base"

    def __init__(self, config: Any, bus: MessageBus):
        """
        Initialize the channel.

        Args:
            config: Channel-specific configuration.
            bus: The message bus for communication.
        """
        self.config = config
        self.bus = bus
        self._running = False

    @abstractmethod
    async def start(self) -> None:
        """
        Start the channel and begin listening for messages.

        This should be a long-running async task that:
        1. Connects to the chat platform
        2. Listens for incoming messages
        3. Forwards messages to the bus via _handle_message()
        """
        pass

    @abstractmethod
    async def stop(self) -> None:
        """Stop the channel and clean up resources."""
        pass

    @abstractmethod
    async def send(self, msg: OutboundMessage) -> None:
        """
        Send a message through this channel.

        Args:
            msg: The message to send.
        """
        pass

    def is_allowed(self, sender_id: str) -> bool:
        """
        Check if a sender is allowed to use this bot.

        Args:
            sender_id: The sender's identifier.

        Returns:
            True if allowed, False otherwise.
        """
        allow_list = getattr(self.config, "allow_from", [])

        # If no allow list, allow everyone
        if not allow_list:
            return True

        sender_str = str(sender_id)
        if sender_str in allow_list:
            return True
        if "|" in sender_str:
            for part in sender_str.split("|"):
                if part and part in allow_list:
                    return True
        return False

    async def _handle_message(
        self,
        sender_id: str,
        chat_id: str,
        content: str,
        media: list[str] | None = None,
        metadata: dict[str, Any] | None = None,
    ) -> None:
        """
        Handle an incoming message from the chat platform.

        This method checks permissions and forwards to the bus.

        Args:
            sender_id: The sender's identifier.
            chat_id: The chat/channel identifier.
            content: Message text content.
            media: Optional list of media URLs.
            metadata: Optional channel-specific metadata.
        """
        if not self.is_allowed(sender_id):
            logger.warning(
                f"Access denied for sender {sender_id} on channel {self.name}. "
                f"Add them to allowFrom list in config to grant access."
            )
            return

        msg = InboundMessage(
            channel=self.name,
            sender_id=str(sender_id),
            chat_id=str(chat_id),
            content=content,
            media=media or [],
            metadata=metadata or {},
        )

        await self.bus.publish_inbound(msg)

    @property
    def is_running(self) -> bool:
        """Check if the channel is running."""
        return self._running


================================================
FILE: nanobot/nanobot/channels/dingtalk.py
================================================
"""DingTalk/DingDing channel implementation using Stream Mode."""

import asyncio
import json
import time
from typing import Any

import httpx
from loguru import logger

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import DingTalkConfig

try:
    from dingtalk_stream import (
        AckMessage,
        CallbackHandler,
        CallbackMessage,
        Credential,
        DingTalkStreamClient,
    )
    from dingtalk_stream.chatbot import ChatbotMessage

    DINGTALK_AVAILABLE = True
except ImportError:
    DINGTALK_AVAILABLE = False
    # Fallback so class definitions don't crash at module level
    CallbackHandler = object  # type: ignore[assignment,misc]
    CallbackMessage = None  # type: ignore[assignment,misc]
    AckMessage = None  # type: ignore[assignment,misc]
    ChatbotMessage = None  # type: ignore[assignment,misc]


class NanobotDingTalkHandler(CallbackHandler):
    """
    Standard DingTalk Stream SDK Callback Handler.
    Parses incoming messages and forwards them to the Nanobot channel.
    """

    def __init__(self, channel: "DingTalkChannel"):
        super().__init__()
        self.channel = channel

    async def process(self, message: CallbackMessage):
        """Process incoming stream message."""
        try:
            # Parse using SDK's ChatbotMessage for robust handling
            chatbot_msg = ChatbotMessage.from_dict(message.data)

            # Extract text content; fall back to raw dict if SDK object is empty
            content = ""
            if chatbot_msg.text:
                content = chatbot_msg.text.content.strip()
            if not content:
                content = message.data.get("text", {}).get("content", "").strip()

            if not content:
                logger.warning(
                    f"Received empty or unsupported message type: {chatbot_msg.message_type}"
                )
                return AckMessage.STATUS_OK, "OK"

            sender_id = chatbot_msg.sender_staff_id or chatbot_msg.sender_id
            sender_name = chatbot_msg.sender_nick or "Unknown"

            logger.info(f"Received DingTalk message from {sender_name} ({sender_id}): {content}")

            # Forward to Nanobot via _on_message (non-blocking).
            # Store reference to prevent GC before task completes.
            task = asyncio.create_task(self.channel._on_message(content, sender_id, sender_name))
            self.channel._background_tasks.add(task)
            task.add_done_callback(self.channel._background_tasks.discard)

            return AckMessage.STATUS_OK, "OK"

        except Exception as e:
            logger.error(f"Error processing DingTalk message: {e}")
            # Return OK to avoid retry loop from DingTalk server
            return AckMessage.STATUS_OK, "Error"


class DingTalkChannel(BaseChannel):
    """
    DingTalk channel using Stream Mode.

    Uses WebSocket to receive events via `dingtalk-stream` SDK.
    Uses direct HTTP API to send messages (SDK is mainly for receiving).

    Note: Currently only supports private (1:1) chat. Group messages are
    received but replies are sent back as private messages to the sender.
    """

    name = "dingtalk"

    def __init__(self, config: DingTalkConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: DingTalkConfig = config
        self._client: Any = None
        self._http: httpx.AsyncClient | None = None

        # Access Token management for sending messages
        self._access_token: str | None = None
        self._token_expiry: float = 0

        # Hold references to background tasks to prevent GC
        self._background_tasks: set[asyncio.Task] = set()

    async def start(self) -> None:
        """Start the DingTalk bot with Stream Mode."""
        try:
            if not DINGTALK_AVAILABLE:
                logger.error("DingTalk Stream SDK not installed. Run: pip install dingtalk-stream")
                return

            if not self.config.client_id or not self.config.client_secret:
                logger.error("DingTalk client_id and client_secret not configured")
                return

            self._running = True
            self._http = httpx.AsyncClient()

            logger.info(
                f"Initializing DingTalk Stream Client with Client ID: {self.config.client_id}..."
            )
            credential = Credential(self.config.client_id, self.config.client_secret)
            self._client = DingTalkStreamClient(credential)

            # Register standard handler
            handler = NanobotDingTalkHandler(self)
            self._client.register_callback_handler(ChatbotMessage.TOPIC, handler)

            logger.info("DingTalk bot started with Stream Mode")

            # client.start() is an async infinite loop handling the websocket connection
            await self._client.start()

        except Exception as e:
            logger.exception(f"Failed to start DingTalk channel: {e}")

    async def stop(self) -> None:
        """Stop the DingTalk bot."""
        self._running = False
        # Close the shared HTTP client
        if self._http:
            await self._http.aclose()
            self._http = None
        # Cancel outstanding background tasks
        for task in self._background_tasks:
            task.cancel()
        self._background_tasks.clear()

    async def _get_access_token(self) -> str | None:
        """Get or refresh Access Token."""
        if self._access_token and time.time() < self._token_expiry:
            return self._access_token

        url = "https://api.dingtalk.com/v1.0/oauth2/accessToken"
        data = {
            "appKey": self.config.client_id,
            "appSecret": self.config.client_secret,
        }

        if not self._http:
            logger.warning("DingTalk HTTP client not initialized, cannot refresh token")
            return None

        try:
            resp = await self._http.post(url, json=data)
            resp.raise_for_status()
            res_data = resp.json()
            self._access_token = res_data.get("accessToken")
            # Expire 60s early to be safe
            self._token_expiry = time.time() + int(res_data.get("expireIn", 7200)) - 60
            return self._access_token
        except Exception as e:
            logger.error(f"Failed to get DingTalk access token: {e}")
            return None

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through DingTalk."""
        token = await self._get_access_token()
        if not token:
            return

        # oToMessages/batchSend: sends to individual users (private chat)
        # https://open.dingtalk.com/document/orgapp/robot-batch-send-messages
        url = "https://api.dingtalk.com/v1.0/robot/oToMessages/batchSend"

        headers = {"x-acs-dingtalk-access-token": token}

        data = {
            "robotCode": self.config.client_id,
            "userIds": [msg.chat_id],  # chat_id is the user's staffId
            "msgKey": "sampleMarkdown",
            "msgParam": json.dumps(
                {
                    "text": msg.content,
                    "title": "Nanobot Reply",
                }
            ),
        }

        if not self._http:
            logger.warning("DingTalk HTTP client not initialized, cannot send")
            return

        try:
            resp = await self._http.post(url, json=data, headers=headers)
            if resp.status_code != 200:
                logger.error(f"DingTalk send failed: {resp.text}")
            else:
                logger.debug(f"DingTalk message sent to {msg.chat_id}")
        except Exception as e:
            logger.error(f"Error sending DingTalk message: {e}")

    async def _on_message(self, content: str, sender_id: str, sender_name: str) -> None:
        """Handle incoming message (called by NanobotDingTalkHandler).

        Delegates to BaseChannel._handle_message() which enforces allow_from
        permission checks before publishing to the bus.
        """
        try:
            logger.info(f"DingTalk inbound: {content} from {sender_name}")
            await self._handle_message(
                sender_id=sender_id,
                chat_id=sender_id,  # For private chat, chat_id == sender_id
                content=str(content),
                metadata={
                    "sender_name": sender_name,
                    "platform": "dingtalk",
                },
            )
        except Exception as e:
            logger.error(f"Error publishing DingTalk message: {e}")


================================================
FILE: nanobot/nanobot/channels/discord.py
================================================
"""Discord channel implementation using Discord Gateway websocket."""

import asyncio
import json
from pathlib import Path
from typing import Any

import httpx
import websockets
from loguru import logger

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import DiscordConfig

DISCORD_API_BASE = "https://discord.com/api/v10"
MAX_ATTACHMENT_BYTES = 20 * 1024 * 1024  # 20MB


class DiscordChannel(BaseChannel):
    """Discord channel using Gateway websocket."""

    name = "discord"

    def __init__(self, config: DiscordConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: DiscordConfig = config
        self._ws: websockets.WebSocketClientProtocol | None = None
        self._seq: int | None = None
        self._heartbeat_task: asyncio.Task | None = None
        self._typing_tasks: dict[str, asyncio.Task] = {}
        self._http: httpx.AsyncClient | None = None

    async def start(self) -> None:
        """Start the Discord gateway connection."""
        if not self.config.token:
            logger.error("Discord bot token not configured")
            return

        self._running = True
        self._http = httpx.AsyncClient(timeout=30.0)

        while self._running:
            try:
                logger.info("Connecting to Discord gateway...")
                async with websockets.connect(self.config.gateway_url) as ws:
                    self._ws = ws
                    await self._gateway_loop()
            except asyncio.CancelledError:
                break
            except Exception as e:
                logger.warning(f"Discord gateway error: {e}")
                if self._running:
                    logger.info("Reconnecting to Discord gateway in 5 seconds...")
                    await asyncio.sleep(5)

    async def stop(self) -> None:
        """Stop the Discord channel."""
        self._running = False
        if self._heartbeat_task:
            self._heartbeat_task.cancel()
            self._heartbeat_task = None
        for task in self._typing_tasks.values():
            task.cancel()
        self._typing_tasks.clear()
        if self._ws:
            await self._ws.close()
            self._ws = None
        if self._http:
            await self._http.aclose()
            self._http = None

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through Discord REST API."""
        if not self._http:
            logger.warning("Discord HTTP client not initialized")
            return

        url = f"{DISCORD_API_BASE}/channels/{msg.chat_id}/messages"
        payload: dict[str, Any] = {"content": msg.content}

        if msg.reply_to:
            payload["message_reference"] = {"message_id": msg.reply_to}
            payload["allowed_mentions"] = {"replied_user": False}

        headers = {"Authorization": f"Bot {self.config.token}"}

        try:
            for attempt in range(3):
                try:
                    response = await self._http.post(url, headers=headers, json=payload)
                    if response.status_code == 429:
                        data = response.json()
                        retry_after = float(data.get("retry_after", 1.0))
                        logger.warning(f"Discord rate limited, retrying in {retry_after}s")
                        await asyncio.sleep(retry_after)
                        continue
                    response.raise_for_status()
                    return
                except Exception as e:
                    if attempt == 2:
                        logger.error(f"Error sending Discord message: {e}")
                    else:
                        await asyncio.sleep(1)
        finally:
            await self._stop_typing(msg.chat_id)

    async def _gateway_loop(self) -> None:
        """Main gateway loop: identify, heartbeat, dispatch events."""
        if not self._ws:
            return

        async for raw in self._ws:
            try:
                data = json.loads(raw)
            except json.JSONDecodeError:
                logger.warning(f"Invalid JSON from Discord gateway: {raw[:100]}")
                continue

            op = data.get("op")
            event_type = data.get("t")
            seq = data.get("s")
            payload = data.get("d")

            if seq is not None:
                self._seq = seq

            if op == 10:
                # HELLO: start heartbeat and identify
                interval_ms = payload.get("heartbeat_interval", 45000)
                await self._start_heartbeat(interval_ms / 1000)
                await self._identify()
            elif op == 0 and event_type == "READY":
                logger.info("Discord gateway READY")
            elif op == 0 and event_type == "MESSAGE_CREATE":
                await self._handle_message_create(payload)
            elif op == 7:
                # RECONNECT: exit loop to reconnect
                logger.info("Discord gateway requested reconnect")
                break
            elif op == 9:
                # INVALID_SESSION: reconnect
                logger.warning("Discord gateway invalid session")
                break

    async def _identify(self) -> None:
        """Send IDENTIFY payload."""
        if not self._ws:
            return

        identify = {
            "op": 2,
            "d": {
                "token": self.config.token,
                "intents": self.config.intents,
                "properties": {
                    "os": "nanobot",
                    "browser": "nanobot",
                    "device": "nanobot",
                },
            },
        }
        await self._ws.send(json.dumps(identify))

    async def _start_heartbeat(self, interval_s: float) -> None:
        """Start or restart the heartbeat loop."""
        if self._heartbeat_task:
            self._heartbeat_task.cancel()

        async def heartbeat_loop() -> None:
            while self._running and self._ws:
                payload = {"op": 1, "d": self._seq}
                try:
                    await self._ws.send(json.dumps(payload))
                except Exception as e:
                    logger.warning(f"Discord heartbeat failed: {e}")
                    break
                await asyncio.sleep(interval_s)

        self._heartbeat_task = asyncio.create_task(heartbeat_loop())

    async def _handle_message_create(self, payload: dict[str, Any]) -> None:
        """Handle incoming Discord messages."""
        author = payload.get("author") or {}
        if author.get("bot"):
            return

        sender_id = str(author.get("id", ""))
        channel_id = str(payload.get("channel_id", ""))
        content = payload.get("content") or ""

        if not sender_id or not channel_id:
            return

        if not self.is_allowed(sender_id):
            return

        content_parts = [content] if content else []
        media_paths: list[str] = []
        media_dir = Path.home() / ".nanobot" / "media"

        for attachment in payload.get("attachments") or []:
            url = attachment.get("url")
            filename = attachment.get("filename") or "attachment"
            size = attachment.get("size") or 0
            if not url or not self._http:
                continue
            if size and size > MAX_ATTACHMENT_BYTES:
                content_parts.append(f"[attachment: {filename} - too large]")
                continue
            try:
                media_dir.mkdir(parents=True, exist_ok=True)
                file_path = (
                    media_dir / f"{attachment.get('id', 'file')}_{filename.replace('/', '_')}"
                )
                resp = await self._http.get(url)
                resp.raise_for_status()
                file_path.write_bytes(resp.content)
                media_paths.append(str(file_path))
                content_parts.append(f"[attachment: {file_path}]")
            except Exception as e:
                logger.warning(f"Failed to download Discord attachment: {e}")
                content_parts.append(f"[attachment: {filename} - download failed]")

        reply_to = (payload.get("referenced_message") or {}).get("id")

        await self._start_typing(channel_id)

        await self._handle_message(
            sender_id=sender_id,
            chat_id=channel_id,
            content="\n".join(p for p in content_parts if p) or "[empty message]",
            media=media_paths,
            metadata={
                "message_id": str(payload.get("id", "")),
                "guild_id": payload.get("guild_id"),
                "reply_to": reply_to,
            },
        )

    async def _start_typing(self, channel_id: str) -> None:
        """Start periodic typing indicator for a channel."""
        await self._stop_typing(channel_id)

        async def typing_loop() -> None:
            url = f"{DISCORD_API_BASE}/channels/{channel_id}/typing"
            headers = {"Authorization": f"Bot {self.config.token}"}
            while self._running:
                try:
                    await self._http.post(url, headers=headers)
                except Exception:
                    pass
                await asyncio.sleep(8)

        self._typing_tasks[channel_id] = asyncio.create_task(typing_loop())

    async def _stop_typing(self, channel_id: str) -> None:
        """Stop typing indicator for a channel."""
        task = self._typing_tasks.pop(channel_id, None)
        if task:
            task.cancel()


================================================
FILE: nanobot/nanobot/channels/email.py
================================================
"""Email channel implementation using IMAP polling + SMTP replies."""

import asyncio
import html
import imaplib
import re
import smtplib
import ssl
from datetime import date
from email import policy
from email.header import decode_header, make_header
from email.message import EmailMessage
from email.parser import BytesParser
from email.utils import parseaddr
from typing import Any

from loguru import logger

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import EmailConfig


class EmailChannel(BaseChannel):
    """
    Email channel.

    Inbound:
    - Poll IMAP mailbox for unread messages.
    - Convert each message into an inbound event.

    Outbound:
    - Send responses via SMTP back to the sender address.
    """

    name = "email"
    _IMAP_MONTHS = (
        "Jan",
        "Feb",
        "Mar",
        "Apr",
        "May",
        "Jun",
        "Jul",
        "Aug",
        "Sep",
        "Oct",
        "Nov",
        "Dec",
    )

    def __init__(self, config: EmailConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: EmailConfig = config
        self._last_subject_by_chat: dict[str, str] = {}
        self._last_message_id_by_chat: dict[str, str] = {}
        self._processed_uids: set[str] = set()  # Capped to prevent unbounded growth
        self._MAX_PROCESSED_UIDS = 100000

    async def start(self) -> None:
        """Start polling IMAP for inbound emails."""
        if not self.config.consent_granted:
            logger.warning(
                "Email channel disabled: consent_granted is false. "
                "Set channels.email.consentGranted=true after explicit user permission."
            )
            return

        if not self._validate_config():
            return

        self._running = True
        logger.info("Starting Email channel (IMAP polling mode)...")

        poll_seconds = max(5, int(self.config.poll_interval_seconds))
        while self._running:
            try:
                inbound_items = await asyncio.to_thread(self._fetch_new_messages)
                for item in inbound_items:
                    sender = item["sender"]
                    subject = item.get("subject", "")
                    message_id = item.get("message_id", "")

                    if subject:
                        self._last_subject_by_chat[sender] = subject
                    if message_id:
                        self._last_message_id_by_chat[sender] = message_id

                    await self._handle_message(
                        sender_id=sender,
                        chat_id=sender,
                        content=item["content"],
                        metadata=item.get("metadata", {}),
                    )
            except Exception as e:
                logger.error(f"Email polling error: {e}")

            await asyncio.sleep(poll_seconds)

    async def stop(self) -> None:
        """Stop polling loop."""
        self._running = False

    async def send(self, msg: OutboundMessage) -> None:
        """Send email via SMTP."""
        if not self.config.consent_granted:
            logger.warning("Skip email send: consent_granted is false")
            return

        force_send = bool((msg.metadata or {}).get("force_send"))
        if not self.config.auto_reply_enabled and not force_send:
            logger.info("Skip automatic email reply: auto_reply_enabled is false")
            return

        if not self.config.smtp_host:
            logger.warning("Email channel SMTP host not configured")
            return

        to_addr = msg.chat_id.strip()
        if not to_addr:
            logger.warning("Email channel missing recipient address")
            return

        base_subject = self._last_subject_by_chat.get(to_addr, "nanobot reply")
        subject = self._reply_subject(base_subject)
        if msg.metadata and isinstance(msg.metadata.get("subject"), str):
            override = msg.metadata["subject"].strip()
            if override:
                subject = override

        email_msg = EmailMessage()
        email_msg["From"] = (
            self.config.from_address or self.config.smtp_username or self.config.imap_username
        )
        email_msg["To"] = to_addr
        email_msg["Subject"] = subject
        email_msg.set_content(msg.content or "")

        in_reply_to = self._last_message_id_by_chat.get(to_addr)
        if in_reply_to:
            email_msg["In-Reply-To"] = in_reply_to
            email_msg["References"] = in_reply_to

        try:
            await asyncio.to_thread(self._smtp_send, email_msg)
        except Exception as e:
            logger.error(f"Error sending email to {to_addr}: {e}")
            raise

    def _validate_config(self) -> bool:
        missing = []
        if not self.config.imap_host:
            missing.append("imap_host")
        if not self.config.imap_username:
            missing.append("imap_username")
        if not self.config.imap_password:
            missing.append("imap_password")
        if not self.config.smtp_host:
            missing.append("smtp_host")
        if not self.config.smtp_username:
            missing.append("smtp_username")
        if not self.config.smtp_password:
            missing.append("smtp_password")

        if missing:
            logger.error(f"Email channel not configured, missing: {', '.join(missing)}")
            return False
        return True

    def _smtp_send(self, msg: EmailMessage) -> None:
        timeout = 30
        if self.config.smtp_use_ssl:
            with smtplib.SMTP_SSL(
                self.config.smtp_host,
                self.config.smtp_port,
                timeout=timeout,
            ) as smtp:
                smtp.login(self.config.smtp_username, self.config.smtp_password)
                smtp.send_message(msg)
            return

        with smtplib.SMTP(self.config.smtp_host, self.config.smtp_port, timeout=timeout) as smtp:
            if self.config.smtp_use_tls:
                smtp.starttls(context=ssl.create_default_context())
            smtp.login(self.config.smtp_username, self.config.smtp_password)
            smtp.send_message(msg)

    def _fetch_new_messages(self) -> list[dict[str, Any]]:
        """Poll IMAP and return parsed unread messages."""
        return self._fetch_messages(
            search_criteria=("UNSEEN",),
            mark_seen=self.config.mark_seen,
            dedupe=True,
            limit=0,
        )

    def fetch_messages_between_dates(
        self,
        start_date: date,
        end_date: date,
        limit: int = 20,
    ) -> list[dict[str, Any]]:
        """
        Fetch messages in [start_date, end_date) by IMAP date search.

        This is used for historical summarization tasks (e.g. "yesterday").
        """
        if end_date <= start_date:
            return []

        return self._fetch_messages(
            search_criteria=(
                "SINCE",
                self._format_imap_date(start_date),
                "BEFORE",
                self._format_imap_date(end_date),
            ),
            mark_seen=False,
            dedupe=False,
            limit=max(1, int(limit)),
        )

    def _fetch_messages(
        self,
        search_criteria: tuple[str, ...],
        mark_seen: bool,
        dedupe: bool,
        limit: int,
    ) -> list[dict[str, Any]]:
        """Fetch messages by arbitrary IMAP search criteria."""
        messages: list[dict[str, Any]] = []
        mailbox = self.config.imap_mailbox or "INBOX"

        if self.config.imap_use_ssl:
            client = imaplib.IMAP4_SSL(self.config.imap_host, self.config.imap_port)
        else:
            client = imaplib.IMAP4(self.config.imap_host, self.config.imap_port)

        try:
            client.login(self.config.imap_username, self.config.imap_password)
            status, _ = client.select(mailbox)
            if status != "OK":
                return messages

            status, data = client.search(None, *search_criteria)
            if status != "OK" or not data:
                return messages

            ids = data[0].split()
            if limit > 0 and len(ids) > limit:
                ids = ids[-limit:]
            for imap_id in ids:
                status, fetched = client.fetch(imap_id, "(BODY.PEEK[] UID)")
                if status != "OK" or not fetched:
                    continue

                raw_bytes = self._extract_message_bytes(fetched)
                if raw_bytes is None:
                    continue

                uid = self._extract_uid(fetched)
                if dedupe and uid and uid in self._processed_uids:
                    continue

                parsed = BytesParser(policy=policy.default).parsebytes(raw_bytes)
                sender = parseaddr(parsed.get("From", ""))[1].strip().lower()
                if not sender:
                    continue

                subject = self._decode_header_value(parsed.get("Subject", ""))
                date_value = parsed.get("Date", "")
                message_id = parsed.get("Message-ID", "").strip()
                body = self._extract_text_body(parsed)

                if not body:
                    body = "(empty email body)"

                body = body[: self.config.max_body_chars]
                content = (
                    f"Email received.\n"
                    f"From: {sender}\n"
                    f"Subject: {subject}\n"
                    f"Date: {date_value}\n\n"
                    f"{body}"
                )

                metadata = {
                    "message_id": message_id,
                    "subject": subject,
                    "date": date_value,
                    "sender_email": sender,
                    "uid": uid,
                }
                messages.append(
                    {
                        "sender": sender,
                        "subject": subject,
                        "message_id": message_id,
                        "content": content,
                        "metadata": metadata,
                    }
                )

                if dedupe and uid:
                    self._processed_uids.add(uid)
                    # mark_seen is the primary dedup; this set is a safety net
                    if len(self._processed_uids) > self._MAX_PROCESSED_UIDS:
                        self._processed_uids.clear()

                if mark_seen:
                    client.store(imap_id, "+FLAGS", "\\Seen")
        finally:
            try:
                client.logout()
            except Exception:
                pass

        return messages

    @classmethod
    def _format_imap_date(cls, value: date) -> str:
        """Format date for IMAP search (always English month abbreviations)."""
        month = cls._IMAP_MONTHS[value.month - 1]
        return f"{value.day:02d}-{month}-{value.year}"

    @staticmethod
    def _extract_message_bytes(fetched: list[Any]) -> bytes | None:
        for item in fetched:
            if (
                isinstance(item, tuple)
                and len(item) >= 2
                and isinstance(item[1], (bytes, bytearray))
            ):
                return bytes(item[1])
        return None

    @staticmethod
    def _extract_uid(fetched: list[Any]) -> str:
        for item in fetched:
            if isinstance(item, tuple) and item and isinstance(item[0], (bytes, bytearray)):
                head = bytes(item[0]).decode("utf-8", errors="ignore")
                m = re.search(r"UID\s+(\d+)", head)
                if m:
                    return m.group(1)
        return ""

    @staticmethod
    def _decode_header_value(value: str) -> str:
        if not value:
            return ""
        try:
            return str(make_header(decode_header(value)))
        except Exception:
            return value

    @classmethod
    def _extract_text_body(cls, msg: Any) -> str:
        """Best-effort extraction of readable body text."""
        if msg.is_multipart():
            plain_parts: list[str] = []
            html_parts: list[str] = []
            for part in msg.walk():
                if part.get_content_disposition() == "attachment":
                    continue
                content_type = part.get_content_type()
                try:
                    payload = part.get_content()
                except Exception:
                    payload_bytes = part.get_payload(decode=True) or b""
                    charset = part.get_content_charset() or "utf-8"
                    payload = payload_bytes.decode(charset, errors="replace")
                if not isinstance(payload, str):
                    continue
                if content_type == "text/plain":
                    plain_parts.append(payload)
                elif content_type == "text/html":
                    html_parts.append(payload)
            if plain_parts:
                return "\n\n".join(plain_parts).strip()
            if html_parts:
                return cls._html_to_text("\n\n".join(html_parts)).strip()
            return ""

        try:
            payload = msg.get_content()
        except Exception:
            payload_bytes = msg.get_payload(decode=True) or b""
            charset = msg.get_content_charset() or "utf-8"
            payload = payload_bytes.decode(charset, errors="replace")
        if not isinstance(payload, str):
            return ""
        if msg.get_content_type() == "text/html":
            return cls._html_to_text(payload).strip()
        return payload.strip()

    @staticmethod
    def _html_to_text(raw_html: str) -> str:
        text = re.sub(r"<\s*br\s*/?>", "\n", raw_html, flags=re.IGNORECASE)
        text = re.sub(r"<\s*/\s*p\s*>", "\n", text, flags=re.IGNORECASE)
        text = re.sub(r"<[^>]+>", "", text)
        return html.unescape(text)

    def _reply_subject(self, base_subject: str) -> str:
        subject = (base_subject or "").strip() or "nanobot reply"
        prefix = self.config.subject_prefix or "Re: "
        if subject.lower().startswith("re:"):
            return subject
        return f"{prefix}{subject}"


================================================
FILE: nanobot/nanobot/channels/feishu.py
================================================
"""Feishu/Lark channel implementation using lark-oapi SDK with WebSocket long connection."""

import asyncio
import json
import re
import threading
from collections import OrderedDict
from typing import Any

from loguru import logger

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import FeishuConfig

try:
    import lark_oapi as lark
    from lark_oapi.api.im.v1 import (
        CreateMessageReactionRequest,
        CreateMessageReactionRequestBody,
        CreateMessageRequest,
        CreateMessageRequestBody,
        Emoji,
        P2ImMessageReceiveV1,
    )

    FEISHU_AVAILABLE = True
except ImportError:
    FEISHU_AVAILABLE = False
    lark = None
    Emoji = None

# Message type display mapping
MSG_TYPE_MAP = {
    "image": "[image]",
    "audio": "[audio]",
    "file": "[file]",
    "sticker": "[sticker]",
}


class FeishuChannel(BaseChannel):
    """
    Feishu/Lark channel using WebSocket long connection.

    Uses WebSocket to receive events - no public IP or webhook required.

    Requires:
    - App ID and App Secret from Feishu Open Platform
    - Bot capability enabled
    - Event subscription enabled (im.message.receive_v1)
    """

    name = "feishu"

    def __init__(self, config: FeishuConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: FeishuConfig = config
        self._client: Any = None
        self._ws_client: Any = None
        self._ws_thread: threading.Thread | None = None
        self._processed_message_ids: OrderedDict[str, None] = OrderedDict()  # Ordered dedup cache
        self._loop: asyncio.AbstractEventLoop | None = None

    async def start(self) -> None:
        """Start the Feishu bot with WebSocket long connection."""
        if not FEISHU_AVAILABLE:
            logger.error("Feishu SDK not installed. Run: pip install lark-oapi")
            return

        if not self.config.app_id or not self.config.app_secret:
            logger.error("Feishu app_id and app_secret not configured")
            return

        self._running = True
        self._loop = asyncio.get_running_loop()

        # Create Lark client for sending messages
        self._client = (
            lark.Client.builder()
            .app_id(self.config.app_id)
            .app_secret(self.config.app_secret)
            .log_level(lark.LogLevel.INFO)
            .build()
        )

        # Create event handler (only register message receive, ignore other events)
        event_handler = (
            lark.EventDispatcherHandler.builder(
                self.config.encrypt_key or "",
                self.config.verification_token or "",
            )
            .register_p2_im_message_receive_v1(self._on_message_sync)
            .build()
        )

        # Create WebSocket client for long connection
        self._ws_client = lark.ws.Client(
            self.config.app_id,
            self.config.app_secret,
            event_handler=event_handler,
            log_level=lark.LogLevel.INFO,
        )

        # Start WebSocket client in a separate thread
        def run_ws():
            try:
                self._ws_client.start()
            except Exception as e:
                logger.error(f"Feishu WebSocket error: {e}")

        self._ws_thread = threading.Thread(target=run_ws, daemon=True)
        self._ws_thread.start()

        logger.info("Feishu bot started with WebSocket long connection")
        logger.info("No public IP required - using WebSocket to receive events")

        # Keep running until stopped
        while self._running:
            await asyncio.sleep(1)

    async def stop(self) -> None:
        """Stop the Feishu bot."""
        self._running = False
        if self._ws_client:
            try:
                self._ws_client.stop()
            except Exception as e:
                logger.warning(f"Error stopping WebSocket client: {e}")
        logger.info("Feishu bot stopped")

    def _add_reaction_sync(self, message_id: str, emoji_type: str) -> None:
        """Sync helper for adding reaction (runs in thread pool)."""
        try:
            request = (
                CreateMessageReactionRequest.builder()
                .message_id(message_id)
                .request_body(
                    CreateMessageReactionRequestBody.builder()
                    .reaction_type(Emoji.builder().emoji_type(emoji_type).build())
                    .build()
                )
                .build()
            )

            response = self._client.im.v1.message_reaction.create(request)

            if not response.success():
                logger.warning(f"Failed to add reaction: code={response.code}, msg={response.msg}")
            else:
                logger.debug(f"Added {emoji_type} reaction to message {message_id}")
        except Exception as e:
            logger.warning(f"Error adding reaction: {e}")

    async def _add_reaction(self, message_id: str, emoji_type: str = "THUMBSUP") -> None:
        """
        Add a reaction emoji to a message (non-blocking).

        Common emoji types: THUMBSUP, OK, EYES, DONE, OnIt, HEART
        """
        if not self._client or not Emoji:
            return

        loop = asyncio.get_running_loop()
        await loop.run_in_executor(None, self._add_reaction_sync, message_id, emoji_type)

    # Regex to match markdown tables (header + separator + data rows)
    _TABLE_RE = re.compile(
        r"((?:^[ \t]*\|.+\|[ \t]*\n)(?:^[ \t]*\|[-:\s|]+\|[ \t]*\n)(?:^[ \t]*\|.+\|[ \t]*\n?)+)",
        re.MULTILINE,
    )

    @staticmethod
    def _split_row(row: str) -> list[str]:
        """Split a markdown table row into cells."""
        return [c.strip() for c in row.strip("|").split("|")]

    @staticmethod
    def _parse_md_table(table_text: str) -> dict | None:
        """Parse a markdown table into a Feishu table element."""
        lines = [line.strip() for line in table_text.strip().split("\n") if line.strip()]
        if len(lines) < 3:
            return None
        headers = FeishuChannel._split_row(lines[0])
        rows = [FeishuChannel._split_row(line) for line in lines[2:]]
        columns = [
            {"tag": "column", "name": f"c{i}", "display_name": h, "width": "auto"}
            for i, h in enumerate(headers)
        ]
        return {
            "tag": "table",
            "page_size": len(rows) + 1,
            "columns": columns,
            "rows": [
                {f"c{i}": r[i] if i < len(r) else "" for i in range(len(headers))} for r in rows
            ],
        }

    def _build_card_elements(self, content: str) -> list[dict]:
        """Split content into markdown + table elements for Feishu card."""
        elements, last_end = [], 0
        for m in self._TABLE_RE.finditer(content):
            before = content[last_end : m.start()].strip()
            if before:
                elements.append({"tag": "markdown", "content": before})
            elements.append(
                self._parse_md_table(m.group(1)) or {"tag": "markdown", "content": m.group(1)}
            )
            last_end = m.end()
        remaining = content[last_end:].strip()
        if remaining:
            elements.append({"tag": "markdown", "content": remaining})
        return elements or [{"tag": "markdown", "content": content}]

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through Feishu."""
        if not self._client:
            logger.warning("Feishu client not initialized")
            return

        try:
            # Determine receive_id_type based on chat_id format
            # open_id starts with "ou_", chat_id starts with "oc_"
            if msg.chat_id.startswith("oc_"):
                receive_id_type = "chat_id"
            else:
                receive_id_type = "open_id"

            # Build card with markdown + table support
            elements = self._build_card_elements(msg.content)
            card = {
                "config": {"wide_screen_mode": True},
                "elements": elements,
            }
            content = json.dumps(card, ensure_ascii=False)

            request = (
                CreateMessageRequest.builder()
                .receive_id_type(receive_id_type)
                .request_body(
                    CreateMessageRequestBody.builder()
                    .receive_id(msg.chat_id)
                    .msg_type("interactive")
                    .content(content)
                    .build()
                )
                .build()
            )

            response = self._client.im.v1.message.create(request)

            if not response.success():
                logger.error(
                    f"Failed to send Feishu message: code={response.code}, "
                    f"msg={response.msg}, log_id={response.get_log_id()}"
                )
            else:
                logger.debug(f"Feishu message sent to {msg.chat_id}")

        except Exception as e:
            logger.error(f"Error sending Feishu message: {e}")

    def _on_message_sync(self, data: "P2ImMessageReceiveV1") -> None:
        """
        Sync handler for incoming messages (called from WebSocket thread).
        Schedules async handling in the main event loop.
        """
        if self._loop and self._loop.is_running():
            asyncio.run_coroutine_threadsafe(self._on_message(data), self._loop)

    async def _on_message(self, data: "P2ImMessageReceiveV1") -> None:
        """Handle incoming message from Feishu."""
        try:
            event = data.event
            message = event.message
            sender = event.sender

            # Deduplication check
            message_id = message.message_id
            if message_id in self._processed_message_ids:
                return
            self._processed_message_ids[message_id] = None

            # Trim cache: keep most recent 500 when exceeds 1000
            while len(self._processed_message_ids) > 1000:
                self._processed_message_ids.popitem(last=False)

            # Skip bot messages
            sender_type = sender.sender_type
            if sender_type == "bot":
                return

            sender_id = sender.sender_id.open_id if sender.sender_id else "unknown"
            chat_id = message.chat_id
            chat_type = message.chat_type  # "p2p" or "group"
            msg_type = message.message_type

            # Add reaction to indicate "seen"
            await self._add_reaction(message_id, "THUMBSUP")

            # Parse message content
            if msg_type == "text":
                try:
                    content = json.loads(message.content).get("text", "")
                except json.JSONDecodeError:
                    content = message.content or ""
            else:
                content = MSG_TYPE_MAP.get(msg_type, f"[{msg_type}]")

            if not content:
                return

            # Forward to message bus
            reply_to = chat_id if chat_type == "group" else sender_id
            await self._handle_message(
                sender_id=sender_id,
                chat_id=reply_to,
                content=content,
                metadata={
                    "message_id": message_id,
                    "chat_type": chat_type,
                    "msg_type": msg_type,
                },
            )

        except Exception as e:
            logger.error(f"Error processing Feishu message: {e}")


================================================
FILE: nanobot/nanobot/channels/manager.py
================================================
"""Channel manager for coordinating chat channels."""

from __future__ import annotations

import asyncio
from typing import TYPE_CHECKING, Any

from loguru import logger

from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import Config

if TYPE_CHECKING:
    from nanobot.session.manager import SessionManager


class ChannelManager:
    """
    Manages chat channels and coordinates message routing.

    Responsibilities:
    - Initialize enabled channels (Telegram, WhatsApp, etc.)
    - Start/stop channels
    - Route outbound messages
    """

    def __init__(
        self, config: Config, bus: MessageBus, session_manager: "SessionManager | None" = None
    ):
        self.config = config
        self.bus = bus
        self.session_manager = session_manager
        self.channels: dict[str, BaseChannel] = {}
        self._dispatch_task: asyncio.Task | None = None

        self._init_channels()

    def _init_channels(self) -> None:
        """Initialize channels based on config."""

        # Telegram channel
        if self.config.channels.telegram.enabled:
            try:
                from nanobot.channels.telegram import TelegramChannel

                self.channels["telegram"] = TelegramChannel(
                    self.config.channels.telegram,
                    self.bus,
                    groq_api_key=self.config.providers.groq.api_key,
                    session_manager=self.session_manager,
                )
                logger.info("Telegram channel enabled")
            except ImportError as e:
                logger.warning(f"Telegram channel not available: {e}")

        # WhatsApp channel
        if self.config.channels.whatsapp.enabled:
            try:
                from nanobot.channels.whatsapp import WhatsAppChannel

                self.channels["whatsapp"] = WhatsAppChannel(self.config.channels.whatsapp, self.bus)
                logger.info("WhatsApp channel enabled")
            except ImportError as e:
                logger.warning(f"WhatsApp channel not available: {e}")

        # Discord channel
        if self.config.channels.discord.enabled:
            try:
                from nanobot.channels.discord import DiscordChannel

                self.channels["discord"] = DiscordChannel(self.config.channels.discord, self.bus)
                logger.info("Discord channel enabled")
            except ImportError as e:
                logger.warning(f"Discord channel not available: {e}")

        # Feishu channel
        if self.config.channels.feishu.enabled:
            try:
                from nanobot.channels.feishu import FeishuChannel

                self.channels["feishu"] = FeishuChannel(self.config.channels.feishu, self.bus)
                logger.info("Feishu channel enabled")
            except ImportError as e:
                logger.warning(f"Feishu channel not available: {e}")

        # DingTalk channel
        if self.config.channels.dingtalk.enabled:
            try:
                from nanobot.channels.dingtalk import DingTalkChannel

                self.channels["dingtalk"] = DingTalkChannel(self.config.channels.dingtalk, self.bus)
                logger.info("DingTalk channel enabled")
            except ImportError as e:
                logger.warning(f"DingTalk channel not available: {e}")

        # Email channel
        if self.config.channels.email.enabled:
            try:
                from nanobot.channels.email import EmailChannel

                self.channels["email"] = EmailChannel(self.config.channels.email, self.bus)
                logger.info("Email channel enabled")
            except ImportError as e:
                logger.warning(f"Email channel not available: {e}")

        # Slack channel
        if self.config.channels.slack.enabled:
            try:
                from nanobot.channels.slack import SlackChannel

                self.channels["slack"] = SlackChannel(self.config.channels.slack, self.bus)
                logger.info("Slack channel enabled")
            except ImportError as e:
                logger.warning(f"Slack channel not available: {e}")

        # QQ channel
        if self.config.channels.qq.enabled:
            try:
                from nanobot.channels.qq import QQChannel

                self.channels["qq"] = QQChannel(
                    self.config.channels.qq,
                    self.bus,
                )
                logger.info("QQ channel enabled")
            except ImportError as e:
                logger.warning(f"QQ channel not available: {e}")

    async def _start_channel(self, name: str, channel: BaseChannel) -> None:
        """Start a channel and log any exceptions."""
        try:
            await channel.start()
        except Exception as e:
            logger.error(f"Failed to start channel {name}: {e}")

    async def start_all(self) -> None:
        """Start all channels and the outbound dispatcher."""
        if not self.channels:
            logger.warning("No channels enabled")
            return

        # Start outbound dispatcher
        self._dispatch_task = asyncio.create_task(self._dispatch_outbound())

        # Start channels
        tasks = []
        for name, channel in self.channels.items():
            logger.info(f"Starting {name} channel...")
            tasks.append(asyncio.create_task(self._start_channel(name, channel)))

        # Wait for all to complete (they should run forever)
        await asyncio.gather(*tasks, return_exceptions=True)

    async def stop_all(self) -> None:
        """Stop all channels and the dispatcher."""
        logger.info("Stopping all channels...")

        # Stop dispatcher
        if self._dispatch_task:
            self._dispatch_task.cancel()
            try:
                await self._dispatch_task
            except asyncio.CancelledError:
                pass

        # Stop all channels
        for name, channel in self.channels.items():
            try:
                await channel.stop()
                logger.info(f"Stopped {name} channel")
            except Exception as e:
                logger.error(f"Error stopping {name}: {e}")

    async def _dispatch_outbound(self) -> None:
        """Dispatch outbound messages to the appropriate channel."""
        logger.info("Outbound dispatcher started")

        while True:
            try:
                msg = await asyncio.wait_for(self.bus.consume_outbound(), timeout=1.0)

                channel = self.channels.get(msg.channel)
                if channel:
                    try:
                        await channel.send(msg)
                    except Exception as e:
                        logger.error(f"Error sending to {msg.channel}: {e}")
                else:
                    logger.warning(f"Unknown channel: {msg.channel}")

            except asyncio.TimeoutError:
                continue
            except asyncio.CancelledError:
                break

    def get_channel(self, name: str) -> BaseChannel | None:
        """Get a channel by name."""
        return self.channels.get(name)

    def get_status(self) -> dict[str, Any]:
        """Get status of all channels."""
        return {
            name: {"enabled": True, "running": channel.is_running}
            for name, channel in self.channels.items()
        }

    @property
    def enabled_channels(self) -> list[str]:
        """Get list of enabled channel names."""
        return list(self.channels.keys())


================================================
FILE: nanobot/nanobot/channels/qq.py
================================================
"""QQ channel implementation using botpy SDK."""

import asyncio
from collections import deque
from typing import TYPE_CHECKING

from loguru import logger

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import QQConfig

try:
    import botpy
    from botpy.message import C2CMessage

    QQ_AVAILABLE = True
except ImportError:
    QQ_AVAILABLE = False
    botpy = None
    C2CMessage = None

if TYPE_CHECKING:
    from botpy.message import C2CMessage


def _make_bot_class(channel: "QQChannel") -> "type[botpy.Client]":
    """Create a botpy Client subclass bound to the given channel."""
    intents = botpy.Intents(c2c_message=True)

    class _Bot(botpy.Client):
        def __init__(self):
            super().__init__(intents=intents)

        async def on_ready(self):
            logger.info(f"QQ bot ready: {self.robot.name}")

        async def on_c2c_message_create(self, message: "C2CMessage"):
            await channel._on_message(message)

        async def on_direct_message_create(self, message):
            await channel._on_message(message)

    return _Bot


class QQChannel(BaseChannel):
    """QQ channel using botpy SDK with WebSocket connection."""

    name = "qq"

    def __init__(self, config: QQConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: QQConfig = config
        self._client: "botpy.Client | None" = None
        self._processed_ids: deque = deque(maxlen=1000)
        self._bot_task: asyncio.Task | None = None

    async def start(self) -> None:
        """Start the QQ bot."""
        if not QQ_AVAILABLE:
            logger.error("QQ SDK not installed. Run: pip install qq-botpy")
            return

        if not self.config.app_id or not self.config.secret:
            logger.error("QQ app_id and secret not configured")
            return

        self._running = True
        bot_class = _make_bot_class(self)
        self._client = bot_class()

        self._bot_task = asyncio.create_task(self._run_bot())
        logger.info("QQ bot started (C2C private message)")

    async def _run_bot(self) -> None:
        """Run the bot connection."""
        try:
            await self._client.start(appid=self.config.app_id, secret=self.config.secret)
        except Exception as e:
            logger.error(f"QQ auth failed, check AppID/Secret at q.qq.com: {e}")
            self._running = False

    async def stop(self) -> None:
        """Stop the QQ bot."""
        self._running = False
        if self._bot_task:
            self._bot_task.cancel()
            try:
                await self._bot_task
            except asyncio.CancelledError:
                pass
        logger.info("QQ bot stopped")

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through QQ."""
        if not self._client:
            logger.warning("QQ client not initialized")
            return
        try:
            await self._client.api.post_c2c_message(
                openid=msg.chat_id,
                msg_type=0,
                content=msg.content,
            )
        except Exception as e:
            logger.error(f"Error sending QQ message: {e}")

    async def _on_message(self, data: "C2CMessage") -> None:
        """Handle incoming message from QQ."""
        try:
            # Dedup by message ID
            if data.id in self._processed_ids:
                return
            self._processed_ids.append(data.id)

            author = data.author
            user_id = str(getattr(author, "id", None) or getattr(author, "user_openid", "unknown"))
            content = (data.content or "").strip()
            if not content:
                return

            await self._handle_message(
                sender_id=user_id,
                chat_id=user_id,
                content=content,
                metadata={"message_id": data.id},
            )
        except Exception as e:
            logger.error(f"Error handling QQ message: {e}")


================================================
FILE: nanobot/nanobot/channels/slack.py
================================================
"""Slack channel implementation using Socket Mode."""

import asyncio
import re

from loguru import logger
from slack_sdk.socket_mode.request import SocketModeRequest
from slack_sdk.socket_mode.response import SocketModeResponse
from slack_sdk.socket_mode.websockets import SocketModeClient
from slack_sdk.web.async_client import AsyncWebClient

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import SlackConfig


class SlackChannel(BaseChannel):
    """Slack channel using Socket Mode."""

    name = "slack"

    def __init__(self, config: SlackConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: SlackConfig = config
        self._web_client: AsyncWebClient | None = None
        self._socket_client: SocketModeClient | None = None
        self._bot_user_id: str | None = None

    async def start(self) -> None:
        """Start the Slack Socket Mode client."""
        if not self.config.bot_token or not self.config.app_token:
            logger.error("Slack bot/app token not configured")
            return
        if self.config.mode != "socket":
            logger.error(f"Unsupported Slack mode: {self.config.mode}")
            return

        self._running = True

        self._web_client = AsyncWebClient(token=self.config.bot_token)
        self._socket_client = SocketModeClient(
            app_token=self.config.app_token,
            web_client=self._web_client,
        )

        self._socket_client.socket_mode_request_listeners.append(self._on_socket_request)

        # Resolve bot user ID for mention handling
        try:
            auth = await self._web_client.auth_test()
            self._bot_user_id = auth.get("user_id")
            logger.info(f"Slack bot connected as {self._bot_user_id}")
        except Exception as e:
            logger.warning(f"Slack auth_test failed: {e}")

        logger.info("Starting Slack Socket Mode client...")
        await self._socket_client.connect()

        while self._running:
            await asyncio.sleep(1)

    async def stop(self) -> None:
        """Stop the Slack client."""
        self._running = False
        if self._socket_client:
            try:
                await self._socket_client.close()
            except Exception as e:
                logger.warning(f"Slack socket close failed: {e}")
            self._socket_client = None

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through Slack."""
        if not self._web_client:
            logger.warning("Slack client not running")
            return
        try:
            slack_meta = msg.metadata.get("slack", {}) if msg.metadata else {}
            thread_ts = slack_meta.get("thread_ts")
            channel_type = slack_meta.get("channel_type")
            # Only reply in thread for channel/group messages; DMs don't use threads
            use_thread = thread_ts and channel_type != "im"
            await self._web_client.chat_postMessage(
                channel=msg.chat_id,
                text=msg.content or "",
                thread_ts=thread_ts if use_thread else None,
            )
        except Exception as e:
            logger.error(f"Error sending Slack message: {e}")

    async def _on_socket_request(
        self,
        client: SocketModeClient,
        req: SocketModeRequest,
    ) -> None:
        """Handle incoming Socket Mode requests."""
        if req.type != "events_api":
            return

        # Acknowledge right away
        await client.send_socket_mode_response(SocketModeResponse(envelope_id=req.envelope_id))

        payload = req.payload or {}
        event = payload.get("event") or {}
        event_type = event.get("type")

        # Handle app mentions or plain messages
        if event_type not in ("message", "app_mention"):
            return

        sender_id = event.get("user")
        chat_id = event.get("channel")

        # Ignore bot/system messages (any subtype = not a normal user message)
        if event.get("subtype"):
            return
        if self._bot_user_id and sender_id == self._bot_user_id:
            return

        # Avoid double-processing: Slack sends both `message` and `app_mention`
        # for mentions in channels. Prefer `app_mention`.
        text = event.get("text") or ""
        if event_type == "message" and self._bot_user_id and f"<@{self._bot_user_id}>" in text:
            return

        # Debug: log basic event shape
        logger.debug(
            "Slack event: type={} subtype={} user={} channel={} channel_type={} text={}",
            event_type,
            event.get("subtype"),
            sender_id,
            chat_id,
            event.get("channel_type"),
            text[:80],
        )
        if not sender_id or not chat_id:
            return

        channel_type = event.get("channel_type") or ""

        if not self._is_allowed(sender_id, chat_id, channel_type):
            return

        if channel_type != "im" and not self._should_respond_in_channel(event_type, text, chat_id):
            return

        text = self._strip_bot_mention(text)

        thread_ts = event.get("thread_ts") or event.get("ts")
        # Add :eyes: reaction to the triggering message (best-effort)
        try:
            if self._web_client and event.get("ts"):
                await self._web_client.reactions_add(
                    channel=chat_id,
                    name="eyes",
                    timestamp=event.get("ts"),
                )
        except Exception as e:
            logger.debug(f"Slack reactions_add failed: {e}")

        await self._handle_message(
            sender_id=sender_id,
            chat_id=chat_id,
            content=text,
            metadata={
                "slack": {
                    "event": event,
                    "thread_ts": thread_ts,
                    "channel_type": channel_type,
                }
            },
        )

    def _is_allowed(self, sender_id: str, chat_id: str, channel_type: str) -> bool:
        if channel_type == "im":
            if not self.config.dm.enabled:
                return False
            if self.config.dm.policy == "allowlist":
                return sender_id in self.config.dm.allow_from
            return True

        # Group / channel messages
        if self.config.group_policy == "allowlist":
            return chat_id in self.config.group_allow_from
        return True

    def _should_respond_in_channel(self, event_type: str, text: str, chat_id: str) -> bool:
        if self.config.group_policy == "open":
            return True
        if self.config.group_policy == "mention":
            if event_type == "app_mention":
                return True
            return self._bot_user_id is not None and f"<@{self._bot_user_id}>" in text
        if self.config.group_policy == "allowlist":
            return chat_id in self.config.group_allow_from
        return False

    def _strip_bot_mention(self, text: str) -> str:
        if not text or not self._bot_user_id:
            return text
        return re.sub(rf"<@{re.escape(self._bot_user_id)}>\s*", "", text).strip()


================================================
FILE: nanobot/nanobot/channels/telegram.py
================================================
"""Telegram channel implementation using python-telegram-bot."""

from __future__ import annotations

import asyncio
import re
from typing import TYPE_CHECKING

from loguru import logger
from telegram import BotCommand, Update
from telegram.ext import Application, CommandHandler, ContextTypes, MessageHandler, filters

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import TelegramConfig

if TYPE_CHECKING:
    from nanobot.session.manager import SessionManager


def _markdown_to_telegram_html(text: str) -> str:
    """
    Convert markdown to Telegram-safe HTML.
    """
    if not text:
        return ""

    # 1. Extract and protect code blocks (preserve content from other processing)
    code_blocks: list[str] = []

    def save_code_block(m: re.Match) -> str:
        code_blocks.append(m.group(1))
        return f"\x00CB{len(code_blocks) - 1}\x00"

    text = re.sub(r"```[\w]*\n?([\s\S]*?)```", save_code_block, text)

    # 2. Extract and protect inline code
    inline_codes: list[str] = []

    def save_inline_code(m: re.Match) -> str:
        inline_codes.append(m.group(1))
        return f"\x00IC{len(inline_codes) - 1}\x00"

    text = re.sub(r"`([^`]+)`", save_inline_code, text)

    # 3. Headers # Title -> just the title text
    text = re.sub(r"^#{1,6}\s+(.+)$", r"\1", text, flags=re.MULTILINE)

    # 4. Blockquotes > text -> just the text (before HTML escaping)
    text = re.sub(r"^>\s*(.*)$", r"\1", text, flags=re.MULTILINE)

    # 5. Escape HTML special characters
    text = text.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")

    # 6. Links [text](url) - must be before bold/italic to handle nested cases
    text = re.sub(r"\[([^\]]+)\]\(([^)]+)\)", r'<a href="\2">\1</a>', text)

    # 7. Bold **text** or __text__
    text = re.sub(r"\*\*(.+?)\*\*", r"<b>\1</b>", text)
    text = re.sub(r"__(.+?)__", r"<b>\1</b>", text)

    # 8. Italic _text_ (avoid matching inside words like some_var_name)
    text = re.sub(r"(?<![a-zA-Z0-9])_([^_]+)_(?![a-zA-Z0-9])", r"<i>\1</i>", text)

    # 9. Strikethrough ~~text~~
    text = re.sub(r"~~(.+?)~~", r"<s>\1</s>", text)

    # 10. Bullet lists - item -> • item
    text = re.sub(r"^[-*]\s+", "• ", text, flags=re.MULTILINE)

    # 11. Restore inline code with HTML tags
    for i, code in enumerate(inline_codes):
        # Escape HTML in code content
        escaped = code.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")
        text = text.replace(f"\x00IC{i}\x00", f"<code>{escaped}</code>")

    # 12. Restore code blocks with HTML tags
    for i, code in enumerate(code_blocks):
        # Escape HTML in code content
        escaped = code.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")
        text = text.replace(f"\x00CB{i}\x00", f"<pre><code>{escaped}</code></pre>")

    return text


class TelegramChannel(BaseChannel):
    """
    Telegram channel using long polling.

    Simple and reliable - no webhook/public IP needed.
    """

    name = "telegram"

    # Commands registered with Telegram's command menu
    BOT_COMMANDS = [
        BotCommand("start", "Start the bot"),
        BotCommand("reset", "Reset conversation history"),
        BotCommand("help", "Show available commands"),
    ]

    def __init__(
        self,
        config: TelegramConfig,
        bus: MessageBus,
        groq_api_key: str = "",
        session_manager: SessionManager | None = None,
    ):
        super().__init__(config, bus)
        self.config: TelegramConfig = config
        self.groq_api_key = groq_api_key
        self.session_manager = session_manager
        self._app: Application | None = None
        self._chat_ids: dict[str, int] = {}  # Map sender_id to chat_id for replies
        self._typing_tasks: dict[str, asyncio.Task] = {}  # chat_id -> typing loop task

    async def start(self) -> None:
        """Start the Telegram bot with long polling."""
        if not self.config.token:
            logger.error("Telegram bot token not configured")
            return

        self._running = True

        # Build the application
        builder = Application.builder().token(self.config.token)
        if self.config.proxy:
            builder = builder.proxy(self.config.proxy).get_updates_proxy(self.config.proxy)
        self._app = builder.build()

        # Add command handlers
        self._app.add_handler(CommandHandler("start", self._on_start))
        self._app.add_handler(CommandHandler("reset", self._on_reset))
        self._app.add_handler(CommandHandler("help", self._on_help))

        # Add message handler for text, photos, voice, documents
        self._app.add_handler(
            MessageHandler(
                (
                    filters.TEXT
                    | filters.PHOTO
                    | filters.VOICE
                    | filters.AUDIO
                    | filters.Document.ALL
                )
                & ~filters.COMMAND,
                self._on_message,
            )
        )

        logger.info("Starting Telegram bot (polling mode)...")

        # Initialize and start polling
        await self._app.initialize()
        await self._app.start()

        # Get bot info and register command menu
        bot_info = await self._app.bot.get_me()
        logger.info(f"Telegram bot @{bot_info.username} connected")

        try:
            await self._app.bot.set_my_commands(self.BOT_COMMANDS)
            logger.debug("Telegram bot commands registered")
        except Exception as e:
            logger.warning(f"Failed to register bot commands: {e}")

        # Start polling (this runs until stopped)
        await self._app.updater.start_polling(
            allowed_updates=["message"],
            drop_pending_updates=True,  # Ignore old messages on startup
        )

        # Keep running until stopped
        while self._running:
            await asyncio.sleep(1)

    async def stop(self) -> None:
        """Stop the Telegram bot."""
        self._running = False

        # Cancel all typing indicators
        for chat_id in list(self._typing_tasks):
            self._stop_typing(chat_id)

        if self._app:
            logger.info("Stopping Telegram bot...")
            await self._app.updater.stop()
            await self._app.stop()
            await self._app.shutdown()
            self._app = None

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through Telegram."""
        if not self._app:
            logger.warning("Telegram bot not running")
            return

        # Stop typing indicator for this chat
        self._stop_typing(msg.chat_id)

        try:
            # chat_id should be the Telegram chat ID (integer)
            chat_id = int(msg.chat_id)
            # Convert markdown to Telegram HTML
            html_content = _markdown_to_telegram_html(msg.content)
            await self._app.bot.send_message(chat_id=chat_id, text=html_content, parse_mode="HTML")
        except ValueError:
            logger.error(f"Invalid chat_id: {msg.chat_id}")
        except Exception as e:
            # Fallback to plain text if HTML parsing fails
            logger.warning(f"HTML parse failed, falling back to plain text: {e}")
            try:
                await self._app.bot.send_message(chat_id=int(msg.chat_id), text=msg.content)
            except Exception as e2:
                logger.error(f"Error sending Telegram message: {e2}")

    async def _on_start(self, update: Update, context: ContextTypes.DEFAULT_TYPE) -> None:
        """Handle /start command."""
        if not update.message or not update.effective_user:
            return

        user = update.effective_user
        await update.message.reply_text(
            f"👋 Hi {user.first_name}! I'm nanobot.\n\n"
            "Send me a message and I'll respond!\n"
            "Type /help to see available commands."
        )

    async def _on_reset(self, update: Update, context: ContextTypes.DEFAULT_TYPE) -> None:
        """Handle /reset command — clear conversation history."""
        if not update.message or not update.effective_user:
            return

        chat_id = str(update.message.chat_id)
        session_key = f"{self.name}:{chat_id}"

        if self.session_manager is None:
            logger.warning("/reset called but session_manager is not available")
            await update.message.reply_text("⚠️ Session management is not available.")
            return

        session = self.session_manager.get_or_create(session_key)
        msg_count = len(session.messages)
        session.clear()
        self.session_manager.save(session)

        logger.info(f"Session reset for {session_key} (cleared {msg_count} messages)")
        await update.message.reply_text("🔄 Conversation history cleared. Let's start fresh!")

    async def _on_help(self, update: Update, context: ContextTypes.DEFAULT_TYPE) -> None:
        """Handle /help command — show available commands."""
        if not update.message:
            return

        help_text = (
            "🐈 <b>nanobot commands</b>\n\n"
            "/start — Start the bot\n"
            "/reset — Reset conversation history\n"
            "/help — Show this help message\n\n"
            "Just send me a text message to chat!"
        )
        await update.message.reply_text(help_text, parse_mode="HTML")

    async def _on_message(self, update: Update, context: ContextTypes.DEFAULT_TYPE) -> None:
        """Handle incoming messages (text, photos, voice, documents)."""
        if not update.message or not update.effective_user:
            return

        message = update.message
        user = update.effective_user
        chat_id = message.chat_id

        # Use stable numeric ID, but keep username for allowlist compatibility
        sender_id = str(user.id)
        if user.username:
            sender_id = f"{sender_id}|{user.username}"

        # Store chat_id for replies
        self._chat_ids[sender_id] = chat_id

        # Build content from text and/or media
        content_parts = []
        media_paths = []

        # Text content
        if message.text:
            content_parts.append(message.text)
        if message.caption:
            content_parts.append(message.caption)

        # Handle media files
        media_file = None
        media_type = None

        if message.photo:
            media_file = message.photo[-1]  # Largest photo
            media_type = "image"
        elif message.voice:
            media_file = message.voice
            media_type = "voice"
        elif message.audio:
            media_file = message.audio
            media_type = "audio"
        elif message.document:
            media_file = message.document
            media_type = "file"

        # Download media if present
        if media_file and self._app:
            try:
                file = await self._app.bot.get_file(media_file.file_id)
                ext = self._get_extension(media_type, getattr(media_file, "mime_type", None))

                # Save to workspace/media/
                from pathlib import Path

                media_dir = Path.home() / ".nanobot" / "media"
                media_dir.mkdir(parents=True, exist_ok=True)

                file_path = media_dir / f"{media_file.file_id[:16]}{ext}"
                await file.download_to_drive(str(file_path))

                media_paths.append(str(file_path))

                # Handle voice transcription
                if media_type == "voice" or media_type == "audio":
                    from nanobot.providers.transcription import GroqTranscriptionProvider

                    transcriber = GroqTranscriptionProvider(api_key=self.groq_api_key)
                    transcription = await transcriber.transcribe(file_path)
                    if transcription:
                        logger.info(f"Transcribed {media_type}: {transcription[:50]}...")
                        content_parts.append(f"[transcription: {transcription}]")
                    else:
                        content_parts.append(f"[{media_type}: {file_path}]")
                else:
                    content_parts.append(f"[{media_type}: {file_path}]")

                logger.debug(f"Downloaded {media_type} to {file_path}")
            except Exception as e:
                logger.error(f"Failed to download media: {e}")
                content_parts.append(f"[{media_type}: download failed]")

        content = "\n".join(content_parts) if content_parts else "[empty message]"

        logger.debug(f"Telegram message from {sender_id}: {content[:50]}...")

        str_chat_id = str(chat_id)

        # Start typing indicator before processing
        self._start_typing(str_chat_id)

        # Forward to the message bus
        await self._handle_message(
            sender_id=sender_id,
            chat_id=str_chat_id,
            content=content,
            media=media_paths,
            metadata={
                "message_id": message.message_id,
                "user_id": user.id,
                "username": user.username,
                "first_name": user.first_name,
                "is_group": message.chat.type != "private",
            },
        )

    def _start_typing(self, chat_id: str) -> None:
        """Start sending 'typing...' indicator for a chat."""
        # Cancel any existing typing task for this chat
        self._stop_typing(chat_id)
        self._typing_tasks[chat_id] = asyncio.create_task(self._typing_loop(chat_id))

    def _stop_typing(self, chat_id: str) -> None:
        """Stop the typing indicator for a chat."""
        task = self._typing_tasks.pop(chat_id, None)
        if task and not task.done():
            task.cancel()

    async def _typing_loop(self, chat_id: str) -> None:
        """Repeatedly send 'typing' action until cancelled."""
        try:
            while self._app:
                await self._app.bot.send_chat_action(chat_id=int(chat_id), action="typing")
                await asyncio.sleep(4)
        except asyncio.CancelledError:
            pass
        except Exception as e:
            logger.debug(f"Typing indicator stopped for {chat_id}: {e}")

    def _get_extension(self, media_type: str, mime_type: str | None) -> str:
        """Get file extension based on media type."""
        if mime_type:
            ext_map = {
                "image/jpeg": ".jpg",
                "image/png": ".png",
                "image/gif": ".gif",
                "audio/ogg": ".ogg",
                "audio/mpeg": ".mp3",
                "audio/mp4": ".m4a",
            }
            if mime_type in ext_map:
                return ext_map[mime_type]

        type_map = {"image": ".jpg", "voice": ".ogg", "audio": ".mp3", "file": ""}
        return type_map.get(media_type, "")


================================================
FILE: nanobot/nanobot/channels/whatsapp.py
================================================
"""WhatsApp channel implementation using Node.js bridge."""

import asyncio
import json

from loguru import logger

from nanobot.bus.events import OutboundMessage
from nanobot.bus.queue import MessageBus
from nanobot.channels.base import BaseChannel
from nanobot.config.schema import WhatsAppConfig


class WhatsAppChannel(BaseChannel):
    """
    WhatsApp channel that connects to a Node.js bridge.

    The bridge uses @whiskeysockets/baileys to handle the WhatsApp Web protocol.
    Communication between Python and Node.js is via WebSocket.
    """

    name = "whatsapp"

    def __init__(self, config: WhatsAppConfig, bus: MessageBus):
        super().__init__(config, bus)
        self.config: WhatsAppConfig = config
        self._ws = None
        self._connected = False

    async def start(self) -> None:
        """Start the WhatsApp channel by connecting to the bridge."""
        import websockets

        bridge_url = self.config.bridge_url

        logger.info(f"Connecting to WhatsApp bridge at {bridge_url}...")

        self._running = True

        while self._running:
            try:
                async with websockets.connect(bridge_url) as ws:
                    self._ws = ws
                    self._connected = True
                    logger.info("Connected to WhatsApp bridge")

                    # Listen for messages
                    async for message in ws:
                        try:
                            await self._handle_bridge_message(message)
                        except Exception as e:
                            logger.error(f"Error handling bridge message: {e}")

            except asyncio.CancelledError:
                break
            except Exception as e:
                self._connected = False
                self._ws = None
                logger.warning(f"WhatsApp bridge connection error: {e}")

                if self._running:
                    logger.info("Reconnecting in 5 seconds...")
                    await asyncio.sleep(5)

    async def stop(self) -> None:
        """Stop the WhatsApp channel."""
        self._running = False
        self._connected = False

        if self._ws:
            await self._ws.close()
            self._ws = None

    async def send(self, msg: OutboundMessage) -> None:
        """Send a message through WhatsApp."""
        if not self._ws or not self._connected:
            logger.warning("WhatsApp bridge not connected")
            return

        try:
            payload = {"type": "send", "to": msg.chat_id, "text": msg.content}
            await self._ws.send(json.dumps(payload))
        except Exception as e:
            logger.error(f"Error sending WhatsApp message: {e}")

    async def _handle_bridge_message(self, raw: str) -> None:
        """Handle a message from the bridge."""
        try:
            data = json.loads(raw)
        except json.JSONDecodeError:
            logger.warning(f"Invalid JSON from bridge: {raw[:100]}")
            return

        msg_type = data.get("type")

        if msg_type == "message":
            # Incoming message from WhatsApp
            # Deprecated by whatsapp: old phone number style typically: <phone>@s.whatspp.net
            pn = data.get("pn", "")
            # New LID sytle typically:
            sender = data.get("sender", "")
            content = data.get("content", "")

            # Extract just the phone number or lid as chat_id
            user_id = pn if pn else sender
            sender_id = user_id.split("@")[0] if "@" in user_id else user_id
            logger.info(f"Sender {sender}")

            # Handle voice transcription if it's a voice message
            if content == "[Voice Message]":
                logger.info(
                    f"Voice message received from {sender_id}, but direct download from bridge is not yet supported."
                )
                content = "[Voice Message: Transcription not available for WhatsApp yet]"

            await self._handle_message(
                sender_id=sender_id,
                chat_id=sender,  # Use full LID for replies
                content=content,
                metadata={
                    "message_id": data.get("id"),
                    "timestamp": data.get("timestamp"),
                    "is_group": data.get("isGroup", False),
                },
            )

        elif msg_type == "status":
            # Connection status update
            status = data.get("status")
            logger.info(f"WhatsApp status: {status}")

            if status == "connected":
                self._connected = True
            elif status == "disconnected":
                self._connected = False

        elif msg_type == "qr":
            # QR code for authentication
            logger.info("Scan QR code in the bridge terminal to connect WhatsApp")

        elif msg_type == "error":
            logger.error(f"WhatsApp bridge error: {data.get('error')}")


================================================
FILE: nanobot/nanobot/cli/__init__.py
================================================
"""CLI module for nanobot."""


================================================
FILE: nanobot/nanobot/cli/commands.py
================================================
"""CLI commands for nanobot."""

import asyncio
import atexit
import os
import select
import signal
import sys
from pathlib import Path

import typer
from rich.console import Console
from rich.markdown import Markdown
from rich.panel import Panel
from rich.table import Table
from rich.text import Text

from nanobot import __logo__, __version__

app = typer.Typer(
    name="nanobot",
    help=f"{__logo__} nanobot - Personal AI Assistant",
    no_args_is_help=True,
)

console = Console()
EXIT_COMMANDS = {"exit", "quit", "/exit", "/quit", ":q"}

# ---------------------------------------------------------------------------
# Lightweight CLI input: readline for arrow keys / history, termios for flush
# ---------------------------------------------------------------------------

_READLINE = None
_HISTORY_FILE: Path | None = None
_HISTORY_HOOK_REGISTERED = False
_USING_LIBEDIT = False
_SAVED_TERM_ATTRS = None  # original termios settings, restored on exit


def _flush_pending_tty_input() -> None:
    """Drop unread keypresses typed while the model was generating output."""
    try:
        fd = sys.stdin.fileno()
        if not os.isatty(fd):
            return
    except Exception:
        return

    try:
        import termios

        termios.tcflush(fd, termios.TCIFLUSH)
        return
    except Exception:
        pass

    try:
        while True:
            ready, _, _ = select.select([fd], [], [], 0)
            if not ready:
                break
            if not os.read(fd, 4096):
                break
    except Exception:
        return


def _save_history() -> None:
    if _READLINE is None or _HISTORY_FILE is None:
        return
    try:
        _READLINE.write_history_file(str(_HISTORY_FILE))
    except Exception:
        return


def _restore_terminal() -> None:
    """Restore terminal to its original state (echo, line buffering, etc.)."""
    if _SAVED_TERM_ATTRS is None:
        return
    try:
        import termios

        termios.tcsetattr(sys.stdin.fileno(), termios.TCSADRAIN, _SAVED_TERM_ATTRS)
    except Exception:
        pass


def _enable_line_editing() -> None:
    """Enable readline for arrow keys, line editing, and persistent history."""
    global _READLINE, _HISTORY_FILE, _HISTORY_HOOK_REGISTERED, _USING_LIBEDIT, _SAVED_TERM_ATTRS

    # Save terminal state before readline touches it
    try:
        import termios

        _SAVED_TERM_ATTRS = termios.tcgetattr(sys.stdin.fileno())
    except Exception:
        pass

    history_file = Path.home() / ".nanobot" / "history" / "cli_history"
    history_file.parent.mkdir(parents=True, exist_ok=True)
    _HISTORY_FILE = history_file

    try:
        import readline
    except ImportError:
        return

    _READLINE = readline
    _USING_LIBEDIT = "libedit" in (readline.__doc__ or "").lower()

    try:
        if _USING_LIBEDIT:
            readline.parse_and_bind("bind ^I rl_complete")
        else:
            readline.parse_and_bind("tab: complete")
        readline.parse_and_bind("set editing-mode emacs")
    except Exception:
        pass

    try:
        readline.read_history_file(str(history_file))
    except Exception:
        pass

    if not _HISTORY_HOOK_REGISTERED:
        atexit.register(_save_history)
        _HISTORY_HOOK_REGISTERED = True


def _prompt_text() -> str:
    """Build a readline-friendly colored prompt."""
    if _READLINE is None:
        return "You: "
    # libedit on macOS does not honor GNU readline non-printing markers.
    if _USING_LIBEDIT:
        return "\033[1;34mYou:\033[0m "
    return "\001\033[1;34m\002You:\001\033[0m\002 "


def _print_agent_response(response: str, render_markdown: bool) -> None:
    """Render assistant response with consistent terminal styling."""
    content = response or ""
    body = Markdown(content) if render_markdown else Text(content)
    console.print()
    console.print(
        Panel(
            body,
            title=f"{__logo__} nanobot",
            title_align="left",
            border_style="cyan",
            padding=(0, 1),
        )
    )
    console.print()


def _is_exit_command(command: str) -> bool:
    """Return True when input should end interactive chat."""
    return command.lower() in EXIT_COMMANDS


async def _read_interactive_input_async() -> str:
    """Read user input with arrow keys and history (runs input() in a thread)."""
    try:
        return await asyncio.to_thread(input, _prompt_text())
    except EOFError as exc:
        raise KeyboardInterrupt from exc


def version_callback(value: bool):
    if value:
        console.print(f"{__logo__} nanobot v{__version__}")
        raise typer.Exit()


@app.callback()
def main(
    version: bool = typer.Option(None, "--version", "-v", callback=version_callback, is_eager=True),
):
    """nanobot - Personal AI Assistant."""
    pass


# ============================================================================
# Onboard / Setup
# ============================================================================


@app.command()
def onboard():
    """Initialize nanobot configuration and workspace."""
    from nanobot.config.loader import get_config_path, save_config
    from nanobot.config.schema import Config
    from nanobot.utils.helpers import get_workspace_path

    config_path = get_config_path()

    if config_path.exists():
        console.print(f"[yellow]Config already exists at {config_path}[/yellow]")
        if not typer.confirm("Overwrite?"):
            raise typer.Exit()

    # Create default config
    config = Config()
    save_config(config)
    console.print(f"[green]✓[/green] Created config at {config_path}")

    # Create workspace
    workspace = get_workspace_path()
    console.print(f"[green]✓[/green] Created workspace at {workspace}")

    # Create default bootstrap files
    _create_workspace_templates(workspace)

    console.print(f"\n{__logo__} nanobot is ready!")
    console.print("\nNext steps:")
    console.print("  1. Add your API key to [cyan]~/.nanobot/config.json[/cyan]")
    console.print("     Get one at: https://openrouter.ai/keys")
    console.print('  2. Chat: [cyan]nanobot agent -m "Hello!"[/cyan]')
    console.print(
        "\n[dim]Want Telegram/WhatsApp? See: https://github.com/HKUDS/nanobot#-chat-apps[/dim]"
    )


def _create_workspace_templates(workspace: Path):
    """Create default workspace template files."""
    templates = {
        "AGENTS.md": """# Agent Instructions

You are a helpful AI assistant. Be concise, accurate, and friendly.

## Guidelines

- Always explain what you're doing before taking actions
- Ask for clarification when the request is ambiguous
- Use tools to help accomplish tasks
- Remember important information in your memory files
""",
        "SOUL.md": """# Soul

I am nanobot, a lightweight AI assistant.

## Personality

- Helpful and friendly
- Concise and to the point
- Curious and eager to learn

## Values

- Accuracy over speed
- User privacy and safety
- Transparency in actions
""",
        "USER.md": """# User

Information about the user goes here.

## Preferences

- Communication style: (casual/formal)
- Timezone: (your timezone)
- Language: (your preferred language)
""",
    }

    for filename, content in templates.items():
        file_path = workspace / filename
        if not file_path.exists():
            file_path.write_text(content)
            console.print(f"  [dim]Created {filename}[/dim]")

    # Create memory directory and MEMORY.md
    memory_dir = workspace / "memory"
    memory_dir.mkdir(exist_ok=True)
    memory_file = memory_dir / "MEMORY.md"
    if not memory_file.exists():
        memory_file.write_text("""# Long-term Memory

This file stores important information that should persist across sessions.

## User Information

(Important facts about the user)

## Preferences

(User preferences learned over time)

## Important Notes

(Things to remember)
""")
        console.print("  [dim]Created memory/MEMORY.md[/dim]")


def _make_provider(config):
    """Create LiteLLMProvider from config. Exits if no API key found."""
    from nanobot.providers.litellm_provider import LiteLLMProvider

    p = config.get_provider()
    model = config.agents.defaults.model
    if not (p and p.api_key) and not model.startswith("bedrock/"):
        console.print("[red]Error: No API key configured.[/red]")
        console.print("Set one in ~/.nanobot/config.json under providers section")
        raise typer.Exit(1)
    return LiteLLMProvider(
        api_key=p.api_key if p else None,
        api_base=config.get_api_base(),
        default_model=model,
        extra_headers=p.extra_headers if p else None,
        provider_name=config.get_provider_name(),
    )


# ============================================================================
# Gateway / Server
# ============================================================================


@app.command()
def gateway(
    port: int = typer.Option(18790, "--port", "-p", help="Gateway port"),
    verbose: bool = typer.Option(False, "--verbose", "-v", help="Verbose output"),
):
    """Start the nanobot gateway."""
    from nanobot.agent.loop import AgentLoop
    from nanobot.bus.queue import MessageBus
    from nanobot.channels.manager import ChannelManager
    from nanobot.config.loader import get_data_dir, load_config
    from nanobot.cron.service import CronService
    from nanobot.cron.types import CronJob
    from nanobot.heartbeat.service import HeartbeatService
    from nanobot.session.manager import SessionManager

    if verbose:
        import logging

        logging.basicConfig(level=logging.DEBUG)

    console.print(f"{__logo__} Starting nanobot gateway on port {port}...")

    config = load_config()
    bus = MessageBus()
    provider = _make_provider(config)
    session_manager = SessionManager(config.workspace_path)

    # Create cron service first (callback set after agent creation)
    cron_store_path = get_data_dir() / "cron" / "jobs.json"
    cron = CronService(cron_store_path)

    # Create agent with cron service
    agent = AgentLoop(
        bus=bus,
        provider=provider,
        workspace=config.workspace_path,
        model=config.agents.defaults.model,
        max_iterations=config.agents.defaults.max_tool_iterations,
        brave_api_key=config.tools.web.search.api_key or None,
        exec_config=config.tools.exec,
        cron_service=cron,
        restrict_to_workspace=config.tools.restrict_to_workspace,
        session_manager=session_manager,
    )

    # Set cron callback (needs agent)
    async def on_cron_job(job: CronJob) -> str | None:
        """Execute a cron job through the agent."""
        response = await agent.process_direct(
            job.payload.message,
            session_key=f"cron:{job.id}",
            channel=job.payload.channel or "cli",
            chat_id=job.payload.to or "direct",
        )
        if job.payload.deliver and job.payload.to:
            from nanobot.bus.events import OutboundMessage

            await bus.publish_outbound(
                OutboundMessage(
                    channel=job.payload.channel or "cli",
                    chat_id=job.payload.to,
                    content=response or "",
                )
            )
        return response

    cron.on_job = on_cron_job

    # Create heartbeat service
    async def on_heartbeat(prompt: str) -> str:
        """Execute heartbeat through the agent."""
        return await agent.process_direct(prompt, session_key="heartbeat")

    heartbeat = HeartbeatService(
        workspace=config.workspace_path,
        on_heartbeat=on_heartbeat,
        interval_s=30 * 60,  # 30 minutes
        enabled=True,
    )

    # Create channel manager
    channels = ChannelManager(config, bus, session_manager=session_manager)

    if channels.enabled_channels:
        console.print(f"[green]✓[/green] Channels enabled: {', '.join(channels.enabled_channels)}")
    else:
        console.print("[yellow]Warning: No channels enabled[/yellow]")

    cron_status = cron.status()
    if cron_status["jobs"] > 0:
        console.print(f"[green]✓[/green] Cron: {cron_status['jobs']} scheduled jobs")

    console.print("[green]✓[/green] Heartbeat: every 30m")

    async def run():
        try:
            await cron.start()
            await heartbeat.start()
            await asyncio.gather(
                agent.run(),
                channels.start_all(),
            )
        except KeyboardInterrupt:
            console.print("\nShutting down...")
            heartbeat.stop()
            cron.stop()
            agent.stop()
            await channels.stop_all()

    asyncio.run(run())


# ============================================================================
# Agent Commands
# ============================================================================


@app.command()
def agent(
    message: str = typer.Option(None, "--message", "-m", help="Message to send to the agent"),
    session_id: str = typer.Option("cli:default", "--session", "-s", help="Session ID"),
    markdown: bool = typer.Option(
        True, "--markdown/--no-markdown", help="Render assistant output as Markdown"
    ),
    logs: bool = typer.Option(
        False, "--logs/--no-logs", help="Show nanobot runtime logs during chat"
    ),
):
    """Interact with the agent directly."""
    from loguru import logger

    from nanobot.agent.loop import AgentLoop
    from nanobot.bus.queue import MessageBus
    from nanobot.config.loader import load_config

    config = load_config()

    bus = MessageBus()
    provider = _make_provider(config)

    if logs:
        logger.enable("nanobot")
    else:
        logger.disable("nanobot")

    agent_loop = AgentLoop(
        bus=bus,
        provider=provider,
        workspace=config.workspace_path,
        brave_api_key=config.tools.web.search.api_key or None,
        exec_config=config.tools.exec,
        restrict_to_workspace=config.tools.restrict_to_workspace,
    )

    # Show spinner when logs are off (no output to miss); skip when logs are on
    def _thinking_ctx():
        if logs:
            from contextlib import nullcontext

            return nullcontext()
        return console.status("[dim]nanobot is thinking...[/dim]", spinner="dots")

    if message:
        # Single message mode
        async def run_once():
            with _thinking_ctx():
                response = await agent_loop.process_direct(message, session_id)
            _print_agent_response(response, render_markdown=markdown)

        asyncio.run(run_once())
    else:
        # Interactive mode
        _enable_line_editing()
        console.print(
            f"{__logo__} Interactive mode (type [bold]exit[/bold] or [bold]Ctrl+C[/bold] to quit)\n"
        )

        # input() runs in a worker thread that can't be cancelled.
        # Without this handler, asyncio.run() would hang waiting for it.
        def _exit_on_sigint(signum, frame):
            _save_history()
            _restore_terminal()
            console.print("\nGoodbye!")
            os._exit(0)

        signal.signal(signal.SIGINT, _exit_on_sigint)

        async def run_interactive():
            while True:
                try:
                    _flush_pending_tty_input()
                    user_input = await _read_interactive_input_async()
                    command = user_input.strip()
                    if not command:
                        continue

                    if _is_exit_command(command):
                        _save_history()
                        _restore_terminal()
                        console.print("\nGoodbye!")
                        break

                    with _thinking_ctx():
                        response = await agent_loop.process_direct(user_input, session_id)
                    _print_agent_response(response, render_markdown=markdown)
                except KeyboardInterrupt:
                    _save_history()
                    _restore_terminal()
                    console.print("\nGoodbye!")
                    break
                except EOFError:
                    _save_history()
                    _restore_terminal()
                    console.print("\nGoodbye!")
                    break

        asyncio.run(run_interactive())


# ============================================================================
# Channel Commands
# ============================================================================


channels_app = typer.Typer(help="Manage channels")
app.add_typer(channels_app, name="channels")


@channels_app.command("status")
def channels_status():
    """Show channel status."""
    from nanobot.config.loader import load_config

    config = load_config()

    table = Table(title="Channel Status")
    table.add_column("Channel", style="cyan")
    table.add_column("Enabled", style="green")
    table.add_column("Configuration", style="yellow")

    # WhatsApp
    wa = config.channels.whatsapp
    table.add_row("WhatsApp", "✓" if wa.enabled else "✗", wa.bridge_url)

    dc = config.channels.discord
    table.add_row("Discord", "✓" if dc.enabled else "✗", dc.gateway_url)

    # Telegram
    tg = config.channels.telegram
    tg_config = f"token: {tg.token[:10]}..." if tg.token else "[dim]not configured[/dim]"
    table.add_row("Telegram", "✓" if tg.enabled else "✗", tg_config)

    # Slack
    slack = config.channels.slack
    slack_config = "socket" if slack.app_token and slack.bot_token else "[dim]not configured[/dim]"
    table.add_row("Slack", "✓" if slack.enabled else "✗", slack_config)

    console.print(table)


def _get_bridge_dir() -> Path:
    """Get the bridge directory, setting it up if needed."""
    import shutil
    import subprocess

    # User's bridge location
    user_bridge = Path.home() / ".nanobot" / "bridge"

    # Check if already built
    if (user_bridge / "dist" / "index.js").exists():
        return user_bridge

    # Check for npm
    if not shutil.which("npm"):
        console.print("[red]npm not found. Please install Node.js >= 18.[/red]")
        raise typer.Exit(1)

    # Find source bridge: first check package data, then source dir
    pkg_bridge = Path(__file__).parent.parent / "bridge"  # nanobot/bridge (installed)
    src_bridge = Path(__file__).parent.parent.parent / "bridge"  # repo root/bridge (dev)

    source = None
    if (pkg_bridge / "package.json").exists():
        source = pkg_bridge
    elif (src_bridge / "package.json").exists():
        source = src_bridge

    if not source:
        console.print("[red]Bridge source not found.[/red]")
        console.print("Try reinstalling: pip install --force-reinstall nanobot")
        raise typer.Exit(1)

    console.print(f"{__logo__} Setting up bridge...")

    # Copy to user directory
    user_bridge.parent.mkdir(parents=True, exist_ok=True)
    if user_bridge.exists():
        shutil.rmtree(user_bridge)
    shutil.copytree(source, user_bridge, ignore=shutil.ignore_patterns("node_modules", "dist"))

    # Install and build
    try:
        console.print("  Installing dependencies...")
        subprocess.run(["npm", "install"], cwd=user_bridge, check=True, capture_output=True)

        console.print("  Building...")
        subprocess.run(["npm", "run", "build"], cwd=user_bridge, check=True, capture_output=True)

        console.print("[green]✓[/green] Bridge ready\n")
    except subprocess.CalledProcessError as e:
        console.print(f"[red]Build failed: {e}[/red]")
        if e.stderr:
            console.print(f"[dim]{e.stderr.decode()[:500]}[/dim]")
        raise typer.Exit(1)

    return user_bridge


@channels_app.command("login")
def channels_login():
    """Link device via QR code."""
    import subprocess

    bridge_dir = _get_bridge_dir()

    console.print(f"{__logo__} Starting bridge...")
    console.print("Scan the QR code to connect.\n")

    try:
        subprocess.run(["npm", "start"], cwd=bridge_dir, check=True)
    except subprocess.CalledProcessError as e:
        console.print(f"[red]Bridge failed: {e}[/red]")
    except FileNotFoundError:
        console.print("[red]npm not found. Please install Node.js.[/red]")


# ============================================================================
# Cron Commands
# ============================================================================

cron_app = typer.Typer(help="Manage scheduled tasks")
app.add_typer(cron_app, name="cron")


@cron_app.command("list")
def cron_list(
    all: bool = typer.Option(False, "--all", "-a", help="Include disabled jobs"),
):
    """List scheduled jobs."""
    from nanobot.config.loader import get_data_dir
    from nanobot.cron.service import CronService

    store_path = get_data_dir() / "cron" / "jobs.json"
    service = CronService(store_path)

    jobs = service.list_jobs(include_disabled=all)

    if not jobs:
        console.print("No scheduled jobs.")
        return

    table = Table(title="Scheduled Jobs")
    table.add_column("ID", style="cyan")
    table.add_column("Name")
    table.add_column("Schedule")
    table.add_column("Status")
    table.add_column("Next Run")

    import time

    for job in jobs:
        # Format schedule
        if job.schedule.kind == "every":
            sched = f"every {(job.schedule.every_ms or 0) // 1000}s"
        elif job.schedule.kind == "cron":
            sched = job.schedule.expr or ""
        else:
            sched = "one-time"

        # Format next run
        next_run = ""
        if job.state.next_run_at_ms:
            next_time = time.strftime(
                "%Y-%m-%d %H:%M", time.localtime(job.state.next_run_at_ms / 1000)
            )
            next_run = next_time

        status = "[green]enabled[/green]" if job.enabled else "[dim]disabled[/dim]"

        table.add_row(job.id, job.name, sched, status, next_run)

    console.print(table)


@cron_app.command("add")
def cron_add(
    name: str = typer.Option(..., "--name", "-n", help="Job name"),
    message: str = typer.Option(..., "--message", "-m", help="Message for agent"),
    every: int = typer.Option(None, "--every", "-e", help="Run every N seconds"),
    cron_expr: str = typer.Option(None, "--cron", "-c", help="Cron expression (e.g. '0 9 * * *')"),
    at: str = typer.Option(None, "--at", help="Run once at time (ISO format)"),
    deliver: bool = typer.Option(False, "--deliver", "-d", help="Deliver response to channel"),
    to: str = typer.Option(None, "--to", help="Recipient for delivery"),
    channel: str = typer.Option(
        None, "--channel", help="Channel for delivery (e.g. 'telegram', 'whatsapp')"
    ),
):
    """Add a scheduled job."""
    from nanobot.config.loader import get_data_dir
    from nanobot.cron.service import CronService
    from nanobot.cron.types import CronSchedule

    # Determine schedule type
    if every:
        schedule = CronSchedule(kind="every", every_ms=every * 1000)
    elif cron_expr:
        schedule = CronSchedule(kind="cron", expr=cron_expr)
    elif at:
        import datetime

        dt = datetime.datetime.fromisoformat(at)
        schedule = CronSchedule(kind="at", at_ms=int(dt.timestamp() * 1000))
    else:
        console.print("[red]Error: Must specify --every, --cron, or --at[/red]")
        raise typer.Exit(1)

    store_path = get_data_dir() / "cron" / "jobs.json"
    service = CronService(store_path)

    job = service.add_job(
        name=name,
        schedule=schedule,
        message=message,
        deliver=deliver,
        to=to,
        channel=channel,
    )

    console.print(f"[green]✓[/green] Added job '{job.name}' ({job.id})")


@cron_app.command("remove")
def cron_remove(
    job_id: str = typer.Argument(..., help="Job ID to remove"),
):
    """Remove a scheduled job."""
    from nanobot.config.loader import get_data_dir
    from nanobot.cron.service import CronService

    store_path = get_data_dir() / "cron" / "jobs.json"
    service = CronService(store_path)

    if service.remove_job(job_id):
        console.print(f"[green]✓[/green] Removed job {job_id}")
    else:
        console.print(f"[red]Job {job_id} not found[/red]")


@cron_app.command("enable")
def cron_enable(
    job_id: str = typer.Argument(..., help="Job ID"),
    disable: bool = typer.Option(False, "--disable", help="Disable instead of enable"),
):
    """Enable or disable a job."""
    from nanobot.config.loader import get_data_dir
    from nanobot.cron.service import CronService

    store_path = get_data_dir() / "cron" / "jobs.json"
    service = CronService(store_path)

    job = service.enable_job(job_id, enabled=not disable)
    if job:
        status = "disabled" if disable else "enabled"
        console.print(f"[green]✓[/green] Job '{job.name}' {status}")
    else:
        console.print(f"[red]Job {job_id} not found[/red]")


@cron_app.command("run")
def cron_run(
    job_id: str = typer.Argument(..., help="Job ID to run"),
    force: bool = typer.Option(False, "--force", "-f", help="Run even if disabled"),
):
    """Manually run a job."""
    from nanobot.config.loader import get_data_dir
    from nanobot.cron.service import CronService

    store_path = get_data_dir() / "cron" / "jobs.json"
    service = CronService(store_path)

    async def run():
        return await service.run_job(job_id, force=force)

    if asyncio.run(run()):
        console.print("[green]✓[/green] Job executed")
    else:
        console.print(f"[red]Failed to run job {job_id}[/red]")


# ============================================================================
# Status Commands
# ============================================================================


@app.command()
def status():
    """Show nanobot status."""
    from nanobot.config.loader import get_config_path, load_config

    config_path = get_config_path()
    config = load_config()
    workspace = config.workspace_path

    console.print(f"{__logo__} nanobot Status\n")

    console.print(
        f"Config: {config_path} {'[green]✓[/green]' if config_path.exists() else '[red]✗[/red]'}"
    )
    console.print(
        f"Workspace: {workspace} {'[green]✓[/green]' if workspace.exists() else '[red]✗[/red]'}"
    )

    if config_path.exists():
        from nanobot.providers.registry import PROVIDERS

        console.print(f"Model: {config.agents.defaults.model}")

        # Check API keys from registry
        for spec in PROVIDERS:
            p = getattr(config.providers, spec.name, None)
            if p is None:
                continue
            if spec.is_local:
                # Local deployments show api_base instead of api_key
                if p.api_base:
                    console.print(f"{spec.label}: [green]✓ {p.api_base}[/green]")
                else:
                    console.print(f"{spec.label}: [dim]not set[/dim]")
            else:
                has_key = bool(p.api_key)
                console.print(
                    f"{spec.label}: {'[green]✓[/green]' if has_key else '[dim]not set[/dim]'}"
                )


if __name__ == "__main__":
    app()


================================================
FILE: nanobot/nanobot/config/__init__.py
================================================
"""Configuration module for nanobot."""

from nanobot.config.loader import get_config_path, load_config
from nanobot.config.schema import Config

__all__ = ["Config", "load_config", "get_config_path"]


================================================
FILE: nanobot/nanobot/config/loader.py
================================================
"""Configuration loading utilities."""

import json
from pathlib import Path
from typing import Any

from nanobot.config.schema import Config


def get_config_path() -> Path:
    """Get the default configuration file path."""
    return Path.home() / ".nanobot" / "config.json"


def get_data_dir() -> Path:
    """Get the nanobot data directory."""
    from nanobot.utils.helpers import get_data_path

    return get_data_path()


def load_config(config_path: Path | None = None) -> Config:
    """
    Load configuration from file or create default.

    Args:
        config_path: Optional path to config file. Uses default if not provided.

    Returns:
        Loaded configuration object.
    """
    path = config_path or get_config_path()

    if path.exists():
        try:
            with open(path) as f:
                data = json.load(f)
            data = _migrate_config(data)
            return Config.model_validate(convert_keys(data))
        except (json.JSONDecodeError, ValueError) as e:
            print(f"Warning: Failed to load config from {path}: {e}")
            print("Using default configuration.")

    return Config()


def save_config(config: Config, config_path: Path | None = None) -> None:
    """
    Save configuration to file.

    Args:
        config: Configuration to save.
        config_path: Optional path to save to. Uses default if not provided.
    """
    path = config_path or get_config_path()
    path.parent.mkdir(parents=True, exist_ok=True)

    # Convert to camelCase format
    data = config.model_dump()
    data = convert_to_camel(data)

    with open(path, "w") as f:
        json.dump(data, f, indent=2)


def _migrate_config(data: dict) -> dict:
    """Migrate old config formats to current."""
    # Move tools.exec.restrictToWorkspace → tools.restrictToWorkspace
    tools = data.get("tools", {})
    exec_cfg = tools.get("exec", {})
    if "restrictToWorkspace" in exec_cfg and "restrictToWorkspace" not in tools:
        tools["restrictToWorkspace"] = exec_cfg.pop("restrictToWorkspace")
    return data


def convert_keys(data: Any) -> Any:
    """Convert camelCase keys to snake_case for Pydantic."""
    if isinstance(data, dict):
        return {camel_to_snake(k): convert_keys(v) for k, v in data.items()}
    if isinstance(data, list):
        return [convert_keys(item) for item in data]
    return data


def convert_to_camel(data: Any) -> Any:
    """Convert snake_case keys to camelCase."""
    if isinstance(data, dict):
        return {snake_to_camel(k): convert_to_camel(v) for k, v in data.items()}
    if isinstance(data, list):
        return [convert_to_camel(item) for item in data]
    return data


def camel_to_snake(name: str) -> str:
    """Convert camelCase to snake_case."""
    result = []
    for i, char in enumerate(name):
        if char.isupper() and i > 0:
            result.append("_")
        result.append(char.lower())
    return "".join(result)


def snake_to_camel(name: str) -> str:
    """Convert snake_case to camelCase."""
    components = name.split("_")
    return components[0] + "".join(x.title() for x in components[1:])


================================================
FILE: nanobot/nanobot/config/schema.py
================================================
"""Configuration schema using Pydantic."""

from pathlib import Path

from pydantic import BaseModel, Field
from pydantic_settings import BaseSettings


class WhatsAppConfig(BaseModel):
    """WhatsApp channel configuration."""

    enabled: bool = False
    bridge_url: str = "ws://localhost:3001"
    allow_from: list[str] = Field(default_factory=list)  # Allowed phone numbers


class TelegramConfig(BaseModel):
    """Telegram channel configuration."""

    enabled: bool = False
    token: str = ""  # Bot token from @BotFather
    allow_from: list[str] = Field(default_factory=list)  # Allowed user IDs or usernames
    proxy: str | None = (
        None  # HTTP/SOCKS5 proxy URL, e.g. "http://127.0.0.1:7890" or "socks5://127.0.0.1:1080"
    )


class FeishuConfig(BaseModel):
    """Feishu/Lark channel configuration using WebSocket long connection."""

    enabled: bool = False
    app_id: str = ""  # App ID from Feishu Open Platform
    app_secret: str = ""  # App Secret from Feishu Open Platform
    encrypt_key: str = ""  # Encrypt Key for event subscription (optional)
    verification_token: str = ""  # Verification Token for event subscription (optional)
    allow_from: list[str] = Field(default_factory=list)  # Allowed user open_ids


class DingTalkConfig(BaseModel):
    """DingTalk channel configuration using Stream mode."""

    enabled: bool = False
    client_id: str = ""  # AppKey
    client_secret: str = ""  # AppSecret
    allow_from: list[str] = Field(default_factory=list)  # Allowed staff_ids


class DiscordConfig(BaseModel):
    """Discord channel configuration."""

    enabled: bool = False
    token: str = ""  # Bot token from Discord Developer Portal
    allow_from: list[str] = Field(default_factory=list)  # Allowed user IDs
    gateway_url: str = "wss://gateway.discord.gg/?v=10&encoding=json"
    intents: int = 37377  # GUILDS + GUILD_MESSAGES + DIRECT_MESSAGES + MESSAGE_CONTENT


class EmailConfig(BaseModel):
    """Email channel configuration (IMAP inbound + SMTP outbound)."""

    enabled: bool = False
    consent_granted: bool = False  # Explicit owner permission to access mailbox data

    # IMAP (receive)
    imap_host: str = ""
    imap_port: int = 993
    imap_username: str = ""
    imap_password: str = ""
    imap_mailbox: str = "INBOX"
    imap_use_ssl: bool = True

    # SMTP (send)
    smtp_host: str = ""
    smtp_port: int = 587
    smtp_username: str = ""
    smtp_password: str = ""
    smtp_use_tls: bool = True
    smtp_use_ssl: bool = False
    from_address: str = ""

    # Behavior
    auto_reply_enabled: bool = (
        True  # If false, inbound email is read but no automatic reply is sent
    )
    poll_interval_seconds: int = 30
    mark_seen: bool = True
    max_body_chars: int = 12000
    subject_prefix: str = "Re: "
    allow_from: list[str] = Field(default_factory=list)  # Allowed sender email addresses


class SlackDMConfig(BaseModel):
    """Slack DM policy configuration."""

    enabled: bool = True
    policy: str = "open"  # "open" or "allowlist"
    allow_from: list[str] = Field(default_factory=list)  # Allowed Slack user IDs


class SlackConfig(BaseModel):
    """Slack channel configuration."""

    enabled: bool = False
    mode: str = "socket"  # "socket" supported
    webhook_path: str = "/slack/events"
    bot_token: str = ""  # xoxb-...
    app_token: str = ""  # xapp-...
    user_token_read_only: bool = True
    group_policy: str = "open"  # "open", "mention", "allowlist"
    group_allow_from: list[str] = Field(default_factory=list)  # Allowed channel IDs if allowlist
    dm: SlackDMConfig = Field(default_factory=SlackDMConfig)


class QQConfig(BaseModel):
    """QQ channel configuration using botpy SDK."""

    enabled: bool = False
    app_id: str = ""  # 机器人 ID (AppID) from q.qq.com
    secret: str = ""  # 机器人密钥 (AppSecret) from q.qq.com
    allow_from: list[str] = Field(
        default_factory=list
    )  # Allowed user openids (empty = public access)


class ChannelsConfig(BaseModel):
    """Configuration for chat channels."""

    whatsapp: WhatsAppConfig = Field(default_factory=WhatsAppConfig)
    telegram: TelegramConfig = Field(default_factory=TelegramConfig)
    discord: DiscordConfig = Field(default_factory=DiscordConfig)
    feishu: FeishuConfig = Field(default_factory=FeishuConfig)
    dingtalk: DingTalkConfig = Field(default_factory=DingTalkConfig)
    email: EmailConfig = Field(default_factory=EmailConfig)
    slack: SlackConfig = Field(default_factory=SlackConfig)
    qq: QQConfig = Field(default_factory=QQConfig)


class AgentDefaults(BaseModel):
    """Default agent configuration."""

    workspace: str = "~/.nanobot/workspace"
    model: str = "anthropic/claude-opus-4-5"
    max_tokens: int = 8192
    temperature: float = 0.7
    max_tool_iterations: int = 20


class AgentsConfig(BaseModel):
    """Agent configuration."""

    defaults: AgentDefaults = Field(default_factory=AgentDefaults)


class ProviderConfig(BaseModel):
    """LLM provider configuration."""

    api_key: str = ""
    api_base: str | None = None
    extra_headers: dict[str, str] | None = None  # Custom headers (e.g. APP-Code for AiHubMix)


class ProvidersConfig(BaseModel):
    """Configuration for LLM providers."""

    anthropic: ProviderConfig = Field(default_factory=ProviderConfig)
    openai: ProviderConfig = Field(default_factory=ProviderConfig)
    openrouter: ProviderConfig = Field(default_factory=ProviderConfig)
    deepseek: ProviderConfig = Field(default_factory=ProviderConfig)
    groq: ProviderConfig = Field(default_factory=ProviderConfig)
    zhipu: ProviderConfig = Field(default_factory=ProviderConfig)
    dashscope: ProviderConfig = Field(default_factory=ProviderConfig)  # 阿里云通义千问
    vllm: ProviderConfig = Field(default_factory=ProviderConfig)
    gemini: ProviderConfig = Field(default_factory=ProviderConfig)
    moonshot: ProviderConfig = Field(default_factory=ProviderConfig)
    aihubmix: ProviderConfig = Field(default_factory=ProviderConfig)  # AiHubMix API gateway


class GatewayConfig(BaseModel):
    """Gateway/server configuration."""

    host: str = "0.0.0.0"
    port: int = 18790


class WebSearchConfig(BaseModel):
    """Web search tool configuration."""

    api_key: str = ""  # Brave Search API key
    max_results: int = 5


class WebToolsConfig(BaseModel):
    """Web tools configuration."""

    search: WebSearchConfig = Field(default_factory=WebSearchConfig)


class ExecToolConfig(BaseModel):
    """Shell exec tool configuration."""

    timeout: int = 60


class ToolsConfig(BaseModel):
    """Tools configuration."""

    web: WebToolsConfig = Field(default_factory=WebToolsConfig)
    exec: ExecToolConfig = Field(default_factory=ExecToolConfig)
    restrict_to_workspace: bool = False  # If true, restrict all tool access to workspace directory


class Config(BaseSettings):
    """Root configuration for nanobot."""

    agents: AgentsConfig = Field(default_factory=AgentsConfig)
    channels: ChannelsConfig = Field(default_factory=ChannelsConfig)
    providers: ProvidersConfig = Field(default_factory=ProvidersConfig)
    gateway: GatewayConfig = Field(default_factory=GatewayConfig)
    tools: ToolsConfig = Field(default_factory=ToolsConfig)

    @property
    def workspace_path(self) -> Path:
        """Get expanded workspace path."""
        return Path(self.agents.defaults.workspace).expanduser()

    def _match_provider(
        self, model: str | None = None
    ) -> tuple["ProviderConfig | None", str | None]:
        """Match provider config and its registry name. Returns (config, spec_name)."""
        from nanobot.providers.registry import PROVIDERS

        model_lower = (model or self.agents.defaults.model).lower()

        # Match by keyword (order follows PROVIDERS registry)
        for spec in PROVIDERS:
            p = getattr(self.providers, spec.name, None)
            if p and any(kw in model_lower for kw in spec.keywords) and p.api_key:
                return p, spec.name

        # Fallback: gateways first, then others (follows registry order)
        for spec in PROVIDERS:
            p = getattr(self.providers, spec.name, None)
            if p and p.api_key:
                return p, spec.name
        return None, None

    def get_provider(self, model: str | None = None) -> ProviderConfig | None:
        """Get matched provider config (api_key, api_base, extra_headers). Falls back to first available."""
        p, _ = self._match_provider(model)
        return p

    def get_provider_name(self, model: str | None = None) -> str | None:
        """Get the registry name of the matched provider (e.g. "deepseek", "openrouter")."""
        _, name = self._match_provider(model)
        return name

    def get_api_key(self, model: str | None = None) -> str | None:
        """Get API key for the given model. Falls back to first available key."""
        p = self.get_provider(model)
        return p.api_key if p else None

    def get_api_base(self, model: str | None = None) -> str | None:
        """Get API base URL for the given model. Applies default URLs for known gateways."""
        from nanobot.providers.registry import find_by_name

        p, name = self._match_provider(model)
        if p and p.api_base:
            return p.api_base
        # Only gateways get a default api_base here. Standard providers
        # (like Moonshot) set their base URL via env vars in _setup_env
        # to avoid polluting the global litellm.api_base.
        if name:
            spec = find_by_name(name)
            if spec and spec.is_gateway and spec.default_api_base:
                return spec.default_api_base
        return None

    class Config:
        env_prefix = "NANOBOT_"
        env_nested_delimiter = "__"


================================================
FILE: nanobot/nanobot/cron/__init__.py
================================================
"""Cron service for scheduled agent tasks."""

from nanobot.cron.service import CronService
from nanobot.cron.types import CronJob, CronSchedule

__all__ = ["CronService", "CronJob", "CronSchedule"]


================================================
FILE: nanobot/nanobot/cron/service.py
================================================
"""Cron service for scheduling agent tasks."""

import asyncio
import json
import time
import uuid
from pathlib import Path
from typing import Any, Callable, Coroutine

from loguru import logger

from nanobot.cron.types import CronJob, CronJobState, CronPayload, CronSchedule, CronStore


def _now_ms() -> int:
    return int(time.time() * 1000)


def _compute_next_run(schedule: CronSchedule, now_ms: int) -> int | None:
    """Compute next run time in ms."""
    if schedule.kind == "at":
        return schedule.at_ms if schedule.at_ms and schedule.at_ms > now_ms else None

    if schedule.kind == "every":
        if not schedule.every_ms or schedule.every_ms <= 0:
            return None
        # Next interval from now
        return now_ms + schedule.every_ms

    if schedule.kind == "cron" and schedule.expr:
        try:
            from croniter import croniter

            cron = croniter(schedule.expr, time.time())
            next_time = cron.get_next()
            return int(next_time * 1000)
        except Exception:
            return None

    return None


class CronService:
    """Service for managing and executing scheduled jobs."""

    def __init__(
        self,
        store_path: Path,
        on_job: Callable[[CronJob], Coroutine[Any, Any, str | None]] | None = None,
    ):
        self.store_path = store_path
        self.on_job = on_job  # Callback to execute job, returns response text
        self._store: CronStore | None = None
        self._timer_task: asyncio.Task | None = None
        self._running = False

    def _load_store(self) -> CronStore:
        """Load jobs from disk."""
        if self._store:
            return self._store

        if self.store_path.exists():
            try:
                data = json.loads(self.store_path.read_text())
                jobs = []
                for j in data.get("jobs", []):
                    jobs.append(
                        CronJob(
                            id=j["id"],
                            name=j["name"],
                            enabled=j.get("enabled", True),
                            schedule=CronSchedule(
                                kind=j["schedule"]["kind"],
                                at_ms=j["schedule"].get("atMs"),
                                every_ms=j["schedule"].get("everyMs"),
                                expr=j["schedule"].get("expr"),
                                tz=j["schedule"].get("tz"),
                            ),
                            payload=CronPayload(
                                kind=j["payload"].get("kind", "agent_turn"),
                                message=j["payload"].get("message", ""),
                                deliver=j["payload"].get("deliver", False),
                                channel=j["payload"].get("channel"),
                                to=j["payload"].get("to"),
                            ),
                            state=CronJobState(
                                next_run_at_ms=j.get("state", {}).get("nextRunAtMs"),
                                last_run_at_ms=j.get("state", {}).get("lastRunAtMs"),
                                last_status=j.get("state", {}).get("lastStatus"),
                                last_error=j.get("state", {}).get("lastError"),
                            ),
                            created_at_ms=j.get("createdAtMs", 0),
                            updated_at_ms=j.get("updatedAtMs", 0),
                            delete_after_run=j.get("deleteAfterRun", False),
                        )
                    )
                self._store = CronStore(jobs=jobs)
            except Exception as e:
                logger.warning(f"Failed to load cron store: {e}")
                self._store = CronStore()
        else:
            self._store = CronStore()

        return self._store

    def _save_store(self) -> None:
        """Save jobs to disk."""
        if not self._store:
            return

        self.store_path.parent.mkdir(parents=True, exist_ok=True)

        data = {
            "version": self._store.version,
            "jobs": [
                {
                    "id": j.id,
                    "name": j.name,
                    "enabled": j.enabled,
                    "schedule": {
                        "kind": j.schedule.kind,
                        "atMs": j.schedule.at_ms,
                        "everyMs": j.schedule.every_ms,
                        "expr": j.schedule.expr,
                        "tz": j.schedule.tz,
                    },
                    "payload": {
                        "kind": j.payload.kind,
                        "message": j.payload.message,
                        "deliver": j.payload.deliver,
                        "channel": j.payload.channel,
                        "to": j.payload.to,
                    },
                    "state": {
                        "nextRunAtMs": j.state.next_run_at_ms,
                        "lastRunAtMs": j.state.last_run_at_ms,
                        "lastStatus": j.state.last_status,
                        "lastError": j.state.last_error,
                    },
                    "createdAtMs": j.created_at_ms,
                    "updatedAtMs": j.updated_at_ms,
                    "deleteAfterRun": j.delete_after_run,
                }
                for j in self._store.jobs
            ],
        }

        self.store_path.write_text(json.dumps(data, indent=2))

    async def start(self) -> None:
        """Start the cron service."""
        self._running = True
        self._load_store()
        self._recompute_next_runs()
        self._save_store()
        self._arm_timer()
        logger.info(
            f"Cron service started with {len(self._store.jobs if self._store else [])} jobs"
        )

    def stop(self) -> None:
        """Stop the cron service."""
        self._running = False
        if self._timer_task:
            self._timer_task.cancel()
            self._timer_task = None

    def _recompute_next_runs(self) -> None:
        """Recompute next run times for all enabled jobs."""
        if not self._store:
            return
        now = _now_ms()
        for job in self._store.jobs:
            if job.enabled:
                job.state.next_run_at_ms = _compute_next_run(job.schedule, now)

    def _get_next_wake_ms(self) -> int | None:
        """Get the earliest next run time across all jobs."""
        if not self._store:
            return None
        times = [
            j.state.next_run_at_ms for j in self._store.jobs if j.enabled and j.state.next_run_at_ms
        ]
        return min(times) if times else None

    def _arm_timer(self) -> None:
        """Schedule the next timer tick."""
        if self._timer_task:
            self._timer_task.cancel()

        next_wake = self._get_next_wake_ms()
        if not next_wake or not self._running:
            return

        delay_ms = max(0, next_wake - _now_ms())
        delay_s = delay_ms / 1000

        async def tick():
            await asyncio.sleep(delay_s)
            if self._running:
                await self._on_timer()

        self._timer_task = asyncio.create_task(tick())

    async def _on_timer(self) -> None:
        """Handle timer tick - run due jobs."""
        if not self._store:
            return

        now = _now_ms()
        due_jobs = [
            j
            for j in self._store.jobs
            if j.enabled and j.state.next_run_at_ms and now >= j.state.next_run_at_ms
        ]

        for job in due_jobs:
            await self._execute_job(job)

        self._save_store()
        self._arm_timer()

    async def _execute_job(self, job: CronJob) -> None:
        """Execute a single job."""
        start_ms = _now_ms()
        logger.info(f"Cron: executing job '{job.name}' ({job.id})")

        try:
            if self.on_job:
                await self.on_job(job)

            job.state.last_status = "ok"
            job.state.last_error = None
            logger.info(f"Cron: job '{job.name}' completed")

        except Exception as e:
            job.state.last_status = "error"
            job.state.last_error = str(e)
            logger.error(f"Cron: job '{job.name}' failed: {e}")

        job.state.last_run_at_ms = start_ms
        job.updated_at_ms = _now_ms()

        # Handle one-shot jobs
        if job.schedule.kind == "at":
            if job.delete_after_run:
                self._store.jobs = [j for j in self._store.jobs if j.id != job.id]
            else:
                job.enabled = False
                job.state.next_run_at_ms = None
        else:
            # Compute next run
            job.state.next_run_at_ms = _compute_next_run(job.schedule, _now_ms())

    # ========== Public API ==========

    def list_jobs(self, include_disabled: bool = False) -> list[CronJob]:
        """List all jobs."""
        store = self._load_store()
        jobs = store.jobs if include_disabled else [j for j in store.jobs if j.enabled]
        return sorted(jobs, key=lambda j: j.state.next_run_at_ms or float("inf"))

    def add_job(
        self,
        name: str,
        schedule: CronSchedule,
        message: str,
        deliver: bool = False,
        channel: str | None = None,
        to: str | None = None,
        delete_after_run: bool = False,
    ) -> CronJob:
        """Add a new job."""
        store = self._load_store()
        now = _now_ms()

        job = CronJob(
            id=str(uuid.uuid4())[:8],
            name=name,
            enabled=True,
            schedule=schedule,
            payload=CronPayload(
                kind="agent_turn",
                message=message,
                deliver=deliver,
                channel=channel,
                to=to,
            ),
            state=CronJobState(next_run_at_ms=_compute_next_run(schedule, now)),
            created_at_ms=now,
            updated_at_ms=now,
            delete_after_run=delete_after_run,
        )

        store.jobs.append(job)
        self._save_store()
        self._arm_timer()

        logger.info(f"Cron: added job '{name}' ({job.id})")
        return job

    def remove_job(self, job_id: str) -> bool:
        """Remove a job by ID."""
        store = self._load_store()
        before = len(store.jobs)
        store.jobs = [j for j in store.jobs if j.id != job_id]
        removed = len(store.jobs) < before

        if removed:
            self._save_store()
            self._arm_timer()
            logger.info(f"Cron: removed job {job_id}")

        return removed

    def enable_job(self, job_id: str, enabled: bool = True) -> CronJob | None:
        """Enable or disable a job."""
        store = self._load_store()
        for job in store.jobs:
            if job.id == job_id:
                job.enabled = enabled
                job.updated_at_ms = _now_ms()
                if enabled:
                    job.state.next_run_at_ms = _compute_next_run(job.schedule, _now_ms())
                else:
                    job.state.next_run_at_ms = None
                self._save_store()
                self._arm_timer()
                return job
        return None

    async def run_job(self, job_id: str, force: bool = False) -> bool:
        """Manually run a job."""
        store = self._load_store()
        for job in store.jobs:
            if job.id == job_id:
                if not force and not job.enabled:
                    return False
                await self._execute_job(job)
                self._save_store()
                self._arm_timer()
                return True
        return False

    def status(self) -> dict:
        """Get service status."""
        store = self._load_store()
        return {
            "enabled": self._running,
            "jobs": len(store.jobs),
            "next_wake_at_ms": self._get_next_wake_ms(),
        }


================================================
FILE: nanobot/nanobot/cron/types.py
================================================
"""Cron types."""

from dataclasses import dataclass, field
from typing import Literal


@dataclass
class CronSchedule:
    """Schedule definition for a cron job."""

    kind: Literal["at", "every", "cron"]
    # For "at": timestamp in ms
    at_ms: int | None = None
    # For "every": interval in ms
    every_ms: int | None = None
    # For "cron": cron expression (e.g. "0 9 * * *")
    expr: str | None = None
    # Timezone for cron expressions
    tz: str | None = None


@dataclass
class CronPayload:
    """What to do when the job runs."""

    kind: Literal["system_event", "agent_turn"] = "agent_turn"
    message: str = ""
    # Deliver response to channel
    deliver: bool = False
    channel: str | None = None  # e.g. "whatsapp"
    to: str | None = None  # e.g. phone number


@dataclass
class CronJobState:
    """Runtime state of a job."""

    next_run_at_ms: int | None = None
    last_run_at_ms: int | None = None
    last_status: Literal["ok", "error", "skipped"] | None = None
    last_error: str | None = None


@dataclass
class CronJob:
    """A scheduled job."""

    id: str
    name: str
    enabled: bool = True
    schedule: CronSchedule = field(default_factory=lambda: CronSchedule(kind="every"))
    payload: CronPayload = field(default_factory=CronPayload)
    state: CronJobState = field(default_factory=CronJobState)
    created_at_ms: int = 0
    updated_at_ms: int = 0
    delete_after_run: bool = False


@dataclass
class CronStore:
    """Persistent store for cron jobs."""

    version: int = 1
    jobs: list[CronJob] = field(default_factory=list)


================================================
FILE: nanobot/nanobot/heartbeat/__init__.py
================================================
"""Heartbeat service for periodic agent wake-ups."""

from nanobot.heartbeat.service import HeartbeatService

__all__ = ["HeartbeatService"]


================================================
FILE: nanobot/nanobot/heartbeat/service.py
================================================
"""Heartbeat service - periodic agent wake-up to check for tasks."""

import asyncio
from pathlib import Path
from typing import Any, Callable, Coroutine

from loguru import logger

# Default interval: 30 minutes
DEFAULT_HEARTBEAT_INTERVAL_S = 30 * 60

# The prompt sent to agent during heartbeat
HEARTBEAT_PROMPT = """Read HEARTBEAT.md in your workspace (if it exists).
Follow any instructions or tasks listed there.
If nothing needs attention, reply with just: HEARTBEAT_OK"""

# Token that indicates "nothing to do"
HEARTBEAT_OK_TOKEN = "HEARTBEAT_OK"


def _is_heartbeat_empty(content: str | None) -> bool:
    """Check if HEARTBEAT.md has no actionable content."""
    if not content:
        return True

    # Lines to skip: empty, headers, HTML comments, empty checkboxes
    skip_patterns = {"- [ ]", "* [ ]", "- [x]", "* [x]"}

    for line in content.split("\n"):
        line = line.strip()
        if not line or line.startswith("#") or line.startswith("<!--") or line in skip_patterns:
            continue
        return False  # Found actionable content

    return True


class HeartbeatService:
    """
    Periodic heartbeat service that wakes the agent to check for tasks.

    The agent reads HEARTBEAT.md from the workspace and executes any
    tasks listed there. If nothing needs attention, it replies HEARTBEAT_OK.
    """

    def __init__(
        self,
        workspace: Path,
        on_heartbeat: Callable[[str], Coroutine[Any, Any, str]] | None = None,
        interval_s: int = DEFAULT_HEARTBEAT_INTERVAL_S,
        enabled: bool = True,
    ):
        self.workspace = workspace
        self.on_heartbeat = on_heartbeat
        self.interval_s = interval_s
        self.enabled = enabled
        self._running = False
        self._task: asyncio.Task | None = None

    @property
    def heartbeat_file(self) -> Path:
        return self.workspace / "HEARTBEAT.md"

    def _read_heartbeat_file(self) -> str | None:
        """Read HEARTBEAT.md content."""
        if self.heartbeat_file.exists():
            try:
                return self.heartbeat_file.read_text()
            except Exception:
                return None
        return None

    async def start(self) -> None:
        """Start the heartbeat service."""
        if not self.enabled:
            logger.info("Heartbeat disabled")
            return

        self._running = True
        self._task = asyncio.create_task(self._run_loop())
        logger.info(f"Heartbeat started (every {self.interval_s}s)")

    def stop(self) -> None:
        """Stop the heartbeat service."""
        self._running = False
        if self._task:
            self._task.cancel()
            self._task = None

    async def _run_loop(self) -> None:
        """Main heartbeat loop."""
        while self._running:
            try:
                await asyncio.sleep(self.interval_s)
                if self._running:
                    await self._tick()
            except asyncio.CancelledError:
                break
            except Exception as e:
                logger.error(f"Heartbeat error: {e}")

    async def _tick(self) -> None:
        """Execute a single heartbeat tick."""
        content = self._read_heartbeat_file()

        # Skip if HEARTBEAT.md is empty or doesn't exist
        if _is_heartbeat_empty(content):
            logger.debug("Heartbeat: no tasks (HEARTBEAT.md empty)")
            return

        logger.info("Heartbeat: checking for tasks...")

        if self.on_heartbeat:
            try:
                response = await self.on_heartbeat(HEARTBEAT_PROMPT)

                # Check if agent said "nothing to do"
                if HEARTBEAT_OK_TOKEN.replace("_", "") in response.upper().replace("_", ""):
                    logger.info("Heartbeat: OK (no action needed)")
                else:
                    logger.info("Heartbeat: completed task")

            except Exception as e:
                logger.error(f"Heartbeat execution failed: {e}")

    async def trigger_now(self) -> str | None:
        """Manually trigger a heartbeat."""
        if self.on_heartbeat:
            return await self.on_heartbeat(HEARTBEAT_PROMPT)
        return None


================================================
FILE: nanobot/nanobot/providers/__init__.py
================================================
"""LLM provider abstraction module."""

from nanobot.providers.base import LLMProvider, LLMResponse
from nanobot.providers.litellm_provider import LiteLLMProvider

__all__ = ["LLMProvider", "LLMResponse", "LiteLLMProvider"]


================================================
FILE: nanobot/nanobot/providers/base.py
================================================
"""Base LLM provider interface."""

from abc import ABC, abstractmethod
from dataclasses import dataclass, field
from typing import Any


@dataclass
class ToolCallRequest:
    """A tool call request from the LLM."""

    id: str
    name: str
    arguments: dict[str, Any]


@dataclass
class LLMResponse:
    """Response from an LLM provider."""

    content: str | None
    tool_calls: list[ToolCallRequest] = field(default_factory=list)
    finish_reason: str = "stop"
    usage: dict[str, int] = field(default_factory=dict)
    reasoning_content: str | None = None  # Kimi, DeepSeek-R1 etc.

    @property
    def has_tool_calls(self) -> bool:
        """Check if response contains tool calls."""
        return len(self.tool_calls) > 0


class LLMProvider(ABC):
    """
    Abstract base class for LLM providers.

    Implementations should handle the specifics of each provider's API
    while maintaining a consistent interface.
    """

    def __init__(self, api_key: str | None = None, api_base: str | None = None):
        self.api_key = api_key
        self.api_base = api_base

    @abstractmethod
    async def chat(
        self,
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
        max_tokens: int = 4096,
        temperature: float = 0.7,
    ) -> LLMResponse:
        """
        Send a chat completion request.

        Args:
            messages: List of message dicts with 'role' and 'content'.
            tools: Optional list of tool definitions.
            model: Model identifier (provider-specific).
            max_tokens: Maximum tokens in response.
            temperature: Sampling temperature.

        Returns:
            LLMResponse with content and/or tool calls.
        """
        pass

    @abstractmethod
    def get_default_model(self) -> str:
        """Get the default model for this provider."""
        pass


================================================
FILE: nanobot/nanobot/providers/litellm_provider.py
================================================
"""LiteLLM provider implementation for multi-provider support."""

import json
import os
from typing import Any

import litellm
from litellm import acompletion

from nanobot.providers.base import LLMProvider, LLMResponse, ToolCallRequest
from nanobot.providers.registry import find_by_model, find_gateway


class LiteLLMProvider(LLMProvider):
    """
    LLM provider using LiteLLM for multi-provider support.

    Supports OpenRouter, Anthropic, OpenAI, Gemini, and many other providers through
    a unified interface.  Provider-specific logic is driven by the registry
    (see providers/registry.py) — no if-elif chains needed here.
    """

    def __init__(
        self,
        api_key: str | None = None,
        api_base: str | None = None,
        default_model: str = "anthropic/claude-opus-4-5",
        extra_headers: dict[str, str] | None = None,
        provider_name: str | None = None,
    ):
        super().__init__(api_key, api_base)
        self.default_model = default_model
        self.extra_headers = extra_headers or {}

        # Detect gateway / local deployment.
        # provider_name (from config key) is the primary signal;
        # api_key / api_base are fallback for auto-detection.
        self._gateway = find_gateway(provider_name, api_key, api_base)

        # Configure environment variables
        if api_key:
            self._setup_env(api_key, api_base, default_model)

        if api_base:
            litellm.api_base = api_base

        # Disable LiteLLM logging noise
        litellm.suppress_debug_info = True
        # Drop unsupported parameters for providers (e.g., gpt-5 rejects some params)
        litellm.drop_params = True

    def _setup_env(self, api_key: str, api_base: str | None, model: str) -> None:
        """Set environment variables based on detected provider."""
        spec = self._gateway or find_by_model(model)
        if not spec:
            return

        # Gateway/local overrides existing env; standard provider doesn't
        if self._gateway:
            os.environ[spec.env_key] = api_key
        else:
            os.environ.setdefault(spec.env_key, api_key)

        # Resolve env_extras placeholders:
        #   {api_key}  → user's API key
        #   {api_base} → user's api_base, falling back to spec.default_api_base
        effective_base = api_base or spec.default_api_base
        for env_name, env_val in spec.env_extras:
            resolved = env_val.replace("{api_key}", api_key)
            resolved = resolved.replace("{api_base}", effective_base)
            os.environ.setdefault(env_name, resolved)

    def _resolve_model(self, model: str) -> str:
        """Resolve model name by applying provider/gateway prefixes."""
        if self._gateway:
            # Gateway mode: apply gateway prefix, skip provider-specific prefixes
            prefix = self._gateway.litellm_prefix
            if self._gateway.strip_model_prefix:
                model = model.split("/")[-1]
            if prefix and not model.startswith(f"{prefix}/"):
                model = f"{prefix}/{model}"
            return model

        # Standard mode: auto-prefix for known providers
        spec = find_by_model(model)
        if spec and spec.litellm_prefix:
            if not any(model.startswith(s) for s in spec.skip_prefixes):
                model = f"{spec.litellm_prefix}/{model}"

        return model

    def _apply_model_overrides(self, model: str, kwargs: dict[str, Any]) -> None:
        """Apply model-specific parameter overrides from the registry."""
        model_lower = model.lower()
        spec = find_by_model(model)
        if spec:
            for pattern, overrides in spec.model_overrides:
                if pattern in model_lower:
                    kwargs.update(overrides)
                    return

    async def chat(
        self,
        messages: list[dict[str, Any]],
        tools: list[dict[str, Any]] | None = None,
        model: str | None = None,
        max_tokens: int = 4096,
        temperature: float = 0.7,
    ) -> LLMResponse:
        """
        Send a chat completion request via LiteLLM.

        Args:
            messages: List of message dicts with 'role' and 'content'.
            tools: Optional list of tool definitions in OpenAI format.
            model: Model identifier (e.g., 'anthropic/claude-sonnet-4-5').
            max_tokens: Maximum tokens in response.
            temperature: Sampling temperature.

        Returns:
            LLMResponse with content and/or tool calls.
        """
        model = self._resolve_model(model or self.default_model)

        kwargs: dict[str, Any] = {
            "model": model,
            "messages": messages,
            "max_tokens": max_tokens,
            "temperature": temperature,
        }

        # Apply model-specific overrides (e.g. kimi-k2.5 temperature)
        self._apply_model_overrides(model, kwargs)

        # Pass api_base for custom endpoints
        if self.api_base:
            kwargs["api_base"] = self.api_base

        # Pass extra headers (e.g. APP-Code for AiHubMix)
        if self.extra_headers:
            kwargs["extra_headers"] = self.extra_headers

        if tools:
            kwargs["tools"] = tools
            kwargs["tool_choice"] = "auto"

        try:
            response = await acompletion(**kwargs)
            return self._parse_response(response)
        except Exception as e:
            # Return error as content for graceful handling
            return LLMResponse(
                content=f"Error calling LLM: {str(e)}",
                finish_reason="error",
            )

    def _parse_response(self, response: Any) -> LLMResponse:
        """Parse LiteLLM response into our standard format."""
        choice = response.choices[0]
        message = choice.message

        tool_calls = []
        if hasattr(message, "tool_calls") and message.tool_calls:
            for tc in message.tool_calls:
                # Parse arguments from JSON string if needed
                args = tc.function.arguments
                if isinstance(args, str):
                    try:
                        args = json.loads(args)
                    except json.JSONDecodeError:
                        args = {"raw": args}

                tool_calls.append(
                    ToolCallRequest(
                        id=tc.id,
                        name=tc.function.name,
                        arguments=args,
                    )
                )

        usage = {}
        if hasattr(response, "usage") and response.usage:
            usage = {
                "prompt_tokens": response.usage.prompt_tokens,
                "completion_tokens": response.usage.completion_tokens,
                "total_tokens": response.usage.total_tokens,
            }

        reasoning_content = getattr(message, "reasoning_content", None)

        return LLMResponse(
            content=message.content,
            tool_calls=tool_calls,
            finish_reason=choice.finish_reason or "stop",
            usage=usage,
            reasoning_content=reasoning_content,
        )

    def get_default_model(self) -> str:
        """Get the default model."""
        return self.default_model


================================================
FILE: nanobot/nanobot/providers/registry.py
================================================
"""
Provider Registry — single source of truth for LLM provider metadata.

Adding a new provider:
  1. Add a ProviderSpec to PROVIDERS below.
  2. Add a field to ProvidersConfig in config/schema.py.
  Done. Env vars, prefixing, config matching, status display all derive from here.

Order matters — it controls match priority and fallback. Gateways first.
Every entry writes out all fields so you can copy-paste as a template.
"""

from __future__ import annotations

from dataclasses import dataclass
from typing import Any


@dataclass(frozen=True)
class ProviderSpec:
    """One LLM provider's metadata. See PROVIDERS below for real examples.

    Placeholders in env_extras values:
      {api_key}  — the user's API key
      {api_base} — api_base from config, or this spec's default_api_base
    """

    # identity
    name: str  # config field name, e.g. "dashscope"
    keywords: tuple[str, ...]  # model-name keywords for matching (lowercase)
    env_key: str  # LiteLLM env var, e.g. "DASHSCOPE_API_KEY"
    display_name: str = ""  # shown in `nanobot status`

    # model prefixing
    litellm_prefix: str = ""  # "dashscope" → model becomes "dashscope/{model}"
    skip_prefixes: tuple[str, ...] = ()  # don't prefix if model already starts with these

    # extra env vars, e.g. (("ZHIPUAI_API_KEY", "{api_key}"),)
    env_extras: tuple[tuple[str, str], ...] = ()

    # gateway / local detection
    is_gateway: bool = False  # routes any model (OpenRouter, AiHubMix)
    is_local: bool = False  # local deployment (vLLM, Ollama)
    detect_by_key_prefix: str = ""  # match api_key prefix, e.g. "sk-or-"
    detect_by_base_keyword: str = ""  # match substring in api_base URL
    default_api_base: str = ""  # fallback base URL

    # gateway behavior
    strip_model_prefix: bool = False  # strip "provider/" before re-prefixing

    # per-model param overrides, e.g. (("kimi-k2.5", {"temperature": 1.0}),)
    model_overrides: tuple[tuple[str, dict[str, Any]], ...] = ()

    @property
    def label(self) -> str:
        return self.display_name or self.name.title()


# ---------------------------------------------------------------------------
# PROVIDERS — the registry. Order = priority. Copy any entry as template.
# ---------------------------------------------------------------------------

PROVIDERS: tuple[ProviderSpec, ...] = (
    # === Gateways (detected by api_key / api_base, not model name) =========
    # Gateways can route any model, so they win in fallback.
    # OpenRouter: global gateway, keys start with "sk-or-"
    ProviderSpec(
        name="openrouter",
        keywords=("openrouter",),
        env_key="OPENROUTER_API_KEY",
        display_name="OpenRouter",
        litellm_prefix="openrouter",  # claude-3 → openrouter/claude-3
        skip_prefixes=(),
        env_extras=(),
        is_gateway=True,
        is_local=False,
        detect_by_key_prefix="sk-or-",
        detect_by_base_keyword="openrouter",
        default_api_base="https://openrouter.ai/api/v1",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # AiHubMix: global gateway, OpenAI-compatible interface.
    # strip_model_prefix=True: it doesn't understand "anthropic/claude-3",
    # so we strip to bare "claude-3" then re-prefix as "openai/claude-3".
    ProviderSpec(
        name="aihubmix",
        keywords=("aihubmix",),
        env_key="OPENAI_API_KEY",  # OpenAI-compatible
        display_name="AiHubMix",
        litellm_prefix="openai",  # → openai/{model}
        skip_prefixes=(),
        env_extras=(),
        is_gateway=True,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="aihubmix",
        default_api_base="https://aihubmix.com/v1",
        strip_model_prefix=True,  # anthropic/claude-3 → claude-3 → openai/claude-3
        model_overrides=(),
    ),
    # === Standard providers (matched by model-name keywords) ===============
    # Anthropic: LiteLLM recognizes "claude-*" natively, no prefix needed.
    ProviderSpec(
        name="anthropic",
        keywords=("anthropic", "claude"),
        env_key="ANTHROPIC_API_KEY",
        display_name="Anthropic",
        litellm_prefix="",
        skip_prefixes=(),
        env_extras=(),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # OpenAI: LiteLLM recognizes "gpt-*" natively, no prefix needed.
    ProviderSpec(
        name="openai",
        keywords=("openai", "gpt"),
        env_key="OPENAI_API_KEY",
        display_name="OpenAI",
        litellm_prefix="",
        skip_prefixes=(),
        env_extras=(),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # DeepSeek: needs "deepseek/" prefix for LiteLLM routing.
    ProviderSpec(
        name="deepseek",
        keywords=("deepseek",),
        env_key="DEEPSEEK_API_KEY",
        display_name="DeepSeek",
        litellm_prefix="deepseek",  # deepseek-chat → deepseek/deepseek-chat
        skip_prefixes=("deepseek/",),  # avoid double-prefix
        env_extras=(),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # Gemini: needs "gemini/" prefix for LiteLLM.
    ProviderSpec(
        name="gemini",
        keywords=("gemini",),
        env_key="GEMINI_API_KEY",
        display_name="Gemini",
        litellm_prefix="gemini",  # gemini-pro → gemini/gemini-pro
        skip_prefixes=("gemini/",),  # avoid double-prefix
        env_extras=(),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # Zhipu: LiteLLM uses "zai/" prefix.
    # Also mirrors key to ZHIPUAI_API_KEY (some LiteLLM paths check that).
    # skip_prefixes: don't add "zai/" when already routed via gateway.
    ProviderSpec(
        name="zhipu",
        keywords=("zhipu", "glm", "zai"),
        env_key="ZAI_API_KEY",
        display_name="Zhipu AI",
        litellm_prefix="zai",  # glm-4 → zai/glm-4
        skip_prefixes=("zhipu/", "zai/", "openrouter/", "hosted_vllm/"),
        env_extras=(("ZHIPUAI_API_KEY", "{api_key}"),),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # DashScope: Qwen models, needs "dashscope/" prefix.
    ProviderSpec(
        name="dashscope",
        keywords=("qwen", "dashscope"),
        env_key="DASHSCOPE_API_KEY",
        display_name="DashScope",
        litellm_prefix="dashscope",  # qwen-max → dashscope/qwen-max
        skip_prefixes=("dashscope/", "openrouter/"),
        env_extras=(),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # Moonshot: Kimi models, needs "moonshot/" prefix.
    # LiteLLM requires MOONSHOT_API_BASE env var to find the endpoint.
    # Kimi K2.5 API enforces temperature >= 1.0.
    ProviderSpec(
        name="moonshot",
        keywords=("moonshot", "kimi"),
        env_key="MOONSHOT_API_KEY",
        display_name="Moonshot",
        litellm_prefix="moonshot",  # kimi-k2.5 → moonshot/kimi-k2.5
        skip_prefixes=("moonshot/", "openrouter/"),
        env_extras=(("MOONSHOT_API_BASE", "{api_base}"),),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="https://api.moonshot.ai/v1",  # intl; use api.moonshot.cn for China
        strip_model_prefix=False,
        model_overrides=(("kimi-k2.5", {"temperature": 1.0}),),
    ),
    # === Local deployment (matched by config key, NOT by api_base) =========
    # vLLM / any OpenAI-compatible local server.
    # Detected when config key is "vllm" (provider_name="vllm").
    ProviderSpec(
        name="vllm",
        keywords=("vllm",),
        env_key="HOSTED_VLLM_API_KEY",
        display_name="vLLM/Local",
        litellm_prefix="hosted_vllm",  # Llama-3-8B → hosted_vllm/Llama-3-8B
        skip_prefixes=(),
        env_extras=(),
        is_gateway=False,
        is_local=True,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",  # user must provide in config
        strip_model_prefix=False,
        model_overrides=(),
    ),
    # === Auxiliary (not a primary LLM provider) ============================
    # Groq: mainly used for Whisper voice transcription, also usable for LLM.
    # Needs "groq/" prefix for LiteLLM routing. Placed last — it rarely wins fallback.
    ProviderSpec(
        name="groq",
        keywords=("groq",),
        env_key="GROQ_API_KEY",
        display_name="Groq",
        litellm_prefix="groq",  # llama3-8b-8192 → groq/llama3-8b-8192
        skip_prefixes=("groq/",),  # avoid double-prefix
        env_extras=(),
        is_gateway=False,
        is_local=False,
        detect_by_key_prefix="",
        detect_by_base_keyword="",
        default_api_base="",
        strip_model_prefix=False,
        model_overrides=(),
    ),
)


# ---------------------------------------------------------------------------
# Lookup helpers
# ---------------------------------------------------------------------------


def find_by_model(model: str) -> ProviderSpec | None:
    """Match a standard provider by model-name keyword (case-insensitive).
    Skips gateways/local — those are matched by api_key/api_base instead."""
    model_lower = model.lower()
    for spec in PROVIDERS:
        if spec.is_gateway or spec.is_local:
            continue
        if any(kw in model_lower for kw in spec.keywords):
            return spec
    return None


def find_gateway(
    provider_name: str | None = None,
    api_key: str | None = None,
    api_base: str | None = None,
) -> ProviderSpec | None:
    """Detect gateway/local provider.

    Priority:
      1. provider_name — if it maps to a gateway/local spec, use it directly.
      2. api_key prefix — e.g. "sk-or-" → OpenRouter.
      3. api_base keyword — e.g. "aihubmix" in URL → AiHubMix.

    A standard provider with a custom api_base (e.g. DeepSeek behind a proxy)
    will NOT be mistaken for vLLM — the old fallback is gone.
    """
    # 1. Direct match by config key
    if provider_name:
        spec = find_by_name(provider_name)
        if spec and (spec.is_gateway or spec.is_local):
            return spec

    # 2. Auto-detect by api_key prefix / api_base keyword
    for spec in PROVIDERS:
        if spec.detect_by_key_prefix and api_key and api_key.startswith(spec.detect_by_key_prefix):
            return spec
        if spec.detect_by_base_keyword and api_base and spec.detect_by_base_keyword in api_base:
            return spec

    return None


def find_by_name(name: str) -> ProviderSpec | None:
    """Find a provider spec by config field name, e.g. "dashscope"."""
    for spec in PROVIDERS:
        if spec.name == name:
            return spec
    return None


================================================
FILE: nanobot/nanobot/providers/transcription.py
================================================
"""Voice transcription provider using Groq."""

import os
from pathlib import Path

import httpx
from loguru import logger


class GroqTranscriptionProvider:
    """
    Voice transcription provider using Groq's Whisper API.

    Groq offers extremely fast transcription with a generous free tier.
    """

    def __init__(self, api_key: str | None = None):
        self.api_key = api_key or os.environ.get("GROQ_API_KEY")
        self.api_url = "https://api.groq.com/openai/v1/audio/transcriptions"

    async def transcribe(self, file_path: str | Path) -> str:
        """
        Transcribe an audio file using Groq.

        Args:
            file_path: Path to the audio file.

        Returns:
            Transcribed text.
        """
        if not self.api_key:
            logger.warning("Groq API key not configured for transcription")
            return ""

        path = Path(file_path)
        if not path.exists():
            logger.error(f"Audio file not found: {file_path}")
            return ""

        try:
            async with httpx.AsyncClient() as client:
                with open(path, "rb") as f:
                    files = {
                        "file": (path.name, f),
                        "model": (None, "whisper-large-v3"),
                    }
                    headers = {
                        "Authorization": f"Bearer {self.api_key}",
                    }

                    response = await client.post(
                        self.api_url, headers=headers, files=files, timeout=60.0
                    )

                    response.raise_for_status()
                    data = response.json()
                    return data.get("text", "")

        except Exception as e:
            logger.error(f"Groq transcription error: {e}")
            return ""


================================================
FILE: nanobot/nanobot/session/__init__.py
================================================
"""Session management module."""

from nanobot.session.manager import Session, SessionManager

__all__ = ["SessionManager", "Session"]


================================================
FILE: nanobot/nanobot/session/manager.py
================================================
"""Session management for conversation history."""

import json
from dataclasses import dataclass, field
from datetime import datetime
from pathlib import Path
from typing import Any

from loguru import logger

from nanobot.utils.helpers import ensure_dir, safe_filename


@dataclass
class Session:
    """
    A conversation session.

    Stores messages in JSONL format for easy reading and persistence.
    """

    key: str  # channel:chat_id
    messages: list[dict[str, Any]] = field(default_factory=list)
    created_at: datetime = field(default_factory=datetime.now)
    updated_at: datetime = field(default_factory=datetime.now)
    metadata: dict[str, Any] = field(default_factory=dict)

    def add_message(self, role: str, content: str, **kwargs: Any) -> None:
        """Add a message to the session."""
        msg = {"role": role, "content": content, "timestamp": datetime.now().isoformat(), **kwargs}
        self.messages.append(msg)
        self.updated_at = datetime.now()

    def get_history(self, max_messages: int = 50) -> list[dict[str, Any]]:
        """
        Get message history for LLM context.

        Args:
            max_messages: Maximum messages to return.

        Returns:
            List of messages in LLM format.
        """
        # Get recent messages
        recent = (
            self.messages[-max_messages:] if len(self.messages) > max_messages else self.messages
        )

        # Convert to LLM format (just role and content)
        return [{"role": m["role"], "content": m["content"]} for m in recent]

    def clear(self) -> None:
        """Clear all messages in the session."""
        self.messages = []
        self.updated_at = datetime.now()


class SessionManager:
    """
    Manages conversation sessions.

    Sessions are stored as JSONL files in the sessions directory.
    """

    def __init__(self, workspace: Path):
        self.workspace = workspace
        self.sessions_dir = ensure_dir(Path.home() / ".nanobot" / "sessions")
        self._cache: dict[str, Session] = {}

    def _get_session_path(self, key: str) -> Path:
        """Get the file path for a session."""
        safe_key = safe_filename(key.replace(":", "_"))
        return self.sessions_dir / f"{safe_key}.jsonl"

    def get_or_create(self, key: str) -> Session:
        """
        Get an existing session or create a new one.

        Args:
            key: Session key (usually channel:chat_id).

        Returns:
            The session.
        """
        # Check cache
        if key in self._cache:
            return self._cache[key]

        # Try to load from disk
        session = self._load(key)
        if session is None:
            session = Session(key=key)

        self._cache[key] = session
        return session

    def _load(self, key: str) -> Session | None:
        """Load a session from disk."""
        path = self._get_session_path(key)

        if not path.exists():
            return None

        try:
            messages = []
            metadata = {}
            created_at = None

            with open(path) as f:
                for line in f:
                    line = line.strip()
                    if not line:
                        continue

                    data = json.loads(line)

                    if data.get("_type") == "metadata":
                        metadata = data.get("metadata", {})
                        created_at = (
                            datetime.fromisoformat(data["created_at"])
                            if data.get("created_at")
                            else None
                        )
                    else:
                        messages.append(data)

            return Session(
                key=key,
                messages=messages,
                created_at=created_at or datetime.now(),
                metadata=metadata,
            )
        except Exception as e:
            logger.warning(f"Failed to load session {key}: {e}")
            return None

    def save(self, session: Session) -> None:
        """Save a session to disk."""
        path = self._get_session_path(session.key)

        with open(path, "w") as f:
            # Write metadata first
            metadata_line = {
                "_type": "metadata",
                "created_at": session.created_at.isoformat(),
                "updated_at": session.updated_at.isoformat(),
                "metadata": session.metadata,
            }
            f.write(json.dumps(metadata_line) + "\n")

            # Write messages
            for msg in session.messages:
                f.write(json.dumps(msg) + "\n")

        self._cache[session.key] = session

    def delete(self, key: str) -> bool:
        """
        Delete a session.

        Args:
            key: Session key.

        Returns:
            True if deleted, False if not found.
        """
        # Remove from cache
        self._cache.pop(key, None)

        # Remove file
        path = self._get_session_path(key)
        if path.exists():
            path.unlink()
            return True
        return False

    def list_sessions(self) -> list[dict[str, Any]]:
        """
        List all sessions.

        Returns:
            List of session info dicts.
        """
        sessions = []

        for path in self.sessions_dir.glob("*.jsonl"):
            try:
                # Read just the metadata line
                with open(path) as f:
                    first_line = f.readline().strip()
                    if first_line:
                        data = json.loads(first_line)
                        if data.get("_type") == "metadata":
                            sessions.append(
                                {
                                    "key": path.stem.replace("_", ":"),
                                    "created_at": data.get("created_at"),
                                    "updated_at": data.get("updated_at"),
                                    "path": str(path),
                                }
                            )
            except Exception:
                continue

        return sorted(sessions, key=lambda x: x.get("updated_at", ""), reverse=True)


================================================
FILE: nanobot/nanobot/skills/README.md
================================================
# nanobot Skills

This directory contains built-in skills that extend nanobot's capabilities.

## Skill Format

Each skill is a directory containing a `SKILL.md` file with:
- YAML frontmatter (name, description, metadata)
- Markdown instructions for the agent

## Attribution

These skills are adapted from [OpenClaw](https://github.com/openclaw/openclaw)'s skill system.
The skill format and metadata structure follow OpenClaw's conventions to maintain compatibility.

## Available Skills

| Skill | Description |
|-------|-------------|
| `github` | Interact with GitHub using the `gh` CLI |
| `weather` | Get weather info using wttr.in and Open-Meteo |
| `summarize` | Summarize URLs, files, and YouTube videos |
| `tmux` | Remote-control tmux sessions |
| `skill-creator` | Create new skills |


================================================
FILE: nanobot/nanobot/skills/cron/SKILL.md
================================================
---
name: cron
description: Schedule reminders and recurring tasks.
---

# Cron

Use the `cron` tool to schedule reminders or recurring tasks.

## Two Modes

1. **Reminder** - message is sent directly to user
2. **Task** - message is a task description, agent executes and sends result

## Examples

Fixed reminder:
```
cron(action="add", message="Time to take a break!", every_seconds=1200)
```

Dynamic task (agent executes each time):
```
cron(action="add", message="Check HKUDS/nanobot GitHub stars and report", every_seconds=600)
```

List/remove:
```
cron(action="list")
cron(action="remove", job_id="abc123")
```

## Time Expressions

| User says | Parameters |
|-----------|------------|
| every 20 minutes | every_seconds: 1200 |
| every hour | every_seconds: 3600 |
| every day at 8am | cron_expr: "0 8 * * *" |
| weekdays at 5pm | cron_expr: "0 17 * * 1-5" |


================================================
FILE: nanobot/nanobot/skills/deepcode/SKILL.md
================================================
---
name: deepcode
description: "DeepCode integration - automated code generation from papers and text requirements"
metadata: {"nanobot":{"always":true}}
---

# DeepCode - AI Code Generation Engine

You have access to **DeepCode**, a powerful multi-agent AI code generation engine that can:
- **Paper2Code**: Reproduce research paper algorithms as working code
- **Chat2Code**: Generate complete projects from text descriptions

## Available Tools

| Tool | Purpose |
|------|---------|
| `deepcode_paper2code` | Submit a paper URL or file for code reproduction |
| `deepcode_chat2code` | Submit text requirements for code generation |
| `deepcode_status` | Check task progress and results |
| `deepcode_list_tasks` | List active and recent tasks |
| `deepcode_cancel` | Cancel a running task |
| `deepcode_respond` | Respond to User-in-Loop interactions |

## When to Use DeepCode

### Automatically trigger `deepcode_paper2code` when user:
- Sends an arxiv URL (e.g. `https://arxiv.org/abs/...` or `https://arxiv.org/pdf/...`)
- Sends a paper URL from other academic sites
- Asks to "reproduce", "implement", or "replicate" a paper
- Sends a PDF file and asks for code generation
- Says something like "帮我复现这篇论文" or "把这篇论文的代码跑出来"

### Automatically trigger `deepcode_chat2code` when user:
- Describes a coding project they want to build
- Asks to create a web app, backend service, algorithm implementation, etc.
- Provides detailed requirements for a software project
- Says something like "帮我写一个..." or "生成一个项目..."

## Workflow Guidelines

### 1. Submitting a Task
When the user wants to generate code:
1. Identify if it's a paper (use `deepcode_paper2code`) or requirements (use `deepcode_chat2code`)
2. Submit the task and note the task_id
3. Tell the user the task has been submitted and the estimated wait time (10-60 minutes for papers, 5-30 minutes for chat)
4. Offer to check progress periodically

### 2. Monitoring Progress
- When user asks about progress, use `deepcode_status` with the task_id
- Report the progress percentage and current phase
- If the task is complete, share the result summary

### 3. Handling User-in-Loop Interactions
- Check `deepcode_status` - if status is "waiting_for_input", there's a pending interaction
- Read the interaction details (questions, plan review, etc.)
- Present the questions/plan to the user in a natural conversational way
- Collect the user's response
- Use `deepcode_respond` to submit the response back to DeepCode

### 4. Delivering Results
When a task completes:
- Report the generated file structure
- Mention key files (e.g. model.py, train.py, requirements.txt)
- The generated code is in the shared `deepcode_lab/` directory
- Offer to read specific files if the user wants to review them

## Response Style
- Be concise and informative about task status
- Use progress percentages to show advancement
- When a task completes, provide a brief summary of what was generated
- For Chinese-speaking users, respond in Chinese (follow the user's language)

## Important Notes
- Code generation tasks run in the background and take time (10-60 minutes)
- Do NOT spawn subagents for DeepCode tasks - use the tools directly
- If DeepCode backend is unreachable, inform the user that the service may not be running
- Generated code is stored in `/app/deepcode_lab/papers/` directory


================================================
FILE: nanobot/nanobot/skills/github/SKILL.md
================================================
---
name: github
description: "Interact with GitHub using the `gh` CLI. Use `gh issue`, `gh pr`, `gh run`, and `gh api` for issues, PRs, CI runs, and advanced queries."
metadata: {"nanobot":{"emoji":"🐙","requires":{"bins":["gh"]},"install":[{"id":"brew","kind":"brew","formula":"gh","bins":["gh"],"label":"Install GitHub CLI (brew)"},{"id":"apt","kind":"apt","package":"gh","bins":["gh"],"label":"Install GitHub CLI (apt)"}]}}
---

# GitHub Skill

Use the `gh` CLI to interact with GitHub. Always specify `--repo owner/repo` when not in a git directory, or use URLs directly.

## Pull Requests

Check CI status on a PR:
```bash
gh pr checks 55 --repo owner/repo
```

List recent workflow runs:
```bash
gh run list --repo owner/repo --limit 10
```

View a run and see which steps failed:
```bash
gh run view <run-id> --repo owner/repo
```

View logs for failed steps only:
```bash
gh run view <run-id> --repo owner/repo --log-failed
```

## API for Advanced Queries

The `gh api` command is useful for accessing data not available through other subcommands.

Get PR with specific fields:
```bash
gh api repos/owner/repo/pulls/55 --jq '.title, .state, .user.login'
```

## JSON Output

Most commands support `--json` for structured output.  You can use `--jq` to filter:

```bash
gh issue list --repo owner/repo --json number,title --jq '.[] | "\(.number): \(.title)"'
```


================================================
FILE: nanobot/nanobot/skills/skill-creator/SKILL.md
================================================
---
name: skill-creator
description: Create or update AgentSkills. Use when designing, structuring, or packaging skills with scripts, references, and assets.
---

# Skill Creator

This skill provides guidance for creating effective skills.

## About Skills

Skills are modular, self-contained packages that extend the agent's capabilities by providing
specialized knowledge, workflows, and tools. Think of them as "onboarding guides" for specific
domains or tasks—they transform the agent from a general-purpose agent into a specialized agent
equipped with procedural knowledge that no model can fully possess.

### What Skills Provide

1. Specialized workflows - Multi-step procedures for specific domains
2. Tool integrations - Instructions for working with specific file formats or APIs
3. Domain expertise - Company-specific knowledge, schemas, business logic
4. Bundled resources - Scripts, references, and assets for complex and repetitive tasks

## Core Principles

### Concise is Key

The context window is a public good. Skills share the context window with everything else the agent needs: system prompt, conversation history, other Skills' metadata, and the actual user request.

**Default assumption: the agent is already very smart.** Only add context the agent doesn't already have. Challenge each piece of information: "Does the agent really need this explanation?" and "Does this paragraph justify its token cost?"

Prefer concise examples over verbose explanations.

### Set Appropriate Degrees of Freedom

Match the level of specificity to the task's fragility and variability:

**High freedom (text-based instructions)**: Use when multiple approaches are valid, decisions depend on context, or heuristics guide the approach.

**Medium freedom (pseudocode or scripts with parameters)**: Use when a preferred pattern exists, some variation is acceptable, or configuration affects behavior.

**Low freedom (specific scripts, few parameters)**: Use when operations are fragile and error-prone, consistency is critical, or a specific sequence must be followed.

Think of the agent as exploring a path: a narrow bridge with cliffs needs specific guardrails (low freedom), while an open field allows many routes (high freedom).

### Anatomy of a Skill

Every skill consists of a required SKILL.md file and optional bundled resources:

```
skill-name/
├── SKILL.md (required)
│   ├── YAML frontmatter metadata (required)
│   │   ├── name: (required)
│   │   └── description: (required)
│   └── Markdown instructions (required)
└── Bundled Resources (optional)
    ├── scripts/          - Executable code (Python/Bash/etc.)
    ├── references/       - Documentation intended to be loaded into context as needed
    └── assets/           - Files used in output (templates, icons, fonts, etc.)
```

#### SKILL.md (required)

Every SKILL.md consists of:

- **Frontmatter** (YAML): Contains `name` and `description` fields. These are the only fields that the agent reads to determine when the skill gets used, thus it is very important to be clear and comprehensive in describing what the skill is, and when it should be used.
- **Body** (Markdown): Instructions and guidance for using the skill. Only loaded AFTER the skill triggers (if at all).

#### Bundled Resources (optional)

##### Scripts (`scripts/`)

Executable code (Python/Bash/etc.) for tasks that require deterministic reliability or are repeatedly rewritten.

- **When to include**: When the same code is being rewritten repeatedly or deterministic reliability is needed
- **Example**: `scripts/rotate_pdf.py` for PDF rotation tasks
- **Benefits**: Token efficient, deterministic, may be executed without loading into context
- **Note**: Scripts may still need to be read by the agent for patching or environment-specific adjustments

##### References (`references/`)

Documentation and reference material intended to be loaded as needed into context to inform the agent's process and thinking.

- **When to include**: For documentation that the agent should reference while working
- **Examples**: `references/finance.md` for financial schemas, `references/mnda.md` for company NDA template, `references/policies.md` for company policies, `references/api_docs.md` for API specifications
- **Use cases**: Database schemas, API documentation, domain knowledge, company policies, detailed workflow guides
- **Benefits**: Keeps SKILL.md lean, loaded only when the agent determines it's needed
- **Best practice**: If files are large (>10k words), include grep search patterns in SKILL.md
- **Avoid duplication**: Information should live in either SKILL.md or references files, not both. Prefer references files for detailed information unless it's truly core to the skill—this keeps SKILL.md lean while making information discoverable without hogging the context window. Keep only essential procedural instructions and workflow guidance in SKILL.md; move detailed reference material, schemas, and examples to references files.

##### Assets (`assets/`)

Files not intended to be loaded into context, but rather used within the output the agent produces.

- **When to include**: When the skill needs files that will be used in the final output
- **Examples**: `assets/logo.png` for brand assets, `assets/slides.pptx` for PowerPoint templates, `assets/frontend-template/` for HTML/React boilerplate, `assets/font.ttf` for typography
- **Use cases**: Templates, images, icons, boilerplate code, fonts, sample documents that get copied or modified
- **Benefits**: Separates output resources from documentation, enables the agent to use files without loading them into context

#### What to Not Include in a Skill

A skill should only contain essential files that directly support its functionality. Do NOT create extraneous documentation or auxiliary files, including:

- README.md
- INSTALLATION_GUIDE.md
- QUICK_REFERENCE.md
- CHANGELOG.md
- etc.

The skill should only contain the information needed for an AI agent to do the job at hand. It should not contain auxiliary context about the process that went into creating it, setup and testing procedures, user-facing documentation, etc. Creating additional documentation files just adds clutter and confusion.

### Progressive Disclosure Design Principle

Skills use a three-level loading system to manage context efficiently:

1. **Metadata (name + description)** - Always in context (~100 words)
2. **SKILL.md body** - When skill triggers (<5k words)
3. **Bundled resources** - As needed by the agent (Unlimited because scripts can be executed without reading into context window)

#### Progressive Disclosure Patterns

Keep SKILL.md body to the essentials and under 500 lines to minimize context bloat. Split content into separate files when approaching this limit. When splitting out content into other files, it is very important to reference them from SKILL.md and describe clearly when to read them, to ensure the reader of the skill knows they exist and when to use them.

**Key principle:** When a skill supports multiple variations, frameworks, or options, keep only the core workflow and selection guidance in SKILL.md. Move variant-specific details (patterns, examples, configuration) into separate reference files.

**Pattern 1: High-level guide with references**

```markdown
# PDF Processing

## Quick start

Extract text with pdfplumber:
[code example]

## Advanced features

- **Form filling**: See [FORMS.md](FORMS.md) for complete guide
- **API reference**: See [REFERENCE.md](REFERENCE.md) for all methods
- **Examples**: See [EXAMPLES.md](EXAMPLES.md) for common patterns
```

the agent loads FORMS.md, REFERENCE.md, or EXAMPLES.md only when needed.

**Pattern 2: Domain-specific organization**

For Skills with multiple domains, organize content by domain to avoid loading irrelevant context:

```
bigquery-skill/
├── SKILL.md (overview and navigation)
└── reference/
    ├── finance.md (revenue, billing metrics)
    ├── sales.md (opportunities, pipeline)
    ├── product.md (API usage, features)
    └── marketing.md (campaigns, attribution)
```

When a user asks about sales metrics, the agent only reads sales.md.

Similarly, for skills supporting multiple frameworks or variants, organize by variant:

```
cloud-deploy/
├── SKILL.md (workflow + provider selection)
└── references/
    ├── aws.md (AWS deployment patterns)
    ├── gcp.md (GCP deployment patterns)
    └── azure.md (Azure deployment patterns)
```

When the user chooses AWS, the agent only reads aws.md.

**Pattern 3: Conditional details**

Show basic content, link to advanced content:

```markdown
# DOCX Processing

## Creating documents

Use docx-js for new documents. See [DOCX-JS.md](DOCX-JS.md).

## Editing documents

For simple edits, modify the XML directly.

**For tracked changes**: See [REDLINING.md](REDLINING.md)
**For OOXML details**: See [OOXML.md](OOXML.md)
```

the agent reads REDLINING.md or OOXML.md only when the user needs those features.

**Important guidelines:**

- **Avoid deeply nested references** - Keep references one level deep from SKILL.md. All reference files should link directly from SKILL.md.
- **Structure longer reference files** - For files longer than 100 lines, include a table of contents at the top so the agent can see the full scope when previewing.

## Skill Creation Process

Skill creation involves these steps:

1. Understand the skill with concrete examples
2. Plan reusable skill contents (scripts, references, assets)
3. Initialize the skill (run init_skill.py)
4. Edit the skill (implement resources and write SKILL.md)
5. Package the skill (run package_skill.py)
6. Iterate based on real usage

Follow these steps in order, skipping only if there is a clear reason why they are not applicable.

### Skill Naming

- Use lowercase letters, digits, and hyphens only; normalize user-provided titles to hyphen-case (e.g., "Plan Mode" -> `plan-mode`).
- When generating names, generate a name under 64 characters (letters, digits, hyphens).
- Prefer short, verb-led phrases that describe the action.
- Namespace by tool when it improves clarity or triggering (e.g., `gh-address-comments`, `linear-address-issue`).
- Name the skill folder exactly after the skill name.

### Step 1: Understanding the Skill with Concrete Examples

Skip this step only when the skill's usage patterns are already clearly understood. It remains valuable even when working with an existing skill.

To create an effective skill, clearly understand concrete examples of how the skill will be used. This understanding can come from either direct user examples or generated examples that are validated with user feedback.

For example, when building an image-editor skill, relevant questions include:

- "What functionality should the image-editor skill support? Editing, rotating, anything else?"
- "Can you give some examples of how this skill would be used?"
- "I can imagine users asking for things like 'Remove the red-eye from this image' or 'Rotate this image'. Are there other ways you imagine this skill being used?"
- "What would a user say that should trigger this skill?"

To avoid overwhelming users, avoid asking too many questions in a single message. Start with the most important questions and follow up as needed for better effectiveness.

Conclude this step when there is a clear sense of the functionality the skill should support.

### Step 2: Planning the Reusable Skill Contents

To turn concrete examples into an effective skill, analyze each example by:

1. Considering how to execute on the example from scratch
2. Identifying what scripts, references, and assets would be helpful when executing these workflows repeatedly

Example: When building a `pdf-editor` skill to handle queries like "Help me rotate this PDF," the analysis shows:

1. Rotating a PDF requires re-writing the same code each time
2. A `scripts/rotate_pdf.py` script would be helpful to store in the skill

Example: When designing a `frontend-webapp-builder` skill for queries like "Build me a todo app" or "Build me a dashboard to track my steps," the analysis shows:

1. Writing a frontend webapp requires the same boilerplate HTML/React each time
2. An `assets/hello-world/` template containing the boilerplate HTML/React project files would be helpful to store in the skill

Example: When building a `big-query` skill to handle queries like "How many users have logged in today?" the analysis shows:

1. Querying BigQuery requires re-discovering the table schemas and relationships each time
2. A `references/schema.md` file documenting the table schemas would be helpful to store in the skill

To establish the skill's contents, analyze each concrete example to create a list of the reusable resources to include: scripts, references, and assets.

### Step 3: Initializing the Skill

At this point, it is time to actually create the skill.

Skip this step only if the skill being developed already exists, and iteration or packaging is needed. In this case, continue to the next step.

When creating a new skill from scratch, always run the `init_skill.py` script. The script conveniently generates a new template skill directory that automatically includes everything a skill requires, making the skill creation process much more efficient and reliable.

Usage:

```bash
scripts/init_skill.py <skill-name> --path <output-directory> [--resources scripts,references,assets] [--examples]
```

Examples:

```bash
scripts/init_skill.py my-skill --path skills/public
scripts/init_skill.py my-skill --path skills/public --resources scripts,references
scripts/init_skill.py my-skill --path skills/public --resources scripts --examples
```

The script:

- Creates the skill directory at the specified path
- Generates a SKILL.md template with proper frontmatter and TODO placeholders
- Optionally creates resource directories based on `--resources`
- Optionally adds example files when `--examples` is set

After initialization, customize the SKILL.md and add resources as needed. If you used `--examples`, replace or delete placeholder files.

### Step 4: Edit the Skill

When editing the (newly-generated or existing) skill, remember that the skill is being created for another instance of the agent to use. Include information that would be beneficial and non-obvious to the agent. Consider what procedural knowledge, domain-specific details, or reusable assets would help another the agent instance execute these tasks more effectively.

#### Learn Proven Design Patterns

Consult these helpful guides based on your skill's needs:

- **Multi-step processes**: See references/workflows.md for sequential workflows and conditional logic
- **Specific output formats or quality standards**: See references/output-patterns.md for template and example patterns

These files contain established best practices for effective skill design.

#### Start with Reusable Skill Contents

To begin implementation, start with the reusable resources identified above: `scripts/`, `references/`, and `assets/` files. Note that this step may require user input. For example, when implementing a `brand-guidelines` skill, the user may need to provide brand assets or templates to store in `assets/`, or documentation to store in `references/`.

Added scripts must be tested by actually running them to ensure there are no bugs and that the output matches what is expected. If there are many similar scripts, only a representative sample needs to be tested to ensure confidence that they all work while balancing time to completion.

If you used `--examples`, delete any placeholder files that are not needed for the skill. Only create resource directories that are actually required.

#### Update SKILL.md

**Writing Guidelines:** Always use imperative/infinitive form.

##### Frontmatter

Write the YAML frontmatter with `name` and `description`:

- `name`: The skill name
- `description`: This is the primary triggering mechanism for your skill, and helps the agent understand when to use the skill.
  - Include both what the Skill does and specific triggers/contexts for when to use it.
  - Include all "when to use" information here - Not in the body. The body is only loaded after triggering, so "When to Use This Skill" sections in the body are not helpful to the agent.
  - Example description for a `docx` skill: "Comprehensive document creation, editing, and analysis with support for tracked changes, comments, formatting preservation, and text extraction. Use when the agent needs to work with professional documents (.docx files) for: (1) Creating new documents, (2) Modifying or editing content, (3) Working with tracked changes, (4) Adding comments, or any other document tasks"

Do not include any other fields in YAML frontmatter.

##### Body

Write instructions for using the skill and its bundled resources.

### Step 5: Packaging a Skill

Once development of the skill is complete, it must be packaged into a distributable .skill file that gets shared with the user. The packaging process automatically validates the skill first to ensure it meets all requirements:

```bash
scripts/package_skill.py <path/to/skill-folder>
```

Optional output directory specification:

```bash
scripts/package_skill.py <path/to/skill-folder> ./dist
```

The packaging script will:

1. **Validate** the skill automatically, checking:

   - YAML frontmatter format and required fields
   - Skill naming conventions and directory structure
   - Description completeness and quality
   - File organization and resource references

2. **Package** the skill if validation passes, creating a .skill file named after the skill (e.g., `my-skill.skill`) that includes all files and maintains the proper directory structure for distribution. The .skill file is a zip file with a .skill extension.

If validation fails, the script will report the errors and exit without creating a package. Fix any validation errors and run the packaging command again.

### Step 6: Iterate

After testing the skill, users may request improvements. Often this happens right after using the skill, with fresh context of how the skill performed.

**Iteration workflow:**

1. Use the skill on real tasks
2. Notice struggles or inefficiencies
3. Identify how SKILL.md or bundled resources should be updated
4. Implement changes and test again


================================================
FILE: nanobot/nanobot/skills/summarize/SKILL.md
================================================
---
name: summarize
description: Summarize or extract text/transcripts from URLs, podcasts, and local files (great fallback for “transcribe this YouTube/video”).
homepage: https://summarize.sh
metadata: {"nanobot":{"emoji":"🧾","requires":{"bins":["summarize"]},"install":[{"id":"brew","kind":"brew","formula":"steipete/tap/summarize","bins":["summarize"],"label":"Install summarize (brew)"}]}}
---

# Summarize

Fast CLI to summarize URLs, local files, and YouTube links.

## When to use (trigger phrases)

Use this skill immediately when the user asks any of:
- “use summarize.sh”
- “what’s this link/video about?”
- “summarize this URL/article”
- “transcribe this YouTube/video” (best-effort transcript extraction; no `yt-dlp` needed)

## Quick start

```bash
summarize "https://example.com" --model google/gemini-3-flash-preview
summarize "/path/to/file.pdf" --model google/gemini-3-flash-preview
summarize "https://youtu.be/dQw4w9WgXcQ" --youtube auto
```

## YouTube: summary vs transcript

Best-effort transcript (URLs only):

```bash
summarize "https://youtu.be/dQw4w9WgXcQ" --youtube auto --extract-only
```

If the user asked for a transcript but it’s huge, return a tight summary first, then ask which section/time range to expand.

## Model + keys

Set the API key for your chosen provider:
- OpenAI: `OPENAI_API_KEY`
- Anthropic: `ANTHROPIC_API_KEY`
- xAI: `XAI_API_KEY`
- Google: `GEMINI_API_KEY` (aliases: `GOOGLE_GENERATIVE_AI_API_KEY`, `GOOGLE_API_KEY`)

Default model is `google/gemini-3-flash-preview` if none is set.

## Useful flags

- `--length short|medium|long|xl|xxl|<chars>`
- `--max-output-tokens <count>`
- `--extract-only` (URLs only)
- `--json` (machine readable)
- `--firecrawl auto|off|always` (fallback extraction)
- `--youtube auto` (Apify fallback if `APIFY_API_TOKEN` set)

## Config

Optional config file: `~/.summarize/config.json`

```json
{ "model": "openai/gpt-5.2" }
```

Optional services:
- `FIRECRAWL_API_KEY` for blocked sites
- `APIFY_API_TOKEN` for YouTube fallback


================================================
FILE: nanobot/nanobot/skills/tmux/SKILL.md
================================================
---
name: tmux
description: Remote-control tmux sessions for interactive CLIs by sending keystrokes and scraping pane output.
metadata: {"nanobot":{"emoji":"🧵","os":["darwin","linux"],"requires":{"bins":["tmux"]}}}
---

# tmux Skill

Use tmux only when you need an interactive TTY. Prefer exec background mode for long-running, non-interactive tasks.

## Quickstart (isolated socket, exec tool)

```bash
SOCKET_DIR="${NANOBOT_TMUX_SOCKET_DIR:-${TMPDIR:-/tmp}/nanobot-tmux-sockets}"
mkdir -p "$SOCKET_DIR"
SOCKET="$SOCKET_DIR/nanobot.sock"
SESSION=nanobot-python

tmux -S "$SOCKET" new -d -s "$SESSION" -n shell
tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 -- 'PYTHON_BASIC_REPL=1 python3 -q' Enter
tmux -S "$SOCKET" capture-pane -p -J -t "$SESSION":0.0 -S -200
```

After starting a session, always print monitor commands:

```
To monitor:
  tmux -S "$SOCKET" attach -t "$SESSION"
  tmux -S "$SOCKET" capture-pane -p -J -t "$SESSION":0.0 -S -200
```

## Socket convention

- Use `NANOBOT_TMUX_SOCKET_DIR` environment variable.
- Default socket path: `"$NANOBOT_TMUX_SOCKET_DIR/nanobot.sock"`.

## Targeting panes and naming

- Target format: `session:window.pane` (defaults to `:0.0`).
- Keep names short; avoid spaces.
- Inspect: `tmux -S "$SOCKET" list-sessions`, `tmux -S "$SOCKET" list-panes -a`.

## Finding sessions

- List sessions on your socket: `{baseDir}/scripts/find-sessions.sh -S "$SOCKET"`.
- Scan all sockets: `{baseDir}/scripts/find-sessions.sh --all` (uses `NANOBOT_TMUX_SOCKET_DIR`).

## Sending input safely

- Prefer literal sends: `tmux -S "$SOCKET" send-keys -t target -l -- "$cmd"`.
- Control keys: `tmux -S "$SOCKET" send-keys -t target C-c`.

## Watching output

- Capture recent history: `tmux -S "$SOCKET" capture-pane -p -J -t target -S -200`.
- Wait for prompts: `{baseDir}/scripts/wait-for-text.sh -t session:0.0 -p 'pattern'`.
- Attaching is OK; detach with `Ctrl+b d`.

## Spawning processes

- For python REPLs, set `PYTHON_BASIC_REPL=1` (non-basic REPL breaks send-keys flows).

## Windows / WSL

- tmux is supported on macOS/Linux. On Windows, use WSL and install tmux inside WSL.
- This skill is gated to `darwin`/`linux` and requires `tmux` on PATH.

## Orchestrating Coding Agents (Codex, Claude Code)

tmux excels at running multiple coding agents in parallel:

```bash
SOCKET="${TMPDIR:-/tmp}/codex-army.sock"

# Create multiple sessions
for i in 1 2 3 4 5; do
  tmux -S "$SOCKET" new-session -d -s "agent-$i"
done

# Launch agents in different workdirs
tmux -S "$SOCKET" send-keys -t agent-1 "cd /tmp/project1 && codex --yolo 'Fix bug X'" Enter
tmux -S "$SOCKET" send-keys -t agent-2 "cd /tmp/project2 && codex --yolo 'Fix bug Y'" Enter

# Poll for completion (check if prompt returned)
for sess in agent-1 agent-2; do
  if tmux -S "$SOCKET" capture-pane -p -t "$sess" -S -3 | grep -q "❯"; then
    echo "$sess: DONE"
  else
    echo "$sess: Running..."
  fi
done

# Get full output from completed session
tmux -S "$SOCKET" capture-pane -p -t agent-1 -S -500
```

**Tips:**
- Use separate git worktrees for parallel fixes (no branch conflicts)
- `pnpm install` first before running codex in fresh clones
- Check for shell prompt (`❯` or `$`) to detect completion
- Codex needs `--yolo` or `--full-auto` for non-interactive fixes

## Cleanup

- Kill a session: `tmux -S "$SOCKET" kill-session -t "$SESSION"`.
- Kill all sessions on a socket: `tmux -S "$SOCKET" list-sessions -F '#{session_name}' | xargs -r -n1 tmux -S "$SOCKET" kill-session -t`.
- Remove everything on the private socket: `tmux -S "$SOCKET" kill-server`.

## Helper: wait-for-text.sh

`{baseDir}/scripts/wait-for-text.sh` polls a pane for a regex (or fixed string) with a timeout.

```bash
{baseDir}/scripts/wait-for-text.sh -t session:0.0 -p 'pattern' [-F] [-T 20] [-i 0.5] [-l 2000]
```

- `-t`/`--target` pane target (required)
- `-p`/`--pattern` regex to match (required); add `-F` for fixed string
- `-T` timeout seconds (integer, default 15)
- `-i` poll interval seconds (default 0.5)
- `-l` history lines to search (integer, default 1000)


================================================
FILE: nanobot/nanobot/skills/tmux/scripts/find-sessions.sh
================================================
#!/usr/bin/env bash
set -euo pipefail

usage() {
  cat <<'USAGE'
Usage: find-sessions.sh [-L socket-name|-S socket-path|-A] [-q pattern]

List tmux sessions on a socket (default tmux socket if none provided).

Options:
  -L, --socket       tmux socket name (passed to tmux -L)
  -S, --socket-path  tmux socket path (passed to tmux -S)
  -A, --all          scan all sockets under NANOBOT_TMUX_SOCKET_DIR
  -q, --query        case-insensitive substring to filter session names
  -h, --help         show this help
USAGE
}

socket_name=""
socket_path=""
query=""
scan_all=false
socket_dir="${NANOBOT_TMUX_SOCKET_DIR:-${TMPDIR:-/tmp}/nanobot-tmux-sockets}"

while [[ $# -gt 0 ]]; do
  case "$1" in
    -L|--socket)      socket_name="${2-}"; shift 2 ;;
    -S|--socket-path) socket_path="${2-}"; shift 2 ;;
    -A|--all)         scan_all=true; shift ;;
    -q|--query)       query="${2-}"; shift 2 ;;
    -h|--help)        usage; exit 0 ;;
    *) echo "Unknown option: $1" >&2; usage; exit 1 ;;
  esac
done

if [[ "$scan_all" == true && ( -n "$socket_name" || -n "$socket_path" ) ]]; then
  echo "Cannot combine --all with -L or -S" >&2
  exit 1
fi

if [[ -n "$socket_name" && -n "$socket_path" ]]; then
  echo "Use either -L or -S, not both" >&2
  exit 1
fi

if ! command -v tmux >/dev/null 2>&1; then
  echo "tmux not found in PATH" >&2
  exit 1
fi

list_sessions() {
  local label="$1"; shift
  local tmux_cmd=(tmux "$@")

  if ! sessions="$("${tmux_cmd[@]}" list-sessions -F '#{session_name}\t#{session_attached}\t#{session_created_string}' 2>/dev/null)"; then
    echo "No tmux server found on $label" >&2
    return 1
  fi

  if [[ -n "$query" ]]; then
    sessions="$(printf '%s\n' "$sessions" | grep -i -- "$query" || true)"
  fi

  if [[ -z "$sessions" ]]; then
    echo "No sessions found on $label"
    return 0
  fi

  echo "Sessions on $label:"
  printf '%s\n' "$sessions" | while IFS=$'\t' read -r name attached created; do
    attached_label=$([[ "$attached" == "1" ]] && echo "attached" || echo "detached")
    printf '  - %s (%s, started %s)\n' "$name" "$attached_label" "$created"
  done
}

if [[ "$scan_all" == true ]]; then
  if [[ ! -d "$socket_dir" ]]; then
    echo "Socket directory not found: $socket_dir" >&2
    exit 1
  fi

  shopt -s nullglob
  sockets=("$socket_dir"/*)
  shopt -u nullglob

  if [[ "${#sockets[@]}" -eq 0 ]]; then
    echo "No sockets found under $socket_dir" >&2
    exit 1
  fi

  exit_code=0
  for sock in "${sockets[@]}"; do
    if [[ ! -S "$sock" ]]; then
      continue
    fi
    list_sessions "socket path '$sock'" -S "$sock" || exit_code=$?
  done
  exit "$exit_code"
fi

tmux_cmd=(tmux)
socket_label="default socket"

if [[ -n "$socket_name" ]]; then
  tmux_cmd+=(-L "$socket_name")
  socket_label="socket name '$socket_name'"
elif [[ -n "$socket_path" ]]; then
  tmux_cmd+=(-S "$socket_path")
  socket_label="socket path '$socket_path'"
fi

list_sessions "$socket_label" "${tmux_cmd[@]:1}"


================================================
FILE: nanobot/nanobot/skills/tmux/scripts/wait-for-text.sh
================================================
#!/usr/bin/env bash
set -euo pipefail

usage() {
  cat <<'USAGE'
Usage: wait-for-text.sh -t target -p pattern [options]

Poll a tmux pane for text and exit when found.

Options:
  -t, --target    tmux target (session:window.pane), required
  -p, --pattern   regex pattern to look for, required
  -F, --fixed     treat pattern as a fixed string (grep -F)
  -T, --timeout   seconds to wait (integer, default: 15)
  -i, --interval  poll interval in seconds (default: 0.5)
  -l, --lines     number of history lines to inspect (integer, default: 1000)
  -h, --help      show this help
USAGE
}

target=""
pattern=""
grep_flag="-E"
timeout=15
interval=0.5
lines=1000

while [[ $# -gt 0 ]]; do
  case "$1" in
    -t|--target)   target="${2-}"; shift 2 ;;
    -p|--pattern)  pattern="${2-}"; shift 2 ;;
    -F|--fixed)    grep_flag="-F"; shift ;;
    -T|--timeout)  timeout="${2-}"; shift 2 ;;
    -i|--interval) interval="${2-}"; shift 2 ;;
    -l|--lines)    lines="${2-}"; shift 2 ;;
    -h|--help)     usage; exit 0 ;;
    *) echo "Unknown option: $1" >&2; usage; exit 1 ;;
  esac
done

if [[ -z "$target" || -z "$pattern" ]]; then
  echo "target and pattern are required" >&2
  usage
  exit 1
fi

if ! [[ "$timeout" =~ ^[0-9]+$ ]]; then
  echo "timeout must be an integer number of seconds" >&2
  exit 1
fi

if ! [[ "$lines" =~ ^[0-9]+$ ]]; then
  echo "lines must be an integer" >&2
  exit 1
fi

if ! command -v tmux >/dev/null 2>&1; then
  echo "tmux not found in PATH" >&2
  exit 1
fi

# End time in epoch seconds (integer, good enough for polling)
start_epoch=$(date +%s)
deadline=$((start_epoch + timeout))

while true; do
  # -J joins wrapped lines, -S uses negative index to read last N lines
  pane_text="$(tmux capture-pane -p -J -t "$target" -S "-${lines}" 2>/dev/null || true)"

  if printf '%s\n' "$pane_text" | grep $grep_flag -- "$pattern" >/dev/null 2>&1; then
    exit 0
  fi

  now=$(date +%s)
  if (( now >= deadline )); then
    echo "Timed out after ${timeout}s waiting for pattern: $pattern" >&2
    echo "Last ${lines} lines from $target:" >&2
    printf '%s\n' "$pane_text" >&2
    exit 1
  fi

  sleep "$interval"
done


================================================
FILE: nanobot/nanobot/skills/weather/SKILL.md
================================================
---
name: weather
description: Get current weather and forecasts (no API key required).
homepage: https://wttr.in/:help
metadata: {"nanobot":{"emoji":"🌤️","requires":{"bins":["curl"]}}}
---

# Weather

Two free services, no API keys needed.

## wttr.in (primary)

Quick one-liner:
```bash
curl -s "wttr.in/London?format=3"
# Output: London: ⛅️ +8°C
```

Compact format:
```bash
curl -s "wttr.in/London?format=%l:+%c+%t+%h+%w"
# Output: London: ⛅️ +8°C 71% ↙5km/h
```

Full forecast:
```bash
curl -s "wttr.in/London?T"
```

Format codes: `%c` condition · `%t` temp · `%h` humidity · `%w` wind · `%l` location · `%m` moon

Tips:
- URL-encode spaces: `wttr.in/New+York`
- Airport codes: `wttr.in/JFK`
- Units: `?m` (metric) `?u` (USCS)
- Today only: `?1` · Current only: `?0`
- PNG: `curl -s "wttr.in/Berlin.png" -o /tmp/weather.png`

## Open-Meteo (fallback, JSON)

Free, no key, good for programmatic use:
```bash
curl -s "https://api.open-meteo.com/v1/forecast?latitude=51.5&longitude=-0.12&current_weather=true"
```

Find coordinates for a city, then query. Returns JSON with temp, windspeed, weathercode.

Docs: https://open-meteo.com/en/docs


================================================
FILE: nanobot/nanobot/utils/__init__.py
================================================
"""Utility functions for nanobot."""

from nanobot.utils.helpers import ensure_dir, get_data_path, get_workspace_path

__all__ = ["ensure_dir", "get_workspace_path", "get_data_path"]


================================================
FILE: nanobot/nanobot/utils/helpers.py
================================================
"""Utility functions for nanobot."""

from datetime import datetime
from pathlib import Path


def ensure_dir(path: Path) -> Path:
    """Ensure a directory exists, creating it if necessary."""
    path.mkdir(parents=True, exist_ok=True)
    return path


def get_data_path() -> Path:
    """Get the nanobot data directory (~/.nanobot)."""
    return ensure_dir(Path.home() / ".nanobot")


def get_workspace_path(workspace: str | None = None) -> Path:
    """
    Get the workspace path.

    Args:
        workspace: Optional workspace path. Defaults to ~/.nanobot/workspace.

    Returns:
        Expanded and ensured workspace path.
    """
    if workspace:
        path = Path(workspace).expanduser()
    else:
        path = Path.home() / ".nanobot" / "workspace"
    return ensure_dir(path)


def get_sessions_path() -> Path:
    """Get the sessions storage directory."""
    return ensure_dir(get_data_path() / "sessions")


def get_memory_path(workspace: Path | None = None) -> Path:
    """Get the memory directory within the workspace."""
    ws = workspace or get_workspace_path()
    return ensure_dir(ws / "memory")


def get_skills_path(workspace: Path | None = None) -> Path:
    """Get the skills directory within the workspace."""
    ws = workspace or get_workspace_path()
    return ensure_dir(ws / "skills")


def today_date() -> str:
    """Get today's date in YYYY-MM-DD format."""
    return datetime.now().strftime("%Y-%m-%d")


def timestamp() -> str:
    """Get current timestamp in ISO format."""
    return datetime.now().isoformat()


def truncate_string(s: str, max_len: int = 100, suffix: str = "...") -> str:
    """Truncate a string to max length, adding suffix if truncated."""
    if len(s) <= max_len:
        return s
    return s[: max_len - len(suffix)] + suffix


def safe_filename(name: str) -> str:
    """Convert a string to a safe filename."""
    # Replace unsafe characters
    unsafe = '<>:"/\\|?*'
    for char in unsafe:
        name = name.replace(char, "_")
    return name.strip()


def parse_session_key(key: str) -> tuple[str, str]:
    """
    Parse a session key into channel and chat_id.

    Args:
        key: Session key in format "channel:chat_id"

    Returns:
        Tuple of (channel, chat_id)
    """
    parts = key.split(":", 1)
    if len(parts) != 2:
        raise ValueError(f"Invalid session key: {key}")
    return parts[0], parts[1]


================================================
FILE: nanobot/pyproject.toml
================================================
[project]
name = "nanobot-ai"
version = "0.1.3.post5"
description = "A lightweight personal AI assistant framework"
requires-python = ">=3.11"
license = {text = "MIT"}
authors = [
    {name = "nanobot contributors"}
]
keywords = ["ai", "agent", "chatbot"]
classifiers = [
    "Development Status :: 3 - Alpha",
    "Intended Audience :: Developers",
    "License :: OSI Approved :: MIT License",
    "Programming Language :: Python :: 3.11",
    "Programming Language :: Python :: 3.12",
]

dependencies = [
    "typer>=0.9.0",
    "litellm>=1.0.0",
    "pydantic>=2.0.0",
    "pydantic-settings>=2.0.0",
    "websockets>=12.0",
    "websocket-client>=1.6.0",
    "httpx[socks]>=0.25.0",
    "loguru>=0.7.0",
    "readability-lxml>=0.8.0",
    "rich>=13.0.0",
    "croniter>=2.0.0",
    "dingtalk-stream>=0.4.0",
    "python-telegram-bot[socks]>=21.0",
    "lark-oapi>=1.0.0",
    "socksio>=1.0.0",
    "slack-sdk>=3.26.0",
    "qq-botpy>=1.0.0",
]

[project.optional-dependencies]
dev = [
    "pytest>=7.0.0",
    "pytest-asyncio>=0.21.0",
    "ruff>=0.1.0",
]

[project.scripts]
nanobot = "nanobot.cli.commands:app"

[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"

[tool.hatch.build.targets.wheel]
packages = ["nanobot"]

[tool.hatch.build.targets.wheel.sources]
"nanobot" = "nanobot"

# Include non-Python files in skills
[tool.hatch.build]
include = [
    "nanobot/**/*.py",
    "nanobot/skills/**/*.md",
    "nanobot/skills/**/*.sh",
]

[tool.hatch.build.targets.sdist]
include = [
    "nanobot/",
    "bridge/",
    "README.md",
    "LICENSE",
]

[tool.hatch.build.targets.wheel.force-include]
"bridge" = "nanobot/bridge"

[tool.ruff]
line-length = 100
target-version = "py311"

[tool.ruff.lint]
select = ["E", "F", "I", "N", "W"]
ignore = ["E501"]

[tool.pytest.ini_options]
asyncio_mode = "auto"
testpaths = ["tests"]


================================================
FILE: nanobot/run_nanobot.sh
================================================
#!/bin/bash
# ============================================================
# Nanobot + DeepCode 一键启动脚本
# 自动检查环境、配置、构建 Docker 镜像并启动服务
# 实现飞书 <-> Nanobot <-> DeepCode 全链路通信
# ============================================================

set -e

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_ROOT="$(cd "$SCRIPT_DIR/.." && pwd)"
COMPOSE_FILE="$PROJECT_ROOT/deepcode_docker/docker-compose.yml"

# 颜色定义
RED='\033[0;31m'
GREEN='\033[0;32m'
BLUE='\033[0;34m'
YELLOW='\033[1;33m'
CYAN='\033[0;36m'
NC='\033[0m'

# docker compose wrapper
dc() {
    docker compose -f "$COMPOSE_FILE" "$@"
}

print_banner() {
    echo ""
    echo "╔══════════════════════════════════════════════╗"
    echo "║   Nanobot + DeepCode  一键启动脚本          ║"
    echo "║   飞书 <-> Nanobot <-> DeepCode             ║"
    echo "╚══════════════════════════════════════════════╝"
    echo ""
}

# ============ 检查 Docker 环境 ============
check_docker() {
    echo -e "${BLUE}[1/5] 检查 Docker 环境...${NC}"

    if ! command -v docker &> /dev/null; then
        echo -e "${RED}❌ 未检测到 Docker，请先安装 Docker Desktop${NC}"
        echo "   下载地址: https://www.docker.com/products/docker-desktop"
        exit 1
    fi

    if ! docker info &> /dev/null 2>&1; then
        echo -e "${RED}❌ Docker 服务未运行，请先启动 Docker Desktop${NC}"
        exit 1
    fi

    echo -e "${GREEN}   ✓ Docker 环境正常${NC}"
}

# ============ 检查 DeepCode 配置文件 ============
check_deepcode_config() {
    echo -e "${BLUE}[2/5] 检查 DeepCode 配置文件...${NC}"

    # mcp_agent.config.yaml
    if [ ! -f "$PROJECT_ROOT/mcp_agent.config.yaml" ]; then
        echo -e "${RED}   ❌ 缺少 mcp_agent.config.yaml${NC}"
        echo -e "      请确保项目根目录下存在 mcp_agent.config.yaml"
        exit 1
    fi
    echo -e "${GREEN}   ✓ mcp_agent.config.yaml${NC}"

    # mcp_agent.secrets.yaml
    if [ ! -f "$PROJECT_ROOT/mcp_agent.secrets.yaml" ]; then
        if [ -f "$PROJECT_ROOT/mcp_agent.secrets.yaml.example" ]; then
            echo -e "${YELLOW}   ⚠ 未找到 mcp_agent.secrets.yaml，从模板创建...${NC}"
            cp "$PROJECT_ROOT/mcp_agent.secrets.yaml.example" "$PROJECT_ROOT/mcp_agent.secrets.yaml"
            echo -e "${YELLOW}   ⚡ 请编辑 mcp_agent.secrets.yaml 填入你的 API Key，然后重新运行${NC}"
            echo -e "      文件路径: $PROJECT_ROOT/mcp_agent.secrets.yaml"
            exit 1
        else
            echo -e "${RED}   ❌ 缺少 mcp_agent.secrets.yaml 且无模板文件${NC}"
            exit 1
        fi
    fi
    echo -e "${GREEN}   ✓ mcp_agent.secrets.yaml${NC}"
}

# ============ 检查 Nanobot 配置文件 ============
check_nanobot_config() {
    echo -e "${BLUE}[3/5] 检查 Nanobot 配置文件 (飞书等渠道)...${NC}"

    if [ ! -f "$PROJECT_ROOT/nanobot_config.json" ]; then
        if [ -f "$PROJECT_ROOT/nanobot_config.json.example" ]; then
            echo -e "${YELLOW}   ⚠ 未找到 nanobot_config.json，从模板创建...${NC}"
            cp "$PROJECT_ROOT/nanobot_config.json.example" "$PROJECT_ROOT/nanobot_config.json"
            echo -e "${YELLOW}   ⚡ 请编辑 nanobot_config.json 填入以下信息后重新运行:${NC}"
            echo -e "      - 飞书 appId 和 appSecret"
            echo -e "      - LLM Provider API Key (如 OpenRouter)"
            echo -e "      文件路径: $PROJECT_ROOT/nanobot_config.json"
            exit 1
        else
            echo -e "${RED}   ❌ 缺少 nanobot_config.json 且无模板文件${NC}"
            exit 1
        fi
    fi

    # 检查飞书配置是否还是占位符
    if grep -q '"your_feishu_app_id"' "$PROJECT_ROOT/nanobot_config.json" 2>/dev/null; then
        echo -e "${YELLOW}   ⚠ nanobot_config.json 中飞书配置仍为占位符${NC}"
        echo -e "      请编辑 $PROJECT_ROOT/nanobot_config.json"
        echo -e "      填入真实的 appId 和 appSecret"
        echo ""
        read -p "   是否已配置好，继续启动? [y/N] " confirm
        if [[ ! "$confirm" =~ ^[Yy]$ ]]; then
            exit 1
        fi
    fi

    echo -e "${GREEN}   ✓ nanobot_config.json${NC}"
}

# ============ 创建必要目录 ============
ensure_dirs() {
    echo -e "${BLUE}[4/5] 检查数据目录...${NC}"
    mkdir -p "$PROJECT_ROOT/deepcode_lab" "$PROJECT_ROOT/uploads" "$PROJECT_ROOT/logs"
    echo -e "${GREEN}   ✓ deepcode_lab/ uploads/ logs/ 已就绪${NC}"
}

# ============ 检查并构建 Docker 镜像 ============
check_and_build() {
    echo -e "${BLUE}[5/5] 检查 Docker 镜像...${NC}"

    local need_build_deepcode=false
    local need_build_nanobot=false

    # 检查 deepcode 镜像是否存在
    if ! docker images --format '{{.Repository}}' | grep -q "deepcode"; then
        need_build_deepcode=true
    fi

    # 检查 nanobot 镜像是否存在
    if ! docker images --format '{{.Repository}}' | grep -q "nanobot"; then
        need_build_nanobot=true
    fi

    if [ "$FORCE_BUILD" = true ]; then
        echo -e "${YELLOW}   强制重新构建所有镜像...${NC}"
        BUILD_FLAG="--build"
    elif [ "$need_build_deepcode" = true ] || [ "$need_build_nanobot" = true ]; then
        echo -e "${YELLOW}   检测到缺少镜像，首次构建中...${NC}"
        if [ "$need_build_deepcode" = true ]; then
            echo -e "${YELLOW}   - deepcode 镜像需要构建${NC}"
        fi
        if [ "$need_build_nanobot" = true ]; then
            echo -e "${YELLOW}   - nanobot 镜像需要构建${NC}"
        fi
        BUILD_FLAG="--build"
    else
        echo -e "${GREEN}   ✓ deepcode 镜像已存在，跳过构建${NC}"
        echo -e "${GREEN}   ✓ nanobot 镜像已存在，跳过构建${NC}"
        BUILD_FLAG=""
    fi
}

# ============ 启动服务 ============
start_services() {
    echo ""
    echo -e "${BLUE}🚀 启动 DeepCode + Nanobot 服务...${NC}"
    echo ""

    dc up $BUILD_FLAG $DETACH_FLAG

    if [ -n "$DETACH_FLAG" ]; then
        echo ""
        echo -e "${YELLOW}⏳ 等待服务启动...${NC}"
        for i in $(seq 1 30); do
            if curl -sf http://localhost:8000/health > /dev/null 2>&1; then
                echo ""
                echo "╔══════════════════════════════════════════════╗"
                echo -e "║  ${GREEN}✓ DeepCode + Nanobot 已启动!${NC}               ║"
                echo "╠══════════════════════════════════════════════╣"
                echo "║                                              ║"
                echo "║  DeepCode API:  http://localhost:8000        ║"
                echo "║  DeepCode Docs: http://localhost:8000/docs   ║"
                echo "║  Nanobot 网关:  http://localhost:18790       ║"
                echo "║                                              ║"
                echo "║  飞书机器人已通过 WebSocket 长连接接入       ║"
                echo "║  现在可以在飞书中与机器人对话了!             ║"
                echo "║                                              ║"
                echo -e "║  查看日志: ${CYAN}$0 logs${NC}                       ║"
                echo -e "║  停止服务: ${CYAN}$0 stop${NC}                       ║"
                echo "╚══════════════════════════════════════════════╝"
                echo ""
                return 0
            fi
            sleep 2
        done
        echo -e "${YELLOW}⚠ 服务仍在启动中，请稍后检查${NC}"
        echo -e "   使用 ${CYAN}$0 logs${NC} 查看启动日志"
    fi
}

# ============ 帮助信息 ============
usage() {
    echo "用法: $0 [选项]"
    echo ""
    echo "选项:"
    echo "  (无参数)      检查环境并启动所有服务 (前台运行)"
    echo "  -d, --detach  后台运行"
    echo "  --build       强制重新构建 Docker 镜像"
    echo "  stop          停止所有服务"
    echo "  restart       重启所有服务"
    echo "  logs          查看实时日志"
    echo "  status        查看服务状态"
    echo "  clean         停止并删除容器和镜像"
    echo "  -h, --help    显示帮助信息"
    echo ""
    echo "示例:"
    echo "  $0              # 首次运行: 检查配置 → 构建镜像 → 启动"
    echo "  $0              # 再次运行: 跳过构建 → 直接启动"
    echo "  $0 -d           # 后台启动"
    echo "  $0 --build      # 强制重新构建后启动"
    echo "  $0 stop         # 停止服务"
    echo "  $0 logs         # 查看日志"
}

# ============ 解析命令行参数 ============
ACTION="up"
BUILD_FLAG=""
DETACH_FLAG=""
FORCE_BUILD=false

while [[ $# -gt 0 ]]; do
    case $1 in
        --build)
            FORCE_BUILD=true
            shift
            ;;
        -d|--detach)
            DETACH_FLAG="-d"
            shift
            ;;
        stop)
            ACTION="stop"
            shift
            ;;
        restart)
            ACTION="restart"
            shift
            ;;
        logs)
            ACTION="logs"
            shift
            ;;
        status)
            ACTION="status"
            shift
            ;;
        clean)
            ACTION="clean"
            shift
            ;;
        -h|--help)
            usage
            exit 0
            ;;
        *)
            echo -e "${RED}未知参数: $1${NC}"
            usage
            exit 1
            ;;
    esac
done

# ============ 主流程 ============
case $ACTION in
    up)
        print_banner
        check_docker
        check_deepcode_config
        check_nanobot_config
        ensure_dirs
        check_and_build
        start_services
        ;;

    stop)
        check_docker
        echo -e "${BLUE}🛑 停止 DeepCode + Nanobot 服务...${NC}"
        dc down
        echo -e "${GREEN}✓ 所有服务已停止${NC}"
        ;;

    restart)
        check_docker
        echo -e "${BLUE}🔄 重启 DeepCode + Nanobot 服务...${NC}"
        dc down
        check_deepcode_config
        check_nanobot_config
        ensure_dirs
        check_and_build
        dc up -d $BUILD_FLAG
        echo -e "${GREEN}✓ 服务已重启${NC}"
        echo -e "   DeepCode: http://localhost:8000"
        echo -e "   Nanobot:  http://localhost:18790"
        ;;

    logs)
        check_docker
        echo -e "${BLUE}📋 服务日志 (Ctrl+C 退出):${NC}"
        echo ""
        dc logs -f
        ;;

    status)
        check_docker
        echo -e "${BLUE}📊 服务状态:${NC}"
        echo ""
        dc ps
        echo ""
        # DeepCode 健康检查
        if curl -sf http://localhost:8000/health > /dev/null 2>&1; then
            echo -e "${GREEN}✓ DeepCode 运行正常 (http://localhost:8000)${NC}"
        else
            echo -e "${YELLOW}⚠ DeepCode 未响应${NC}"
        fi
        # Nanobot 端口检查
        if curl -sf http://localhost:18790 > /dev/null 2>&1 || \
           nc -z localhost 18790 2>/dev/null; then
            echo -e "${GREEN}✓ Nanobot 网关运行中 (http://localhost:18790)${NC}"
        else
            echo -e "${YELLOW}⚠ Nanobot 网关未响应${NC}"
        fi
        ;;

    clean)
        check_docker
        echo -e "${YELLOW}⚠ 即将停止并删除 DeepCode + Nanobot 容器和镜像${NC}"
        echo -e "${YELLOW}  (数据目录 deepcode_lab/, uploads/, logs/ 不会被删除)${NC}"
        read -p "确认? [y/N] " confirm
        if [[ "$confirm" =~ ^[Yy]$ ]]; then
            dc down --rmi local --remove-orphans -v
            echo -e "${GREEN}✓ 已清理完成${NC}"
        else
            echo "已取消"
        fi
        ;;
esac


================================================
FILE: nanobot/workspace/AGENTS.md
================================================
# Agent Instructions

You are a helpful AI assistant. Be concise, accurate, and friendly.

## Guidelines

- Always explain what you're doing before taking actions
- Ask for clarification when the request is ambiguous
- Use tools to help accomplish tasks
- Remember important information in your memory files

## Tools Available

You have access to:
- File operations (read, write, edit, list)
- Shell commands (exec)
- Web access (search, fetch)
- Messaging (message)
- Background tasks (spawn)

## Memory

- Use `memory/` directory for daily notes
- Use `MEMORY.md` for long-term information

## Scheduled Reminders

When user asks for a reminder at a specific time, use `exec` to run:
```
nanobot cron add --name "reminder" --message "Your message" --at "YYYY-MM-DDTHH:MM:SS" --deliver --to "USER_ID" --channel "CHANNEL"
```
Get USER_ID and CHANNEL from the current session (e.g., `8281248569` and `telegram` from `telegram:8281248569`).

**Do NOT just write reminders to MEMORY.md** — that won't trigger actual notifications.

## Heartbeat Tasks

`HEARTBEAT.md` is checked every 30 minutes. You can manage periodic tasks by editing this file:

- **Add a task**: Use `edit_file` to append new tasks to `HEARTBEAT.md`
- **Remove a task**: Use `edit_file` to remove completed or obsolete tasks
- **Rewrite tasks**: Use `write_file` to completely rewrite the task list

Task format examples:
```
- [ ] Check calendar and remind of upcoming events
- [ ] Scan inbox for urgent emails
- [ ] Check weather forecast for today
```

When the user asks you to add a recurring/periodic task, update `HEARTBEAT.md` instead of creating a one-time reminder. Keep the file small to minimize token usage.


================================================
FILE: nanobot/workspace/HEARTBEAT.md
================================================
# Heartbeat Tasks

This file is checked every 30 minutes by your nanobot agent.
Add tasks below that you want the agent to work on periodically.

If this file has no tasks (only headers and comments), the agent will skip the heartbeat.

## Active Tasks

<!-- Add your periodic tasks below this line -->


## Completed

<!-- Move completed tasks here or delete them -->


================================================
FILE: nanobot/workspace/SOUL.md
================================================
# Soul

I am nanobot 🐈, a personal AI assistant.

## Personality

- Helpful and friendly
- Concise and to the point
- Curious and eager to learn

## Values

- Accuracy over speed
- User privacy and safety
- Transparency in actions

## Communication Style

- Be clear and direct
- Explain reasoning when helpful
- Ask clarifying questions when needed


================================================
FILE: nanobot/workspace/TOOLS.md
================================================
# Available Tools

This document describes the tools available to nanobot.

## File Operations

### read_file
Read the contents of a file.
```
read_file(path: str) -> str
```

### write_file
Write content to a file (creates parent directories if needed).
```
write_file(path: str, content: str) -> str
```

### edit_file
Edit a file by replacing specific text.
```
edit_file(path: str, old_text: str, new_text: str) -> str
```

### list_dir
List contents of a directory.
```
list_dir(path: str) -> str
```

## Shell Execution

### exec
Execute a shell command and return output.
```
exec(command: str, working_dir: str = None) -> str
```

**Safety Notes:**
- Commands have a configurable timeout (default 60s)
- Dangerous commands are blocked (rm -rf, format, dd, shutdown, etc.)
- Output is truncated at 10,000 characters
- Optional `restrictToWorkspace` config to limit paths

## Web Access

### web_search
Search the web using Brave Search API.
```
web_search(query: str, count: int = 5) -> str
```

Returns search results with titles, URLs, and snippets. Requires `tools.web.search.apiKey` in config.

### web_fetch
Fetch and extract main content from a URL.
```
web_fetch(url: str, extractMode: str = "markdown", maxChars: int = 50000) -> str
```

**Notes:**
- Content is extracted using readability
- Supports markdown or plain text extraction
- Output is truncated at 50,000 characters by default

## Communication

### message
Send a message to the user (used internally).
```
message(content: str, channel: str = None, chat_id: str = None) -> str
```

## Background Tasks

### spawn
Spawn a subagent to handle a task in the background.
```
spawn(task: str, label: str = None) -> str
```

Use for complex or time-consuming tasks that can run independently. The subagent will complete the task and report back when done.

## Scheduled Reminders (Cron)

Use the `exec` tool to create scheduled reminders with `nanobot cron add`:

### Set a recurring reminder
```bash
# Every day at 9am
nanobot cron add --name "morning" --message "Good morning! ☀️" --cron "0 9 * * *"

# Every 2 hours
nanobot cron add --name "water" --message "Drink water! 💧" --every 7200
```

### Set a one-time reminder
```bash
# At a specific time (ISO format)
nanobot cron add --name "meeting" --message "Meeting starts now!" --at "2025-01-31T15:00:00"
```

### Manage reminders
```bash
nanobot cron list              # List all jobs
nanobot cron remove <job_id>   # Remove a job
```

## Heartbeat Task Management

The `HEARTBEAT.md` file in the workspace is checked every 30 minutes.
Use file operations to manage periodic tasks:

### Add a heartbeat task
```python
# Append a new task
edit_file(
    path="HEARTBEAT.md",
    old_text="## Example Tasks",
    new_text="- [ ] New periodic task here\n\n## Example Tasks"
)
```

### Remove a heartbeat task
```python
# Remove a specific task
edit_file(
    path="HEARTBEAT.md",
    old_text="- [ ] Task to remove\n",
    new_text=""
)
```

### Rewrite all tasks
```python
# Replace the entire file
write_file(
    path="HEARTBEAT.md",
    content="# Heartbeat Tasks\n\n- [ ] Task 1\n- [ ] Task 2\n"
)
```

---

## Adding Custom Tools

To add custom tools:
1. Create a class that extends `Tool` in `nanobot/agent/tools/`
2. Implement `name`, `description`, `parameters`, and `execute`
3. Register it in `AgentLoop._register_default_tools()`


================================================
FILE: nanobot/workspace/USER.md
================================================
# User Profile

Information about the user to help personalize interactions.

## Basic Information

- **Name**: (your name)
- **Timezone**: (your timezone, e.g., UTC+8)
- **Language**: (preferred language)

## Preferences

### Communication Style

- [ ] Casual
- [ ] Professional
- [ ] Technical

### Response Length

- [ ] Brief and concise
- [ ] Detailed explanations
- [ ] Adaptive based on question

### Technical Level

- [ ] Beginner
- [ ] Intermediate
- [ ] Expert

## Work Context

- **Primary Role**: (your role, e.g., developer, researcher)
- **Main Projects**: (what you're working on)
- **Tools You Use**: (IDEs, languages, frameworks)

## Topics of Interest

-
-
-

## Special Instructions

(Any specific instructions for how the assistant should behave)

---

*Edit this file to customize nanobot's behavior for your needs.*


================================================
FILE: nanobot/workspace/memory/MEMORY.md
================================================
# Long-term Memory

This file stores important information that should persist across sessions.

## User Information

(Important facts about the user)

## Preferences

(User preferences learned over time)

## Project Context

(Information about ongoing projects)

## Important Notes

(Things to remember)

---

*This file is automatically updated by nanobot when important information should be remembered.*


================================================
FILE: nanobot_config.json.example
================================================
{
  "_comment": "nanobot configuration for DeepCode integration. Copy to nanobot_config.json and fill in your keys.",
  "channels": {
    "feishu": {
      "enabled": true,
      "appId": "your_feishu_app_id",
      "appSecret": "your_feishu_app_secret",
      "encryptKey": "",
      "verificationToken": "",
      "allowFrom": []
    },
    "telegram": {
      "enabled": false,
      "token": "your_telegram_bot_token",
      "allowFrom": []
    },
    "discord": {
      "enabled": false,
      "token": "your_discord_bot_token",
      "allowFrom": []
    }
  },
  "providers": {
    "openrouter": {
      "apiKey": "sk-or-v1-your_openrouter_key"
    }
  },
  "agents": {
    "defaults": {
      "model": "anthropic/claude-sonnet-4-20250514",
      "workspace": "/root/.nanobot/workspace",
      "maxTokens": 8192,
      "temperature": 0.7
    }
  },
  "gateway": {
    "host": "0.0.0.0",
    "port": 18790
  },
  "tools": {
    "web": {
      "search": {
        "apiKey": "your_brave_search_api_key",
        "maxResults": 5
      }
    },
    "exec": {
      "timeout": 120
    },
    "restrictToWorkspace": false
  }
}


================================================
FILE: new_ui/README.md
================================================
# DeepCode New UI

Modern, intelligent UI for DeepCode - AI-powered code generation platform.

## Technology Stack

- **Backend**: FastAPI (Python)
- **Frontend**: React 18 + TypeScript + Vite
- **Styling**: Tailwind CSS + shadcn/ui
- **State Management**: Zustand
- **Real-time Communication**: WebSocket
- **Workflow Visualization**: React Flow
- **Code Display**: Monaco Editor

## Features

### Intelligent Features

1. **Real-time Streaming Output** - Watch code generation in real-time, like ChatGPT
2. **Smart Context Awareness** - Remembers conversation history, provides intelligent suggestions
3. **Adaptive Interface** - Layout adjusts based on task type
4. **Visual Workflow** - Draggable flow-chart style task visualization

### Design Style

- Clean, modern design inspired by Notion/Linear
- Light theme with blue accent colors
- Inter font for text, JetBrains Mono for code

## Project Structure

```
new_ui/
├── backend/                    # FastAPI Backend
│   ├── main.py                # Entry point
│   ├── config.py              # Configuration
│   ├── api/
│   │   ├── routes/            # REST API endpoints
│   │   └── websockets/        # WebSocket handlers
│   ├── services/              # Business logic
│   └── models/                # Pydantic models
│
├── frontend/                   # React Frontend
│   ├── src/
│   │   ├── components/        # React components
│   │   ├── pages/             # Page components
│   │   ├── hooks/             # Custom hooks
│   │   ├── stores/            # Zustand stores
│   │   ├── services/          # API client
│   │   └── types/             # TypeScript types
│   ├── package.json
│   └── vite.config.ts
│
└── scripts/
    ├── start_dev.sh           # Development startup
    └── build.sh               # Production build
```

## Quick Start

### Prerequisites

- Python 3.10+
- Node.js 18+
- npm or yarn

### Development

1. **Start both backend and frontend:**

```bash
cd new_ui
chmod +x scripts/start_dev.sh
./scripts/start_dev.sh
```

2. **Or start separately:**

Backend:
```bash
cd new_ui/backend
pip install -r requirements.txt  # First time only
uvicorn main:app --reload --port 8000
```

Frontend:
```bash
cd new_ui/frontend
npm install  # First time only
npm run dev
```

3. **Access the application:**
   - Frontend: http://localhost:5173
   - Backend API: http://localhost:8000
   - API Documentation: http://localhost:8000/docs

### Production Build

```bash
cd new_ui
chmod +x scripts/build.sh
./scripts/build.sh
```

## API Endpoints

### REST API

| Method | Endpoint | Description |
|--------|----------|-------------|
| POST | `/api/v1/workflows/paper-to-code` | Start paper-to-code workflow |
| POST | `/api/v1/workflows/chat-planning` | Start chat-based planning |
| GET | `/api/v1/workflows/status/{task_id}` | Get workflow status |
| POST | `/api/v1/requirements/questions` | Generate guiding questions |
| POST | `/api/v1/requirements/summarize` | Summarize requirements |
| POST | `/api/v1/files/upload` | Upload file |
| GET | `/api/v1/config/settings` | Get settings |

### WebSocket Endpoints

| Endpoint | Description |
|----------|-------------|
| `/ws/workflow/{task_id}` | Real-time workflow progress |
| `/ws/code-stream/{task_id}` | Streaming code output |
| `/ws/logs/{session_id}` | Live log streaming |

## Configuration

The new UI reads configuration from the existing DeepCode config files:

- `mcp_agent.config.yaml` - LLM provider, models, MCP server settings
- `mcp_agent.secrets.yaml` - API keys

## Integration

The new UI integrates with existing DeepCode components:

- `workflows/agent_orchestration_engine.py` - Core workflow execution
- `workflows/agents/` - Specialized agents
- `utils/llm_utils.py` - LLM provider management

## Browser Support

- Chrome (recommended)
- Firefox
- Safari
- Edge

## License

MIT License - see main DeepCode license.


================================================
FILE: new_ui/backend/__init__.py
================================================
"""
DeepCode New UI Backend
FastAPI-based backend for the new DeepCode UI
"""

__version__ = "1.0.0"


================================================
FILE: new_ui/backend/api/__init__.py
================================================
"""API package"""


================================================
FILE: new_ui/backend/api/routes/__init__.py
================================================
"""API Routes"""


================================================
FILE: new_ui/backend/api/routes/config.py
================================================
"""
Configuration API Routes
Handles LLM provider and settings management
"""

from fastapi import APIRouter, HTTPException
import yaml

from settings import (
    load_mcp_config,
    load_secrets,
    get_llm_provider,
    get_llm_models,
    is_indexing_enabled,
    CONFIG_PATH,
)
from models.requests import LLMProviderUpdateRequest
from models.responses import ConfigResponse, SettingsResponse


router = APIRouter()


@router.get("/settings", response_model=SettingsResponse)
async def get_settings():
    """Get current application settings"""
    config = load_mcp_config()
    provider = get_llm_provider()
    models = get_llm_models(provider)

    return SettingsResponse(
        llm_provider=provider,
        models=models,
        indexing_enabled=is_indexing_enabled(),
        document_segmentation=config.get("document_segmentation", {}),
    )


@router.get("/llm-providers", response_model=ConfigResponse)
async def get_llm_providers():
    """Get available LLM providers and their configurations"""
    secrets = load_secrets()

    # Get available providers (those with API keys configured)
    available_providers = []
    for provider in ["google", "anthropic", "openai"]:
        if secrets.get(provider, {}).get("api_key"):
            available_providers.append(provider)

    current_provider = get_llm_provider()
    models = get_llm_models(current_provider)

    return ConfigResponse(
        llm_provider=current_provider,
        available_providers=available_providers,
        models=models,
        indexing_enabled=is_indexing_enabled(),
    )


@router.put("/llm-provider")
async def set_llm_provider(request: LLMProviderUpdateRequest):
    """Update the preferred LLM provider"""
    secrets = load_secrets()

    # Verify provider has an API key
    if not secrets.get(request.provider, {}).get("api_key"):
        raise HTTPException(
            status_code=400,
            detail=f"Provider '{request.provider}' does not have an API key configured",
        )

    # Update config file
    try:
        config = load_mcp_config()
        config["llm_provider"] = request.provider

        with open(CONFIG_PATH, "w", encoding="utf-8") as f:
            yaml.dump(config, f, default_flow_style=False)

        return {
            "status": "success",
            "message": f"LLM provider updated to '{request.provider}'",
            "provider": request.provider,
        }

    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Failed to update configuration: {str(e)}",
        )


================================================
FILE: new_ui/backend/api/routes/files.py
================================================
"""
Files API Routes
Handles file upload and download operations
"""

import uuid
import shutil
from pathlib import Path

from fastapi import APIRouter, File, UploadFile, HTTPException
from fastapi.responses import FileResponse

from settings import settings


router = APIRouter()

# In-memory file registry (in production, use a database)
_file_registry: dict = {}


@router.post("/upload")
async def upload_file(file: UploadFile = File(...)):
    """Upload a file (PDF, markdown, etc.)"""
    # Validate file type
    allowed_types = {".pdf", ".md", ".txt", ".markdown"}
    file_ext = Path(file.filename).suffix.lower()

    if file_ext not in allowed_types:
        raise HTTPException(
            status_code=400,
            detail=f"File type '{file_ext}' not allowed. Allowed: {', '.join(allowed_types)}",
        )

    # Generate unique file ID
    file_id = str(uuid.uuid4())
    safe_filename = f"{file_id}{file_ext}"
    file_path = Path(settings.upload_dir) / safe_filename

    try:
        # Ensure upload directory exists
        file_path.parent.mkdir(parents=True, exist_ok=True)

        # Save file
        with open(file_path, "wb") as buffer:
            shutil.copyfileobj(file.file, buffer)

        # Get file size
        file_size = file_path.stat().st_size

        # Check size limit
        if file_size > settings.max_upload_size:
            file_path.unlink()  # Delete oversized file
            raise HTTPException(
                status_code=400,
                detail=f"File size exceeds limit of {settings.max_upload_size // (1024*1024)}MB",
            )

        # Register file
        _file_registry[file_id] = {
            "id": file_id,
            "original_name": file.filename,
            "path": str(file_path),
            "size": file_size,
            "type": file_ext,
        }

        return {
            "file_id": file_id,
            "filename": file.filename,
            "path": str(file_path),
            "size": file_size,
        }

    except HTTPException:
        raise
    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Failed to upload file: {str(e)}",
        )


@router.get("/download/{file_id}")
async def download_file(file_id: str):
    """Download a file by ID"""
    file_info = _file_registry.get(file_id)

    if not file_info:
        raise HTTPException(status_code=404, detail="File not found")

    file_path = Path(file_info["path"])

    if not file_path.exists():
        raise HTTPException(status_code=404, detail="File no longer exists")

    return FileResponse(
        path=str(file_path),
        filename=file_info["original_name"],
        media_type="application/octet-stream",
    )


@router.delete("/delete/{file_id}")
async def delete_file(file_id: str):
    """Delete an uploaded file"""
    file_info = _file_registry.get(file_id)

    if not file_info:
        raise HTTPException(status_code=404, detail="File not found")

    file_path = Path(file_info["path"])

    try:
        if file_path.exists():
            file_path.unlink()

        del _file_registry[file_id]

        return {"status": "deleted", "file_id": file_id}

    except Exception as e:
        raise HTTPException(
            status_code=500,
            detail=f"Failed to delete file: {str(e)}",
        )


@router.get("/info/{file_id}")
async def get_file_info(file_id: str):
    """Get information about an uploaded file"""
    file_info = _file_registry.get(file_id)

    if not file_info:
        raise HTTPException(status_code=404, detail="File not found")

    return file_info


================================================
FILE: new_ui/backend/api/routes/requirements.py
================================================
"""
Requirements API Routes
Handles requirement analysis operations
"""

from fastapi import APIRouter, HTTPException

from services.requirement_service import requirement_service
from models.requests import (
    GenerateQuestionsRequest,
    SummarizeRequirementsRequest,
    ModifyRequirementsRequest,
)
from models.responses import QuestionsResponse, RequirementsSummaryResponse


router = APIRouter()


@router.post("/questions", response_model=QuestionsResponse)
async def generate_questions(request: GenerateQuestionsRequest):
    """Generate guiding questions based on initial requirements"""
    result = await requirement_service.generate_questions(request.initial_requirement)

    if result["status"] != "success":
        raise HTTPException(
            status_code=500,
            detail=result.get("error", "Failed to generate questions"),
        )

    return QuestionsResponse(
        questions=result["questions"],
        status="success",
    )


@router.post("/summarize", response_model=RequirementsSummaryResponse)
async def summarize_requirements(request: SummarizeRequirementsRequest):
    """Summarize requirements based on initial input and user answers"""
    result = await requirement_service.summarize_requirements(
        request.initial_requirement,
        request.user_answers,
    )

    if result["status"] != "success":
        raise HTTPException(
            status_code=500,
            detail=result.get("error", "Failed to summarize requirements"),
        )

    return RequirementsSummaryResponse(
        summary=result["summary"],
        status="success",
    )


@router.put("/modify", response_model=RequirementsSummaryResponse)
async def modify_requirements(request: ModifyRequirementsRequest):
    """Modify requirements based on user feedback"""
    result = await requirement_service.modify_requirements(
        request.current_requirements,
        request.modification_feedback,
    )

    if result["status"] != "success":
        raise HTTPException(
            status_code=500,
            detail=result.get("error", "Failed to modify requirements"),
        )

    return RequirementsSummaryResponse(
        summary=result["summary"],
        status="success",
    )


================================================
FILE: new_ui/backend/api/routes/workflows.py
================================================
"""
Workflows API Routes
Handles paper-to-code and chat-based planning workflows
"""

from fastapi import APIRouter, BackgroundTasks, HTTPException

from services.workflow_service import workflow_service
from models.requests import (
    PaperToCodeRequest,
    ChatPlanningRequest,
    InteractionResponseRequest,
)
from models.responses import TaskResponse


router = APIRouter()


@router.post("/paper-to-code", response_model=TaskResponse)
async def start_paper_to_code(
    request: PaperToCodeRequest,
    background_tasks: BackgroundTasks,
):
    """
    Start a paper-to-code workflow.
    Returns a task ID that can be used to track progress via WebSocket.
    """
    task = workflow_service.create_task()

    # Run workflow in background
    background_tasks.add_task(
        workflow_service.execute_paper_to_code,
        task.task_id,
        request.input_source,
        request.input_type,
        request.enable_indexing,
    )

    return TaskResponse(
        task_id=task.task_id,
        status="started",
        message="Paper-to-code workflow started",
    )


@router.post("/chat-planning", response_model=TaskResponse)
async def start_chat_planning(
    request: ChatPlanningRequest,
    background_tasks: BackgroundTasks,
):
    """
    Start a chat-based planning workflow.
    Returns a task ID that can be used to track progress via WebSocket.
    """
    task = workflow_service.create_task()

    # Run workflow in background
    background_tasks.add_task(
        workflow_service.execute_chat_planning,
        task.task_id,
        request.requirements,
        request.enable_indexing,
    )

    return TaskResponse(
        task_id=task.task_id,
        status="started",
        message="Chat planning workflow started",
    )


@router.get("/status/{task_id}")
async def get_workflow_status(task_id: str):
    """Get the status of a workflow task"""
    task = workflow_service.get_task(task_id)

    if not task:
        raise HTTPException(status_code=404, detail="Task not found")

    response = {
        "task_id": task.task_id,
        "status": task.status,
        "progress": task.progress,
        "message": task.message,
        "result": task.result,
        "error": task.error,
        "started_at": task.started_at.isoformat() if task.started_at else None,
        "completed_at": task.completed_at.isoformat() if task.completed_at else None,
    }

    # Include pending interaction if waiting for input
    if task.status == "waiting_for_input" and task.pending_interaction:
        response["pending_interaction"] = task.pending_interaction

    return response


@router.post("/cancel/{task_id}")
async def cancel_workflow(task_id: str):
    """Cancel a running workflow"""
    success = workflow_service.cancel_task(task_id)

    if not success:
        raise HTTPException(
            status_code=400,
            detail="Task not found or cannot be cancelled",
        )

    return {"status": "cancelled", "task_id": task_id}


@router.post("/respond/{task_id}")
async def respond_to_interaction(task_id: str, request: InteractionResponseRequest):
    """
    Submit user's response to a pending interaction.

    This is used for User-in-Loop functionality where the workflow
    pauses to ask the user for input (e.g., requirement questions,
    plan confirmation).
    """
    task = workflow_service.get_task(task_id)

    if not task:
        raise HTTPException(status_code=404, detail="Task not found")

    if task.status != "waiting_for_input":
        raise HTTPException(
            status_code=400,
            detail=f"Task is not waiting for input (current status: {task.status})",
        )

    # Check if plugin integration is available
    if not hasattr(workflow_service, "_plugin_integration"):
        raise HTTPException(
            status_code=501, detail="User-in-Loop plugin system not enabled"
        )

    success = workflow_service._plugin_integration.submit_response(
        task_id=task_id,
        action=request.action,
        data=request.data,
        skipped=request.skipped,
    )

    if not success:
        raise HTTPException(
            status_code=400, detail="No pending interaction for this task"
        )

    return {
        "status": "ok",
        "task_id": task_id,
        "action": request.action,
    }


@router.get("/interaction/{task_id}")
async def get_pending_interaction(task_id: str):
    """
    Get the pending interaction for a task, if any.

    Returns the interaction data that needs user response.
    """
    task = workflow_service.get_task(task_id)

    if not task:
        raise HTTPException(status_code=404, detail="Task not found")

    if task.status != "waiting_for_input" or not task.pending_interaction:
        return {
            "has_interaction": False,
            "task_id": task_id,
            "status": task.status,
        }

    return {
        "has_interaction": True,
        "task_id": task_id,
        "status": task.status,
        "interaction": task.pending_interaction,
    }


@router.get("/active")
async def get_active_tasks():
    """
    Get all active (running) tasks.
    Useful for recovering tasks after page refresh.
    """
    active_tasks = workflow_service.get_active_tasks()
    return {
        "tasks": [
            {
                "task_id": task.task_id,
                "status": task.status,
                "progress": task.progress,
                "message": task.message,
                "started_at": task.started_at,
            }
            for task in active_tasks
        ]
    }


@router.get("/recent")
async def get_recent_tasks(limit: int = 10):
    """
    Get recent tasks (completed, error, or running).
    Useful for task history.
    """
    recent_tasks = workflow_service.get_recent_tasks(limit)
    return {
        "tasks": [
            {
                "task_id": task.task_id,
                "status": task.status,
                "progress": task.progress,
                "message": task.message,
                "result": task.result,
                "error": task.error,
                "started_at": task.started_at,
                "completed_at": task.completed_at,
            }
            for task in recent_tasks
        ]
    }


================================================
FILE: new_ui/backend/api/websockets/__init__.py
================================================
"""WebSocket handlers"""


================================================
FILE: new_ui/backend/api/websockets/code_stream_ws.py
================================================
"""
Code Stream WebSocket Handler
Provides real-time streaming of generated code
"""

import asyncio
from datetime import datetime
from fastapi import APIRouter, WebSocket, WebSocketDisconnect

from services.workflow_service import workflow_service


router = APIRouter()


@router.websocket("/code-stream/{task_id}")
async def code_stream_websocket(websocket: WebSocket, task_id: str):
    """
    WebSocket endpoint for real-time code streaming.

    Streams generated code as it's being written, similar to ChatGPT.

    Message format:
    {
        "type": "code_chunk" | "file_start" | "file_end" | "complete",
        "task_id": str,
        "content": str,  # Code content for code_chunk
        "filename": str | null,  # For file_start/file_end
        "timestamp": str
    }
    """
    await websocket.accept()

    task = workflow_service.get_task(task_id)
    # Subscribe to get our own queue for this task
    queue = workflow_service.subscribe(task_id)

    if not task:
        await websocket.send_json(
            {
                "type": "error",
                "task_id": task_id,
                "error": "Task not found",
                "timestamp": datetime.utcnow().isoformat(),
            }
        )
        await websocket.close()
        return

    try:
        # Track current file being streamed
        current_file = None

        if queue:
            while True:
                try:
                    message = await asyncio.wait_for(queue.get(), timeout=60.0)

                    # Transform progress messages into code stream format
                    if message.get("type") == "progress":
                        msg_text = message.get("message", "")

                        # Detect file creation events
                        if "Creating file:" in msg_text or "Writing:" in msg_text:
                            filename = msg_text.split(":")[-1].strip()
                            if current_file:
                                await websocket.send_json(
                                    {
                                        "type": "file_end",
                                        "task_id": task_id,
                                        "filename": current_file,
                                        "timestamp": datetime.utcnow().isoformat(),
                                    }
                                )
                            current_file = filename
                            await websocket.send_json(
                                {
                                    "type": "file_start",
                                    "task_id": task_id,
                                    "filename": filename,
                                    "timestamp": datetime.utcnow().isoformat(),
                                }
                            )

                        # Forward progress message
                        await websocket.send_json(
                            {
                                "type": "progress",
                                "task_id": task_id,
                                "progress": message.get("progress", 0),
                                "message": msg_text,
                                "timestamp": datetime.utcnow().isoformat(),
                            }
                        )

                    elif message.get("type") == "code_chunk":
                        # Direct code chunk forwarding
                        await websocket.send_json(
                            {
                                "type": "code_chunk",
                                "task_id": task_id,
                                "content": message.get("content", ""),
                                "filename": message.get("filename"),
                                "timestamp": datetime.utcnow().isoformat(),
                            }
                        )

                    elif message.get("type") in ("complete", "error"):
                        msg_type = message.get("type")
                        print(
                            f"[CodeStreamWS] Workflow finished: task={task_id[:8]}... type={msg_type}"
                        )
                        if current_file:
                            await websocket.send_json(
                                {
                                    "type": "file_end",
                                    "task_id": task_id,
                                    "filename": current_file,
                                    "timestamp": datetime.utcnow().isoformat(),
                                }
                            )
                        await websocket.send_json(message)
                        # Wait a bit before closing to ensure frontend processes the message
                        await asyncio.sleep(0.5)
                        await websocket.close()
                        break

                except asyncio.TimeoutError:
                    await websocket.send_json(
                        {
                            "type": "heartbeat",
                            "task_id": task_id,
                            "timestamp": datetime.utcnow().isoformat(),
                        }
                    )

    except WebSocketDisconnect:
        pass
    finally:
        # Unsubscribe from task updates
        if queue:
            workflow_service.unsubscribe(task_id, queue)


================================================
FILE: new_ui/backend/api/websockets/logs_ws.py
================================================
"""
Logs WebSocket Handler
Provides real-time log streaming
"""

import asyncio
import json
from datetime import datetime
from fastapi import APIRouter, WebSocket, WebSocketDisconnect

from settings import PROJECT_ROOT


router = APIRouter()


@router.websocket("/logs/{session_id}")
async def logs_websocket(websocket: WebSocket, session_id: str):
    """
    WebSocket endpoint for real-time log streaming.

    Streams log entries from the logs directory.

    Message format:
    {
        "type": "log",
        "level": "INFO" | "WARNING" | "ERROR" | "DEBUG",
        "message": str,
        "namespace": str,
        "timestamp": str
    }
    """
    await websocket.accept()

    logs_dir = PROJECT_ROOT / "logs"
    last_position = 0
    current_log_file = None

    try:
        while True:
            try:
                # Find the most recent log file
                if logs_dir.exists():
                    log_files = sorted(
                        logs_dir.glob("*.jsonl"),
                        key=lambda p: p.stat().st_mtime,
                        reverse=True,
                    )

                    if log_files:
                        newest_log = log_files[0]

                        # Check if we switched to a new log file
                        if current_log_file != newest_log:
                            current_log_file = newest_log
                            last_position = 0

                        # Read new entries
                        try:
                            with open(current_log_file, "r", encoding="utf-8") as f:
                                f.seek(last_position)
                                new_lines = f.readlines()
                                last_position = f.tell()

                            for line in new_lines:
                                line = line.strip()
                                if not line:
                                    continue

                                try:
                                    log_entry = json.loads(line)
                                    await websocket.send_json(
                                        {
                                            "type": "log",
                                            "level": log_entry.get("level", "INFO"),
                                            "message": log_entry.get("message", ""),
                                            "namespace": log_entry.get("namespace", ""),
                                            "timestamp": log_entry.get(
                                                "timestamp",
                                                datetime.utcnow().isoformat(),
                                            ),
                                        }
                                    )
                                except json.JSONDecodeError:
                                    # Raw text log
                                    await websocket.send_json(
                                        {
                                            "type": "log",
                                            "level": "INFO",
                                            "message": line,
                                            "namespace": "",
                                            "timestamp": datetime.utcnow().isoformat(),
                                        }
                                    )

                        except Exception as e:
                            await websocket.send_json(
                                {
                                    "type": "error",
                                    "message": f"Error reading log file: {str(e)}",
                                    "timestamp": datetime.utcnow().isoformat(),
                                }
                            )

                # Wait before checking for more logs
                await asyncio.sleep(0.5)

            except asyncio.CancelledError:
                break

    except WebSocketDisconnect:
        pass


================================================
FILE: new_ui/backend/api/websockets/workflow_ws.py
================================================
"""
Workflow WebSocket Handler
Provides real-time progress updates for running workflows
"""

import asyncio
from datetime import datetime
from fastapi import APIRouter, WebSocket, WebSocketDisconnect

from services.workflow_service import workflow_service


router = APIRouter()


class ConnectionManager:
    """Manages WebSocket connections for workflow updates"""

    def __init__(self):
        self.active_connections: dict[str, list[WebSocket]] = {}

    async def connect(self, websocket: WebSocket, task_id: str):
        await websocket.accept()
        if task_id not in self.active_connections:
            self.active_connections[task_id] = []
        self.active_connections[task_id].append(websocket)

    def disconnect(self, websocket: WebSocket, task_id: str):
        if task_id in self.active_connections:
            if websocket in self.active_connections[task_id]:
                self.active_connections[task_id].remove(websocket)
            if not self.active_connections[task_id]:
                del self.active_connections[task_id]

    async def broadcast(self, task_id: str, message: dict):
        if task_id in self.active_connections:
            for connection in self.active_connections[task_id]:
                try:
                    await connection.send_json(message)
                except Exception:
                    pass


manager = ConnectionManager()


@router.websocket("/workflow/{task_id}")
async def workflow_websocket(websocket: WebSocket, task_id: str):
    """
    WebSocket endpoint for real-time workflow progress updates.

    Connect to receive:
    - progress: Workflow step progress updates
    - complete: Workflow completion notification
    - error: Error notifications

    Message format:
    {
        "type": "progress" | "complete" | "error",
        "task_id": str,
        "progress": int,  # 0-100
        "message": str,
        "timestamp": str,
        "result": dict | null,  # Only for complete type
        "error": str | null  # Only for error type
    }
    """
    await manager.connect(websocket, task_id)
    print(f"[WorkflowWS] Connected: task={task_id[:8]}...")

    # Subscribe to get our own queue for this task
    queue = workflow_service.subscribe(task_id)
    task = workflow_service.get_task(task_id)
    print(
        f"[WorkflowWS] Subscribed: task={task_id[:8]}... queue={queue is not None} task={task is not None}"
    )

    if not task:
        await websocket.send_json(
            {
                "type": "error",
                "task_id": task_id,
                "error": "Task not found",
                "timestamp": datetime.utcnow().isoformat(),
            }
        )
        await websocket.close()
        return

    # Send current status
    await websocket.send_json(
        {
            "type": "status",
            "task_id": task_id,
            "status": task.status,
            "progress": task.progress,
            "message": task.message,
            "timestamp": datetime.utcnow().isoformat(),
        }
    )

    # Send pending interaction if any (fixes race condition where interaction_required
    # was broadcast before WebSocket connected)
    if task.pending_interaction:
        print(f"[WorkflowWS] Sending missed pending interaction: task={task_id[:8]}...")
        await websocket.send_json(
            {
                "type": "interaction_required",
                "task_id": task_id,
                "interaction_type": task.pending_interaction.get("type"),
                "title": task.pending_interaction.get("title"),
                "description": task.pending_interaction.get("description"),
                "data": task.pending_interaction.get("data"),
                "options": task.pending_interaction.get("options"),
                "required": task.pending_interaction.get("required"),
                "timestamp": datetime.utcnow().isoformat(),
            }
        )

    try:
        # If task is already completed, send final status and close
        if task.status in ("completed", "error", "cancelled"):
            if task.status == "completed":
                await websocket.send_json(
                    {
                        "type": "complete",
                        "task_id": task_id,
                        "result": task.result,
                        "timestamp": datetime.utcnow().isoformat(),
                    }
                )
            elif task.status == "error":
                await websocket.send_json(
                    {
                        "type": "error",
                        "task_id": task_id,
                        "error": task.error,
                        "timestamp": datetime.utcnow().isoformat(),
                    }
                )
            # Close WebSocket (don't cleanup immediately - keep task for status queries)
            await websocket.close()
            return

        # Stream progress updates
        if queue:
            while True:
                try:
                    # Wait for progress update with timeout
                    message = await asyncio.wait_for(queue.get(), timeout=60.0)
                    msg_type = message.get("type")
                    print(
                        f"[WorkflowWS] Sending: task={task_id[:8]}... type={msg_type}"
                    )
                    await websocket.send_json(message)

                    # Check if workflow is complete
                    if msg_type in ("complete", "error"):
                        print(
                            f"[WorkflowWS] Workflow finished: task={task_id[:8]}... type={msg_type}"
                        )
                        # Wait a bit before closing to ensure frontend processes the message
                        await asyncio.sleep(0.5)
                        await websocket.close()
                        break

                except asyncio.TimeoutError:
                    # Send heartbeat
                    await websocket.send_json(
                        {
                            "type": "heartbeat",
                            "task_id": task_id,
                            "timestamp": datetime.utcnow().isoformat(),
                        }
                    )

    except WebSocketDisconnect:
        pass
    finally:
        manager.disconnect(websocket, task_id)
        # Unsubscribe from task updates
        if queue:
            workflow_service.unsubscribe(task_id, queue)


================================================
FILE: new_ui/backend/app_utils/__init__.py
================================================
"""Utils package"""


================================================
FILE: new_ui/backend/main.py
================================================
"""
DeepCode New UI - FastAPI Backend Entry Point

Supports two modes:
  - Development: Frontend runs on Vite dev server (port 5173), proxied to backend
  - Production/Docker: FastAPI serves the frontend static build directly
"""

import os
import sys
from pathlib import Path

# ============================================================
# Path Setup - Critical for avoiding module naming conflicts
# ============================================================
# Directory layout:
#   PROJECT_ROOT/              <- DeepCode root (config/, utils/, workflows/, prompts/, tools/)
#   PROJECT_ROOT/new_ui/
#   PROJECT_ROOT/new_ui/backend/  <- This file's directory (api/, models/, services/, settings.py)
#
# IMPORTANT: Backend modules (settings, models, services, api) must NOT shadow
# DeepCode modules (config, utils, workflows, prompts, tools).
# We renamed: config.py -> settings.py, utils/ -> app_utils/
# ============================================================

BACKEND_DIR = Path(__file__).resolve().parent
NEW_UI_DIR = BACKEND_DIR.parent
PROJECT_ROOT = NEW_UI_DIR.parent

# PROJECT_ROOT must be first so DeepCode modules (config, utils, etc.) are found correctly
# BACKEND_DIR must also be present so local modules (settings, api, models, services) are found
# Since there are no naming conflicts after renaming, order is safe
if str(PROJECT_ROOT) not in sys.path:
    sys.path.insert(0, str(PROJECT_ROOT))
if str(BACKEND_DIR) not in sys.path:
    sys.path.insert(1, str(BACKEND_DIR))

from contextlib import asynccontextmanager
from fastapi import FastAPI, Request
from fastapi.middleware.cors import CORSMiddleware
from fastapi.staticfiles import StaticFiles
from fastapi.responses import FileResponse

from settings import settings
from api.routes import workflows, requirements, config as config_routes, files
from api.websockets import workflow_ws, code_stream_ws, logs_ws

# Check if running in Docker/production mode
IS_DOCKER = os.environ.get("DEEPCODE_ENV") == "docker"
FRONTEND_DIST = NEW_UI_DIR / "frontend" / "dist"


@asynccontextmanager
async def lifespan(app: FastAPI):
    """Application lifespan management"""
    # Startup
    print("Starting DeepCode New UI Backend...")
    print(f"  Project root: {PROJECT_ROOT}")
    print(f"  Backend dir:  {BACKEND_DIR}")
    print(f"  Mode:         {'Docker/Production' if IS_DOCKER else 'Development'}")

    if IS_DOCKER and FRONTEND_DIST.exists():
        print(f"  Frontend:     Serving static files from {FRONTEND_DIST}")
    elif IS_DOCKER:
        print(f"  ⚠️  Frontend dist not found at {FRONTEND_DIST}")

    # Ensure upload directory exists
    upload_dir = Path(settings.upload_dir)
    upload_dir.mkdir(parents=True, exist_ok=True)

    yield

    # Shutdown
    print("Shutting down DeepCode New UI Backend...")


app = FastAPI(
    title="DeepCode New UI API",
    description="Modern API backend for DeepCode - AI-powered code generation platform",
    version="1.0.0",
    lifespan=lifespan,
)

# CORS middleware
app.add_middleware(
    CORSMiddleware,
    allow_origins=settings.cors_origins,
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)

# Include REST API routes
app.include_router(workflows.router, prefix="/api/v1/workflows", tags=["Workflows"])
app.include_router(
    requirements.router, prefix="/api/v1/requirements", tags=["Requirements"]
)
app.include_router(
    config_routes.router, prefix="/api/v1/config", tags=["Configuration"]
)
app.include_router(files.router, prefix="/api/v1/files", tags=["Files"])

# Include WebSocket routes
app.include_router(workflow_ws.router, prefix="/ws", tags=["WebSocket"])
app.include_router(code_stream_ws.router, prefix="/ws", tags=["WebSocket"])
app.include_router(logs_ws.router, prefix="/ws", tags=["WebSocket"])


# ============================================================
# Static file serving for Docker/production mode
# In development, Vite dev server handles this via proxy
# ============================================================
if IS_DOCKER and FRONTEND_DIST.exists():
    # Serve static assets (JS, CSS, images, etc.)
    app.mount(
        "/assets",
        StaticFiles(directory=str(FRONTEND_DIST / "assets")),
        name="static-assets",
    )

    @app.get("/health")
    async def health_check():
        """Health check endpoint"""
        return {"status": "healthy"}

    # Catch-all: serve index.html for SPA client-side routing
    # This must be registered AFTER all API/WS routes
    @app.get("/{full_path:path}")
    async def serve_spa(request: Request, full_path: str):
        """Serve frontend SPA - fallback to index.html for client-side routing"""
        # Check if a static file exists at the requested path
        file_path = FRONTEND_DIST / full_path
        if full_path and file_path.exists() and file_path.is_file():
            return FileResponse(file_path)
        # Otherwise return index.html (SPA routing)
        return FileResponse(FRONTEND_DIST / "index.html")
else:
    # Development mode endpoints
    @app.get("/")
    async def root():
        """Root endpoint (dev mode)"""
        return {
            "name": "DeepCode New UI API",
            "version": "1.0.0",
            "status": "running",
            "mode": "development",
        }

    @app.get("/health")
    async def health_check_dev():
        """Health check endpoint"""
        return {"status": "healthy"}


if __name__ == "__main__":
    import uvicorn

    uvicorn.run(
        "main:app",
        host=settings.host,
        port=settings.port,
        reload=settings.debug,
    )


================================================
FILE: new_ui/backend/models/__init__.py
================================================
"""Models package"""

from .requests import (
    PaperToCodeRequest,
    ChatPlanningRequest,
    GenerateQuestionsRequest,
    SummarizeRequirementsRequest,
    ModifyRequirementsRequest,
    LLMProviderUpdateRequest,
    FileUploadResponse,
    InteractionResponseRequest,
)
from .responses import (
    TaskResponse,
    WorkflowStatusResponse,
    QuestionsResponse,
    RequirementsSummaryResponse,
    ConfigResponse,
    SettingsResponse,
    ErrorResponse,
)

__all__ = [
    # Requests
    "PaperToCodeRequest",
    "ChatPlanningRequest",
    "GenerateQuestionsRequest",
    "SummarizeRequirementsRequest",
    "ModifyRequirementsRequest",
    "LLMProviderUpdateRequest",
    "FileUploadResponse",
    "InteractionResponseRequest",
    # Responses
    "TaskResponse",
    "WorkflowStatusResponse",
    "QuestionsResponse",
    "RequirementsSummaryResponse",
    "ConfigResponse",
    "SettingsResponse",
    "ErrorResponse",
]


================================================
FILE: new_ui/backend/models/requests.py
================================================
"""Request models for API endpoints"""

from typing import Dict, Any
from pydantic import BaseModel, Field


class PaperToCodeRequest(BaseModel):
    """Request model for paper-to-code workflow"""

    input_source: str = Field(..., description="Path to paper file or URL")
    input_type: str = Field(..., description="Type of input: file, url")
    enable_indexing: bool = Field(default=False, description="Enable code indexing")


class ChatPlanningRequest(BaseModel):
    """Request model for chat-based planning workflow"""

    requirements: str = Field(..., description="User requirements text")
    enable_indexing: bool = Field(default=False, description="Enable code indexing")


class GenerateQuestionsRequest(BaseModel):
    """Request model for generating guiding questions"""

    initial_requirement: str = Field(..., description="Initial requirement text")


class SummarizeRequirementsRequest(BaseModel):
    """Request model for summarizing requirements"""

    initial_requirement: str = Field(..., description="Initial requirement text")
    user_answers: Dict[str, str] = Field(
        default_factory=dict, description="User answers to guiding questions"
    )


class ModifyRequirementsRequest(BaseModel):
    """Request model for modifying requirements"""

    current_requirements: str = Field(..., description="Current requirements document")
    modification_feedback: str = Field(..., description="User's modification feedback")


class LLMProviderUpdateRequest(BaseModel):
    """Request model for updating LLM provider"""

    provider: str = Field(
        ..., description="LLM provider name: google, anthropic, openai"
    )


class FileUploadResponse(BaseModel):
    """Response model for file upload"""

    file_id: str
    filename: str
    path: str
    size: int


class InteractionResponseRequest(BaseModel):
    """Request model for responding to user-in-loop interactions"""

    action: str = Field(
        ..., description="User action: submit, confirm, modify, skip, cancel"
    )
    data: Dict[str, Any] = Field(
        default_factory=dict,
        description="Response data (e.g., answers to questions, modification feedback)",
    )
    skipped: bool = Field(default=False, description="Whether user chose to skip")


================================================
FILE: new_ui/backend/models/responses.py
================================================
"""Response models for API endpoints"""

from typing import Optional, Dict, Any, List
from datetime import datetime
from pydantic import BaseModel, Field


class TaskResponse(BaseModel):
    """Response model for task creation"""

    task_id: str
    status: str = "created"
    message: str = "Task created successfully"
    created_at: datetime = Field(default_factory=datetime.utcnow)


class WorkflowStatusResponse(BaseModel):
    """Response model for workflow status"""

    task_id: str
    status: str
    progress: int = 0
    message: str = ""
    result: Optional[Dict[str, Any]] = None
    error: Optional[str] = None
    started_at: Optional[datetime] = None
    completed_at: Optional[datetime] = None


class QuestionsResponse(BaseModel):
    """Response model for generated questions"""

    questions: List[Dict[str, Any]]
    status: str = "success"


class RequirementsSummaryResponse(BaseModel):
    """Response model for requirements summary"""

    summary: str
    status: str = "success"


class ConfigResponse(BaseModel):
    """Response model for configuration"""

    llm_provider: str
    available_providers: List[str]
    models: Dict[str, str]
    indexing_enabled: bool


class SettingsResponse(BaseModel):
    """Response model for settings"""

    llm_provider: str
    models: Dict[str, str]
    indexing_enabled: bool
    document_segmentation: Dict[str, Any]


class ErrorResponse(BaseModel):
    """Response model for errors"""

    error: str
    detail: Optional[str] = None
    code: Optional[str] = None


================================================
FILE: new_ui/backend/services/__init__.py
================================================
"""Services package"""


================================================
FILE: new_ui/backend/services/requirement_service.py
================================================
"""
Requirement Analysis Service
Integration with existing requirement analysis workflow

NOTE: This module uses lazy imports for DeepCode modules.
sys.path is configured in main.py at startup.
"""

import json
from typing import Dict, Any


class RequirementService:
    """Service for requirement analysis operations"""

    async def generate_questions(self, initial_requirement: str) -> Dict[str, Any]:
        """Generate guiding questions based on initial requirements"""
        try:
            # Lazy import - DeepCode module found via sys.path set in main.py
            from workflows.agent_orchestration_engine import (
                execute_requirement_analysis_workflow,
            )

            result = await execute_requirement_analysis_workflow(
                user_input=initial_requirement,
                analysis_mode="generate_questions",
                user_answers=None,
                logger=None,
                progress_callback=None,
            )

            if result.get("status") == "success":
                # Parse JSON questions
                questions = json.loads(result.get("result", "[]"))
                return {
                    "status": "success",
                    "questions": questions,
                }
            else:
                return {
                    "status": "error",
                    "error": result.get("error", "Failed to generate questions"),
                }

        except Exception as e:
            return {
                "status": "error",
                "error": str(e),
            }

    async def summarize_requirements(
        self,
        initial_requirement: str,
        user_answers: Dict[str, str],
    ) -> Dict[str, Any]:
        """Summarize requirements based on initial input and user answers"""
        try:
            # Lazy import - DeepCode module found via sys.path set in main.py
            from workflows.agent_orchestration_engine import (
                execute_requirement_analysis_workflow,
            )

            result = await execute_requirement_analysis_workflow(
                user_input=initial_requirement,
                analysis_mode="summarize_requirements",
                user_answers=user_answers,
                logger=None,
                progress_callback=None,
            )

            if result.get("status") == "success":
                return {
                    "status": "success",
                    "summary": result.get("result", ""),
                }
            else:
                return {
                    "status": "error",
                    "error": result.get("error", "Failed to summarize requirements"),
                }

        except Exception as e:
            return {
                "status": "error",
                "error": str(e),
            }

    async def modify_requirements(
        self,
        current_requirements: str,
        modification_feedback: str,
    ) -> Dict[str, Any]:
        """Modify requirements based on user feedback"""
        try:
            # Lazy import - DeepCode module found via sys.path set in main.py
            from workflows.agents.requirement_analysis_agent import (
                RequirementAnalysisAgent,
            )

            agent = RequirementAnalysisAgent()
            await agent.initialize()

            result = await agent.modify_requirements(
                current_requirements=current_requirements,
                modification_feedback=modification_feedback,
            )

            await agent.cleanup()

            return {
                "status": "success",
                "summary": result,
            }

        except Exception as e:
            return {
                "status": "error",
                "error": str(e),
            }


# Global service instance
requirement_service = RequirementService()


================================================
FILE: new_ui/backend/services/session_service.py
================================================
"""
Session Service
Manages user sessions and conversation history
"""

import uuid
from datetime import datetime, timedelta
from typing import Optional, Dict, Any, List
from dataclasses import dataclass, field


@dataclass
class Session:
    """Represents a user session"""

    session_id: str
    created_at: datetime = field(default_factory=datetime.utcnow)
    last_activity: datetime = field(default_factory=datetime.utcnow)
    conversation_history: List[Dict[str, Any]] = field(default_factory=list)
    active_tasks: List[str] = field(default_factory=list)
    preferences: Dict[str, Any] = field(default_factory=dict)


class SessionService:
    """Service for managing user sessions"""

    def __init__(self, timeout_minutes: int = 60):
        self._sessions: Dict[str, Session] = {}
        self._timeout = timedelta(minutes=timeout_minutes)

    def create_session(self) -> Session:
        """Create a new session"""
        session_id = str(uuid.uuid4())
        session = Session(session_id=session_id)
        self._sessions[session_id] = session
        return session

    def get_session(self, session_id: str) -> Optional[Session]:
        """Get session by ID"""
        session = self._sessions.get(session_id)
        if session:
            # Check if session has expired
            if datetime.utcnow() - session.last_activity > self._timeout:
                self.delete_session(session_id)
                return None
            session.last_activity = datetime.utcnow()
        return session

    def delete_session(self, session_id: str):
        """Delete a session"""
        if session_id in self._sessions:
            del self._sessions[session_id]

    def add_to_history(
        self,
        session_id: str,
        role: str,
        content: str,
        metadata: Optional[Dict[str, Any]] = None,
    ):
        """Add a message to conversation history"""
        session = self.get_session(session_id)
        if session:
            session.conversation_history.append(
                {
                    "role": role,
                    "content": content,
                    "timestamp": datetime.utcnow().isoformat(),
                    "metadata": metadata or {},
                }
            )

    def get_history(self, session_id: str, limit: int = 50) -> List[Dict[str, Any]]:
        """Get conversation history for a session"""
        session = self.get_session(session_id)
        if session:
            return session.conversation_history[-limit:]
        return []

    def add_active_task(self, session_id: str, task_id: str):
        """Add an active task to the session"""
        session = self.get_session(session_id)
        if session and task_id not in session.active_tasks:
            session.active_tasks.append(task_id)

    def remove_active_task(self, session_id: str, task_id: str):
        """Remove an active task from the session"""
        session = self.get_session(session_id)
        if session and task_id in session.active_tasks:
            session.active_tasks.remove(task_id)

    def update_preferences(self, session_id: str, preferences: Dict[str, Any]):
        """Update session preferences"""
        session = self.get_session(session_id)
        if session:
            session.preferences.update(preferences)

    def cleanup_expired_sessions(self):
        """Remove all expired sessions"""
        now = datetime.utcnow()
        expired = [
            sid
            for sid, session in self._sessions.items()
            if now - session.last_activity > self._timeout
        ]
        for sid in expired:
            del self._sessions[sid]


# Global service instance
session_service = SessionService()


================================================
FILE: new_ui/backend/services/workflow_service.py
================================================
"""
Workflow Service - Integration with existing DeepCode workflows

NOTE: This module uses lazy imports for DeepCode modules (workflows, mcp_agent).
sys.path is configured in main.py at startup. Background tasks share the same
sys.path, so DeepCode modules will be found correctly as long as there are
no naming conflicts (config.py -> settings.py, utils/ -> app_utils/).
"""

import asyncio
import uuid
import os
from datetime import datetime
from typing import Optional, Dict, Any, Callable, List
from dataclasses import dataclass, field

from settings import CONFIG_PATH, PROJECT_ROOT


@dataclass
class WorkflowTask:
    """Represents a running workflow task"""

    task_id: str
    status: str = "pending"  # pending | running | waiting_for_input | completed | error | cancelled
    progress: int = 0
    message: str = ""
    result: Optional[Dict[str, Any]] = None
    error: Optional[str] = None
    started_at: Optional[datetime] = None
    completed_at: Optional[datetime] = None
    cancel_event: asyncio.Event = field(default_factory=asyncio.Event)
    # User-in-Loop support
    pending_interaction: Optional[Dict[str, Any]] = (
        None  # Current interaction request waiting for user
    )


class WorkflowService:
    """Service for managing workflow execution"""

    def __init__(self):
        self._tasks: Dict[str, WorkflowTask] = {}
        # Changed: Each task can have multiple subscriber queues
        self._subscribers: Dict[str, List[asyncio.Queue]] = {}
        # User-in-Loop plugin integration (lazy loaded)
        self._plugin_integration = None
        self._plugin_enabled = True  # Can be disabled via config

    def _get_plugin_integration(self):
        """Lazy load the plugin integration system."""
        if self._plugin_integration is None and self._plugin_enabled:
            try:
                from workflows.plugins.integration import WorkflowPluginIntegration

                self._plugin_integration = WorkflowPluginIntegration(self)
                print("[WorkflowService] Plugin integration initialized")
            except ImportError as e:
                print(f"[WorkflowService] Plugin system not available: {e}")
                self._plugin_enabled = False
        return self._plugin_integration

    def create_task(self) -> WorkflowTask:
        """Create a new workflow task"""
        task_id = str(uuid.uuid4())
        task = WorkflowTask(task_id=task_id)
        self._tasks[task_id] = task
        self._subscribers[task_id] = []
        return task

    def get_task(self, task_id: str) -> Optional[WorkflowTask]:
        """Get task by ID"""
        return self._tasks.get(task_id)

    def subscribe(self, task_id: str) -> Optional[asyncio.Queue]:
        """Subscribe to a task's progress updates. Returns a new queue for this subscriber."""
        if task_id not in self._subscribers:
            print(f"[Subscribe] Failed: task={task_id[:8]}... not found in subscribers")
            return None
        queue = asyncio.Queue()
        self._subscribers[task_id].append(queue)
        print(
            f"[Subscribe] Success: task={task_id[:8]}... total_subscribers={len(self._subscribers[task_id])}"
        )
        return queue

    def unsubscribe(self, task_id: str, queue: asyncio.Queue):
        """Unsubscribe from a task's progress updates."""
        if task_id in self._subscribers and queue in self._subscribers[task_id]:
            self._subscribers[task_id].remove(queue)
            print(
                f"[Unsubscribe] task={task_id[:8]}... remaining={len(self._subscribers[task_id])}"
            )

    async def _broadcast(self, task_id: str, message: Dict[str, Any]):
        """Broadcast a message to all subscribers of a task."""
        if task_id in self._subscribers:
            subscriber_count = len(self._subscribers[task_id])
            print(
                f"[Broadcast] task={task_id[:8]}... type={message.get('type')} subscribers={subscriber_count}"
            )
            for queue in self._subscribers[task_id]:
                try:
                    await queue.put(message)
                except Exception as e:
                    print(f"[Broadcast] Failed to send to queue: {e}")
        else:
            print(
                f"[Broadcast] No subscribers for task={task_id[:8]}... type={message.get('type')}"
            )

    def get_progress_queue(self, task_id: str) -> Optional[asyncio.Queue]:
        """Get progress queue for a task (deprecated, use subscribe instead)"""
        # For backwards compatibility, create a subscriber queue
        return self.subscribe(task_id)

    async def _create_progress_callback(
        self, task_id: str
    ) -> Callable[[int, str], None]:
        """Create a progress callback that broadcasts to all subscribers"""
        task = self._tasks.get(task_id)

        def callback(progress: int, message: str):
            if task:
                task.progress = progress
                task.message = message

            # Broadcast to all subscribers
            asyncio.create_task(
                self._broadcast(
                    task_id,
                    {
                        "type": "progress",
                        "task_id": task_id,
                        "progress": progress,
                        "message": message,
                        "timestamp": datetime.utcnow().isoformat(),
                    },
                )
            )

        return callback

    async def execute_paper_to_code(
        self,
        task_id: str,
        input_source: str,
        input_type: str,
        enable_indexing: bool = False,
    ) -> Dict[str, Any]:
        """Execute paper-to-code workflow"""
        # Lazy imports - DeepCode modules found via sys.path set in main.py
        from mcp_agent.app import MCPApp
        from workflows.agent_orchestration_engine import (
            execute_multi_agent_research_pipeline,
        )

        task = self._tasks.get(task_id)
        if not task:
            return {"status": "error", "error": "Task not found"}

        task.status = "running"
        task.started_at = datetime.utcnow()

        try:
            progress_callback = await self._create_progress_callback(task_id)

            # Change to project root directory for MCP server paths to work correctly
            original_cwd = os.getcwd()
            os.chdir(PROJECT_ROOT)

            # Create MCP app context with explicit config path
            app = MCPApp(name="paper_to_code", settings=str(CONFIG_PATH))

            async with app.run() as agent_app:
                logger = agent_app.logger
                context = agent_app.context

                # Add current working directory to filesystem server args
                context.config.mcp.servers["filesystem"].args.extend([os.getcwd()])

                # Execute the pipeline
                result = await execute_multi_agent_research_pipeline(
                    input_source,
                    logger,
                    progress_callback,
                    enable_indexing=enable_indexing,
                )

                task.status = "completed"
                task.progress = 100
                task.result = {
                    "status": "success",
                    "repo_result": result,
                }
                task.completed_at = datetime.utcnow()

                # Broadcast completion signal to all subscribers
                await self._broadcast(
                    task_id,
                    {
                        "type": "complete",
                        "task_id": task_id,
                        "status": "success",
                        "result": task.result,
                    },
                )
                # Give WebSocket handlers time to receive the completion message
                await asyncio.sleep(0.5)

                return task.result

        except Exception as e:
            task.status = "error"
            task.error = str(e)
            task.completed_at = datetime.utcnow()

            # Broadcast error signal to all subscribers
            await self._broadcast(
                task_id,
                {
                    "type": "error",
                    "task_id": task_id,
                    "error": str(e),
                },
            )

            return {"status": "error", "error": str(e)}

        finally:
            # Restore original working directory
            os.chdir(original_cwd)

    async def execute_chat_planning(
        self,
        task_id: str,
        requirements: str,
        enable_indexing: bool = False,
        enable_user_interaction: bool = True,  # Enable User-in-Loop by default
    ) -> Dict[str, Any]:
        """Execute chat-based planning workflow"""
        # Lazy imports - DeepCode modules found via sys.path set in main.py
        from mcp_agent.app import MCPApp
        from workflows.agent_orchestration_engine import (
            execute_chat_based_planning_pipeline,
        )

        task = self._tasks.get(task_id)
        if not task:
            return {"status": "error", "error": "Task not found"}

        task.status = "running"
        task.started_at = datetime.utcnow()

        try:
            progress_callback = await self._create_progress_callback(task_id)

            # Change to project root directory for MCP server paths to work correctly
            original_cwd = os.getcwd()
            os.chdir(PROJECT_ROOT)

            # Create MCP app context with explicit config path
            app = MCPApp(name="chat_planning", settings=str(CONFIG_PATH))

            async with app.run() as agent_app:
                logger = agent_app.logger
                context = agent_app.context

                # Add current working directory to filesystem server args
                context.config.mcp.servers["filesystem"].args.extend([os.getcwd()])

                # --- User-in-Loop: Before Planning Hook ---
                final_requirements = requirements
                plugin_integration = self._get_plugin_integration()

                if enable_user_interaction and plugin_integration:
                    try:
                        from workflows.plugins import InteractionPoint

                        # Create plugin context
                        plugin_context = plugin_integration.create_context(
                            task_id=task_id,
                            user_input=requirements,
                            requirements=requirements,
                            enable_indexing=enable_indexing,
                        )

                        # Run BEFORE_PLANNING plugins (requirement analysis)
                        plugin_context = await plugin_integration.run_hook(
                            InteractionPoint.BEFORE_PLANNING, plugin_context
                        )

                        # Check if workflow was cancelled by user
                        if plugin_context.get("workflow_cancelled"):
                            task.status = "cancelled"
                            task.completed_at = datetime.utcnow()
                            return {
                                "status": "cancelled",
                                "reason": plugin_context.get(
                                    "cancel_reason", "Cancelled by user"
                                ),
                            }

                        # Use potentially enhanced requirements
                        final_requirements = plugin_context.get(
                            "requirements", requirements
                        )
                        print(
                            f"[WorkflowService] Requirements after plugin: {len(final_requirements)} chars"
                        )

                    except Exception as plugin_error:
                        print(
                            f"[WorkflowService] Plugin error (continuing without): {plugin_error}"
                        )
                        # Continue without plugin enhancement

                # Execute the pipeline with (possibly enhanced) requirements
                result = await execute_chat_based_planning_pipeline(
                    final_requirements,
                    logger,
                    progress_callback,
                    enable_indexing=enable_indexing,
                )

                task.status = "completed"
                task.progress = 100
                task.result = {
                    "status": "success",
                    "repo_result": result,
                }
                task.completed_at = datetime.utcnow()

                # Broadcast completion signal to all subscribers
                await self._broadcast(
                    task_id,
                    {
                        "type": "complete",
                        "task_id": task_id,
                        "status": "success",
                        "result": task.result,
                    },
                )
                # Give WebSocket handlers time to receive the completion message
                await asyncio.sleep(0.5)

                return task.result

        except Exception as e:
            task.status = "error"
            task.error = str(e)
            task.completed_at = datetime.utcnow()

            # Broadcast error signal to all subscribers
            await self._broadcast(
                task_id,
                {
                    "type": "error",
                    "task_id": task_id,
                    "error": str(e),
                },
            )

            return {"status": "error", "error": str(e)}

        finally:
            # Restore original working directory
            os.chdir(original_cwd)

    def cancel_task(self, task_id: str) -> bool:
        """Cancel a running task"""
        task = self._tasks.get(task_id)
        if task and task.status == "running":
            task.cancel_event.set()
            task.status = "cancelled"
            return True
        return False

    def cleanup_task(self, task_id: str):
        """Clean up task resources"""
        if task_id in self._tasks:
            del self._tasks[task_id]
        if task_id in self._subscribers:
            del self._subscribers[task_id]

    def get_active_tasks(self) -> List[WorkflowTask]:
        """Get all tasks that are currently running"""
        return [task for task in self._tasks.values() if task.status == "running"]

    def get_recent_tasks(self, limit: int = 10) -> List[WorkflowTask]:
        """Get recent tasks sorted by start time (newest first)"""
        tasks = list(self._tasks.values())
        # Sort by started_at descending (newest first)
        tasks.sort(key=lambda t: t.started_at or datetime.min, reverse=True)
        return tasks[:limit]


# Global service instance
workflow_service = WorkflowService()


================================================
FILE: new_ui/backend/settings.py
================================================
"""
Configuration management for DeepCode New UI Backend
Reads from existing mcp_agent.config.yaml and mcp_agent.secrets.yaml
"""

from pathlib import Path
from typing import Optional, Dict, Any

import yaml
from pydantic_settings import BaseSettings


# Project paths
BACKEND_DIR = Path(__file__).resolve().parent
NEW_UI_DIR = BACKEND_DIR.parent
PROJECT_ROOT = NEW_UI_DIR.parent
CONFIG_PATH = PROJECT_ROOT / "mcp_agent.config.yaml"
SECRETS_PATH = PROJECT_ROOT / "mcp_agent.secrets.yaml"


class Settings(BaseSettings):
    """Application settings"""

    # Server settings
    host: str = "0.0.0.0"
    port: int = 8000
    debug: bool = True

    # Environment: "docker" for production, anything else for development
    env: str = ""

    # CORS settings - in Docker mode, frontend is served by FastAPI (same origin)
    cors_origins: list = [
        "http://localhost:5173",
        "http://localhost:3000",
        "http://localhost:8000",
    ]

    # File upload settings
    max_upload_size: int = 100 * 1024 * 1024  # 100MB
    upload_dir: str = str(PROJECT_ROOT / "uploads")

    # Session settings
    session_timeout: int = 3600  # 1 hour

    class Config:
        env_prefix = "DEEPCODE_"


settings = Settings()


def load_mcp_config() -> Dict[str, Any]:
    """Load main MCP agent configuration"""
    if not CONFIG_PATH.exists():
        return {}

    with open(CONFIG_PATH, "r", encoding="utf-8") as f:
        return yaml.safe_load(f) or {}


def load_secrets() -> Dict[str, Any]:
    """Load API secrets configuration"""
    if not SECRETS_PATH.exists():
        return {}

    with open(SECRETS_PATH, "r", encoding="utf-8") as f:
        return yaml.safe_load(f) or {}


def get_llm_provider() -> str:
    """Get the preferred LLM provider from config"""
    config = load_mcp_config()
    return config.get("llm_provider", "google")


def get_llm_models(provider: Optional[str] = None) -> Dict[str, str]:
    """Get the model configuration for a provider"""
    config = load_mcp_config()
    provider = provider or get_llm_provider()

    provider_config = config.get(provider, {})
    return {
        "default": provider_config.get("default_model", ""),
        "planning": provider_config.get("planning_model", ""),
        "implementation": provider_config.get("implementation_model", ""),
    }


def get_api_key(provider: str) -> Optional[str]:
    """Get API key for a specific provider"""
    secrets = load_secrets()
    provider_secrets = secrets.get(provider, {})
    return provider_secrets.get("api_key")


def is_indexing_enabled() -> bool:
    """Check if document indexing is enabled"""
    config = load_mcp_config()
    doc_seg = config.get("document_segmentation", {})
    return doc_seg.get("enabled", False)


================================================
FILE: new_ui/frontend/index.html
================================================
<!DOCTYPE html>
<html lang="en">
  <head>
    <meta charset="UTF-8" />
    <link rel="icon" type="image/svg+xml" href="https://github.com/Zongwei9888/Experiment_Images/raw/43c585dca3d21b8e4b6390d835cdd34dc4b4b23d/DeepCode_images/title_logo.svg" />
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <title>DeepCode - AI-Powered Code Generation</title>
    <link rel="preconnect" href="https://fonts.googleapis.com">
    <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
    <link href="https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&family=JetBrains+Mono:wght@400;500&display=swap" rel="stylesheet">
  </head>
  <body>
    <div id="root"></div>
    <script type="module" src="/src/main.tsx"></script>
  </body>
</html>


================================================
FILE: new_ui/frontend/package.json
================================================
{
  "name": "deepcode-new-ui",
  "private": true,
  "version": "1.0.0",
  "type": "module",
  "scripts": {
    "dev": "vite",
    "build": "tsc && vite build",
    "lint": "eslint . --ext ts,tsx --report-unused-disable-directives --max-warnings 0",
    "preview": "vite preview",
    "test": "vitest"
  },
  "dependencies": {
    "@monaco-editor/react": "^4.6.0",
    "@radix-ui/react-dialog": "^1.0.5",
    "@radix-ui/react-dropdown-menu": "^2.0.6",
    "@radix-ui/react-progress": "^1.0.3",
    "@radix-ui/react-tabs": "^1.0.4",
    "@radix-ui/react-toast": "^1.1.5",
    "@tanstack/react-query": "^5.17.0",
    "axios": "^1.6.5",
    "class-variance-authority": "^0.7.0",
    "clsx": "^2.1.0",
    "framer-motion": "^10.18.0",
    "lucide-react": "^0.309.0",
    "react": "^18.2.0",
    "react-dom": "^18.2.0",
    "react-router-dom": "^6.21.2",
    "reactflow": "^11.10.2",
    "tailwind-merge": "^2.2.0",
    "zustand": "^4.4.7"
  },
  "devDependencies": {
    "@types/node": "^20.11.0",
    "@types/react": "^18.2.47",
    "@types/react-dom": "^18.2.18",
    "@typescript-eslint/eslint-plugin": "^6.18.1",
    "@typescript-eslint/parser": "^6.18.1",
    "@vitejs/plugin-react": "^4.2.1",
    "autoprefixer": "^10.4.17",
    "eslint": "^8.56.0",
    "eslint-plugin-react-hooks": "^4.6.0",
    "eslint-plugin-react-refresh": "^0.4.5",
    "postcss": "^8.4.33",
    "tailwindcss": "^3.4.1",
    "typescript": "^5.3.3",
    "vite": "^5.0.11",
    "vitest": "^1.2.0"
  }
}


================================================
FILE: new_ui/frontend/postcss.config.js
================================================
export default {
  plugins: {
    tailwindcss: {},
    autoprefixer: {},
  },
}


================================================
FILE: new_ui/frontend/src/App.tsx
================================================
import { BrowserRouter, Routes, Route } from 'react-router-dom'
import { Toaster } from './components/common/Toaster'
import Layout from './components/layout/Layout'
import HomePage from './pages/HomePage'
import PaperToCodePage from './pages/PaperToCodePage'
import ChatPlanningPage from './pages/ChatPlanningPage'
import WorkflowEditorPage from './pages/WorkflowEditorPage'
import SettingsPage from './pages/SettingsPage'

function App() {
  return (
    <BrowserRouter>
      <Layout>
        <Routes>
          <Route path="/" element={<HomePage />} />
          <Route path="/paper-to-code" element={<PaperToCodePage />} />
          <Route path="/chat" element={<ChatPlanningPage />} />
          <Route path="/workflow" element={<WorkflowEditorPage />} />
          <Route path="/settings" element={<SettingsPage />} />
        </Routes>
      </Layout>
      <Toaster />
    </BrowserRouter>
  )
}

export default App


================================================
FILE: new_ui/frontend/src/components/common/Button.tsx
================================================
import { ButtonHTMLAttributes, forwardRef } from 'react';
import { clsx } from 'clsx';
import { Loader2 } from 'lucide-react';

interface ButtonProps extends ButtonHTMLAttributes<HTMLButtonElement> {
  variant?: 'primary' | 'secondary' | 'ghost' | 'danger';
  size?: 'sm' | 'md' | 'lg';
  isLoading?: boolean;
}

const Button = forwardRef<HTMLButtonElement, ButtonProps>(
  (
    {
      className,
      variant = 'primary',
      size = 'md',
      isLoading = false,
      disabled,
      children,
      ...props
    },
    ref
  ) => {
    const baseStyles =
      'inline-flex items-center justify-center rounded-lg font-medium transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-primary-500 focus-visible:ring-offset-2 disabled:pointer-events-none disabled:opacity-50';

    const variants = {
      primary: 'bg-primary-600 text-white hover:bg-primary-700',
      secondary: 'bg-gray-100 text-gray-900 hover:bg-gray-200',
      ghost: 'text-gray-600 hover:bg-gray-100 hover:text-gray-900',
      danger: 'bg-red-600 text-white hover:bg-red-700',
    };

    const sizes = {
      sm: 'h-8 px-3 text-sm',
      md: 'h-10 px-4 text-sm',
      lg: 'h-12 px-6 text-base',
    };

    return (
      <button
        ref={ref}
        className={clsx(baseStyles, variants[variant], sizes[size], className)}
        disabled={disabled || isLoading}
        {...props}
      >
        {isLoading && <Loader2 className="mr-2 h-4 w-4 animate-spin" />}
        {children}
      </button>
    );
  }
);

Button.displayName = 'Button';

export default Button;


================================================
FILE: new_ui/frontend/src/components/common/Card.tsx
================================================
import { ReactNode } from 'react';
import { clsx } from 'clsx';

interface CardProps {
  children: ReactNode;
  className?: string;
  padding?: 'none' | 'sm' | 'md' | 'lg';
}

export default function Card({
  children,
  className,
  padding = 'md',
}: CardProps) {
  const paddingStyles = {
    none: '',
    sm: 'p-4',
    md: 'p-6',
    lg: 'p-8',
  };

  return (
    <div
      className={clsx(
        'rounded-xl border border-gray-200 bg-white shadow-sm',
        paddingStyles[padding],
        className
      )}
    >
      {children}
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/common/ConfirmDialog.tsx
================================================
/**
 * Confirm Dialog Component
 *
 * A reusable confirmation dialog for destructive or important actions.
 */

import { motion, AnimatePresence } from 'framer-motion';
import { AlertTriangle, X } from 'lucide-react';

interface ConfirmDialogProps {
  isOpen: boolean;
  title: string;
  message: string;
  confirmLabel?: string;
  cancelLabel?: string;
  variant?: 'danger' | 'warning' | 'info';
  onConfirm: () => void;
  onCancel: () => void;
}

export function ConfirmDialog({
  isOpen,
  title,
  message,
  confirmLabel = 'Confirm',
  cancelLabel = 'Cancel',
  variant = 'warning',
  onConfirm,
  onCancel,
}: ConfirmDialogProps) {
  const variantStyles = {
    danger: {
      icon: 'bg-red-100 text-red-600',
      button: 'bg-red-600 hover:bg-red-700',
    },
    warning: {
      icon: 'bg-yellow-100 text-yellow-600',
      button: 'bg-yellow-600 hover:bg-yellow-700',
    },
    info: {
      icon: 'bg-blue-100 text-blue-600',
      button: 'bg-blue-600 hover:bg-blue-700',
    },
  };

  const styles = variantStyles[variant];

  return (
    <AnimatePresence>
      {isOpen && (
        <>
          {/* Backdrop */}
          <motion.div
            initial={{ opacity: 0 }}
            animate={{ opacity: 1 }}
            exit={{ opacity: 0 }}
            className="fixed inset-0 bg-black/50 z-50"
            onClick={onCancel}
          />

          {/* Dialog */}
          <motion.div
            initial={{ opacity: 0, scale: 0.95, y: 20 }}
            animate={{ opacity: 1, scale: 1, y: 0 }}
            exit={{ opacity: 0, scale: 0.95, y: 20 }}
            className="fixed left-1/2 top-1/2 -translate-x-1/2 -translate-y-1/2 z-50 w-full max-w-md"
          >
            <div className="bg-white rounded-xl shadow-xl p-6">
              {/* Close button */}
              <button
                onClick={onCancel}
                className="absolute top-4 right-4 text-gray-400 hover:text-gray-600"
              >
                <X className="h-5 w-5" />
              </button>

              {/* Icon */}
              <div className={`w-12 h-12 rounded-full ${styles.icon} flex items-center justify-center mb-4`}>
                <AlertTriangle className="h-6 w-6" />
              </div>

              {/* Content */}
              <h3 className="text-lg font-semibold text-gray-900 mb-2">
                {title}
              </h3>
              <p className="text-sm text-gray-600 mb-6">
                {message}
              </p>

              {/* Actions */}
              <div className="flex space-x-3">
                <button
                  onClick={onCancel}
                  className="flex-1 px-4 py-2 text-sm font-medium text-gray-700 bg-gray-100 rounded-lg hover:bg-gray-200 transition-colors"
                >
                  {cancelLabel}
                </button>
                <button
                  onClick={onConfirm}
                  className={`flex-1 px-4 py-2 text-sm font-medium text-white rounded-lg transition-colors ${styles.button}`}
                >
                  {confirmLabel}
                </button>
              </div>
            </div>
          </motion.div>
        </>
      )}
    </AnimatePresence>
  );
}


================================================
FILE: new_ui/frontend/src/components/common/GuardedLink.tsx
================================================
/**
 * Guarded Link Component
 *
 * A Link component that respects the navigation guard.
 * Shows confirmation dialog when trying to navigate away during a running task.
 */

import { Link, LinkProps, useLocation } from 'react-router-dom';
import { useWorkflowStore } from '../../stores/workflowStore';
import { useState } from 'react';
import { ConfirmDialog } from './ConfirmDialog';

interface GuardedLinkProps extends Omit<LinkProps, 'onClick'> {
  children: React.ReactNode;
}

export function GuardedLink({ to, children, ...props }: GuardedLinkProps) {
  const { status } = useWorkflowStore();
  const location = useLocation();
  const [showDialog, setShowDialog] = useState(false);

  const shouldBlock = status === 'running';
  const targetPath = typeof to === 'string' ? to : to.pathname;
  const isSamePage = targetPath === location.pathname;

  const handleClick = (e: React.MouseEvent<HTMLAnchorElement>) => {
    if (shouldBlock && !isSamePage) {
      e.preventDefault();
      setShowDialog(true);
    }
  };

  const handleConfirm = () => {
    setShowDialog(false);
    // Navigate by setting window.location to trigger actual navigation
    window.location.href = typeof to === 'string' ? to : to.pathname || '/';
  };

  return (
    <>
      <Link to={to} onClick={handleClick} {...props}>
        {children}
      </Link>

      <ConfirmDialog
        isOpen={showDialog}
        title="Task is still running"
        message="A task is currently running. If you leave this page, the task will continue in the background, but you may lose track of its progress."
        confirmLabel="Leave anyway"
        cancelLabel="Stay here"
        variant="warning"
        onConfirm={handleConfirm}
        onCancel={() => setShowDialog(false)}
      />
    </>
  );
}


================================================
FILE: new_ui/frontend/src/components/common/TaskRecoveryBanner.tsx
================================================
/**
 * Task Recovery Banner
 *
 * Shows a notification when a running task is recovered after page refresh.
 */

import { motion, AnimatePresence } from 'framer-motion';
import { RefreshCw, X, ExternalLink } from 'lucide-react';
import { useWorkflowStore } from '../../stores/workflowStore';
import { useNavigate } from 'react-router-dom';

interface TaskRecoveryBannerProps {
  isRecovering: boolean;
  recoveredTaskId: string | null;
  onDismiss: () => void;
}

export function TaskRecoveryBanner({
  isRecovering,
  recoveredTaskId,
  onDismiss,
}: TaskRecoveryBannerProps) {
  const navigate = useNavigate();
  const { workflowType, status } = useWorkflowStore();

  const handleGoToTask = () => {
    if (workflowType === 'chat-planning') {
      navigate('/chat-planning');
    } else if (workflowType === 'paper-to-code') {
      navigate('/paper-to-code');
    }
    onDismiss();
  };

  // Don't show if not recovering and no recovered task
  if (!isRecovering && !recoveredTaskId) {
    return null;
  }

  // Don't show if task is completed or has error
  if (status === 'completed' || status === 'error' || status === 'idle') {
    return null;
  }

  return (
    <AnimatePresence>
      <motion.div
        initial={{ opacity: 0, y: -50 }}
        animate={{ opacity: 1, y: 0 }}
        exit={{ opacity: 0, y: -50 }}
        className="fixed top-4 left-1/2 transform -translate-x-1/2 z-50"
      >
        <div className="bg-blue-50 border border-blue-200 rounded-lg shadow-lg px-4 py-3 flex items-center space-x-3">
          {isRecovering ? (
            <>
              <RefreshCw className="h-5 w-5 text-blue-500 animate-spin" />
              <span className="text-sm text-blue-700">
                Recovering task...
              </span>
            </>
          ) : (
            <>
              <RefreshCw className="h-5 w-5 text-blue-500" />
              <span className="text-sm text-blue-700">
                Task recovered! Your workflow is still running.
              </span>
              <button
                onClick={handleGoToTask}
                className="flex items-center text-sm font-medium text-blue-600 hover:text-blue-800"
              >
                View
                <ExternalLink className="h-3 w-3 ml-1" />
              </button>
              <button
                onClick={onDismiss}
                className="text-blue-400 hover:text-blue-600"
              >
                <X className="h-4 w-4" />
              </button>
            </>
          )}
        </div>
      </motion.div>
    </AnimatePresence>
  );
}


================================================
FILE: new_ui/frontend/src/components/common/Toaster.tsx
================================================
import { useEffect, useState } from 'react';
import { X, CheckCircle, AlertCircle, Info, AlertTriangle } from 'lucide-react';
import { motion, AnimatePresence } from 'framer-motion';

interface Toast {
  id: string;
  type: 'success' | 'error' | 'warning' | 'info';
  title: string;
  description?: string;
}

// Global toast state
let toasts: Toast[] = [];
let listeners: ((toasts: Toast[]) => void)[] = [];

const notify = () => {
  listeners.forEach((listener) => listener([...toasts]));
};

export const toast = {
  success: (title: string, description?: string) => {
    const id = crypto.randomUUID();
    toasts = [...toasts, { id, type: 'success', title, description }];
    notify();
    setTimeout(() => toast.dismiss(id), 5000);
  },
  error: (title: string, description?: string) => {
    const id = crypto.randomUUID();
    toasts = [...toasts, { id, type: 'error', title, description }];
    notify();
    setTimeout(() => toast.dismiss(id), 8000);
  },
  warning: (title: string, description?: string) => {
    const id = crypto.randomUUID();
    toasts = [...toasts, { id, type: 'warning', title, description }];
    notify();
    setTimeout(() => toast.dismiss(id), 6000);
  },
  info: (title: string, description?: string) => {
    const id = crypto.randomUUID();
    toasts = [...toasts, { id, type: 'info', title, description }];
    notify();
    setTimeout(() => toast.dismiss(id), 5000);
  },
  dismiss: (id: string) => {
    toasts = toasts.filter((t) => t.id !== id);
    notify();
  },
};

const icons = {
  success: CheckCircle,
  error: AlertCircle,
  warning: AlertTriangle,
  info: Info,
};

const colors = {
  success: 'bg-green-50 border-green-200 text-green-800',
  error: 'bg-red-50 border-red-200 text-red-800',
  warning: 'bg-yellow-50 border-yellow-200 text-yellow-800',
  info: 'bg-blue-50 border-blue-200 text-blue-800',
};

const iconColors = {
  success: 'text-green-500',
  error: 'text-red-500',
  warning: 'text-yellow-500',
  info: 'text-blue-500',
};

export function Toaster() {
  const [currentToasts, setCurrentToasts] = useState<Toast[]>([]);

  useEffect(() => {
    listeners.push(setCurrentToasts);
    return () => {
      listeners = listeners.filter((l) => l !== setCurrentToasts);
    };
  }, []);

  return (
    <div className="fixed bottom-4 right-4 z-50 flex flex-col gap-2">
      <AnimatePresence>
        {currentToasts.map((t) => {
          const Icon = icons[t.type];
          return (
            <motion.div
              key={t.id}
              initial={{ opacity: 0, y: 20, scale: 0.95 }}
              animate={{ opacity: 1, y: 0, scale: 1 }}
              exit={{ opacity: 0, y: -10, scale: 0.95 }}
              className={`flex items-start gap-3 p-4 rounded-lg border shadow-lg max-w-sm ${colors[t.type]}`}
            >
              <Icon className={`h-5 w-5 mt-0.5 ${iconColors[t.type]}`} />
              <div className="flex-1 min-w-0">
                <p className="font-medium text-sm">{t.title}</p>
                {t.description && (
                  <p className="text-sm opacity-80 mt-0.5">{t.description}</p>
                )}
              </div>
              <button
                onClick={() => toast.dismiss(t.id)}
                className="p-1 rounded hover:bg-black/5 transition-colors"
              >
                <X className="h-4 w-4" />
              </button>
            </motion.div>
          );
        })}
      </AnimatePresence>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/common/index.ts
================================================
export { default as Button } from './Button';
export { default as Card } from './Card';
export { Toaster, toast } from './Toaster';


================================================
FILE: new_ui/frontend/src/components/input/ChatInput.tsx
================================================
import { useState, useRef, KeyboardEvent } from 'react';
import { Send, Loader2 } from 'lucide-react';
import { motion } from 'framer-motion';

interface ChatInputProps {
  onSubmit: (message: string) => void;
  placeholder?: string;
  isLoading?: boolean;
  disabled?: boolean;
}

export default function ChatInput({
  onSubmit,
  placeholder = 'Describe your project requirements...',
  isLoading = false,
  disabled = false,
}: ChatInputProps) {
  const [message, setMessage] = useState('');
  const textareaRef = useRef<HTMLTextAreaElement>(null);

  const handleSubmit = () => {
    const trimmedMessage = message.trim();
    if (trimmedMessage && !isLoading && !disabled) {
      onSubmit(trimmedMessage);
      setMessage('');
      if (textareaRef.current) {
        textareaRef.current.style.height = 'auto';
      }
    }
  };

  const handleKeyDown = (e: KeyboardEvent<HTMLTextAreaElement>) => {
    if (e.key === 'Enter' && !e.shiftKey) {
      e.preventDefault();
      handleSubmit();
    }
  };

  const handleInput = () => {
    const textarea = textareaRef.current;
    if (textarea) {
      textarea.style.height = 'auto';
      textarea.style.height = Math.min(textarea.scrollHeight, 200) + 'px';
    }
  };

  return (
    <motion.div
      initial={{ opacity: 0, y: 10 }}
      animate={{ opacity: 1, y: 0 }}
      className="relative"
    >
      <div className="flex items-end gap-2 p-3 bg-white border border-gray-200 rounded-xl shadow-sm focus-within:ring-2 focus-within:ring-primary-500 focus-within:border-primary-500 transition-shadow">
        <textarea
          ref={textareaRef}
          value={message}
          onChange={(e) => setMessage(e.target.value)}
          onKeyDown={handleKeyDown}
          onInput={handleInput}
          placeholder={placeholder}
          disabled={disabled || isLoading}
          rows={1}
          className="flex-1 resize-none border-0 bg-transparent text-sm text-gray-900 placeholder-gray-400 focus:outline-none disabled:opacity-50"
          style={{ maxHeight: '200px' }}
        />
        <button
          onClick={handleSubmit}
          disabled={!message.trim() || isLoading || disabled}
          className="flex-shrink-0 p-2 rounded-lg bg-primary-600 text-white hover:bg-primary-700 disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
        >
          {isLoading ? (
            <Loader2 className="h-5 w-5 animate-spin" />
          ) : (
            <Send className="h-5 w-5" />
          )}
        </button>
      </div>
      <p className="mt-2 text-xs text-gray-400 text-center">
        Press Enter to send, Shift+Enter for new line
      </p>
    </motion.div>
  );
}


================================================
FILE: new_ui/frontend/src/components/input/FileUploader.tsx
================================================
import { useCallback, useState } from 'react';
import { Upload, File, X, Loader2 } from 'lucide-react';
import { motion, AnimatePresence } from 'framer-motion';
import { filesApi } from '../../services/api';
import { toast } from '../common/Toaster';

interface FileUploaderProps {
  onFileUploaded: (fileId: string, path: string) => void;
  acceptedTypes?: string[];
  maxSize?: number; // in bytes
  disabled?: boolean;
}

export default function FileUploader({
  onFileUploaded,
  acceptedTypes = ['.pdf', '.md', '.txt'],
  maxSize = 100 * 1024 * 1024, // 100MB
  disabled = false,
}: FileUploaderProps) {
  const [isDragging, setIsDragging] = useState(false);
  const [uploadedFile, setUploadedFile] = useState<{
    id: string;
    name: string;
    size: number;
  } | null>(null);
  const [isUploading, setIsUploading] = useState(false);

  const handleDragOver = useCallback((e: React.DragEvent) => {
    e.preventDefault();
    setIsDragging(true);
  }, []);

  const handleDragLeave = useCallback((e: React.DragEvent) => {
    e.preventDefault();
    setIsDragging(false);
  }, []);

  const uploadFile = async (file: File) => {
    // Validate file type
    const ext = '.' + file.name.split('.').pop()?.toLowerCase();
    if (!acceptedTypes.includes(ext)) {
      toast.error(
        'Invalid file type',
        `Accepted types: ${acceptedTypes.join(', ')}`
      );
      return;
    }

    // Validate file size
    if (file.size > maxSize) {
      toast.error(
        'File too large',
        `Maximum size: ${Math.round(maxSize / (1024 * 1024))}MB`
      );
      return;
    }

    setIsUploading(true);
    try {
      const result = await filesApi.upload(file);
      setUploadedFile({
        id: result.file_id,
        name: result.filename,
        size: result.size,
      });
      onFileUploaded(result.file_id, result.path);
      toast.success('File uploaded', result.filename);
    } catch (error) {
      toast.error('Upload failed', 'Please try again');
      console.error('Upload error:', error);
    } finally {
      setIsUploading(false);
    }
  };

  const handleDrop = useCallback(
    (e: React.DragEvent) => {
      e.preventDefault();
      setIsDragging(false);

      const file = e.dataTransfer.files[0];
      if (file) {
        uploadFile(file);
      }
    },
    [uploadFile]
  );

  const handleFileSelect = useCallback(
    (e: React.ChangeEvent<HTMLInputElement>) => {
      const file = e.target.files?.[0];
      if (file) {
        uploadFile(file);
      }
    },
    [uploadFile]
  );

  const removeFile = async () => {
    if (uploadedFile) {
      try {
        await filesApi.delete(uploadedFile.id);
      } catch {
        // Ignore delete errors
      }
      setUploadedFile(null);
    }
  };

  const formatFileSize = (bytes: number) => {
    if (bytes < 1024) return bytes + ' B';
    if (bytes < 1024 * 1024) return (bytes / 1024).toFixed(1) + ' KB';
    return (bytes / (1024 * 1024)).toFixed(1) + ' MB';
  };

  return (
    <div className="w-full">
      <AnimatePresence mode="wait">
        {uploadedFile ? (
          <motion.div
            initial={{ opacity: 0, scale: 0.95 }}
            animate={{ opacity: 1, scale: 1 }}
            exit={{ opacity: 0, scale: 0.95 }}
            className="flex items-center justify-between p-4 bg-gray-50 border border-gray-200 rounded-lg"
          >
            <div className="flex items-center space-x-3">
              <div className="p-2 bg-primary-100 rounded-lg">
                <File className="h-5 w-5 text-primary-600" />
              </div>
              <div>
                <p className="font-medium text-sm text-gray-900">
                  {uploadedFile.name}
                </p>
                <p className="text-xs text-gray-500">
                  {formatFileSize(uploadedFile.size)}
                </p>
              </div>
            </div>
            <button
              onClick={removeFile}
              className="p-1.5 text-gray-400 hover:text-gray-600 hover:bg-gray-200 rounded-lg transition-colors"
            >
              <X className="h-4 w-4" />
            </button>
          </motion.div>
        ) : (
          <motion.div
            initial={{ opacity: 0 }}
            animate={{ opacity: 1 }}
            exit={{ opacity: 0 }}
            onDragOver={disabled ? undefined : handleDragOver}
            onDragLeave={disabled ? undefined : handleDragLeave}
            onDrop={disabled ? undefined : handleDrop}
            className={`relative border-2 border-dashed rounded-lg p-8 text-center transition-colors ${
              disabled
                ? 'border-gray-200 bg-gray-50 opacity-60 cursor-not-allowed'
                : isDragging
                ? 'border-primary-500 bg-primary-50'
                : 'border-gray-300 hover:border-gray-400'
            }`}
          >
            <input
              type="file"
              accept={acceptedTypes.join(',')}
              onChange={handleFileSelect}
              className="absolute inset-0 w-full h-full opacity-0 cursor-pointer disabled:cursor-not-allowed"
              disabled={isUploading || disabled}
            />

            {isUploading ? (
              <div className="flex flex-col items-center">
                <Loader2 className="h-10 w-10 text-primary-500 animate-spin mb-3" />
                <p className="text-sm text-gray-600">Uploading...</p>
              </div>
            ) : (
              <div className="flex flex-col items-center">
                <Upload
                  className={`h-10 w-10 mb-3 ${
                    isDragging ? 'text-primary-500' : 'text-gray-400'
                  }`}
                />
                <p className="text-sm font-medium text-gray-700 mb-1">
                  Drop your file here or click to browse
                </p>
                <p className="text-xs text-gray-500">
                  Supports {acceptedTypes.join(', ')} up to{' '}
                  {Math.round(maxSize / (1024 * 1024))}MB
                </p>
              </div>
            )}
          </motion.div>
        )}
      </AnimatePresence>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/input/UrlInput.tsx
================================================
import { useState } from 'react';
import { Link2, Check, X, Loader2 } from 'lucide-react';
import { motion, AnimatePresence } from 'framer-motion';

interface UrlInputProps {
  onSubmit: (url: string) => void;
  placeholder?: string;
  isLoading?: boolean;
  disabled?: boolean;
}

export default function UrlInput({
  onSubmit,
  placeholder = 'https://arxiv.org/abs/...',
  isLoading = false,
  disabled = false,
}: UrlInputProps) {
  const [url, setUrl] = useState('');
  const [isValid, setIsValid] = useState<boolean | null>(null);

  const validateUrl = (value: string) => {
    try {
      new URL(value);
      return true;
    } catch {
      return false;
    }
  };

  const handleChange = (value: string) => {
    setUrl(value);
    if (value.trim()) {
      setIsValid(validateUrl(value));
    } else {
      setIsValid(null);
    }
  };

  const handleSubmit = () => {
    if (url.trim() && isValid) {
      onSubmit(url.trim());
    }
  };

  return (
    <motion.div
      initial={{ opacity: 0, y: 10 }}
      animate={{ opacity: 1, y: 0 }}
      className="w-full"
    >
      <div className="relative">
        <div className="absolute inset-y-0 left-0 pl-3 flex items-center pointer-events-none">
          <Link2 className="h-5 w-5 text-gray-400" />
        </div>
        <input
          type="url"
          value={url}
          onChange={(e) => handleChange(e.target.value)}
          onKeyDown={(e) => e.key === 'Enter' && handleSubmit()}
          placeholder={placeholder}
          disabled={isLoading || disabled}
          className={`w-full pl-10 pr-24 py-3 border rounded-lg text-sm focus:outline-none focus:ring-2 focus:ring-primary-500 transition-colors disabled:opacity-60 disabled:cursor-not-allowed ${
            isValid === false
              ? 'border-red-300 bg-red-50'
              : isValid === true
              ? 'border-green-300 bg-green-50'
              : 'border-gray-200 bg-white'
          }`}
        />
        <div className="absolute inset-y-0 right-0 flex items-center pr-2">
          <AnimatePresence mode="wait">
            {isValid !== null && (
              <motion.span
                initial={{ opacity: 0, scale: 0.8 }}
                animate={{ opacity: 1, scale: 1 }}
                exit={{ opacity: 0, scale: 0.8 }}
                className="mr-2"
              >
                {isValid ? (
                  <Check className="h-4 w-4 text-green-500" />
                ) : (
                  <X className="h-4 w-4 text-red-500" />
                )}
              </motion.span>
            )}
          </AnimatePresence>
          <button
            onClick={handleSubmit}
            disabled={!isValid || isLoading || disabled}
            className="px-3 py-1.5 text-sm font-medium text-white bg-primary-600 rounded-md hover:bg-primary-700 disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
          >
            {isLoading ? (
              <Loader2 className="h-4 w-4 animate-spin" />
            ) : (
              'Load'
            )}
          </button>
        </div>
      </div>
      {isValid === false && url.trim() && (
        <p className="mt-1.5 text-xs text-red-500">Please enter a valid URL</p>
      )}
      <p className="mt-2 text-xs text-gray-400">
        Supported: ArXiv, GitHub, and direct PDF links
      </p>
    </motion.div>
  );
}


================================================
FILE: new_ui/frontend/src/components/input/index.ts
================================================
export { default as FileUploader } from './FileUploader';
export { default as ChatInput } from './ChatInput';
export { default as UrlInput } from './UrlInput';


================================================
FILE: new_ui/frontend/src/components/interaction/InlineChatInteraction.tsx
================================================
/**
 * InlineChatInteraction Component
 *
 * Displays User-in-Loop interactions inline within the chat flow.
 * Designed to look like an AI assistant message with interactive elements.
 */

import { useState, useCallback } from 'react';
import { motion, AnimatePresence } from 'framer-motion';
import {
  Send,
  SkipForward,
  CheckCircle,
  XCircle,
  Edit,
  HelpCircle,
  Loader2,
  Bot
} from 'lucide-react';
import { Button } from '../common';
import { useWorkflowStore, type PendingInteraction } from '../../stores/workflowStore';
import { workflowsApi } from '../../services/api';
import { toast } from '../common/Toaster';

interface InlineChatInteractionProps {
  taskId: string;
  interaction: PendingInteraction;
  onComplete?: () => void;
}

export default function InlineChatInteraction({
  taskId,
  interaction,
  onComplete
}: InlineChatInteractionProps) {
  const [isSubmitting, setIsSubmitting] = useState(false);
  const [answers, setAnswers] = useState<Record<string, string>>({});
  const [feedback, setFeedback] = useState('');
  const [showModify, setShowModify] = useState(false);
  const { clearInteraction, addActivityLog } = useWorkflowStore();

  const handleSubmit = useCallback(async (action: string, data: Record<string, unknown> = {}) => {
    setIsSubmitting(true);
    try {
      await workflowsApi.respondToInteraction(taskId, action, data, false);
      addActivityLog(`✓ Submitted: ${action}`, 0, 'success');
      clearInteraction();
      onComplete?.();
    } catch (error) {
      console.error('Failed to submit response:', error);
      toast.error('Failed to submit', 'Please try again');
    } finally {
      setIsSubmitting(false);
    }
  }, [taskId, clearInteraction, addActivityLog, onComplete]);

  const handleSkip = useCallback(async () => {
    setIsSubmitting(true);
    try {
      await workflowsApi.respondToInteraction(taskId, 'skip', {}, true);
      addActivityLog('⏭️ Skipped interaction', 0, 'info');
      clearInteraction();
      onComplete?.();
    } catch (error) {
      console.error('Failed to skip:', error);
      toast.error('Failed to skip', 'Please try again');
    } finally {
      setIsSubmitting(false);
    }
  }, [taskId, clearInteraction, addActivityLog, onComplete]);

  // Render questions type
  const renderQuestions = () => {
    const questions = interaction.data?.questions || [];

    return (
      <div className="space-y-3">
        {questions.map((q: { id?: string; question: string; hint?: string; category?: string }, index: number) => (
          <motion.div
            key={q.id || index}
            initial={{ opacity: 0, y: 10 }}
            animate={{ opacity: 1, y: 0 }}
            transition={{ delay: index * 0.1 }}
            className="bg-white rounded-lg p-3 border border-gray-200 shadow-sm"
          >
            <div className="flex items-start space-x-2">
              <div className="flex-shrink-0 w-5 h-5 rounded-full bg-primary-100 flex items-center justify-center mt-0.5">
                <span className="text-xs font-semibold text-primary-600">{index + 1}</span>
              </div>
              <div className="flex-1 min-w-0">
                {q.category && (
                  <span className="inline-block px-2 py-0.5 text-xs font-medium text-primary-700 bg-primary-50 rounded mb-1">
                    {q.category}
                  </span>
                )}
                <p className="text-sm font-medium text-gray-900">{q.question}</p>
                {q.hint && (
                  <p className="text-xs text-gray-500 mt-1 flex items-center">
                    <HelpCircle className="h-3 w-3 mr-1 flex-shrink-0" />
                    <span>{q.hint}</span>
                  </p>
                )}
                <textarea
                  className="mt-2 w-full px-3 py-2 text-sm border border-gray-200 rounded-lg focus:ring-2 focus:ring-primary-500 focus:border-transparent resize-none bg-gray-50"
                  rows={2}
                  placeholder="Type your answer here..."
                  value={answers[q.id || `q${index}`] || ''}
                  onChange={(e) => setAnswers(prev => ({
                    ...prev,
                    [q.id || `q${index}`]: e.target.value
                  }))}
                  disabled={isSubmitting}
                />
              </div>
            </div>
          </motion.div>
        ))}

        <div className="flex justify-end space-x-2 pt-3">
          {!interaction.required && (
            <Button
              variant="secondary"
              size="sm"
              onClick={handleSkip}
              disabled={isSubmitting}
            >
              <SkipForward className="h-3.5 w-3.5 mr-1.5" />
              Skip
            </Button>
          )}
          <Button
            variant="primary"
            size="sm"
            onClick={() => handleSubmit('submit', { answers })}
            disabled={isSubmitting}
          >
            {isSubmitting ? (
              <Loader2 className="h-3.5 w-3.5 mr-1.5 animate-spin" />
            ) : (
              <Send className="h-3.5 w-3.5 mr-1.5" />
            )}
            Submit Answers
          </Button>
        </div>
      </div>
    );
  };

  // Render plan review type
  const renderPlanReview = () => {
    const plan = interaction.data?.plan || interaction.data?.plan_preview || '';

    return (
      <div className="space-y-3">
        <div className="bg-gray-900 rounded-lg p-3 max-h-60 overflow-y-auto">
          <pre className="text-xs text-gray-300 font-mono whitespace-pre-wrap">
            {plan}
          </pre>
        </div>

        <AnimatePresence>
          {showModify && (
            <motion.div
              initial={{ opacity: 0, height: 0 }}
              animate={{ opacity: 1, height: 'auto' }}
              exit={{ opacity: 0, height: 0 }}
            >
              <textarea
                className="w-full px-3 py-2 text-sm border border-gray-200 rounded-lg focus:ring-2 focus:ring-primary-500 focus:border-transparent resize-none bg-gray-50"
                rows={3}
                placeholder="Describe the changes you'd like to make..."
                value={feedback}
                onChange={(e) => setFeedback(e.target.value)}
                disabled={isSubmitting}
              />
            </motion.div>
          )}
        </AnimatePresence>

        <div className="flex flex-wrap justify-end gap-2 pt-3">
          <Button
            variant="danger"
            size="sm"
            onClick={() => handleSubmit('cancel', { reason: 'User cancelled' })}
            disabled={isSubmitting}
          >
            <XCircle className="h-3.5 w-3.5 mr-1.5" />
            Cancel
          </Button>

          {!showModify ? (
            <Button
              variant="secondary"
              size="sm"
              onClick={() => setShowModify(true)}
              disabled={isSubmitting}
            >
              <Edit className="h-3.5 w-3.5 mr-1.5" />
              Modify
            </Button>
          ) : (
            <Button
              variant="secondary"
              size="sm"
              onClick={() => {
                if (feedback.trim()) {
                  handleSubmit('modify', { feedback });
                } else {
                  toast.warning('Please provide feedback', 'Describe what you want to change');
                }
              }}
              disabled={isSubmitting || !feedback.trim()}
            >
              <Send className="h-3.5 w-3.5 mr-1.5" />
              Submit Changes
            </Button>
          )}

          <Button
            variant="primary"
            size="sm"
            onClick={() => handleSubmit('confirm')}
            disabled={isSubmitting}
          >
            {isSubmitting ? (
              <Loader2 className="h-3.5 w-3.5 mr-1.5 animate-spin" />
            ) : (
              <CheckCircle className="h-3.5 w-3.5 mr-1.5" />
            )}
            Approve
          </Button>
        </div>
      </div>
    );
  };

  // Render generic interaction type
  const renderGenericInteraction = () => {
    return (
      <div className="space-y-3">
        <p className="text-sm text-gray-600">{interaction.description}</p>

        <div className="flex flex-wrap justify-end gap-2 pt-3">
          {interaction.options && Object.entries(interaction.options).map(([action, label]) => (
            <Button
              key={action}
              variant={action === 'confirm' || action === 'submit' ? 'primary' : 'secondary'}
              size="sm"
              onClick={() => handleSubmit(action)}
              disabled={isSubmitting}
            >
              {isSubmitting ? (
                <Loader2 className="h-3.5 w-3.5 mr-1.5 animate-spin" />
              ) : null}
              {label as string}
            </Button>
          ))}
        </div>
      </div>
    );
  };

  // Render based on interaction type
  const renderContent = () => {
    switch (interaction.type) {
      case 'requirement_questions':
        return renderQuestions();
      case 'plan_review':
        return renderPlanReview();
      default:
        return renderGenericInteraction();
    }
  };

  return (
    <motion.div
      initial={{ opacity: 0, y: 10 }}
      animate={{ opacity: 1, y: 0 }}
      className="flex items-start space-x-3"
    >
      {/* Bot Avatar */}
      <div className="flex-shrink-0 w-8 h-8 rounded-full bg-primary-100 flex items-center justify-center">
        <Bot className="h-4 w-4 text-primary-600" />
      </div>

      {/* Interaction Content */}
      <div className="flex-1 max-w-[90%]">
        <div className="bg-gradient-to-br from-primary-50 to-blue-50 border border-primary-200 rounded-2xl px-4 py-3 shadow-sm">
          {/* Title */}
          <div className="mb-3">
            <h4 className="font-semibold text-gray-900 text-sm">{interaction.title}</h4>
            {interaction.description && interaction.type !== 'requirement_questions' && (
              <p className="text-xs text-gray-600 mt-0.5">{interaction.description}</p>
            )}
          </div>

          {/* Content */}
          {renderContent()}
        </div>
      </div>
    </motion.div>
  );
}


================================================
FILE: new_ui/frontend/src/components/interaction/InteractionPanel.tsx
================================================
/**
 * InteractionPanel Component
 *
 * Displays User-in-Loop interactions from the workflow.
 * Supports different interaction types:
 * - requirement_questions: Show questions and collect answers
 * - plan_review: Show plan and allow confirm/modify/cancel
 */

import { useState, useCallback } from 'react';
import { motion, AnimatePresence } from 'framer-motion';
import {
  MessageCircle,
  Send,
  SkipForward,
  CheckCircle,
  XCircle,
  Edit,
  HelpCircle,
  Loader2
} from 'lucide-react';
import { Button, Card } from '../common';
import { useWorkflowStore, type PendingInteraction } from '../../stores/workflowStore';
import { workflowsApi } from '../../services/api';
import { toast } from '../common/Toaster';

interface InteractionPanelProps {
  taskId: string;
  interaction: PendingInteraction;
  onComplete?: () => void;
}

export default function InteractionPanel({
  taskId,
  interaction,
  onComplete
}: InteractionPanelProps) {
  const [isSubmitting, setIsSubmitting] = useState(false);
  const [answers, setAnswers] = useState<Record<string, string>>({});
  const [feedback, setFeedback] = useState('');
  const [showModify, setShowModify] = useState(false);
  const { clearInteraction, addActivityLog } = useWorkflowStore();

  const handleSubmit = useCallback(async (action: string, data: Record<string, unknown> = {}) => {
    setIsSubmitting(true);
    try {
      await workflowsApi.respondToInteraction(taskId, action, data, false);
      addActivityLog(`✓ Submitted: ${action}`, 0, 'success');
      clearInteraction();
      onComplete?.();
    } catch (error) {
      console.error('Failed to submit response:', error);
      toast.error('Failed to submit', 'Please try again');
    } finally {
      setIsSubmitting(false);
    }
  }, [taskId, clearInteraction, addActivityLog, onComplete]);

  const handleSkip = useCallback(async () => {
    setIsSubmitting(true);
    try {
      await workflowsApi.respondToInteraction(taskId, 'skip', {}, true);
      addActivityLog('⏭️ Skipped interaction', 0, 'info');
      clearInteraction();
      onComplete?.();
    } catch (error) {
      console.error('Failed to skip:', error);
      toast.error('Failed to skip', 'Please try again');
    } finally {
      setIsSubmitting(false);
    }
  }, [taskId, clearInteraction, addActivityLog, onComplete]);

  // Render based on interaction type
  const renderContent = () => {
    switch (interaction.type) {
      case 'requirement_questions':
        return renderQuestions();
      case 'plan_review':
        return renderPlanReview();
      default:
        return renderGenericInteraction();
    }
  };

  const renderQuestions = () => {
    const questions = interaction.data.questions || [];

    return (
      <div className="space-y-4">
        {questions.map((q, index) => (
          <motion.div
            key={q.id || index}
            initial={{ opacity: 0, y: 10 }}
            animate={{ opacity: 1, y: 0 }}
            transition={{ delay: index * 0.1 }}
            className="bg-gray-50 rounded-lg p-4"
          >
            <div className="flex items-start space-x-3">
              <div className="flex-shrink-0 w-6 h-6 rounded-full bg-primary-100 flex items-center justify-center">
                <span className="text-xs font-semibold text-primary-600">{index + 1}</span>
              </div>
              <div className="flex-1">
                <p className="text-sm font-medium text-gray-900">{q.question}</p>
                {q.hint && (
                  <p className="text-xs text-gray-500 mt-1 flex items-center">
                    <HelpCircle className="h-3 w-3 mr-1" />
                    {q.hint}
                  </p>
                )}
                <textarea
                  className="mt-2 w-full px-3 py-2 text-sm border border-gray-200 rounded-lg focus:ring-2 focus:ring-primary-500 focus:border-transparent resize-none"
                  rows={2}
                  placeholder="Your answer..."
                  value={answers[q.id || `q${index}`] || ''}
                  onChange={(e) => setAnswers(prev => ({
                    ...prev,
                    [q.id || `q${index}`]: e.target.value
                  }))}
                  disabled={isSubmitting}
                />
              </div>
            </div>
          </motion.div>
        ))}

        <div className="flex justify-end space-x-3 pt-4 border-t border-gray-100">
          {!interaction.required && (
            <Button
              variant="secondary"
              onClick={handleSkip}
              disabled={isSubmitting}
            >
              <SkipForward className="h-4 w-4 mr-2" />
              Skip
            </Button>
          )}
          <Button
            variant="primary"
            onClick={() => handleSubmit('submit', { answers })}
            disabled={isSubmitting}
          >
            {isSubmitting ? (
              <Loader2 className="h-4 w-4 mr-2 animate-spin" />
            ) : (
              <Send className="h-4 w-4 mr-2" />
            )}
            Submit Answers
          </Button>
        </div>
      </div>
    );
  };

  const renderPlanReview = () => {
    const plan = interaction.data.plan || interaction.data.plan_preview || '';

    return (
      <div className="space-y-4">
        <div className="bg-gray-900 rounded-lg p-4 max-h-80 overflow-y-auto">
          <pre className="text-xs text-gray-300 font-mono whitespace-pre-wrap">
            {plan}
          </pre>
        </div>

        <AnimatePresence>
          {showModify && (
            <motion.div
              initial={{ opacity: 0, height: 0 }}
              animate={{ opacity: 1, height: 'auto' }}
              exit={{ opacity: 0, height: 0 }}
            >
              <textarea
                className="w-full px-3 py-2 text-sm border border-gray-200 rounded-lg focus:ring-2 focus:ring-primary-500 focus:border-transparent resize-none"
                rows={3}
                placeholder="Describe the changes you'd like to make..."
                value={feedback}
                onChange={(e) => setFeedback(e.target.value)}
                disabled={isSubmitting}
              />
            </motion.div>
          )}
        </AnimatePresence>

        <div className="flex justify-end space-x-3 pt-4 border-t border-gray-100">
          <Button
            variant="danger"
            onClick={() => handleSubmit('cancel', { reason: 'User cancelled' })}
            disabled={isSubmitting}
          >
            <XCircle className="h-4 w-4 mr-2" />
            Cancel
          </Button>

          {!showModify ? (
            <Button
              variant="secondary"
              onClick={() => setShowModify(true)}
              disabled={isSubmitting}
            >
              <Edit className="h-4 w-4 mr-2" />
              Modify
            </Button>
          ) : (
            <Button
              variant="secondary"
              onClick={() => {
                if (feedback.trim()) {
                  handleSubmit('modify', { feedback });
                } else {
                  toast.warning('Please provide feedback', 'Describe what you want to change');
                }
              }}
              disabled={isSubmitting || !feedback.trim()}
            >
              <Send className="h-4 w-4 mr-2" />
              Submit Changes
            </Button>
          )}

          <Button
            variant="primary"
            onClick={() => handleSubmit('confirm')}
            disabled={isSubmitting}
          >
            {isSubmitting ? (
              <Loader2 className="h-4 w-4 mr-2 animate-spin" />
            ) : (
              <CheckCircle className="h-4 w-4 mr-2" />
            )}
            Approve & Continue
          </Button>
        </div>
      </div>
    );
  };

  const renderGenericInteraction = () => {
    return (
      <div className="space-y-4">
        <p className="text-sm text-gray-600">{interaction.description}</p>

        <div className="flex justify-end space-x-3 pt-4 border-t border-gray-100">
          {Object.entries(interaction.options).map(([action, label]) => (
            <Button
              key={action}
              variant={action === 'confirm' || action === 'submit' ? 'primary' : 'secondary'}
              onClick={() => handleSubmit(action)}
              disabled={isSubmitting}
            >
              {isSubmitting ? (
                <Loader2 className="h-4 w-4 mr-2 animate-spin" />
              ) : null}
              {label}
            </Button>
          ))}
        </div>
      </div>
    );
  };

  return (
    <motion.div
      initial={{ opacity: 0, scale: 0.95 }}
      animate={{ opacity: 1, scale: 1 }}
      exit={{ opacity: 0, scale: 0.95 }}
    >
      <Card className="border-2 border-primary-200 bg-primary-50/30">
        <div className="flex items-center space-x-3 mb-4">
          <div className="p-2 bg-primary-100 rounded-lg">
            <MessageCircle className="h-5 w-5 text-primary-600" />
          </div>
          <div>
            <h3 className="font-semibold text-gray-900">{interaction.title}</h3>
            <p className="text-sm text-gray-500">{interaction.description}</p>
          </div>
        </div>

        {renderContent()}
      </Card>
    </motion.div>
  );
}


================================================
FILE: new_ui/frontend/src/components/interaction/index.ts
================================================
export { default as InteractionPanel } from './InteractionPanel';
export { default as InlineChatInteraction } from './InlineChatInteraction';


================================================
FILE: new_ui/frontend/src/components/layout/Header.tsx
================================================
import { Link, useLocation, useNavigate } from 'react-router-dom';
import { Settings, Menu, Loader2 } from 'lucide-react';
import { useState } from 'react';
import { useWorkflowStore } from '../../stores/workflowStore';

export default function Header() {
  const location = useLocation();
  const navigate = useNavigate();
  const [isMobileMenuOpen, setIsMobileMenuOpen] = useState(false);

  const { status, workflowType, progress } = useWorkflowStore();
  const isRunning = status === 'running';

  const navItems = [
    { path: '/', label: 'Home' },
    { path: '/paper-to-code', label: 'Paper to Code' },
    { path: '/chat', label: 'Chat Planning' },
    { path: '/workflow', label: 'Workflow' },
  ];

  return (
    <header className="sticky top-0 z-50 border-b border-gray-200 bg-white/80 backdrop-blur-sm">
      <div className="mx-auto max-w-7xl px-4 sm:px-6 lg:px-8">
        <div className="flex h-16 items-center justify-between">
          {/* Logo */}
          <Link to="/" className="flex items-center space-x-2">
            <img
              src="https://github.com/Zongwei9888/Experiment_Images/raw/43c585dca3d21b8e4b6390d835cdd34dc4b4b23d/DeepCode_images/title_logo.svg"
              alt="DeepCode Logo"
              className="h-8 w-8"
            />
            <span className="text-xl font-semibold text-gray-900">
              DeepCode
            </span>
          </Link>

          {/* Desktop Navigation */}
          <nav className="hidden md:flex items-center space-x-1">
            {navItems.map((item) => (
              <Link
                key={item.path}
                to={item.path}
                className={`px-4 py-2 rounded-lg text-sm font-medium transition-colors ${
                  location.pathname === item.path
                    ? 'bg-primary-50 text-primary-600'
                    : 'text-gray-600 hover:bg-gray-100 hover:text-gray-900'
                }`}
              >
                {item.label}
              </Link>
            ))}
          </nav>

          {/* Right Side */}
          <div className="flex items-center space-x-3">
            {/* Running Task Indicator */}
            {isRunning && (
              <button
                onClick={() => {
                  if (workflowType === 'chat-planning') {
                    navigate('/chat');
                  } else if (workflowType === 'paper-to-code') {
                    navigate('/paper-to-code');
                  }
                }}
                className="flex items-center space-x-2 px-3 py-1.5 bg-blue-50 border border-blue-200 rounded-full text-sm font-medium text-blue-700 hover:bg-blue-100 transition-colors"
              >
                <Loader2 className="h-4 w-4 animate-spin" />
                <span className="hidden sm:inline">Task Running</span>
                <span className="text-blue-500">{progress}%</span>
              </button>
            )}

            <Link
              to="/settings"
              className="p-2 rounded-lg text-gray-500 hover:bg-gray-100 hover:text-gray-700 transition-colors"
            >
              <Settings className="h-5 w-5" />
            </Link>

            {/* Mobile menu button */}
            <button
              className="md:hidden p-2 rounded-lg text-gray-500 hover:bg-gray-100"
              onClick={() => setIsMobileMenuOpen(!isMobileMenuOpen)}
            >
              <Menu className="h-5 w-5" />
            </button>
          </div>
        </div>

        {/* Mobile Navigation */}
        {isMobileMenuOpen && (
          <nav className="md:hidden py-4 border-t border-gray-100">
            {navItems.map((item) => (
              <Link
                key={item.path}
                to={item.path}
                className={`block px-4 py-2 rounded-lg text-sm font-medium ${
                  location.pathname === item.path
                    ? 'bg-primary-50 text-primary-600'
                    : 'text-gray-600 hover:bg-gray-100'
                }`}
                onClick={() => setIsMobileMenuOpen(false)}
              >
                {item.label}
              </Link>
            ))}
          </nav>
        )}
      </div>
    </header>
  );
}


================================================
FILE: new_ui/frontend/src/components/layout/Layout.tsx
================================================
import { ReactNode, useState } from 'react';
import Header from './Header';
import Sidebar from './Sidebar';
import { TaskRecoveryBanner } from '../common/TaskRecoveryBanner';
import { ConfirmDialog } from '../common/ConfirmDialog';
import { useTaskRecovery } from '../../hooks/useTaskRecovery';
import { useNavigationGuard } from '../../hooks/useNavigationGuard';

interface LayoutProps {
  children: ReactNode;
}

export default function Layout({ children }: LayoutProps) {
  const { isRecovering, recoveredTaskId } = useTaskRecovery();
  const [showBanner, setShowBanner] = useState(true);

  const {
    showConfirmDialog,
    confirmNavigation,
    cancelNavigation,
  } = useNavigationGuard();

  return (
    <div className="min-h-screen bg-gray-50">
      {/* Task Recovery Banner */}
      {showBanner && (
        <TaskRecoveryBanner
          isRecovering={isRecovering}
          recoveredTaskId={recoveredTaskId}
          onDismiss={() => setShowBanner(false)}
        />
      )}

      {/* Navigation Confirmation Dialog */}
      <ConfirmDialog
        isOpen={showConfirmDialog}
        title="Task is still running"
        message="A task is currently running. If you leave this page, the task will continue in the background, but you may lose track of its progress. Are you sure you want to leave?"
        confirmLabel="Leave"
        cancelLabel="Stay"
        variant="warning"
        onConfirm={confirmNavigation}
        onCancel={cancelNavigation}
      />

      <Header />
      <div className="flex">
        <Sidebar />
        <main className="flex-1 p-6 lg:p-8">
          <div className="mx-auto max-w-7xl">{children}</div>
        </main>
      </div>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/layout/Sidebar.tsx
================================================
import { Link, useLocation } from 'react-router-dom';
import {
  FileText,
  MessageSquare,
  GitBranch,
  Clock,
  Folder,
} from 'lucide-react';
import { useSessionStore } from '../../stores/sessionStore';

export default function Sidebar() {
  const location = useLocation();
  const { recentProjects } = useSessionStore();

  const menuItems = [
    {
      path: '/paper-to-code',
      icon: FileText,
      label: 'Paper to Code',
      description: 'Convert research papers',
    },
    {
      path: '/chat',
      icon: MessageSquare,
      label: 'Chat Planning',
      description: 'Describe your project',
    },
    {
      path: '/workflow',
      icon: GitBranch,
      label: 'Workflow Editor',
      description: 'Visual workflow design',
    },
  ];

  return (
    <aside className="hidden lg:flex flex-col w-64 min-h-[calc(100vh-4rem)] border-r border-gray-200 bg-white">
      <div className="flex-1 p-4">
        {/* Quick Actions */}
        <div className="mb-6">
          <h3 className="px-3 text-xs font-semibold text-gray-400 uppercase tracking-wider mb-2">
            Quick Actions
          </h3>
          <nav className="space-y-1">
            {menuItems.map((item) => {
              const Icon = item.icon;
              const isActive = location.pathname === item.path;

              return (
                <Link
                  key={item.path}
                  to={item.path}
                  className={`flex items-start space-x-3 px-3 py-2.5 rounded-lg transition-colors ${
                    isActive
                      ? 'bg-primary-50 text-primary-700'
                      : 'text-gray-600 hover:bg-gray-50 hover:text-gray-900'
                  }`}
                >
                  <Icon
                    className={`h-5 w-5 mt-0.5 ${
                      isActive ? 'text-primary-600' : 'text-gray-400'
                    }`}
                  />
                  <div>
                    <div className="font-medium text-sm">{item.label}</div>
                    <div
                      className={`text-xs ${
                        isActive ? 'text-primary-600/70' : 'text-gray-400'
                      }`}
                    >
                      {item.description}
                    </div>
                  </div>
                </Link>
              );
            })}
          </nav>
        </div>

        {/* Recent Projects */}
        {recentProjects.length > 0 && (
          <div>
            <h3 className="px-3 text-xs font-semibold text-gray-400 uppercase tracking-wider mb-2 flex items-center">
              <Clock className="h-3 w-3 mr-1.5" />
              Recent
            </h3>
            <div className="space-y-1">
              {recentProjects.slice(0, 5).map((project) => (
                <button
                  key={project.id}
                  className="w-full flex items-center space-x-3 px-3 py-2 rounded-lg text-left text-sm text-gray-600 hover:bg-gray-50 hover:text-gray-900 transition-colors"
                >
                  <Folder className="h-4 w-4 text-gray-400" />
                  <span className="truncate">{project.name}</span>
                </button>
              ))}
            </div>
          </div>
        )}
      </div>

      {/* Footer */}
      <div className="p-4 border-t border-gray-100">
        <div className="flex items-center justify-center space-x-2 text-xs text-gray-400">
          <img
            src="https://github.com/Zongwei9888/Experiment_Images/raw/43c585dca3d21b8e4b6390d835cdd34dc4b4b23d/DeepCode_images/title_logo.svg"
            alt="DeepCode"
            className="h-4 w-4"
          />
          <span>DeepCode v1.0.0</span>
        </div>
      </div>
    </aside>
  );
}


================================================
FILE: new_ui/frontend/src/components/layout/index.ts
================================================
export { default as Layout } from './Layout';
export { default as Header } from './Header';
export { default as Sidebar } from './Sidebar';


================================================
FILE: new_ui/frontend/src/components/results/CodePreview.tsx
================================================
import Editor from '@monaco-editor/react';
import { Code } from 'lucide-react';

interface CodePreviewProps {
  code: string;
  filename?: string;
  language?: string;
}

export default function CodePreview({
  code,
  filename,
  language = 'python',
}: CodePreviewProps) {
  const detectLanguage = (fname?: string): string => {
    if (!fname) return language;
    const ext = fname.split('.').pop()?.toLowerCase();
    const langMap: Record<string, string> = {
      py: 'python',
      js: 'javascript',
      ts: 'typescript',
      tsx: 'typescript',
      jsx: 'javascript',
      md: 'markdown',
      json: 'json',
      yaml: 'yaml',
      yml: 'yaml',
      html: 'html',
      css: 'css',
    };
    return langMap[ext || ''] || language;
  };

  return (
    <div className="rounded-lg border border-gray-200 bg-white overflow-hidden">
      <div className="flex items-center space-x-2 px-4 py-2 bg-gray-50 border-b border-gray-200">
        <Code className="h-4 w-4 text-gray-500" />
        <span className="text-sm font-medium text-gray-700">
          {filename || 'Preview'}
        </span>
      </div>
      {code ? (
        <Editor
          height="300px"
          language={detectLanguage(filename)}
          value={code}
          theme="vs-light"
          options={{
            readOnly: true,
            minimap: { enabled: false },
            scrollBeyondLastLine: false,
            fontSize: 13,
            fontFamily: "'JetBrains Mono', monospace",
            padding: { top: 16, bottom: 16 },
          }}
        />
      ) : (
        <div className="h-[300px] flex items-center justify-center text-gray-400">
          Select a file to preview
        </div>
      )}
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/results/FileTree.tsx
================================================
import { useState } from 'react';
import { ChevronRight, ChevronDown, File, Folder, FolderOpen } from 'lucide-react';
import { motion, AnimatePresence } from 'framer-motion';

interface FileNode {
  name: string;
  type: 'file' | 'folder';
  children?: FileNode[];
}

interface FileTreeProps {
  files: string[];
  onFileSelect?: (path: string) => void;
  selectedFile?: string;
}

export default function FileTree({ files, onFileSelect, selectedFile }: FileTreeProps) {
  // Convert flat file list to tree structure
  const buildTree = (paths: string[]): FileNode[] => {
    const root: Record<string, FileNode> = {};

    paths.forEach((path) => {
      const parts = path.split('/').filter(Boolean);
      let current = root;

      parts.forEach((part, index) => {
        const isFile = index === parts.length - 1;

        if (!current[part]) {
          current[part] = {
            name: part,
            type: isFile ? 'file' : 'folder',
            children: isFile ? undefined : ({} as unknown as FileNode[]),
          };
        }

        if (!isFile) {
          current = current[part].children as unknown as Record<string, FileNode>;
        }
      });
    });

    const convertToArray = (obj: Record<string, FileNode>): FileNode[] => {
      return Object.values(obj).map((node) => ({
        ...node,
        children: node.children
          ? convertToArray(node.children as unknown as Record<string, FileNode>)
          : undefined,
      }));
    };

    return convertToArray(root);
  };

  const tree = buildTree(files);

  return (
    <div className="rounded-lg border border-gray-200 bg-white overflow-hidden">
      <div className="px-4 py-2 bg-gray-50 border-b border-gray-200">
        <span className="text-sm font-medium text-gray-700">Generated Files</span>
        <span className="text-xs text-gray-400 ml-2">({files.length})</span>
      </div>
      <div className="p-2 max-h-[400px] overflow-y-auto">
        {tree.length === 0 ? (
          <div className="py-8 text-center text-gray-400 text-sm">
            No files generated yet
          </div>
        ) : (
          tree.map((node) => (
            <TreeNode
              key={node.name}
              node={node}
              path=""
              onFileSelect={onFileSelect}
              selectedFile={selectedFile}
            />
          ))
        )}
      </div>
    </div>
  );
}

interface TreeNodeProps {
  node: FileNode;
  path: string;
  depth?: number;
  onFileSelect?: (path: string) => void;
  selectedFile?: string;
}

function TreeNode({
  node,
  path,
  depth = 0,
  onFileSelect,
  selectedFile,
}: TreeNodeProps) {
  const [isOpen, setIsOpen] = useState(depth < 2);
  const fullPath = path ? `${path}/${node.name}` : node.name;
  const isSelected = selectedFile === fullPath;

  const handleClick = () => {
    if (node.type === 'folder') {
      setIsOpen(!isOpen);
    } else {
      onFileSelect?.(fullPath);
    }
  };

  const getFileIcon = (filename: string) => {
    const ext = filename.split('.').pop()?.toLowerCase();
    const colors: Record<string, string> = {
      py: 'text-yellow-500',
      js: 'text-yellow-400',
      ts: 'text-blue-500',
      tsx: 'text-blue-400',
      json: 'text-green-500',
      md: 'text-gray-500',
      yaml: 'text-purple-500',
      yml: 'text-purple-500',
    };
    return colors[ext || ''] || 'text-gray-400';
  };

  return (
    <div>
      <button
        onClick={handleClick}
        className={`w-full flex items-center space-x-1.5 px-2 py-1.5 rounded text-sm hover:bg-gray-100 transition-colors ${
          isSelected ? 'bg-primary-50 text-primary-700' : 'text-gray-700'
        }`}
        style={{ paddingLeft: `${depth * 16 + 8}px` }}
      >
        {node.type === 'folder' ? (
          <>
            {isOpen ? (
              <ChevronDown className="h-4 w-4 text-gray-400 flex-shrink-0" />
            ) : (
              <ChevronRight className="h-4 w-4 text-gray-400 flex-shrink-0" />
            )}
            {isOpen ? (
              <FolderOpen className="h-4 w-4 text-yellow-500 flex-shrink-0" />
            ) : (
              <Folder className="h-4 w-4 text-yellow-500 flex-shrink-0" />
            )}
          </>
        ) : (
          <>
            <span className="w-4" />
            <File className={`h-4 w-4 flex-shrink-0 ${getFileIcon(node.name)}`} />
          </>
        )}
        <span className="truncate">{node.name}</span>
      </button>

      <AnimatePresence>
        {node.type === 'folder' && isOpen && node.children && (
          <motion.div
            initial={{ opacity: 0, height: 0 }}
            animate={{ opacity: 1, height: 'auto' }}
            exit={{ opacity: 0, height: 0 }}
          >
            {node.children.map((child) => (
              <TreeNode
                key={child.name}
                node={child}
                path={fullPath}
                depth={depth + 1}
                onFileSelect={onFileSelect}
                selectedFile={selectedFile}
              />
            ))}
          </motion.div>
        )}
      </AnimatePresence>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/results/index.ts
================================================
export { default as CodePreview } from './CodePreview';
export { default as FileTree } from './FileTree';


================================================
FILE: new_ui/frontend/src/components/streaming/ActivityLogViewer.tsx
================================================
/**
 * Activity Log Viewer
 *
 * Displays real-time activity logs from the backend workflow.
 * Shows progress messages, timestamps, and status icons.
 */

import { useEffect, useRef } from 'react';
import { motion, AnimatePresence } from 'framer-motion';
import {
  Terminal,
  CheckCircle,
  Clock,
  Loader2,
  AlertCircle,
  Rocket,
  Brain,
  Code,
  FolderOpen,
  FileText,
  Zap
} from 'lucide-react';

interface LogEntry {
  id: string;
  timestamp: Date;
  message: string;
  progress: number;
  type: 'info' | 'success' | 'warning' | 'error' | 'progress';
}

interface ActivityLogViewerProps {
  logs: LogEntry[];
  isRunning: boolean;
  currentMessage?: string;
}

// Map message content to appropriate icon
function getIconForMessage(message: string): React.ReactNode {
  const msg = message.toLowerCase();

  if (msg.includes('complete') || msg.includes('success') || msg.includes('✅')) {
    return <CheckCircle className="h-4 w-4 text-green-500" />;
  }
  if (msg.includes('error') || msg.includes('failed') || msg.includes('❌')) {
    return <AlertCircle className="h-4 w-4 text-red-500" />;
  }
  if (msg.includes('initializ') || msg.includes('🚀') || msg.includes('starting')) {
    return <Rocket className="h-4 w-4 text-blue-500" />;
  }
  if (msg.includes('analyz') || msg.includes('🧠') || msg.includes('brain') || msg.includes('intelligence')) {
    return <Brain className="h-4 w-4 text-purple-500" />;
  }
  if (msg.includes('code') || msg.includes('implement') || msg.includes('🔬') || msg.includes('synthesi')) {
    return <Code className="h-4 w-4 text-orange-500" />;
  }
  if (msg.includes('workspace') || msg.includes('directory') || msg.includes('📁') || msg.includes('🏗️')) {
    return <FolderOpen className="h-4 w-4 text-yellow-600" />;
  }
  if (msg.includes('plan') || msg.includes('📝') || msg.includes('document') || msg.includes('📄')) {
    return <FileText className="h-4 w-4 text-cyan-500" />;
  }
  if (msg.includes('process') || msg.includes('⚡') || msg.includes('running')) {
    return <Zap className="h-4 w-4 text-amber-500" />;
  }

  return <Clock className="h-4 w-4 text-gray-400" />;
}

function formatTime(date: Date): string {
  return date.toLocaleTimeString('en-US', {
    hour: '2-digit',
    minute: '2-digit',
    second: '2-digit',
    hour12: false
  });
}

export default function ActivityLogViewer({
  logs,
  isRunning,
  currentMessage,
}: ActivityLogViewerProps) {
  const scrollRef = useRef<HTMLDivElement>(null);

  // Auto-scroll to bottom when new logs arrive
  useEffect(() => {
    if (scrollRef.current) {
      scrollRef.current.scrollTop = scrollRef.current.scrollHeight;
    }
  }, [logs]);

  return (
    <div className="rounded-xl border border-gray-200 bg-gray-900 overflow-hidden">
      {/* Header */}
      <div className="flex items-center justify-between px-4 py-2 bg-gray-800 border-b border-gray-700">
        <div className="flex items-center space-x-2">
          <Terminal className="h-4 w-4 text-green-400" />
          <span className="text-sm font-medium text-gray-200">
            Activity Log
          </span>
          {isRunning && (
            <motion.span
              initial={{ opacity: 0 }}
              animate={{ opacity: 1 }}
              className="flex items-center text-xs text-green-400"
            >
              <Loader2 className="h-3 w-3 mr-1 animate-spin" />
              Live
            </motion.span>
          )}
        </div>

        <div className="text-xs text-gray-500">
          {logs.length} events
        </div>
      </div>

      {/* Log Content */}
      <div
        ref={scrollRef}
        className="h-[350px] overflow-y-auto p-4 font-mono text-sm"
      >
        {logs.length === 0 && !isRunning ? (
          <div className="h-full flex items-center justify-center text-gray-500">
            <div className="text-center">
              <Terminal className="h-12 w-12 mx-auto mb-3 opacity-50" />
              <p className="text-sm">Activity logs will appear here</p>
              <p className="text-xs text-gray-600 mt-1">Start a workflow to see real-time progress</p>
            </div>
          </div>
        ) : (
          <AnimatePresence mode="popLayout">
            {logs.map((log, _index) => (
              <motion.div
                key={log.id}
                initial={{ opacity: 0, x: -20 }}
                animate={{ opacity: 1, x: 0 }}
                transition={{ duration: 0.2 }}
                className="flex items-start space-x-3 py-2 border-b border-gray-800 last:border-0"
              >
                {/* Timestamp */}
                <span className="text-gray-500 text-xs whitespace-nowrap pt-0.5">
                  {formatTime(log.timestamp)}
                </span>

                {/* Icon */}
                <span className="flex-shrink-0 pt-0.5">
                  {getIconForMessage(log.message)}
                </span>

                {/* Message */}
                <span className="text-gray-300 flex-1 break-words">
                  {log.message}
                </span>

                {/* Progress Badge */}
                <span className="text-xs text-gray-500 whitespace-nowrap pt-0.5">
                  {log.progress}%
                </span>
              </motion.div>
            ))}

            {/* Current Activity Indicator */}
            {isRunning && currentMessage && (
              <motion.div
                initial={{ opacity: 0 }}
                animate={{ opacity: 1 }}
                className="flex items-start space-x-3 py-2 bg-gray-800/50 rounded-lg mt-2 px-2"
              >
                <span className="text-green-400 text-xs whitespace-nowrap pt-0.5">
                  {formatTime(new Date())}
                </span>
                <Loader2 className="h-4 w-4 text-green-400 animate-spin flex-shrink-0" />
                <span className="text-green-400 flex-1">
                  {currentMessage}
                </span>
              </motion.div>
            )}
          </AnimatePresence>
        )}
      </div>

      {/* Footer Status Bar */}
      <div className="flex items-center justify-between px-4 py-2 bg-gray-800 border-t border-gray-700 text-xs text-gray-500">
        <span>
          {isRunning ? (
            <span className="text-green-400">● Connected</span>
          ) : logs.length > 0 ? (
            <span className="text-gray-400">● Completed</span>
          ) : (
            <span className="text-gray-500">○ Idle</span>
          )}
        </span>
        {logs.length > 0 && (
          <span>
            Last update: {formatTime(logs[logs.length - 1]?.timestamp || new Date())}
          </span>
        )}
      </div>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/streaming/CodeStreamViewer.tsx
================================================
import { useEffect, useRef } from 'react';
import Editor from '@monaco-editor/react';
import { motion } from 'framer-motion';
import { Code, Copy, Check, Loader2 } from 'lucide-react';
import { useState } from 'react';

interface CodeStreamViewerProps {
  code: string;
  currentFile: string | null;
  isStreaming: boolean;
  language?: string;
}

export default function CodeStreamViewer({
  code,
  currentFile,
  isStreaming,
  language = 'python',
}: CodeStreamViewerProps) {
  const [copied, setCopied] = useState(false);
  const editorRef = useRef<any>(null);

  // Auto-scroll to bottom when code updates
  useEffect(() => {
    if (editorRef.current && isStreaming) {
      const editor = editorRef.current;
      const model = editor.getModel();
      if (model) {
        const lineCount = model.getLineCount();
        editor.revealLine(lineCount);
      }
    }
  }, [code, isStreaming]);

  const handleCopy = async () => {
    await navigator.clipboard.writeText(code);
    setCopied(true);
    setTimeout(() => setCopied(false), 2000);
  };

  const detectLanguage = (filename: string | null): string => {
    if (!filename) return language;
    const ext = filename.split('.').pop()?.toLowerCase();
    const langMap: Record<string, string> = {
      py: 'python',
      js: 'javascript',
      ts: 'typescript',
      tsx: 'typescript',
      jsx: 'javascript',
      md: 'markdown',
      json: 'json',
      yaml: 'yaml',
      yml: 'yaml',
      html: 'html',
      css: 'css',
      sh: 'shell',
      bash: 'shell',
    };
    return langMap[ext || ''] || language;
  };

  return (
    <div className="rounded-xl border border-gray-200 bg-white overflow-hidden">
      {/* Header */}
      <div className="flex items-center justify-between px-4 py-2 bg-gray-50 border-b border-gray-200">
        <div className="flex items-center space-x-2">
          <Code className="h-4 w-4 text-gray-500" />
          <span className="text-sm font-medium text-gray-700">
            {currentFile || 'Generated Code'}
          </span>
          {isStreaming && (
            <motion.span
              initial={{ opacity: 0 }}
              animate={{ opacity: 1 }}
              className="flex items-center text-xs text-primary-600"
            >
              <Loader2 className="h-3 w-3 mr-1 animate-spin" />
              Generating...
            </motion.span>
          )}
        </div>

        <button
          onClick={handleCopy}
          disabled={!code}
          className="flex items-center space-x-1 px-2 py-1 text-xs text-gray-500 hover:text-gray-700 hover:bg-gray-100 rounded transition-colors disabled:opacity-50"
        >
          {copied ? (
            <>
              <Check className="h-3 w-3 text-green-500" />
              <span>Copied!</span>
            </>
          ) : (
            <>
              <Copy className="h-3 w-3" />
              <span>Copy</span>
            </>
          )}
        </button>
      </div>

      {/* Editor */}
      <div className="relative">
        {!code && !isStreaming ? (
          <div className="h-[400px] flex items-center justify-center text-gray-400">
            <div className="text-center">
              <Code className="h-12 w-12 mx-auto mb-3 opacity-50" />
              <p className="text-sm">Code will appear here</p>
            </div>
          </div>
        ) : (
          <Editor
            height="400px"
            language={detectLanguage(currentFile)}
            value={code}
            theme="vs-light"
            onMount={(editor) => {
              editorRef.current = editor;
            }}
            options={{
              readOnly: true,
              minimap: { enabled: false },
              scrollBeyondLastLine: false,
              fontSize: 13,
              fontFamily: "'JetBrains Mono', Menlo, Monaco, monospace",
              lineNumbers: 'on',
              renderLineHighlight: 'none',
              scrollbar: {
                vertical: 'auto',
                horizontal: 'auto',
              },
              padding: { top: 16, bottom: 16 },
            }}
          />
        )}

        {/* Streaming indicator overlay */}
        {isStreaming && (
          <div className="absolute bottom-4 right-4">
            <motion.div
              initial={{ opacity: 0, scale: 0.9 }}
              animate={{ opacity: 1, scale: 1 }}
              className="flex items-center space-x-2 px-3 py-1.5 bg-primary-50 border border-primary-200 rounded-full"
            >
              <span className="relative flex h-2 w-2">
                <span className="animate-ping absolute inline-flex h-full w-full rounded-full bg-primary-400 opacity-75"></span>
                <span className="relative inline-flex rounded-full h-2 w-2 bg-primary-500"></span>
              </span>
              <span className="text-xs font-medium text-primary-700">
                Live
              </span>
            </motion.div>
          </div>
        )}
      </div>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/streaming/LogViewer.tsx
================================================
import { useEffect, useRef, useState } from 'react';
import { motion, AnimatePresence } from 'framer-motion';
import { Terminal, Trash2, Filter } from 'lucide-react';

interface LogEntry {
  id: string;
  level: 'INFO' | 'WARNING' | 'ERROR' | 'DEBUG';
  message: string;
  namespace: string;
  timestamp: string;
}

interface LogViewerProps {
  logs: LogEntry[];
  maxHeight?: number;
  onClear?: () => void;
}

const levelColors = {
  INFO: 'text-blue-600 bg-blue-50',
  WARNING: 'text-yellow-600 bg-yellow-50',
  ERROR: 'text-red-600 bg-red-50',
  DEBUG: 'text-gray-600 bg-gray-50',
};

export default function LogViewer({
  logs,
  maxHeight = 400,
  onClear,
}: LogViewerProps) {
  const containerRef = useRef<HTMLDivElement>(null);
  const [filter, setFilter] = useState<string | null>(null);
  const [autoScroll, setAutoScroll] = useState(true);

  // Auto-scroll to bottom when new logs arrive
  useEffect(() => {
    if (autoScroll && containerRef.current) {
      containerRef.current.scrollTop = containerRef.current.scrollHeight;
    }
  }, [logs, autoScroll]);

  const filteredLogs = filter
    ? logs.filter((log) => log.level === filter)
    : logs;

  const formatTime = (timestamp: string) => {
    try {
      const date = new Date(timestamp);
      return date.toLocaleTimeString('en-US', {
        hour12: false,
        hour: '2-digit',
        minute: '2-digit',
        second: '2-digit',
      });
    } catch {
      return timestamp.slice(-8);
    }
  };

  return (
    <div className="rounded-lg border border-gray-200 bg-white overflow-hidden">
      {/* Header */}
      <div className="flex items-center justify-between px-4 py-2 bg-gray-50 border-b border-gray-200">
        <div className="flex items-center space-x-2">
          <Terminal className="h-4 w-4 text-gray-500" />
          <span className="text-sm font-medium text-gray-700">Logs</span>
          <span className="text-xs text-gray-400">({filteredLogs.length})</span>
        </div>

        <div className="flex items-center space-x-2">
          {/* Filter dropdown */}
          <div className="relative">
            <select
              value={filter || ''}
              onChange={(e) => setFilter(e.target.value || null)}
              className="text-xs pl-6 pr-2 py-1 border border-gray-200 rounded bg-white focus:outline-none focus:ring-1 focus:ring-primary-500"
            >
              <option value="">All levels</option>
              <option value="INFO">INFO</option>
              <option value="WARNING">WARNING</option>
              <option value="ERROR">ERROR</option>
              <option value="DEBUG">DEBUG</option>
            </select>
            <Filter className="absolute left-2 top-1/2 -translate-y-1/2 h-3 w-3 text-gray-400" />
          </div>

          {/* Clear button */}
          {onClear && (
            <button
              onClick={onClear}
              className="p-1 text-gray-400 hover:text-gray-600 transition-colors"
              title="Clear logs"
            >
              <Trash2 className="h-4 w-4" />
            </button>
          )}
        </div>
      </div>

      {/* Log content */}
      <div
        ref={containerRef}
        className="overflow-y-auto font-mono text-xs"
        style={{ maxHeight }}
        onScroll={(e) => {
          const target = e.target as HTMLDivElement;
          const isAtBottom =
            target.scrollHeight - target.scrollTop === target.clientHeight;
          setAutoScroll(isAtBottom);
        }}
      >
        {filteredLogs.length === 0 ? (
          <div className="p-8 text-center text-gray-400">
            No logs to display
          </div>
        ) : (
          <div className="p-2 space-y-1">
            <AnimatePresence initial={false}>
              {filteredLogs.map((log) => (
                <motion.div
                  key={log.id}
                  initial={{ opacity: 0, height: 0 }}
                  animate={{ opacity: 1, height: 'auto' }}
                  exit={{ opacity: 0, height: 0 }}
                  className="flex items-start space-x-2 py-1 px-2 rounded hover:bg-gray-50"
                >
                  <span className="text-gray-400 flex-shrink-0">
                    {formatTime(log.timestamp)}
                  </span>
                  <span
                    className={`px-1.5 py-0.5 rounded text-xs font-medium flex-shrink-0 ${
                      levelColors[log.level]
                    }`}
                  >
                    {log.level}
                  </span>
                  {log.namespace && (
                    <span className="text-primary-600 flex-shrink-0">
                      [{log.namespace}]
                    </span>
                  )}
                  <span className="text-gray-700 break-all">{log.message}</span>
                </motion.div>
              ))}
            </AnimatePresence>
          </div>
        )}
      </div>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/streaming/ProgressTracker.tsx
================================================
import { motion } from 'framer-motion';
import { CheckCircle, Circle, Loader2, XCircle } from 'lucide-react';
import type { WorkflowStep } from '../../types/workflow';

interface ProgressTrackerProps {
  steps: WorkflowStep[];
  currentProgress: number;
}

export default function ProgressTracker({
  steps,
  currentProgress,
}: ProgressTrackerProps) {
  const getStepIcon = (status: WorkflowStep['status']) => {
    switch (status) {
      case 'completed':
        return <CheckCircle className="h-5 w-5 text-green-500" />;
      case 'active':
        return <Loader2 className="h-5 w-5 text-primary-500 animate-spin" />;
      case 'error':
        return <XCircle className="h-5 w-5 text-red-500" />;
      default:
        return <Circle className="h-5 w-5 text-gray-300" />;
    }
  };

  return (
    <div className="w-full">
      {/* Progress bar */}
      <div className="mb-6">
        <div className="flex justify-between text-sm mb-2">
          <span className="font-medium text-gray-700">Progress</span>
          <span className="text-gray-500">{currentProgress}%</span>
        </div>
        <div className="h-2 bg-gray-100 rounded-full overflow-hidden">
          <motion.div
            className="h-full bg-primary-500 rounded-full"
            initial={{ width: 0 }}
            animate={{ width: `${currentProgress}%` }}
            transition={{ duration: 0.5, ease: 'easeOut' }}
          />
        </div>
      </div>

      {/* Steps */}
      <div className="space-y-3">
        {steps.map((step, index) => (
          <motion.div
            key={step.id}
            initial={{ opacity: 0, x: -10 }}
            animate={{ opacity: 1, x: 0 }}
            transition={{ delay: index * 0.1 }}
            className={`flex items-center space-x-3 p-3 rounded-lg transition-colors ${
              step.status === 'active'
                ? 'bg-primary-50 border border-primary-200'
                : step.status === 'completed'
                ? 'bg-green-50 border border-green-100'
                : step.status === 'error'
                ? 'bg-red-50 border border-red-100'
                : 'bg-gray-50'
            }`}
          >
            {getStepIcon(step.status)}
            <div className="flex-1 min-w-0">
              <p
                className={`text-sm font-medium ${
                  step.status === 'active'
                    ? 'text-primary-700'
                    : step.status === 'completed'
                    ? 'text-green-700'
                    : step.status === 'error'
                    ? 'text-red-700'
                    : 'text-gray-500'
                }`}
              >
                {step.title}
              </p>
              <p className="text-xs text-gray-400">{step.subtitle}</p>
            </div>
            {step.status === 'completed' && (
              <span className="text-xs text-green-600 font-medium">Done</span>
            )}
          </motion.div>
        ))}
      </div>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/streaming/index.ts
================================================
export { default as CodeStreamViewer } from './CodeStreamViewer';
export { default as ProgressTracker } from './ProgressTracker';
export { default as LogViewer } from './LogViewer';
export { default as ActivityLogViewer } from './ActivityLogViewer';


================================================
FILE: new_ui/frontend/src/components/workflow/WorkflowCanvas.tsx
================================================
import { useCallback } from 'react';
import ReactFlow, {
  Node,
  Edge,
  Controls,
  MiniMap,
  Background,
  useNodesState,
  useEdgesState,
  addEdge,
  Connection,
  BackgroundVariant,
} from 'reactflow';
import 'reactflow/dist/style.css';
import WorkflowNode from './WorkflowNode';
import type { WorkflowStep } from '../../types/workflow';

interface WorkflowCanvasProps {
  steps: WorkflowStep[];
  currentStepIndex: number;
  onStepClick?: (stepId: string) => void;
}

const nodeTypes = {
  workflow: WorkflowNode,
};

export default function WorkflowCanvas({
  steps,
  currentStepIndex,
  onStepClick,
}: WorkflowCanvasProps) {
  // Convert steps to React Flow nodes
  const initialNodes: Node[] = steps.map((step, index) => ({
    id: step.id,
    type: 'workflow',
    position: { x: index * 200, y: 100 },
    data: {
      ...step,
      isActive: index === currentStepIndex,
      isCompleted: index < currentStepIndex,
      onClick: () => onStepClick?.(step.id),
    },
  }));

  // Create edges between consecutive nodes
  const initialEdges: Edge[] = steps.slice(0, -1).map((step, index) => ({
    id: `${step.id}-${steps[index + 1].id}`,
    source: step.id,
    target: steps[index + 1].id,
    animated: index === currentStepIndex - 1,
    style: {
      stroke:
        index < currentStepIndex
          ? '#10b981'
          : index === currentStepIndex - 1
          ? '#3b82f6'
          : '#d1d5db',
      strokeWidth: 2,
    },
  }));

  const [nodes, , onNodesChange] = useNodesState(initialNodes);
  const [edges, setEdges, onEdgesChange] = useEdgesState(initialEdges);

  const onConnect = useCallback(
    (params: Connection) => setEdges((eds) => addEdge(params, eds)),
    [setEdges]
  );

  return (
    <div className="h-[500px] rounded-xl border border-gray-200 bg-white overflow-hidden">
      <ReactFlow
        nodes={nodes}
        edges={edges}
        onNodesChange={onNodesChange}
        onEdgesChange={onEdgesChange}
        onConnect={onConnect}
        nodeTypes={nodeTypes}
        fitView
        attributionPosition="bottom-left"
        className="bg-gray-50"
      >
        <Controls
          className="bg-white border border-gray-200 rounded-lg"
          showInteractive={false}
        />
        <MiniMap
          className="bg-white border border-gray-200 rounded-lg"
          nodeColor={(node) => {
            if (node.data.isCompleted) return '#10b981';
            if (node.data.isActive) return '#3b82f6';
            return '#d1d5db';
          }}
        />
        <Background variant={BackgroundVariant.Dots} gap={20} size={1} />
      </ReactFlow>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/components/workflow/WorkflowNode.tsx
================================================
import { memo } from 'react';
import { Handle, Position, NodeProps } from 'reactflow';
import { CheckCircle, Circle, Loader2 } from 'lucide-react';
import { motion } from 'framer-motion';

interface WorkflowNodeData {
  id: string;
  title: string;
  subtitle: string;
  isActive: boolean;
  isCompleted: boolean;
  onClick?: () => void;
}

function WorkflowNode({ data }: NodeProps<WorkflowNodeData>) {
  const { title, subtitle, isActive, isCompleted, onClick } = data;

  return (
    <>
      <Handle
        type="target"
        position={Position.Left}
        className="!bg-gray-300 !border-2 !border-white !w-3 !h-3"
      />

      <motion.div
        initial={{ scale: 0.9, opacity: 0 }}
        animate={{ scale: 1, opacity: 1 }}
        onClick={onClick}
        className={`px-4 py-3 rounded-xl border-2 cursor-pointer transition-all min-w-[140px] ${
          isCompleted
            ? 'bg-green-50 border-green-300 shadow-green-100'
            : isActive
            ? 'bg-primary-50 border-primary-400 shadow-primary-100 shadow-lg'
            : 'bg-white border-gray-200 hover:border-gray-300'
        }`}
      >
        <div className="flex items-center space-x-2 mb-1">
          {isCompleted ? (
            <CheckCircle className="h-4 w-4 text-green-500" />
          ) : isActive ? (
            <Loader2 className="h-4 w-4 text-primary-500 animate-spin" />
          ) : (
            <Circle className="h-4 w-4 text-gray-300" />
          )}
          <span
            className={`text-sm font-semibold ${
              isCompleted
                ? 'text-green-700'
                : isActive
                ? 'text-primary-700'
                : 'text-gray-700'
            }`}
          >
            {title}
          </span>
        </div>
        <p
          className={`text-xs ${
            isCompleted
              ? 'text-green-600'
              : isActive
              ? 'text-primary-600'
              : 'text-gray-400'
          }`}
        >
          {subtitle}
        </p>

        {isActive && (
          <motion.div
            layoutId="activeIndicator"
            className="absolute -bottom-1 left-1/2 transform -translate-x-1/2 w-2 h-2 bg-primary-500 rounded-full"
            animate={{ scale: [1, 1.2, 1] }}
            transition={{ repeat: Infinity, duration: 1.5 }}
          />
        )}
      </motion.div>

      <Handle
        type="source"
        position={Position.Right}
        className="!bg-gray-300 !border-2 !border-white !w-3 !h-3"
      />
    </>
  );
}

export default memo(WorkflowNode);


================================================
FILE: new_ui/frontend/src/components/workflow/index.ts
================================================
export { default as WorkflowCanvas } from './WorkflowCanvas';
export { default as WorkflowNode } from './WorkflowNode';


================================================
FILE: new_ui/frontend/src/hooks/index.ts
================================================
export { useWebSocket } from './useWebSocket';
export { useStreaming } from './useStreaming';
export { useAdaptiveLayout } from './useAdaptiveLayout';


================================================
FILE: new_ui/frontend/src/hooks/useAdaptiveLayout.ts
================================================
import { useMemo } from 'react';
import type { TaskType, LayoutConfig } from '../types/common';

const layoutConfigs: Record<TaskType, LayoutConfig> = {
  'paper-to-code': {
    sidebarWidth: 320,
    showCodePreview: true,
    showWorkflowCanvas: true,
    splitRatio: 0.6,
  },
  'chat-planning': {
    sidebarWidth: 280,
    showCodePreview: true,
    showWorkflowCanvas: false,
    splitRatio: 0.5,
  },
  'workflow-editor': {
    sidebarWidth: 240,
    showCodePreview: false,
    showWorkflowCanvas: true,
    splitRatio: 0.7,
  },
  settings: {
    sidebarWidth: 280,
    showCodePreview: false,
    showWorkflowCanvas: false,
    splitRatio: 1,
  },
};

export function useAdaptiveLayout(taskType: TaskType): LayoutConfig {
  return useMemo(() => layoutConfigs[taskType], [taskType]);
}


================================================
FILE: new_ui/frontend/src/hooks/useNavigationGuard.ts
================================================
/**
 * Navigation Guard Hook
 *
 * Prevents accidental navigation away from a page when a task is running.
 * - Shows browser warning on refresh/close (beforeunload)
 * - Shows confirmation dialog on in-app navigation
 */

import { useEffect, useCallback, useState } from 'react';
import { useNavigate, useLocation } from 'react-router-dom';
import { useWorkflowStore } from '../stores/workflowStore';

interface NavigationGuardState {
  isBlocking: boolean;
  pendingPath: string | null;
  showConfirmDialog: boolean;
}

export function useNavigationGuard() {
  const { status } = useWorkflowStore();
  const navigate = useNavigate();
  const location = useLocation();

  const [guardState, setGuardState] = useState<NavigationGuardState>({
    isBlocking: false,
    pendingPath: null,
    showConfirmDialog: false,
  });

  // Determine if we should block navigation
  const shouldBlock = status === 'running';

  // Handle browser beforeunload event (refresh, close tab, close browser)
  useEffect(() => {
    const handleBeforeUnload = (e: BeforeUnloadEvent) => {
      if (shouldBlock) {
        e.preventDefault();
        // Chrome requires returnValue to be set
        e.returnValue = 'A task is still running. Are you sure you want to leave?';
        return e.returnValue;
      }
    };

    window.addEventListener('beforeunload', handleBeforeUnload);
    return () => window.removeEventListener('beforeunload', handleBeforeUnload);
  }, [shouldBlock]);

  // Update blocking state
  useEffect(() => {
    setGuardState(prev => ({ ...prev, isBlocking: shouldBlock }));
  }, [shouldBlock]);

  // Function to attempt navigation (called by NavLink wrapper)
  const attemptNavigation = useCallback((path: string) => {
    if (shouldBlock && path !== location.pathname) {
      setGuardState({
        isBlocking: true,
        pendingPath: path,
        showConfirmDialog: true,
      });
      return false; // Block navigation
    }
    return true; // Allow navigation
  }, [shouldBlock, location.pathname]);

  // Confirm navigation (user clicked "Leave" in dialog)
  const confirmNavigation = useCallback(() => {
    const { pendingPath } = guardState;
    setGuardState({
      isBlocking: false,
      pendingPath: null,
      showConfirmDialog: false,
    });
    if (pendingPath) {
      navigate(pendingPath);
    }
  }, [guardState.pendingPath, navigate]);

  // Cancel navigation (user clicked "Stay" in dialog)
  const cancelNavigation = useCallback(() => {
    setGuardState(prev => ({
      ...prev,
      pendingPath: null,
      showConfirmDialog: false,
    }));
  }, []);

  return {
    isBlocking: guardState.isBlocking,
    showConfirmDialog: guardState.showConfirmDialog,
    pendingPath: guardState.pendingPath,
    attemptNavigation,
    confirmNavigation,
    cancelNavigation,
  };
}


================================================
FILE: new_ui/frontend/src/hooks/useStreaming.ts
================================================
import { useEffect, useCallback, useRef } from 'react';
import { useWebSocket } from './useWebSocket';
import { useWorkflowStore } from '../stores/workflowStore';
import type {
  WSProgressMessage,
  WSCompleteMessage,
  WSErrorMessage,
  WSCodeChunkMessage,
  WSInteractionMessage,
} from '../types/api';

type WSMessage = WSProgressMessage | WSCompleteMessage | WSErrorMessage | WSCodeChunkMessage | WSInteractionMessage;

export function useStreaming(taskId: string | null) {
  const {
    status,
    updateProgress,
    setStatus,
    setResult,
    setError,
    appendStreamedCode,
    setCurrentFile,
    addGeneratedFile,
    addActivityLog,
    setPendingInteraction,
    clearInteraction,
  } = useWorkflowStore();

  // Track previous taskId to detect changes
  const prevTaskIdRef = useRef<string | null>(null);

  // Determine if finished based on store status (persisted state)
  const isFinished = status === 'completed' || status === 'error';

  const handleMessage = useCallback(
    (message: WSMessage) => {
      console.log('[useStreaming] Received message:', message.type, message);

      switch (message.type) {
        case 'progress':
          if ('progress' in message && message.progress !== undefined) {
            updateProgress(message.progress, message.message || '');
            // Add to activity log if there's a meaningful message
            if (message.message && message.message.trim()) {
              addActivityLog(message.message, message.progress, 'progress');
            }
          }
          break;

        case 'status':
          // Handle status messages - check if task is already completed
          if ('progress' in message && message.progress !== undefined) {
            updateProgress(message.progress, message.message || '');
            // Add initial status to activity log
            if (message.message && message.message.trim()) {
              addActivityLog(message.message, message.progress, 'info');
            }
          }
          // Check if the status indicates completion (for reconnection after task finished)
          if ('status' in message) {
            const taskStatus = (message as unknown as { status: string }).status;
            if (taskStatus === 'completed') {
              console.log('[useStreaming] Task already completed (from status message)');
              // Don't set finished here - wait for the complete message with result
            } else if (taskStatus === 'error') {
              console.log('[useStreaming] Task already errored (from status message)');
            } else if (taskStatus === 'waiting_for_input') {
              console.log('[useStreaming] Task waiting for input');
              // The interaction details will come in a separate interaction_required message
            }
          }
          break;

        case 'interaction_required':
          // User-in-Loop: workflow is requesting user input
          console.log('[useStreaming] Interaction required:', message.interaction_type);
          addActivityLog(`⏸️ Waiting for input: ${message.title}`, 0, 'info');
          setPendingInteraction({
            type: message.interaction_type,
            title: message.title,
            description: message.description,
            data: message.data,
            options: message.options,
            required: message.required,
          });
          break;

        case 'complete':
          console.log('[useStreaming] Workflow complete!');
          console.log('[useStreaming] Result:', JSON.stringify(message.result, null, 2));
          setStatus('completed');  // This will make isFinished = true
          setResult(message.result);
          clearInteraction(); // Clear any pending interaction
          // Update progress to 100% to mark all steps as complete
          updateProgress(100, 'Workflow completed successfully');
          addActivityLog('✅ Workflow completed successfully!', 100, 'success');
          break;

        case 'error':
          // Handle "Task not found" - clear state and stop reconnecting
          if (message.error === 'Task not found') {
            console.log('[useStreaming] Task not found, clearing persisted state...');
            // Reset the entire workflow state (this also clears localStorage)
            useWorkflowStore.getState().reset();
          } else {
            // Real error - mark as error state
            setStatus('error');  // This will make isFinished = true
            setError(message.error);
            clearInteraction(); // Clear any pending interaction
            addActivityLog(`❌ Error: ${message.error}`, 0, 'error');
          }
          break;

        case 'code_chunk':
          if (message.content) {
            appendStreamedCode(message.content);
          }
          break;

        case 'file_start':
          if (message.filename) {
            setCurrentFile(message.filename);
          }
          break;

        case 'file_end':
          if (message.filename) {
            addGeneratedFile(message.filename);
            setCurrentFile(null);
          }
          break;

        case 'heartbeat':
          // Ignore heartbeat messages
          break;
      }
    },
    [updateProgress, setStatus, setResult, setError, appendStreamedCode, setCurrentFile, addGeneratedFile, addActivityLog, setPendingInteraction, clearInteraction]
  );

  // Compute effective URL - null if finished to stop WebSocket
  const workflowUrl = taskId && !isFinished ? `/ws/workflow/${taskId}` : null;
  const codeStreamUrl = taskId && !isFinished ? `/ws/code-stream/${taskId}` : null;

  const workflowWs = useWebSocket(workflowUrl, {
    onMessage: handleMessage as (message: unknown) => void,
    reconnect: true,
  });

  const codeStreamWs = useWebSocket(codeStreamUrl, {
    onMessage: handleMessage as (message: unknown) => void,
    reconnect: true,
  });

  // Reset status to running only when taskId actually changes to a new value
  useEffect(() => {
    if (taskId && taskId !== prevTaskIdRef.current) {
      console.log('[useStreaming] taskId changed from', prevTaskIdRef.current, 'to', taskId, '- resetting to running');
      prevTaskIdRef.current = taskId;
      setStatus('running');
    } else if (!taskId) {
      prevTaskIdRef.current = null;
    }
  }, [taskId, setStatus]);

  return {
    isConnected: workflowWs.isConnected || codeStreamWs.isConnected,
    isFinished,
    disconnect: () => {
      workflowWs.disconnect();
      codeStreamWs.disconnect();
    },
  };
}


================================================
FILE: new_ui/frontend/src/hooks/useTaskRecovery.ts
================================================
/**
 * Task Recovery Hook
 *
 * Handles automatic recovery of running tasks after page refresh.
 *
 * Flow:
 * 1. On mount, check if there's a persisted activeTaskId
 * 2. If yes, query the backend to verify task status
 * 3. If task is still running, reconnect WebSocket
 * 4. If task is completed/error, sync the final state
 * 5. If task not found, clear the persisted state
 */

import { useEffect, useCallback, useState } from 'react';
import { useWorkflowStore } from '../stores/workflowStore';
import { workflowsApi } from '../services/api';
import { PAPER_TO_CODE_STEPS, CHAT_PLANNING_STEPS } from '../types/workflow';

interface RecoveryState {
  isRecovering: boolean;
  recoveredTaskId: string | null;
  error: string | null;
}

export function useTaskRecovery() {
  const {
    activeTaskId,
    workflowType,
    status,
    setActiveTask,
    setStatus,
    setSteps,
    updateProgress,
    setResult,
    setError,
    setNeedsRecovery,
    reset,
  } = useWorkflowStore();

  const [recoveryState, setRecoveryState] = useState<RecoveryState>({
    isRecovering: false,
    recoveredTaskId: null,
    error: null,
  });

  const recoverTask = useCallback(async () => {
    // Only recover if there's a persisted task and it was running
    if (!activeTaskId || status === 'idle' || status === 'completed' || status === 'error') {
      return;
    }

    console.log('[TaskRecovery] Attempting to recover task:', activeTaskId);
    setRecoveryState({ isRecovering: true, recoveredTaskId: null, error: null });

    try {
      // Query backend for task status
      const taskStatus = await workflowsApi.getStatus(activeTaskId);
      console.log('[TaskRecovery] Task status from backend:', taskStatus);

      if (taskStatus.status === 'running') {
        // Task is still running - restore steps and let WebSocket reconnect
        console.log('[TaskRecovery] Task still running, reconnecting...');

        // Restore steps based on workflow type
        if (workflowType === 'paper-to-code') {
          setSteps(PAPER_TO_CODE_STEPS);
        } else if (workflowType === 'chat-planning') {
          setSteps(CHAT_PLANNING_STEPS);
        }

        // Update progress from backend
        updateProgress(taskStatus.progress, taskStatus.message);
        setStatus('running');
        setNeedsRecovery(false);

        setRecoveryState({
          isRecovering: false,
          recoveredTaskId: activeTaskId,
          error: null,
        });

      } else if (taskStatus.status === 'completed') {
        // Task completed while we were away
        console.log('[TaskRecovery] Task completed, syncing final state...');

        if (workflowType === 'paper-to-code') {
          setSteps(PAPER_TO_CODE_STEPS);
        } else if (workflowType === 'chat-planning') {
          setSteps(CHAT_PLANNING_STEPS);
        }

        updateProgress(100, 'Completed');
        setStatus('completed');
        setResult(taskStatus.result || null);
        setNeedsRecovery(false);

        setRecoveryState({
          isRecovering: false,
          recoveredTaskId: activeTaskId,
          error: null,
        });

      } else if (taskStatus.status === 'error') {
        // Task errored while we were away
        console.log('[TaskRecovery] Task errored, syncing error state...');

        setStatus('error');
        setError(taskStatus.error || 'Unknown error');
        setNeedsRecovery(false);

        setRecoveryState({
          isRecovering: false,
          recoveredTaskId: activeTaskId,
          error: taskStatus.error || null,
        });

      } else {
        // Unknown status, reset
        console.log('[TaskRecovery] Unknown task status, resetting...');
        reset();
        setRecoveryState({
          isRecovering: false,
          recoveredTaskId: null,
          error: null,
        });
      }

    } catch (error) {
      // Task not found or API error
      console.error('[TaskRecovery] Failed to recover task:', error);

      // Always reset on any error - the task is no longer valid
      // This handles 404 (task not found) and any other API errors
      console.log('[TaskRecovery] Task not recoverable, clearing state...');
      reset();

      setRecoveryState({
        isRecovering: false,
        recoveredTaskId: null,
        error: null, // Don't show error - just clear state
      });
    }
  }, [activeTaskId, workflowType, status, setActiveTask, setStatus, setSteps, updateProgress, setResult, setError, setNeedsRecovery, reset]);

  // Run recovery on mount
  useEffect(() => {
    // Only run once on initial mount if there's a persisted running task
    if (activeTaskId && (status === 'running' || (status as string) === 'pending')) {
      setNeedsRecovery(true);
      recoverTask();
    }
  }, []); // Empty deps - only run on mount

  return {
    ...recoveryState,
    recoverTask,
  };
}


================================================
FILE: new_ui/frontend/src/hooks/useWebSocket.ts
================================================
import { useEffect, useRef, useCallback, useState } from 'react';
import type { WSMessage } from '../types/api';

interface UseWebSocketOptions {
  onMessage?: (message: WSMessage) => void;
  onOpen?: () => void;
  onClose?: () => void;
  onError?: (error: Event) => void;
  reconnect?: boolean;
  reconnectInterval?: number;
  maxReconnectAttempts?: number;
}

export function useWebSocket(
  url: string | null,
  options: UseWebSocketOptions = {}
) {
  const {
    onMessage,
    onOpen,
    onClose,
    onError,
    reconnect = true,
    reconnectInterval = 3000,
    maxReconnectAttempts = 50,  // Increased for long-running workflows
  } = options;

  const wsRef = useRef<WebSocket | null>(null);
  const reconnectAttemptsRef = useRef(0);
  const reconnectTimeoutRef = useRef<NodeJS.Timeout>();
  const shouldReconnectRef = useRef(true);

  // Use refs for callbacks to avoid triggering reconnection on callback changes
  const onMessageRef = useRef(onMessage);
  const onOpenRef = useRef(onOpen);
  const onCloseRef = useRef(onClose);
  const onErrorRef = useRef(onError);

  // Update refs when callbacks change
  useEffect(() => {
    onMessageRef.current = onMessage;
    onOpenRef.current = onOpen;
    onCloseRef.current = onClose;
    onErrorRef.current = onError;
  }, [onMessage, onOpen, onClose, onError]);

  const [isConnected, setIsConnected] = useState(false);
  const [lastMessage, setLastMessage] = useState<WSMessage | null>(null);

  const connect = useCallback(() => {
    if (!url) return;

    // Clean up existing connection
    if (wsRef.current) {
      wsRef.current.close();
    }

    shouldReconnectRef.current = true;

    const wsUrl = url.startsWith('ws')
      ? url
      : `${window.location.protocol === 'https:' ? 'wss:' : 'ws:'}//${window.location.host}${url}`;

    const ws = new WebSocket(wsUrl);

    ws.onopen = () => {
      setIsConnected(true);
      reconnectAttemptsRef.current = 0;
      onOpenRef.current?.();
    };

    ws.onclose = () => {
      setIsConnected(false);
      onCloseRef.current?.();

      // Attempt reconnection only if allowed
      if (
        shouldReconnectRef.current &&
        reconnect &&
        reconnectAttemptsRef.current < maxReconnectAttempts
      ) {
        reconnectTimeoutRef.current = setTimeout(() => {
          reconnectAttemptsRef.current += 1;
          connect();
        }, reconnectInterval);
      }
    };

    ws.onerror = (error) => {
      onErrorRef.current?.(error);
    };

    ws.onmessage = (event) => {
      try {
        const message = JSON.parse(event.data) as WSMessage;
        console.log('[useWebSocket] Received:', message.type, message);
        setLastMessage(message);
        if (onMessageRef.current) {
          console.log('[useWebSocket] Calling onMessage handler');
          onMessageRef.current(message);
        } else {
          console.error('[useWebSocket] No onMessage handler registered!');
        }
      } catch (e) {
        console.error('Failed to parse WebSocket message:', event.data, e);
      }
    };

    wsRef.current = ws;
  }, [url, reconnect, reconnectInterval, maxReconnectAttempts]);  // Removed callback dependencies

  const disconnect = useCallback(() => {
    shouldReconnectRef.current = false;
    if (reconnectTimeoutRef.current) {
      clearTimeout(reconnectTimeoutRef.current);
    }
    if (wsRef.current) {
      wsRef.current.close();
      wsRef.current = null;
    }
  }, []);

  const sendMessage = useCallback((data: unknown) => {
    if (wsRef.current && wsRef.current.readyState === WebSocket.OPEN) {
      wsRef.current.send(JSON.stringify(data));
    }
  }, []);

  useEffect(() => {
    if (url) {
      connect();
    } else {
      disconnect();
    }

    return () => {
      disconnect();
    };
  }, [url, connect, disconnect]);

  return {
    isConnected,
    lastMessage,
    sendMessage,
    connect,
    disconnect,
  };
}


================================================
FILE: new_ui/frontend/src/index.css
================================================
@tailwind base;
@tailwind components;
@tailwind utilities;

@layer base {
  :root {
    --border-color: #e5e7eb;
  }

  * {
    border-color: var(--border-color);
  }

  body {
    @apply bg-gray-50 text-gray-900 font-sans antialiased;
  }
}

@layer components {
  .btn {
    @apply inline-flex items-center justify-center rounded-lg px-4 py-2 text-sm font-medium transition-colors focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-primary-500 disabled:pointer-events-none disabled:opacity-50;
  }

  .btn-primary {
    @apply btn bg-primary-600 text-white hover:bg-primary-700;
  }

  .btn-secondary {
    @apply btn bg-gray-100 text-gray-900 hover:bg-gray-200;
  }

  .btn-ghost {
    @apply btn hover:bg-gray-100 hover:text-gray-900;
  }

  .card {
    @apply rounded-xl border border-gray-200 bg-white shadow-sm;
  }

  .input {
    @apply flex h-10 w-full rounded-lg border border-gray-200 bg-white px-3 py-2 text-sm ring-offset-white file:border-0 file:bg-transparent file:text-sm file:font-medium placeholder:text-gray-400 focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-primary-500 focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50;
  }

  .textarea {
    @apply flex min-h-[80px] w-full rounded-lg border border-gray-200 bg-white px-3 py-2 text-sm ring-offset-white placeholder:text-gray-400 focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-primary-500 focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50;
  }
}

/* Custom scrollbar */
::-webkit-scrollbar {
  width: 8px;
  height: 8px;
}

::-webkit-scrollbar-track {
  background: #f1f5f9;
  border-radius: 4px;
}

::-webkit-scrollbar-thumb {
  background: #cbd5e1;
  border-radius: 4px;
}

::-webkit-scrollbar-thumb:hover {
  background: #94a3b8;
}

/* Monaco editor customization */
.monaco-editor {
  border-radius: 8px;
}


================================================
FILE: new_ui/frontend/src/main.tsx
================================================
import React from 'react'
import ReactDOM from 'react-dom/client'
import { QueryClient, QueryClientProvider } from '@tanstack/react-query'
import App from './App'
import './index.css'

const queryClient = new QueryClient({
  defaultOptions: {
    queries: {
      staleTime: 1000 * 60 * 5, // 5 minutes
      retry: 1,
    },
  },
})

ReactDOM.createRoot(document.getElementById('root')!).render(
  <React.StrictMode>
    <QueryClientProvider client={queryClient}>
      <App />
    </QueryClientProvider>
  </React.StrictMode>,
)


================================================
FILE: new_ui/frontend/src/pages/ChatPlanningPage.tsx
================================================
import { useState, useEffect, useRef } from 'react';
import { motion, AnimatePresence } from 'framer-motion';
import { Card } from '../components/common';
import { ChatInput } from '../components/input';
import { ProgressTracker, ActivityLogViewer } from '../components/streaming';
import { FileTree } from '../components/results';
import { InlineChatInteraction } from '../components/interaction';
import { useWorkflowStore } from '../stores/workflowStore';
import { useSessionStore } from '../stores/sessionStore';
import { useStreaming } from '../hooks/useStreaming';
import { workflowsApi } from '../services/api';
import { toast } from '../components/common/Toaster';
import { CHAT_PLANNING_STEPS } from '../types/workflow';
import { MessageSquare, User, Bot, CheckCircle, XCircle, FolderOpen, StopCircle } from 'lucide-react';
import { ConfirmDialog } from '../components/common/ConfirmDialog';

export default function ChatPlanningPage() {
  const [enableIndexing, setEnableIndexing] = useState(false);
  const [showCancelDialog, setShowCancelDialog] = useState(false);
  const [isCancelling, setIsCancelling] = useState(false);
  const chatContainerRef = useRef<HTMLDivElement>(null);

  const {
    activeTaskId,
    status,
    progress,
    message,
    steps,
    generatedFiles,
    activityLogs,
    pendingInteraction,
    isWaitingForInput,
    result,
    error,
    setActiveTask,
    setSteps,
    setStatus,
    reset,
  } = useWorkflowStore();

  const { conversationHistory, addMessage } = useSessionStore();
  useStreaming(activeTaskId);

  // Debug: log status changes
  console.log('[ChatPlanningPage] status:', status, 'result:', result, 'error:', error);

  // Auto-scroll to bottom when new messages or interactions appear
  useEffect(() => {
    if (chatContainerRef.current) {
      chatContainerRef.current.scrollTop = chatContainerRef.current.scrollHeight;
    }
  }, [conversationHistory.length, pendingInteraction]);

  // Show toast and add message when workflow completes
  useEffect(() => {
    if (status === 'completed' && result) {
      toast.success('Code generation complete!', 'Your project has been generated successfully.');
      // Add completion message to chat
      const codeDir = result.repo_result && typeof result.repo_result === 'object'
        ? (result.repo_result as Record<string, unknown>).code_directory as string
        : null;
      addMessage({
        role: 'assistant',
        content: codeDir
          ? `Code generation complete! Your project has been generated at:\n\n${codeDir}`
          : 'Code generation complete! Your project has been successfully generated.',
      });
    } else if (status === 'error' && error) {
      toast.error('Generation failed', error);
      addMessage({
        role: 'assistant',
        content: `Sorry, code generation failed: ${error}`,
      });
    }
  }, [status, error, result, addMessage]);

  // Handle task cancellation
  const handleCancelTask = async () => {
    if (!activeTaskId) return;

    setIsCancelling(true);
    try {
      await workflowsApi.cancel(activeTaskId);
      setStatus('idle');
      reset();
      addMessage({
        role: 'assistant',
        content: 'Task cancelled. Feel free to start a new request.',
      });
      toast.info('Task cancelled', 'The workflow has been stopped.');
    } catch (err) {
      toast.error('Cancel failed', 'Could not cancel the task.');
      console.error('Cancel error:', err);
    } finally {
      setIsCancelling(false);
      setShowCancelDialog(false);
    }
  };

  const handleSubmit = async (message: string) => {
    try {
      // Add user message to history
      addMessage({ role: 'user', content: message });

      reset();
      setSteps(CHAT_PLANNING_STEPS);

      const response = await workflowsApi.startChatPlanning(
        message,
        enableIndexing
      );

      setActiveTask(response.task_id, 'chat-planning');
      addMessage({
        role: 'assistant',
        content: 'Starting code generation...',
        metadata: { taskId: response.task_id },
      });

      toast.info('Workflow started', 'Generating code from your requirements...');
    } catch (error) {
      toast.error('Failed to start workflow', 'Please try again');
      addMessage({
        role: 'assistant',
        content: 'Sorry, there was an error processing your request.',
      });
      console.error('Start error:', error);
    }
  };

  const isRunning = status === 'running';

  return (
    <div className="space-y-6">
      {/* Header */}
      <motion.div
        initial={{ opacity: 0, y: -10 }}
        animate={{ opacity: 1, y: 0 }}
      >
        <h1 className="text-2xl font-bold text-gray-900">Chat Planning</h1>
        <p className="text-gray-500 mt-1">
          Describe your project and let AI generate the code for you
        </p>
      </motion.div>

      <div className="grid gap-6 lg:grid-cols-2">
        {/* Left Column - Chat */}
        <div className="space-y-6">
          <Card padding="none" className="flex flex-col h-[600px]">
            {/* Chat Header */}
            <div className="px-4 py-3 border-b border-gray-100">
              <div className="flex items-center space-x-2">
                <MessageSquare className="h-5 w-5 text-primary-500" />
                <span className="font-medium text-gray-900">
                  Project Requirements
                </span>
              </div>
            </div>

            {/* Chat Messages */}
            <div ref={chatContainerRef} className="flex-1 overflow-y-auto p-4 space-y-4">
              {conversationHistory.length === 0 && !pendingInteraction ? (
                <div className="h-full flex items-center justify-center text-center text-gray-400">
                  <div>
                    <MessageSquare className="h-12 w-12 mx-auto mb-3 opacity-50" />
                    <p className="text-sm">
                      Describe your project requirements to get started
                    </p>
                  </div>
                </div>
              ) : (
                <>
                  {conversationHistory.map((msg) => (
                    <motion.div
                      key={msg.id}
                      initial={{ opacity: 0, y: 10 }}
                      animate={{ opacity: 1, y: 0 }}
                      className={`flex items-start space-x-3 ${
                        msg.role === 'user' ? 'flex-row-reverse space-x-reverse' : ''
                      }`}
                    >
                      <div
                        className={`flex-shrink-0 w-8 h-8 rounded-full flex items-center justify-center ${
                          msg.role === 'user'
                            ? 'bg-primary-100'
                            : 'bg-gray-100'
                        }`}
                      >
                        {msg.role === 'user' ? (
                          <User className="h-4 w-4 text-primary-600" />
                        ) : (
                          <Bot className="h-4 w-4 text-gray-600" />
                        )}
                      </div>
                      <div
                        className={`max-w-[80%] px-4 py-2 rounded-2xl ${
                          msg.role === 'user'
                            ? 'bg-primary-500 text-white'
                            : 'bg-gray-100 text-gray-900'
                        }`}
                      >
                        <p className="text-sm whitespace-pre-wrap">{msg.content}</p>
                      </div>
                    </motion.div>
                  ))}

                  {/* Inline Interaction - displayed in chat flow */}
                  <AnimatePresence>
                    {pendingInteraction && activeTaskId && (
                      <InlineChatInteraction
                        taskId={activeTaskId}
                        interaction={pendingInteraction}
                      />
                    )}
                  </AnimatePresence>
                </>
              )}
            </div>

            {/* Chat Input */}
            <div className="p-4 border-t border-gray-100">
              <ChatInput
                onSubmit={handleSubmit}
                isLoading={isRunning}
                placeholder="Describe your project requirements..."
              />
            </div>
          </Card>

          {/* Options */}
          <Card>
            <label className="flex items-center space-x-3 cursor-pointer">
              <input
                type="checkbox"
                checked={enableIndexing}
                onChange={(e) => setEnableIndexing(e.target.checked)}
                disabled={isRunning}
                className="w-4 h-4 text-primary-600 rounded focus:ring-primary-500 disabled:opacity-50"
              />
              <span className={`text-sm ${isRunning ? 'text-gray-400' : 'text-gray-700'}`}>
                Enable code indexing for better results
              </span>
            </label>

            {/* Cancel Button */}
            {isRunning && (
              <button
                onClick={() => setShowCancelDialog(true)}
                disabled={isCancelling}
                className="mt-4 w-full flex items-center justify-center space-x-2 px-4 py-2 text-sm font-medium text-red-600 bg-red-50 border border-red-200 rounded-lg hover:bg-red-100 transition-colors disabled:opacity-50"
              >
                <StopCircle className="h-4 w-4" />
                <span>Cancel Task</span>
              </button>
            )}
          </Card>
        </div>

        {/* Right Column - Results */}
        <div className="space-y-6">
          {/* Progress */}
          {status !== 'idle' && (
            <Card>
              <ProgressTracker steps={steps} currentProgress={progress} />
            </Card>
          )}

          {/* Activity Log */}
          <ActivityLogViewer
            logs={activityLogs}
            isRunning={isRunning && !isWaitingForInput}
            currentMessage={isWaitingForInput ? 'Waiting for your input...' : message}
          />

          {/* Generated Files */}
          {generatedFiles.length > 0 && (
            <FileTree files={generatedFiles} />
          )}

          {/* Completion Status */}
          {status === 'completed' && result && (
            <motion.div
              initial={{ opacity: 0, scale: 0.95 }}
              animate={{ opacity: 1, scale: 1 }}
            >
              <Card className="border-green-200 bg-green-50">
                <div className="flex items-start space-x-3">
                  <CheckCircle className="h-6 w-6 text-green-500 flex-shrink-0" />
                  <div className="flex-1">
                    <h3 className="font-medium text-green-900">
                      Code Generation Complete!
                    </h3>
                    <p className="text-sm text-green-700 mt-1">
                      Your code has been successfully generated.
                    </p>
                    {result.repo_result && typeof result.repo_result === 'object' && 'code_directory' in (result.repo_result as Record<string, unknown>) ? (
                      <div className="mt-3 flex items-center text-sm text-green-600">
                        <FolderOpen className="h-4 w-4 mr-2" />
                        <span className="font-mono text-xs">
                          {String((result.repo_result as Record<string, unknown>).code_directory)}
                        </span>
                      </div>
                    ) : null}
                  </div>
                </div>
              </Card>
            </motion.div>
          )}

          {/* Error Status */}
          {status === 'error' && error && (
            <motion.div
              initial={{ opacity: 0, scale: 0.95 }}
              animate={{ opacity: 1, scale: 1 }}
            >
              <Card className="border-red-200 bg-red-50">
                <div className="flex items-start space-x-3">
                  <XCircle className="h-6 w-6 text-red-500 flex-shrink-0" />
                  <div className="flex-1">
                    <h3 className="font-medium text-red-900">
                      Generation Failed
                    </h3>
                    <p className="text-sm text-red-700 mt-1">
                      {error}
                    </p>
                  </div>
                </div>
              </Card>
            </motion.div>
          )}
        </div>
      </div>

      {/* Cancel Confirmation Dialog */}
      <ConfirmDialog
        isOpen={showCancelDialog}
        title="Cancel Task?"
        message="Are you sure you want to cancel this task? Any progress will be lost and you'll need to start over."
        confirmLabel="Yes, Cancel"
        cancelLabel="Keep Running"
        variant="danger"
        onConfirm={handleCancelTask}
        onCancel={() => setShowCancelDialog(false)}
      />
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/pages/HomePage.tsx
================================================
import { Link } from 'react-router-dom';
import { motion } from 'framer-motion';
import {
  FileText,
  MessageSquare,
  GitBranch,
  ArrowRight,
  Rocket,
  Palette,
  Server,
  Users,
} from 'lucide-react';
import { Card } from '../components/common';

const features = [
  {
    icon: Rocket,
    title: 'Paper2Code',
    description:
      'Automated implementation of complex algorithms from research papers into high-quality, production-ready code.',
    color: 'text-red-500',
    bgColor: 'bg-red-50',
  },
  {
    icon: Palette,
    title: 'Text2Web',
    description:
      'Translates plain textual descriptions into fully functional, visually appealing front-end web code.',
    color: 'text-teal-500',
    bgColor: 'bg-teal-50',
  },
  {
    icon: Server,
    title: 'Text2Backend',
    description:
      'Generates efficient, scalable, and feature-rich back-end code from simple text inputs.',
    color: 'text-purple-500',
    bgColor: 'bg-purple-50',
  },
  {
    icon: Users,
    title: 'User-in-Loop',
    description:
      'Interactive collaboration with AI agents through real-time feedback and inline chat interaction.',
    color: 'text-blue-500',
    bgColor: 'bg-blue-50',
  },
];

const actions = [
  {
    path: '/paper-to-code',
    icon: FileText,
    title: 'Paper to Code',
    description: 'Convert research papers into working implementations',
    color: 'from-blue-500 to-indigo-600',
  },
  {
    path: '/chat',
    icon: MessageSquare,
    title: 'Chat Planning',
    description: 'Describe your project and let AI generate the code',
    color: 'from-purple-500 to-pink-600',
  },
  {
    path: '/workflow',
    icon: GitBranch,
    title: 'Workflow Editor',
    description: 'Visual workflow design for complex projects',
    color: 'from-green-500 to-teal-600',
  },
];

export default function HomePage() {
  return (
    <div className="space-y-12">
      {/* Hero */}
      <motion.div
        initial={{ opacity: 0, y: 20 }}
        animate={{ opacity: 1, y: 0 }}
        className="text-center"
      >
        <h1 className="text-4xl font-bold text-gray-900 mb-4">
          Welcome to{' '}
          <span className="bg-gradient-to-r from-primary-600 to-indigo-600 bg-clip-text text-transparent">
            DeepCode
          </span>
        </h1>
        <p className="text-lg text-gray-600 max-w-2xl mx-auto">
          Transform research papers and natural language specifications into
          production-ready code with AI-powered automation.
        </p>
      </motion.div>

      {/* Quick Actions */}
      <div className="grid gap-6 md:grid-cols-3">
        {actions.map((action, index) => {
          const Icon = action.icon;
          return (
            <motion.div
              key={action.path}
              initial={{ opacity: 0, y: 20 }}
              animate={{ opacity: 1, y: 0 }}
              transition={{ delay: index * 0.1 }}
            >
              <Link to={action.path}>
                <Card className="group hover:shadow-md transition-shadow h-full">
                  <div
                    className={`inline-flex p-3 rounded-xl bg-gradient-to-r ${action.color} mb-4`}
                  >
                    <Icon className="h-6 w-6 text-white" />
                  </div>
                  <h3 className="text-lg font-semibold text-gray-900 mb-2 group-hover:text-primary-600 transition-colors">
                    {action.title}
                  </h3>
                  <p className="text-gray-500 text-sm mb-4">
                    {action.description}
                  </p>
                  <span className="inline-flex items-center text-sm font-medium text-primary-600">
                    Get started
                    <ArrowRight className="ml-1 h-4 w-4 group-hover:translate-x-1 transition-transform" />
                  </span>
                </Card>
              </Link>
            </motion.div>
          );
        })}
      </div>

      {/* Features */}
      <div>
        <h2 className="text-2xl font-bold text-gray-900 mb-6 text-center">
          Powerful Features
        </h2>
        <div className="grid gap-6 md:grid-cols-2 lg:grid-cols-4">
          {features.map((feature, index) => {
            const Icon = feature.icon;
            return (
              <motion.div
                key={feature.title}
                initial={{ opacity: 0, scale: 0.95 }}
                animate={{ opacity: 1, scale: 1 }}
                transition={{ delay: 0.2 + index * 0.1 }}
              >
                <Card className="h-full">
                  <div
                    className={`inline-flex p-2.5 rounded-lg ${feature.bgColor} mb-3`}
                  >
                    <Icon className={`h-5 w-5 ${feature.color}`} />
                  </div>
                  <h3 className="font-semibold text-gray-900 mb-2">
                    {feature.title}
                  </h3>
                  <p className="text-sm text-gray-500">{feature.description}</p>
                </Card>
              </motion.div>
            );
          })}
        </div>
      </div>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/pages/PaperToCodePage.tsx
================================================
import { useState, useEffect } from 'react';
import { motion, AnimatePresence } from 'framer-motion';
import { Card, Button } from '../components/common';
import { FileUploader, UrlInput } from '../components/input';
import { ProgressTracker, ActivityLogViewer } from '../components/streaming';
import { FileTree } from '../components/results';
import { InteractionPanel } from '../components/interaction';
import { useWorkflowStore } from '../stores/workflowStore';
import { useStreaming } from '../hooks/useStreaming';
import { workflowsApi } from '../services/api';
import { toast } from '../components/common/Toaster';
import { PAPER_TO_CODE_STEPS } from '../types/workflow';
import { CheckCircle, XCircle, FolderOpen, StopCircle } from 'lucide-react';
import { ConfirmDialog } from '../components/common/ConfirmDialog';

type InputMethod = 'file' | 'url';

export default function PaperToCodePage() {
  const [inputMethod, setInputMethod] = useState<InputMethod>('file');
  const [uploadedFilePath, setUploadedFilePath] = useState<string | null>(null);
  const [enableIndexing, setEnableIndexing] = useState(false);
  const [showCancelDialog, setShowCancelDialog] = useState(false);
  const [isCancelling, setIsCancelling] = useState(false);

  const {
    activeTaskId,
    status,
    progress,
    message,
    steps,
    generatedFiles,
    activityLogs,
    pendingInteraction,
    isWaitingForInput,
    result,
    error,
    setActiveTask,
    setSteps,
    setStatus,
    reset,
  } = useWorkflowStore();

  useStreaming(activeTaskId);

  // Show toast when workflow completes
  useEffect(() => {
    if (status === 'completed' && result) {
      toast.success('Paper processing complete!', 'Code has been generated successfully.');
    } else if (status === 'error' && error) {
      toast.error('Processing failed', error);
    }
  }, [status, error, result]);

  // Handle task cancellation
  const handleCancelTask = async () => {
    if (!activeTaskId) return;

    setIsCancelling(true);
    try {
      await workflowsApi.cancel(activeTaskId);
      setStatus('idle');
      reset();
      toast.info('Task cancelled', 'The workflow has been stopped.');
    } catch (err) {
      toast.error('Cancel failed', 'Could not cancel the task.');
      console.error('Cancel error:', err);
    } finally {
      setIsCancelling(false);
      setShowCancelDialog(false);
    }
  };

  const handleStart = async (inputSource: string, inputType: 'file' | 'url') => {
    try {
      reset();
      setSteps(PAPER_TO_CODE_STEPS);

      const response = await workflowsApi.startPaperToCode(
        inputSource,
        inputType,
        enableIndexing
      );

      setActiveTask(response.task_id, 'paper-to-code');
      toast.info('Workflow started', 'Processing your paper...');
    } catch (error) {
      toast.error('Failed to start workflow', 'Please try again');
      console.error('Start error:', error);
    }
  };

  const handleFileUploaded = (_fileId: string, path: string) => {
    setUploadedFilePath(path);
  };

  const handleUrlSubmit = (url: string) => {
    handleStart(url, 'url');
  };

  const handleStartWithFile = () => {
    if (uploadedFilePath) {
      handleStart(uploadedFilePath, 'file');
    }
  };

  const isRunning = status === 'running';

  return (
    <div className="space-y-6">
      {/* Header */}
      <motion.div
        initial={{ opacity: 0, y: -10 }}
        animate={{ opacity: 1, y: 0 }}
      >
        <h1 className="text-2xl font-bold text-gray-900">Paper to Code</h1>
        <p className="text-gray-500 mt-1">
          Upload a research paper and convert it to a working implementation
        </p>
      </motion.div>

      <div className="grid gap-6 lg:grid-cols-2">
        {/* Left Column - Input */}
        <div className="space-y-6">
          <Card>
            <h3 className="font-semibold text-gray-900 mb-4">Input Source</h3>

            {/* Input Method Tabs */}
            <div className="flex space-x-2 mb-4">
              <button
                onClick={() => setInputMethod('file')}
                className={`flex-1 px-4 py-2 text-sm font-medium rounded-lg transition-colors ${
                  inputMethod === 'file'
                    ? 'bg-primary-50 text-primary-600'
                    : 'text-gray-600 hover:bg-gray-50'
                }`}
              >
                Upload PDF
              </button>
              <button
                onClick={() => setInputMethod('url')}
                className={`flex-1 px-4 py-2 text-sm font-medium rounded-lg transition-colors ${
                  inputMethod === 'url'
                    ? 'bg-primary-50 text-primary-600'
                    : 'text-gray-600 hover:bg-gray-50'
                }`}
              >
                URL Link
              </button>
            </div>

            {/* Input Components */}
            {inputMethod === 'file' ? (
              <div className="space-y-4">
                <FileUploader onFileUploaded={handleFileUploaded} disabled={isRunning} />
                {uploadedFilePath && !isRunning && (
                  <Button
                    onClick={handleStartWithFile}
                    isLoading={isRunning}
                    className="w-full"
                  >
                    Start Processing
                  </Button>
                )}
              </div>
            ) : (
              <UrlInput onSubmit={handleUrlSubmit} isLoading={isRunning} disabled={isRunning} />
            )}

            {/* Cancel Button */}
            {isRunning && (
              <div className="mt-4">
                <button
                  onClick={() => setShowCancelDialog(true)}
                  disabled={isCancelling}
                  className="w-full flex items-center justify-center space-x-2 px-4 py-2 text-sm font-medium text-red-600 bg-red-50 border border-red-200 rounded-lg hover:bg-red-100 transition-colors disabled:opacity-50"
                >
                  <StopCircle className="h-4 w-4" />
                  <span>Cancel Task</span>
                </button>
              </div>
            )}

            {/* Options */}
            <div className="mt-6 pt-4 border-t border-gray-100">
              <label className="flex items-center space-x-3 cursor-pointer">
                <input
                  type="checkbox"
                  checked={enableIndexing}
                  onChange={(e) => setEnableIndexing(e.target.checked)}
                  className="w-4 h-4 text-primary-600 rounded focus:ring-primary-500"
                />
                <span className="text-sm text-gray-700">
                  Enable code indexing
                </span>
              </label>
              <p className="text-xs text-gray-400 mt-1 ml-7">
                Improves code quality but takes longer
              </p>
            </div>
          </Card>
        </div>

        {/* Right Column - Progress & Results */}
        <div className="space-y-6">
          {/* Progress */}
          {status !== 'idle' && (
            <Card>
              <ProgressTracker steps={steps} currentProgress={progress} />
            </Card>
          )}

          {/* User-in-Loop Interaction Panel */}
          <AnimatePresence>
            {pendingInteraction && activeTaskId && (
              <InteractionPanel
                taskId={activeTaskId}
                interaction={pendingInteraction}
              />
            )}
          </AnimatePresence>

          {/* Activity Log */}
          <ActivityLogViewer
            logs={activityLogs}
            isRunning={isRunning && !isWaitingForInput}
            currentMessage={isWaitingForInput ? 'Waiting for your input...' : message}
          />

          {/* Generated Files */}
          {generatedFiles.length > 0 && (
            <FileTree files={generatedFiles} />
          )}

          {/* Completion Status */}
          {status === 'completed' && result && (
            <motion.div
              initial={{ opacity: 0, scale: 0.95 }}
              animate={{ opacity: 1, scale: 1 }}
            >
              <Card className="border-green-200 bg-green-50">
                <div className="flex items-start space-x-3">
                  <CheckCircle className="h-6 w-6 text-green-500 flex-shrink-0" />
                  <div className="flex-1">
                    <h3 className="font-medium text-green-900">
                      Code Generation Complete!
                    </h3>
                    <p className="text-sm text-green-700 mt-1">
                      Your code has been successfully generated from the paper.
                    </p>
                    {result.repo_result && typeof result.repo_result === 'object' && 'code_directory' in (result.repo_result as Record<string, unknown>) ? (
                      <div className="mt-3 flex items-center text-sm text-green-600">
                        <FolderOpen className="h-4 w-4 mr-2" />
                        <span className="font-mono text-xs">
                          {String((result.repo_result as Record<string, unknown>).code_directory)}
                        </span>
                      </div>
                    ) : null}
                  </div>
                </div>
              </Card>
            </motion.div>
          )}

          {/* Error Status */}
          {status === 'error' && error && (
            <motion.div
              initial={{ opacity: 0, scale: 0.95 }}
              animate={{ opacity: 1, scale: 1 }}
            >
              <Card className="border-red-200 bg-red-50">
                <div className="flex items-start space-x-3">
                  <XCircle className="h-6 w-6 text-red-500 flex-shrink-0" />
                  <div className="flex-1">
                    <h3 className="font-medium text-red-900">
                      Processing Failed
                    </h3>
                    <p className="text-sm text-red-700 mt-1">
                      {error}
                    </p>
                  </div>
                </div>
              </Card>
            </motion.div>
          )}
        </div>
      </div>

      {/* Cancel Confirmation Dialog */}
      <ConfirmDialog
        isOpen={showCancelDialog}
        title="Cancel Task?"
        message="Are you sure you want to cancel this task? Any progress will be lost and you'll need to start over."
        confirmLabel="Yes, Cancel"
        cancelLabel="Keep Running"
        variant="danger"
        onConfirm={handleCancelTask}
        onCancel={() => setShowCancelDialog(false)}
      />
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/pages/SettingsPage.tsx
================================================
import { useState, useEffect } from 'react';
import { motion } from 'framer-motion';
import { useQuery, useMutation, useQueryClient } from '@tanstack/react-query';
import { Card, Button } from '../components/common';
import { toast } from '../components/common/Toaster';
import { configApi } from '../services/api';
import { Settings, Server, Cpu, Check } from 'lucide-react';

export default function SettingsPage() {
  const queryClient = useQueryClient();

  const { data: settings, isLoading } = useQuery({
    queryKey: ['settings'],
    queryFn: configApi.getSettings,
  });

  const { data: providers } = useQuery({
    queryKey: ['llm-providers'],
    queryFn: configApi.getLLMProviders,
  });

  const updateProviderMutation = useMutation({
    mutationFn: configApi.setLLMProvider,
    onSuccess: () => {
      queryClient.invalidateQueries({ queryKey: ['settings'] });
      queryClient.invalidateQueries({ queryKey: ['llm-providers'] });
      toast.success('Settings saved', 'LLM provider updated');
    },
    onError: () => {
      toast.error('Failed to save', 'Please try again');
    },
  });

  const [selectedProvider, setSelectedProvider] = useState('');

  useEffect(() => {
    if (settings?.llm_provider) {
      setSelectedProvider(settings.llm_provider);
    }
  }, [settings]);

  const handleSaveProvider = () => {
    if (selectedProvider && selectedProvider !== settings?.llm_provider) {
      updateProviderMutation.mutate(selectedProvider);
    }
  };

  const providerInfo: Record<string, { name: string; description: string }> = {
    google: {
      name: 'Google Gemini',
      description: 'Uses Gemini models for code generation',
    },
    anthropic: {
      name: 'Anthropic Claude',
      description: 'Uses Claude models for high-quality output',
    },
    openai: {
      name: 'OpenAI',
      description: 'Uses GPT models for code generation',
    },
  };

  if (isLoading) {
    return (
      <div className="flex items-center justify-center h-64">
        <div className="animate-spin rounded-full h-8 w-8 border-b-2 border-primary-600"></div>
      </div>
    );
  }

  return (
    <div className="space-y-6 max-w-2xl">
      {/* Header */}
      <motion.div
        initial={{ opacity: 0, y: -10 }}
        animate={{ opacity: 1, y: 0 }}
      >
        <h1 className="text-2xl font-bold text-gray-900">Settings</h1>
        <p className="text-gray-500 mt-1">
          Configure DeepCode to match your preferences
        </p>
      </motion.div>

      {/* LLM Provider */}
      <Card>
        <div className="flex items-center space-x-3 mb-6">
          <div className="p-2 bg-primary-50 rounded-lg">
            <Cpu className="h-5 w-5 text-primary-600" />
          </div>
          <div>
            <h3 className="font-semibold text-gray-900">LLM Provider</h3>
            <p className="text-sm text-gray-500">
              Choose the AI model provider for code generation
            </p>
          </div>
        </div>

        <div className="space-y-3">
          {providers?.available_providers.map((provider) => {
            const info = providerInfo[provider];
            const isSelected = selectedProvider === provider;

            return (
              <button
                key={provider}
                onClick={() => setSelectedProvider(provider)}
                className={`w-full flex items-center justify-between p-4 rounded-lg border-2 transition-colors ${
                  isSelected
                    ? 'border-primary-500 bg-primary-50'
                    : 'border-gray-200 hover:border-gray-300'
                }`}
              >
                <div className="flex items-center space-x-3">
                  <Server
                    className={`h-5 w-5 ${
                      isSelected ? 'text-primary-600' : 'text-gray-400'
                    }`}
                  />
                  <div className="text-left">
                    <div
                      className={`font-medium ${
                        isSelected ? 'text-primary-900' : 'text-gray-900'
                      }`}
                    >
                      {info?.name || provider}
                    </div>
                    <div
                      className={`text-sm ${
                        isSelected ? 'text-primary-600' : 'text-gray-500'
                      }`}
                    >
                      {info?.description || ''}
                    </div>
                  </div>
                </div>
                {isSelected && (
                  <Check className="h-5 w-5 text-primary-600" />
                )}
              </button>
            );
          })}
        </div>

        {selectedProvider !== settings?.llm_provider && (
          <div className="mt-4 pt-4 border-t border-gray-100">
            <Button
              onClick={handleSaveProvider}
              isLoading={updateProviderMutation.isPending}
            >
              Save Changes
            </Button>
          </div>
        )}
      </Card>

      {/* Current Models */}
      <Card>
        <div className="flex items-center space-x-3 mb-4">
          <div className="p-2 bg-gray-100 rounded-lg">
            <Settings className="h-5 w-5 text-gray-600" />
          </div>
          <h3 className="font-semibold text-gray-900">Current Configuration</h3>
        </div>

        <div className="space-y-3">
          <div className="flex justify-between py-2 border-b border-gray-100">
            <span className="text-sm text-gray-500">Active Provider</span>
            <span className="text-sm font-medium text-gray-900">
              {providerInfo[settings?.llm_provider || '']?.name || settings?.llm_provider}
            </span>
          </div>
          <div className="flex justify-between py-2 border-b border-gray-100">
            <span className="text-sm text-gray-500">Planning Model</span>
            <span className="text-sm font-mono text-gray-900">
              {settings?.models?.planning || 'N/A'}
            </span>
          </div>
          <div className="flex justify-between py-2 border-b border-gray-100">
            <span className="text-sm text-gray-500">Implementation Model</span>
            <span className="text-sm font-mono text-gray-900">
              {settings?.models?.implementation || 'N/A'}
            </span>
          </div>
          <div className="flex justify-between py-2">
            <span className="text-sm text-gray-500">Code Indexing</span>
            <span className="text-sm text-gray-900">
              {settings?.indexing_enabled ? 'Enabled' : 'Disabled'}
            </span>
          </div>
        </div>
      </Card>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/pages/WorkflowEditorPage.tsx
================================================
import { motion } from 'framer-motion';
import { Card } from '../components/common';
import { WorkflowCanvas } from '../components/workflow';
import { PAPER_TO_CODE_STEPS, CHAT_PLANNING_STEPS } from '../types/workflow';
import { useState } from 'react';

export default function WorkflowEditorPage() {
  const [selectedWorkflow, setSelectedWorkflow] = useState<'paper' | 'chat'>('paper');
  const [currentStep, setCurrentStep] = useState(2); // Demo: step 2 is active

  const steps = selectedWorkflow === 'paper' ? PAPER_TO_CODE_STEPS : CHAT_PLANNING_STEPS;

  return (
    <div className="space-y-6">
      {/* Header */}
      <motion.div
        initial={{ opacity: 0, y: -10 }}
        animate={{ opacity: 1, y: 0 }}
      >
        <h1 className="text-2xl font-bold text-gray-900">Workflow Editor</h1>
        <p className="text-gray-500 mt-1">
          Visualize and customize your code generation workflows
        </p>
      </motion.div>

      {/* Workflow Selection */}
      <Card>
        <div className="flex items-center space-x-4 mb-6">
          <span className="text-sm font-medium text-gray-700">Workflow:</span>
          <div className="flex space-x-2">
            <button
              onClick={() => setSelectedWorkflow('paper')}
              className={`px-4 py-2 text-sm font-medium rounded-lg transition-colors ${
                selectedWorkflow === 'paper'
                  ? 'bg-primary-50 text-primary-600'
                  : 'text-gray-600 hover:bg-gray-50'
              }`}
            >
              Paper to Code
            </button>
            <button
              onClick={() => setSelectedWorkflow('chat')}
              className={`px-4 py-2 text-sm font-medium rounded-lg transition-colors ${
                selectedWorkflow === 'chat'
                  ? 'bg-primary-50 text-primary-600'
                  : 'text-gray-600 hover:bg-gray-50'
              }`}
            >
              Chat Planning
            </button>
          </div>
        </div>

        {/* Step Selector for Demo */}
        <div className="flex items-center space-x-4 mb-6">
          <span className="text-sm font-medium text-gray-700">Current Step:</span>
          <input
            type="range"
            min="0"
            max={steps.length - 1}
            value={currentStep}
            onChange={(e) => setCurrentStep(parseInt(e.target.value))}
            className="w-48"
          />
          <span className="text-sm text-gray-500">
            {steps[currentStep]?.title || 'N/A'}
          </span>
        </div>

        <WorkflowCanvas
          steps={steps}
          currentStepIndex={currentStep}
          onStepClick={(stepId) => {
            const index = steps.findIndex((s) => s.id === stepId);
            if (index !== -1) setCurrentStep(index);
          }}
        />
      </Card>

      {/* Info */}
      <Card>
        <h3 className="font-semibold text-gray-900 mb-4">About This View</h3>
        <p className="text-sm text-gray-600">
          The workflow editor allows you to visualize the code generation pipeline.
          Each node represents a step in the process, and the connections show the
          data flow between steps. Use this view to understand how DeepCode processes
          your inputs and generates code.
        </p>
        <ul className="mt-4 space-y-2 text-sm text-gray-600">
          <li className="flex items-center space-x-2">
            <span className="w-3 h-3 rounded-full bg-gray-300"></span>
            <span>Pending steps</span>
          </li>
          <li className="flex items-center space-x-2">
            <span className="w-3 h-3 rounded-full bg-primary-500"></span>
            <span>Active step</span>
          </li>
          <li className="flex items-center space-x-2">
            <span className="w-3 h-3 rounded-full bg-green-500"></span>
            <span>Completed steps</span>
          </li>
        </ul>
      </Card>
    </div>
  );
}


================================================
FILE: new_ui/frontend/src/pages/index.ts
================================================
export { default as HomePage } from './HomePage';
export { default as PaperToCodePage } from './PaperToCodePage';
export { default as ChatPlanningPage } from './ChatPlanningPage';
export { default as WorkflowEditorPage } from './WorkflowEditorPage';
export { default as SettingsPage } from './SettingsPage';


================================================
FILE: new_ui/frontend/src/services/api.ts
================================================
import axios from 'axios';
import type {
  TaskResponse,
  WorkflowStatusResponse,
  QuestionsResponse,
  RequirementsSummaryResponse,
  ConfigResponse,
  SettingsResponse,
  FileUploadResponse,
} from '../types/api';

const api = axios.create({
  baseURL: '/api/v1',
  timeout: 30000,
  headers: {
    'Content-Type': 'application/json',
  },
});

// Workflows API
export const workflowsApi = {
  startPaperToCode: async (
    inputSource: string,
    inputType: 'file' | 'url',
    enableIndexing: boolean = false
  ): Promise<TaskResponse> => {
    const response = await api.post<TaskResponse>('/workflows/paper-to-code', {
      input_source: inputSource,
      input_type: inputType,
      enable_indexing: enableIndexing,
    });
    return response.data;
  },

  startChatPlanning: async (
    requirements: string,
    enableIndexing: boolean = false
  ): Promise<TaskResponse> => {
    const response = await api.post<TaskResponse>('/workflows/chat-planning', {
      requirements,
      enable_indexing: enableIndexing,
    });
    return response.data;
  },

  getStatus: async (taskId: string): Promise<WorkflowStatusResponse> => {
    const response = await api.get<WorkflowStatusResponse>(
      `/workflows/status/${taskId}`
    );
    return response.data;
  },

  cancel: async (taskId: string): Promise<void> => {
    await api.post(`/workflows/cancel/${taskId}`);
  },

  getActiveTasks: async (): Promise<{ tasks: Array<{
    task_id: string;
    status: string;
    progress: number;
    message: string;
    started_at: string | null;
  }> }> => {
    const response = await api.get('/workflows/active');
    return response.data;
  },

  getRecentTasks: async (limit: number = 10): Promise<{ tasks: Array<{
    task_id: string;
    status: string;
    progress: number;
    message: string;
    result: Record<string, unknown> | null;
    error: string | null;
    started_at: string | null;
    completed_at: string | null;
  }> }> => {
    const response = await api.get(`/workflows/recent?limit=${limit}`);
    return response.data;
  },

  // User-in-Loop interaction APIs
  respondToInteraction: async (
    taskId: string,
    action: string,
    data: Record<string, unknown> = {},
    skipped: boolean = false
  ): Promise<{ status: string; task_id: string; action: string }> => {
    const response = await api.post(`/workflows/respond/${taskId}`, {
      action,
      data,
      skipped,
    });
    return response.data;
  },

  getInteraction: async (taskId: string): Promise<{
    has_interaction: boolean;
    task_id: string;
    status: string;
    interaction?: {
      type: string;
      title: string;
      description: string;
      data: Record<string, unknown>;
      options: Record<string, string>;
      required: boolean;
    };
  }> => {
    const response = await api.get(`/workflows/interaction/${taskId}`);
    return response.data;
  },
};

// Requirements API
export const requirementsApi = {
  generateQuestions: async (
    initialRequirement: string
  ): Promise<QuestionsResponse> => {
    const response = await api.post<QuestionsResponse>('/requirements/questions', {
      initial_requirement: initialRequirement,
    });
    return response.data;
  },

  summarize: async (
    initialRequirement: string,
    userAnswers: Record<string, string>
  ): Promise<RequirementsSummaryResponse> => {
    const response = await api.post<RequirementsSummaryResponse>(
      '/requirements/summarize',
      {
        initial_requirement: initialRequirement,
        user_answers: userAnswers,
      }
    );
    return response.data;
  },

  modify: async (
    currentRequirements: string,
    modificationFeedback: string
  ): Promise<RequirementsSummaryResponse> => {
    const response = await api.put<RequirementsSummaryResponse>(
      '/requirements/modify',
      {
        current_requirements: currentRequirements,
        modification_feedback: modificationFeedback,
      }
    );
    return response.data;
  },
};

// Config API
export const configApi = {
  getSettings: async (): Promise<SettingsResponse> => {
    const response = await api.get<SettingsResponse>('/config/settings');
    return response.data;
  },

  getLLMProviders: async (): Promise<ConfigResponse> => {
    const response = await api.get<ConfigResponse>('/config/llm-providers');
    return response.data;
  },

  setLLMProvider: async (provider: string): Promise<void> => {
    await api.put('/config/llm-provider', { provider });
  },
};

// Files API
export const filesApi = {
  upload: async (file: File): Promise<FileUploadResponse> => {
    const formData = new FormData();
    formData.append('file', file);

    const response = await api.post<FileUploadResponse>('/files/upload', formData, {
      headers: {
        'Content-Type': 'multipart/form-data',
      },
    });
    return response.data;
  },

  delete: async (fileId: string): Promise<void> => {
    await api.delete(`/files/delete/${fileId}`);
  },

  getInfo: async (fileId: string): Promise<FileUploadResponse> => {
    const response = await api.get<FileUploadResponse>(`/files/info/${fileId}`);
    return response.data;
  },
};

export default api;


================================================
FILE: new_ui/frontend/src/stores/index.ts
================================================
export { useWorkflowStore } from './workflowStore';
export { useSessionStore } from './sessionStore';


================================================
FILE: new_ui/frontend/src/stores/sessionStore.ts
================================================
import { create } from 'zustand';
import { persist } from 'zustand/middleware';
import type { Message } from '../types/common';

interface SessionState {
  // Session
  sessionId: string | null;

  // Conversation history
  conversationHistory: Message[];

  // User preferences
  preferences: {
    llmProvider: string;
    enableIndexing: boolean;
    theme: 'light' | 'dark';
  };

  // Recent projects
  recentProjects: {
    id: string;
    name: string;
    type: string;
    timestamp: string;
  }[];

  // Actions
  setSessionId: (id: string | null) => void;
  addMessage: (message: Omit<Message, 'id' | 'timestamp'>) => void;
  clearHistory: () => void;
  updatePreferences: (prefs: Partial<SessionState['preferences']>) => void;
  addRecentProject: (project: Omit<SessionState['recentProjects'][0], 'timestamp'>) => void;
}

export const useSessionStore = create<SessionState>()(
  persist(
    (set, _get) => ({
      sessionId: null,
      conversationHistory: [],
      preferences: {
        llmProvider: 'google',
        enableIndexing: false,
        theme: 'light',
      },
      recentProjects: [],

      setSessionId: (id) => set({ sessionId: id }),

      addMessage: (message) => {
        const newMessage: Message = {
          ...message,
          id: crypto.randomUUID(),
          timestamp: new Date().toISOString(),
        };
        set((state) => ({
          conversationHistory: [...state.conversationHistory, newMessage],
        }));
      },

      clearHistory: () => set({ conversationHistory: [] }),

      updatePreferences: (prefs) =>
        set((state) => ({
          preferences: { ...state.preferences, ...prefs },
        })),

      addRecentProject: (project) => {
        const newProject = {
          ...project,
          timestamp: new Date().toISOString(),
        };
        set((state) => ({
          recentProjects: [newProject, ...state.recentProjects.slice(0, 9)],
        }));
      },
    }),
    {
      name: 'deepcode-session',
      partialize: (state) => ({
        preferences: state.preferences,
        recentProjects: state.recentProjects,
      }),
    }
  )
);


================================================
FILE: new_ui/frontend/src/stores/workflowStore.ts
================================================
import { create } from 'zustand';
import { persist } from 'zustand/middleware';
import type {
  WorkflowStatus,
  WorkflowStep,
} from '../types/workflow';

// Activity log entry type
interface ActivityLogEntry {
  id: string;
  timestamp: Date;
  message: string;
  progress: number;
  type: 'info' | 'success' | 'warning' | 'error' | 'progress';
}

// User-in-Loop interaction types
export interface PendingInteraction {
  type: string;  // 'requirement_questions' | 'plan_review' | etc.
  title: string;
  description: string;
  data: {
    questions?: Array<{
      id: string;
      question: string;
      category?: string;
      importance?: string;
      hint?: string;
    }>;
    plan?: string;
    plan_preview?: string;
    original_input?: string;
    [key: string]: unknown;
  };
  options: Record<string, string>;
  required: boolean;
}

interface WorkflowState {
  // Current task
  activeTaskId: string | null;
  workflowType: 'paper-to-code' | 'chat-planning' | null;  // Track workflow type
  status: WorkflowStatus;
  progress: number;
  message: string;

  // Steps
  steps: WorkflowStep[];
  currentStepIndex: number;

  // Streaming data
  streamedCode: string;
  currentFile: string | null;
  generatedFiles: string[];

  // Activity logs
  activityLogs: ActivityLogEntry[];

  // User-in-Loop interaction
  pendingInteraction: PendingInteraction | null;
  isWaitingForInput: boolean;

  // Results
  result: Record<string, unknown> | null;
  error: string | null;

  // Recovery
  needsRecovery: boolean;  // Flag to indicate if we need to recover a task

  // Actions
  setActiveTask: (taskId: string | null, workflowType?: 'paper-to-code' | 'chat-planning') => void;
  setStatus: (status: WorkflowStatus) => void;
  updateProgress: (progress: number, message: string) => void;
  setSteps: (steps: WorkflowStep[]) => void;
  updateStepStatus: (stepId: string, status: WorkflowStep['status']) => void;
  appendStreamedCode: (chunk: string) => void;
  setCurrentFile: (filename: string | null) => void;
  addGeneratedFile: (filename: string) => void;
  addActivityLog: (message: string, progress: number, type?: ActivityLogEntry['type']) => void;
  setPendingInteraction: (interaction: PendingInteraction | null) => void;
  clearInteraction: () => void;
  setResult: (result: Record<string, unknown> | null) => void;
  setError: (error: string | null) => void;
  setNeedsRecovery: (needs: boolean) => void;
  reset: () => void;
}

const initialState = {
  activeTaskId: null,
  workflowType: null as 'paper-to-code' | 'chat-planning' | null,
  status: 'idle' as WorkflowStatus,
  progress: 0,
  message: '',
  steps: [],
  currentStepIndex: -1,
  streamedCode: '',
  currentFile: null,
  generatedFiles: [],
  activityLogs: [] as ActivityLogEntry[],
  pendingInteraction: null as PendingInteraction | null,
  isWaitingForInput: false,
  result: null,
  error: null,
  needsRecovery: false,
};

export const useWorkflowStore = create<WorkflowState>()(
  persist(
    (set, get) => ({
      ...initialState,

      setActiveTask: (taskId, workflowType) => set({
        activeTaskId: taskId,
        workflowType: workflowType ?? get().workflowType
      }),

  setStatus: (status) => {
    console.log('[workflowStore] setStatus:', status);
    set({ status });
  },

  updateProgress: (progress, message) => {
    const { steps } = get();

    // Find current step based on progress
    let currentStepIndex = -1;
    for (let i = steps.length - 1; i >= 0; i--) {
      if (progress >= steps[i].progress) {
        currentStepIndex = i;
        break;
      }
    }

    // Check if workflow is complete (progress >= 100)
    const isComplete = progress >= 100;

    // Update step statuses
    const updatedSteps = steps.map((step, index) => ({
      ...step,
      status:
        isComplete
          ? 'completed'  // All steps completed when progress >= 100
          : index < currentStepIndex
          ? 'completed'
          : index === currentStepIndex
          ? 'active'
          : 'pending',
    })) as WorkflowStep[];

    set({
      progress,
      message,
      currentStepIndex: isComplete ? steps.length - 1 : currentStepIndex,
      steps: updatedSteps,
    });
  },

  setSteps: (steps) => set({ steps }),

  updateStepStatus: (stepId, status) => {
    const { steps } = get();
    const updatedSteps = steps.map((step) =>
      step.id === stepId ? { ...step, status } : step
    );
    set({ steps: updatedSteps });
  },

  appendStreamedCode: (chunk) =>
    set((state) => ({
      streamedCode: state.streamedCode + chunk,
    })),

  setCurrentFile: (filename) => set({ currentFile: filename }),

  addGeneratedFile: (filename) =>
    set((state) => ({
      generatedFiles: [...state.generatedFiles, filename],
    })),

  addActivityLog: (message, progress, type = 'progress') =>
    set((state) => ({
      activityLogs: [
        ...state.activityLogs,
        {
          id: `log-${Date.now()}-${Math.random().toString(36).substr(2, 9)}`,
          timestamp: new Date(),
          message,
          progress,
          type,
        },
      ],
    })),

  setPendingInteraction: (interaction) => {
    console.log('[workflowStore] setPendingInteraction:', interaction?.type);
    set({
      pendingInteraction: interaction,
      isWaitingForInput: interaction !== null,
    });
  },

  clearInteraction: () => {
    console.log('[workflowStore] clearInteraction');
    set({
      pendingInteraction: null,
      isWaitingForInput: false,
    });
  },

  setResult: (result) => {
    console.log('[workflowStore] setResult:', result);
    set({ result });
  },

  setError: (error) => set({ error, status: error ? 'error' : get().status }),

  setNeedsRecovery: (needs) => set({ needsRecovery: needs }),

  reset: () => {
    console.log('[workflowStore] Resetting state and clearing localStorage');
    // Clear localStorage explicitly to ensure clean state
    try {
      localStorage.removeItem('deepcode-workflow');
    } catch (e) {
      console.error('[workflowStore] Failed to clear localStorage:', e);
    }
    set(initialState);
  },
    }),
    {
      name: 'deepcode-workflow',
      // Only persist task-related data for recovery when task is running or waiting
      partialize: (state) => {
        const isActive = state.status === 'running' || state.isWaitingForInput;
        return {
          // Only persist activeTaskId if task is still running or waiting for input
          // This prevents trying to recover completed/errored tasks
          activeTaskId: isActive ? state.activeTaskId : null,
          workflowType: isActive ? state.workflowType : null,
          status: isActive ? state.status : 'idle',
          progress: isActive ? state.progress : 0,
          steps: isActive ? state.steps : [],
          isWaitingForInput: state.isWaitingForInput,
        };
      },
    }
  )
);


================================================
FILE: new_ui/frontend/src/types/api.ts
================================================
// API types

export interface TaskResponse {
  task_id: string;
  status: string;
  message: string;
  created_at?: string;
}

export interface WorkflowStatusResponse {
  task_id: string;
  status: string;
  progress: number;
  message: string;
  result?: Record<string, unknown>;
  error?: string;
  started_at?: string;
  completed_at?: string;
}

export interface QuestionsResponse {
  questions: Question[];
  status: string;
}

export interface Question {
  id: string;
  question: string;
  category?: string;
  importance?: string;
  hint?: string;
}

export interface RequirementsSummaryResponse {
  summary: string;
  status: string;
}

export interface ConfigResponse {
  llm_provider: string;
  available_providers: string[];
  models: Record<string, string>;
  indexing_enabled: boolean;
}

export interface SettingsResponse {
  llm_provider: string;
  models: Record<string, string>;
  indexing_enabled: boolean;
  document_segmentation: Record<string, unknown>;
}

export interface FileUploadResponse {
  file_id: string;
  filename: string;
  path: string;
  size: number;
}

export interface ErrorResponse {
  error: string;
  detail?: string;
  code?: string;
}

// WebSocket message types
export interface WSProgressMessage {
  type: 'progress' | 'status' | 'heartbeat';
  task_id: string;
  progress?: number;
  message?: string;
  status?: string;
  timestamp: string;
}

export interface WSCompleteMessage {
  type: 'complete';
  task_id: string;
  status: string;
  result: Record<string, unknown>;
  timestamp: string;
}

export interface WSErrorMessage {
  type: 'error';
  task_id: string;
  error: string;
  timestamp: string;
}

export interface WSCodeChunkMessage {
  type: 'code_chunk' | 'file_start' | 'file_end';
  task_id: string;
  content?: string;
  filename?: string;
  timestamp: string;
}

export interface WSLogMessage {
  type: 'log';
  level: 'INFO' | 'WARNING' | 'ERROR' | 'DEBUG';
  message: string;
  namespace: string;
  timestamp: string;
}

// User-in-Loop interaction message
export interface WSInteractionMessage {
  type: 'interaction_required';
  task_id: string;
  interaction_type: 'requirement_questions' | 'plan_review' | 'code_review' | string;
  title: string;
  description: string;
  data: {
    questions?: Question[];
    plan?: string;
    plan_preview?: string;
    original_input?: string;
    [key: string]: unknown;
  };
  options: Record<string, string>;
  required: boolean;
  timestamp: string;
}

export type WSMessage =
  | WSProgressMessage
  | WSCompleteMessage
  | WSErrorMessage
  | WSCodeChunkMessage
  | WSLogMessage
  | WSInteractionMessage;


================================================
FILE: new_ui/frontend/src/types/common.ts
================================================
// Common types

export interface Message {
  id: string;
  role: 'user' | 'assistant' | 'system';
  content: string;
  timestamp: string;
  metadata?: Record<string, unknown>;
}

export interface Notification {
  id: string;
  type: 'success' | 'error' | 'warning' | 'info';
  title: string;
  description?: string;
  duration?: number;
}

export interface LayoutConfig {
  sidebarWidth: number;
  showCodePreview: boolean;
  showWorkflowCanvas: boolean;
  splitRatio: number;
}

export type TaskType = 'paper-to-code' | 'chat-planning' | 'workflow-editor' | 'settings';


================================================
FILE: new_ui/frontend/src/types/index.ts
================================================
export * from './workflow';
export * from './api';
export * from './common';


================================================
FILE: new_ui/frontend/src/types/workflow.ts
================================================
// Workflow types

export type WorkflowStatus = 'idle' | 'running' | 'completed' | 'error' | 'cancelled';

export interface WorkflowStep {
  id: string;
  title: string;
  subtitle: string;
  progress: number;
  status: 'pending' | 'active' | 'completed' | 'error';
}

export interface WorkflowTask {
  taskId: string;
  status: WorkflowStatus;
  progress: number;
  message: string;
  result?: Record<string, unknown>;
  error?: string;
  startedAt?: string;
  completedAt?: string;
}

export interface WorkflowInput {
  type: 'paper-to-code' | 'chat-planning';
  inputSource: string;
  inputType: 'file' | 'url' | 'chat';
  enableIndexing: boolean;
}

// Workflow step definitions
export const PAPER_TO_CODE_STEPS: WorkflowStep[] = [
  { id: 'init', title: 'Initialize', subtitle: 'Load systems', progress: 5, status: 'pending' },
  { id: 'analyze', title: 'Analyze', subtitle: 'Parse paper', progress: 10, status: 'pending' },
  { id: 'download', title: 'Download', subtitle: 'Collect refs', progress: 25, status: 'pending' },
  { id: 'plan', title: 'Plan', subtitle: 'Blueprint', progress: 40, status: 'pending' },
  { id: 'references', title: 'References', subtitle: 'Key refs', progress: 50, status: 'pending' },
  { id: 'repos', title: 'Repos', subtitle: 'GitHub sync', progress: 60, status: 'pending' },
  { id: 'index', title: 'Index', subtitle: 'Vectorize', progress: 70, status: 'pending' },
  { id: 'implement', title: 'Implement', subtitle: 'Code gen', progress: 85, status: 'pending' },
];

export const CHAT_PLANNING_STEPS: WorkflowStep[] = [
  { id: 'init', title: 'Initialize', subtitle: 'Boot agents', progress: 5, status: 'pending' },
  { id: 'plan', title: 'Plan', subtitle: 'Analyze intent', progress: 30, status: 'pending' },
  { id: 'setup', title: 'Setup', subtitle: 'Workspace', progress: 50, status: 'pending' },
  { id: 'draft', title: 'Draft', subtitle: 'Generate plan', progress: 70, status: 'pending' },
  { id: 'implement', title: 'Implement', subtitle: 'Code gen', progress: 85, status: 'pending' },
];


================================================
FILE: new_ui/frontend/tailwind.config.js
================================================
/** @type {import('tailwindcss').Config} */
export default {
  content: [
    "./index.html",
    "./src/**/*.{js,ts,jsx,tsx}",
  ],
  theme: {
    extend: {
      colors: {
        primary: {
          50: '#eff6ff',
          100: '#dbeafe',
          200: '#bfdbfe',
          300: '#93c5fd',
          400: '#60a5fa',
          500: '#3b82f6',
          600: '#2563eb',
          700: '#1d4ed8',
          800: '#1e40af',
          900: '#1e3a8a',
        },
        gray: {
          50: '#f9fafb',
          100: '#f3f4f6',
          200: '#e5e7eb',
          300: '#d1d5db',
          400: '#9ca3af',
          500: '#6b7280',
          600: '#4b5563',
          700: '#374151',
          800: '#1f2937',
          900: '#111827',
        },
      },
      fontFamily: {
        sans: ['Inter', 'system-ui', 'sans-serif'],
        mono: ['JetBrains Mono', 'Menlo', 'Monaco', 'monospace'],
      },
      animation: {
        'pulse-slow': 'pulse 3s cubic-bezier(0.4, 0, 0.6, 1) infinite',
        'slide-in': 'slideIn 0.3s ease-out',
        'fade-in': 'fadeIn 0.2s ease-out',
      },
      keyframes: {
        slideIn: {
          '0%': { transform: 'translateX(-10px)', opacity: '0' },
          '100%': { transform: 'translateX(0)', opacity: '1' },
        },
        fadeIn: {
          '0%': { opacity: '0' },
          '100%': { opacity: '1' },
        },
      },
    },
  },
  plugins: [],
}


================================================
FILE: new_ui/frontend/tsconfig.json
================================================
{
  "compilerOptions": {
    "target": "ES2020",
    "useDefineForClassFields": true,
    "lib": ["ES2020", "DOM", "DOM.Iterable"],
    "module": "ESNext",
    "skipLibCheck": true,
    "moduleResolution": "bundler",
    "allowImportingTsExtensions": true,
    "resolveJsonModule": true,
    "isolatedModules": true,
    "noEmit": true,
    "jsx": "react-jsx",
    "strict": true,
    "noUnusedLocals": true,
    "noUnusedParameters": true,
    "noFallthroughCasesInSwitch": true,
    "baseUrl": ".",
    "paths": {
      "@/*": ["src/*"]
    }
  },
  "include": ["src"],
  "references": [{ "path": "./tsconfig.node.json" }]
}


================================================
FILE: new_ui/frontend/tsconfig.node.json
================================================
{
  "compilerOptions": {
    "composite": true,
    "skipLibCheck": true,
    "module": "ESNext",
    "moduleResolution": "bundler",
    "allowSyntheticDefaultImports": true
  },
  "include": ["vite.config.ts"]
}


================================================
FILE: new_ui/frontend/vite.config.ts
================================================
import { defineConfig } from 'vite'
import react from '@vitejs/plugin-react'
import path from 'path'

// https://vitejs.dev/config/
export default defineConfig({
  plugins: [react()],
  resolve: {
    alias: {
      '@': path.resolve(__dirname, './src'),
    },
  },
  server: {
    port: 5173,
    proxy: {
      '/api': {
        target: 'http://localhost:8000',
        changeOrigin: true,
      },
      '/ws': {
        target: 'ws://localhost:8000',
        ws: true,
      },
    },
  },
})


================================================
FILE: new_ui/scripts/build.sh
================================================
#!/bin/bash
# DeepCode New UI - Production Build Script

set -e

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_ROOT="$(cd "$SCRIPT_DIR/.." && pwd)"

echo "🏗️  Building DeepCode New UI for Production..."
echo ""

# Colors
GREEN='\033[0;32m'
BLUE='\033[0;34m'
NC='\033[0m' # No Color

# Build Frontend
echo -e "${BLUE}📦 Building React Frontend...${NC}"
cd "$PROJECT_ROOT/frontend"

# Install dependencies if needed
if [ ! -d "node_modules" ]; then
    echo "Installing npm dependencies..."
    npm install
fi

# Build
npm run build

echo -e "${GREEN}✓ Frontend built successfully!${NC}"
echo "  Output: $PROJECT_ROOT/frontend/dist"
echo ""

# Backend doesn't need building (Python)
echo -e "${BLUE}📦 Backend is ready (Python - no build required)${NC}"
echo ""

echo "=========================================="
echo -e "${GREEN}🎉 Build complete!${NC}"
echo ""
echo "To run in production:"
echo ""
echo "  Backend:"
echo "    cd $PROJECT_ROOT/backend"
echo "    uvicorn main:app --host 0.0.0.0 --port 8000"
echo ""
echo "  Frontend (serve static files):"
echo "    npx serve $PROJECT_ROOT/frontend/dist"
echo ""
echo "=========================================="


================================================
FILE: new_ui/scripts/start_dev.sh
================================================
#!/bin/bash
# DeepCode New UI - Development Startup Script

set -e

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
PROJECT_ROOT="$(cd "$SCRIPT_DIR/.." && pwd)"

echo "🚀 Starting DeepCode New UI Development Environment..."
echo ""

# Colors
GREEN='\033[0;32m'
BLUE='\033[0;34m'
NC='\033[0m' # No Color

# Check if we're in the right directory
if [ ! -f "$PROJECT_ROOT/backend/main.py" ]; then
    echo "❌ Error: Please run this script from the new_ui directory"
    exit 1
fi

# Function to cleanup on exit
cleanup() {
    echo ""
    echo "🛑 Shutting down..."
    pkill -P $$ 2>/dev/null || true
}
trap cleanup EXIT

# Start Backend
echo -e "${BLUE}📦 Starting FastAPI Backend...${NC}"
cd "$PROJECT_ROOT/backend"

# Check if pydantic-settings is installed
if ! python -c "import pydantic_settings" 2>/dev/null; then
    echo "Installing pydantic-settings..."
    pip install pydantic-settings
fi

# Start uvicorn in background
python -m uvicorn main:app --reload --host 0.0.0.0 --port 8000 &
BACKEND_PID=$!
echo -e "${GREEN}✓ Backend started on http://localhost:8000${NC}"
echo ""

# Start Frontend
echo -e "${BLUE}📦 Starting React Frontend...${NC}"
cd "$PROJECT_ROOT/frontend"

# Check if node_modules exists
if [ ! -d "node_modules" ]; then
    echo "Installing npm dependencies..."
    npm install
fi

# Start vite in background
npm run dev &
FRONTEND_PID=$!
echo -e "${GREEN}✓ Frontend started on http://localhost:5173${NC}"
echo ""

echo "=========================================="
echo -e "${GREEN}🎉 DeepCode New UI is running!${NC}"
echo ""
echo "  Frontend: http://localhost:5173"
echo "  Backend:  http://localhost:8000"
echo "  API Docs: http://localhost:8000/docs"
echo ""
echo "Press Ctrl+C to stop all services"
echo "=========================================="

# Wait for both processes
wait


================================================
FILE: prompts/code_prompts.py
================================================
"""
Prompt templates for the DeepCode agent system.

RECENT UPDATES (针对论文代码复现优化):
1. 简化并优化了文件结构生成逻辑，确保结构简洁且富有逻辑性
2. 明确标识需要复现的核心文件和组件，由LLM智能判断优先级
3. 优化了多agent协作的信息总结效率，减少冗余信息传递
4. 移除了时间线等次要信息，专注于高质量代码复现
5. 保持prompt完整性的同时提高了简洁性和可理解性
6. 采用更清晰的结构化格式，便于LLM理解和执行

核心改进：
- PAPER_ALGORITHM_ANALYSIS_PROMPT: 专注算法提取，明确实现优先级
- PAPER_CONCEPT_ANALYSIS_PROMPT: 专注系统架构，突出概念到代码的映射
- CODE_PLANNING_PROMPT: 整合前两者输出，生成高质量复现计划
"""

# Paper to Code Workflow Prompts
PAPER_INPUT_ANALYZER_PROMPT = """You are a precise input analyzer for paper-to-code tasks. You MUST return only a JSON object with no additional text.

Task: Analyze input text and identify file paths/URLs to determine appropriate input type.

Input Analysis Rules:
1. Path Detection:
   - Scan input text for file paths or URLs
   - Use first valid path/URL if multiple found
   - Treat as text input if no valid path/URL found

2. Path Type Classification:
   - URL (starts with http:// or https://): input_type = "url", path = "detected URL"
   - PDF file path: input_type = "file", path = "detected file path"
   - Directory path: input_type = "directory", path = "detected directory path"
   - No path/URL detected: input_type = "text", path = null

3. Requirements Analysis:
   - Extract ONLY requirements from additional_input
   - DO NOT modify or interpret requirements

CRITICAL OUTPUT RESTRICTIONS:
- RETURN ONLY RAW JSON - NO TEXT BEFORE OR AFTER
- NO markdown code blocks (```json)
- NO explanatory text or descriptions
- NO tool call information
- NO analysis summaries
- JUST THE JSON OBJECT BELOW

{
    "input_type": "text|file|directory|url",
    "path": "detected path or URL or null",
    "paper_info": {
        "title": "N/A for text input",
        "authors": ["N/A for text input"],
        "year": "N/A for text input"
    },
    "requirements": [
        "exact requirement from additional_input"
    ]
}
"""

PAPER_DOWNLOADER_PROMPT = """You are a precise paper downloader that processes input from PaperInputAnalyzerAgent.

Task: Handle paper according to input type and save to "./deepcode_lab/papers/id/id.md"
Note: The paper ID will be provided at the start of the message as "PAPER_ID=<number>". Use this EXACT number.

CRITICAL RULES:
- Use the EXACT paper ID provided in the message (PAPER_ID=X).
- Save path MUST be: ./deepcode_lab/papers/{PAPER_ID}/{PAPER_ID}.md

CRITICAL OUTPUT RESTRICTIONS:
- RETURN ONLY THE RAW JSON OBJECT DESCRIBED BELOW
- NO markdown code fences (```json)
- NO explanatory or conversational text before or after the JSON
- NO tool call commentary or step-by-step narration in the final reply
- IF YOU NEED TO EXPLAIN YOUR ACTIONS, DO SO THROUGH TOOL CALLS ONLY. THE FINAL ASSISTANT MESSAGE MUST BE JSON.

Processing Rules:
1. URL Input (input_type = "url"):
   - Use download_file_to tool with: url=<url>, destination="./deepcode_lab/papers/{PAPER_ID}/", filename="{PAPER_ID}.md"
   - Extract metadata (title, authors, year)
   - Return saved file path and metadata

2. File Input (input_type = "file"):
   - Use move_file_to tool with: source=<file_path>, destination="./deepcode_lab/papers/{PAPER_ID}/{PAPER_ID}.md"
   - The tool will automatically convert PDF/documents to .md format
   - NEVER manually extract content or use write_file - let the conversion tools handle this
   - Note: Original file is preserved, only a copy is placed in target directory
   - Return new saved file path and metadata

3. Directory Input (input_type = "directory"):
   - Verify directory exists
   - Return to PaperInputAnalyzerAgent for processing
   - Set status as "failure" with message

4. Text Input (input_type = "text"):
   - No file operations needed
   - Set paper_path as null
   - Use paper_info from input

Input Format:
{
    "input_type": "file|directory|url|text",
    "path": "detected path or null",
    "paper_info": {
        "title": "paper title or N/A",
        "authors": ["author names or N/A"],
        "year": "publication year or N/A"
    },
    "requirements": ["requirement1", "requirement2"]
}

CRITICAL OUTPUT RESTRICTIONS:
- RETURN ONLY RAW JSON - NO TEXT BEFORE OR AFTER
- NO markdown code blocks (```json)
- NO explanatory text or descriptions
- NO tool call information
- NO analysis summaries
- JUST THE JSON OBJECT BELOW

Output Format (MANDATORY - EXACT FORMAT):
{
    "status": "success|failure",
    "paper_path": "./deepcode_lab/papers/{PAPER_ID}/{PAPER_ID}.md (or null for text input)",
    "metadata": {
        "title": "extracted or provided title",
        "authors": ["extracted or provided authors"],
        "year": "extracted or provided year"
    }
}

Example: If PAPER_ID=14, then paper_path should be "./deepcode_lab/papers/14/14.md"
"""

PAPER_REFERENCE_ANALYZER_PROMPT = """You are an expert academic paper reference analyzer specializing in computer science and machine learning.

Task: Analyze paper and identify 5 most relevant references that have GitHub repositories.

Constraints:
- ONLY select references with GitHub repositories
- DO NOT use target paper's official implementation
- DO NOT use repositories directly associated with target paper
- CAN analyze code implementations from referenced papers
- Focus on references with good implementations solving similar problems

Analysis Criteria:
1. GitHub Repository Quality (40%):
   - Star count, activity, maintenance
   - Documentation quality
   - Community adoption
   - Last update date

2. Implementation Relevance (30%):
   - References from methodology/implementation sections
   - Algorithmic details
   - Core component descriptions
   - Code implementation quality

3. Technical Depth (20%):
   - Algorithm/method similarity
   - Technical foundation relationship
   - Implementation details
   - Code structure

4. Academic Influence (10%):
   - Publication venue quality
   - Author expertise
   - Research impact
   - Citation influence

Analysis Steps:
1. Extract all references from paper
2. Filter references with GitHub repositories
3. Analyze repositories based on criteria
4. Calculate relevance scores
5. Select and rank top 5 references

Output Format:
{
    "selected_references": [
        {
            "rank": 1,
            "title": "paper title",
            "authors": ["author1", "author2"],
            "year": "publication year",
            "relevance_score": 0.95,
            "citation_context": "how cited in main paper",
            "key_contributions": ["contribution1", "contribution2"],
            "implementation_value": "why valuable for implementation",
            "github_info": {
                "repository_url": "GitHub repository URL",
                "stars_count": "number of stars",
                "last_updated": "last update date",
                "repository_quality": "repository quality assessment",
                "key_features": ["feature1", "feature2"],
                "documentation_quality": "documentation assessment",
                "community_activity": "community engagement description"
            },
            "original_reference": "Complete reference text from paper"
        }
    ],
    "analysis_summary": "selection process and key findings",
    "github_repositories_found": "total number of references with GitHub repositories"
}
"""

GITHUB_DOWNLOAD_PROMPT = """You are an expert GitHub repository downloader.

Task: Download GitHub repositories to specified directory structure.

Process:
1. For each repository:
   - Create directory: {paper_dir}/code_base/
   - Download repository to directory

Requirements:
- Use interpreter tool to execute download script
- Monitor interpreter output for errors/warnings
- Verify download status through interpreter response

Output Format:
{
    "downloaded_repos": [
        {
            "reference_number": "1",
            "paper_title": "paper title",
            "repo_url": "github repository URL",
            "save_path": "{paper_dir}/code_base/name_of_repo",
            "status": "success|failed",
            "notes": "relevant notes about download"
        }
    ],
    "summary": "Brief summary of download process"
}
"""

# Code Analysis Prompts
PAPER_ALGORITHM_ANALYSIS_PROMPT = """You are extracting COMPLETE implementation details from a research paper. Your goal is to capture EVERY algorithm, formula, and technical detail needed for perfect reproduction.

# INTELLIGENT DOCUMENT READING STRATEGY

## IMPORTANT: Use Segmented Reading for Algorithm Extraction
To avoid token limits and efficiently extract algorithm details, use the intelligent segmentation system:

1. **Primary Algorithm Extraction** - Use read_document_segments tool with:
   - query_type: "algorithm_extraction"
   - keywords: ["algorithm", "method", "procedure", "formula", "equation", "implementation"]
   - max_segments: 3
   - max_total_chars: 6000

2. **Supplementary Details** - Make additional calls if needed with:
   - keywords: ["hyperparameter", "training", "optimization", "loss", "objective"]
   - keywords: ["experiment", "setup", "configuration", "parameter"]

3. **This approach ensures** you get the most algorithm-relevant content without missing critical details

# DETAILED EXTRACTION PROTOCOL

## 1. INTELLIGENT ALGORITHM SCAN
Use the segmented reading approach to focus on algorithm sections:
- Method/Algorithm sections (captured automatically by segmentation)
- Implementation Details (targeted retrieval)
- Hyperparameters and training details (focused extraction)

## 2. ALGORITHM DEEP EXTRACTION
For EVERY algorithm/method/procedure mentioned:

### Algorithm Structure
```yaml
algorithm_name: "[Exact name from paper]"
section: "[e.g., Section 3.2]"
algorithm_box: "[e.g., Algorithm 1 on page 4]"

pseudocode: |
  [COPY THE EXACT PSEUDOCODE FROM PAPER]
  Input: ...
  Output: ...
  1. Initialize ...
  2. For each ...
     2.1 Calculate ...
  [Keep exact formatting and numbering]

mathematical_formulation:
  - equation: "[Copy formula EXACTLY, e.g., L = L_task + λ*L_explain]"
    equation_number: "[e.g., Eq. 3]"
    where:
      L_task: "task loss"
      L_explain: "explanation loss"
      λ: "weighting parameter (default: 0.5)"

step_by_step_breakdown:
  1. "[Detailed explanation of what step 1 does]"
  2. "[What step 2 computes and why]"

implementation_details:
  - "Uses softmax temperature τ = 0.1"
  - "Gradient clipping at norm 1.0"
  - "Initialize weights with Xavier uniform"
```

## 3. COMPONENT EXTRACTION
For EVERY component/module mentioned:

### Component Details
```yaml
component_name: "[e.g., Mask Network, Critic Network]"
purpose: "[What this component does in the system]"
architecture:
  input: "[shape and meaning]"
  layers:
    - "[Conv2d(3, 64, kernel=3, stride=1)]"
    - "[ReLU activation]"
    - "[BatchNorm2d(64)]"
  output: "[shape and meaning]"

special_features:
  - "[Any unique aspects]"
  - "[Special initialization]"
```

## 4. TRAINING PROCEDURE
Extract the COMPLETE training process:

```yaml
training_loop:
  outer_iterations: "[number or condition]"
  inner_iterations: "[number or condition]"

  steps:
    1. "Sample batch of size B from buffer"
    2. "Compute importance weights using..."
    3. "Update policy with loss..."

  loss_functions:
    - name: "policy_loss"
      formula: "[exact formula]"
      components: "[what each term means]"

  optimization:
    optimizer: "Adam"
    learning_rate: "3e-4"
    lr_schedule: "linear decay to 0"
    gradient_norm: "clip at 0.5"
```

## 5. HYPERPARAMETERS HUNT
Search EVERYWHERE (text, tables, captions) for:

```yaml
hyperparameters:
  # Training
  batch_size: 64
  buffer_size: 1e6
  discount_gamma: 0.99

  # Architecture
  hidden_units: [256, 256]
  activation: "ReLU"

  # Algorithm-specific
  explanation_weight: 0.5
  exploration_bonus_scale: 0.1
  reset_probability: 0.3

  # Found in:
  location_references:
    - "batch_size: Table 1"
    - "hidden_units: Section 4.1"
```

# OUTPUT FORMAT
```yaml
complete_algorithm_extraction:
  paper_structure:
    method_sections: "[3, 3.1, 3.2, 3.3, 4]"
    algorithm_count: "[total number found]"

  main_algorithm:
    [COMPLETE DETAILS AS ABOVE]

  supporting_algorithms:
    - [EACH SUPPORTING ALGORITHM WITH FULL DETAILS]

  components:
    - [EVERY COMPONENT WITH ARCHITECTURE]

  training_details:
    [COMPLETE TRAINING PROCEDURE]

  all_hyperparameters:
    [EVERY PARAMETER WITH VALUE AND SOURCE]

  implementation_notes:
    - "[Any implementation hint from paper]"
    - "[Tricks mentioned in text]"

  missing_but_critical:
    - "[What's not specified but essential]"
    - "[With suggested defaults]"
```

BE EXHAUSTIVE. A developer should be able to implement the ENTIRE paper using only your extraction."""

PAPER_CONCEPT_ANALYSIS_PROMPT = """You are doing a COMPREHENSIVE analysis of a research paper to understand its complete structure, contributions, and implementation requirements.

# OBJECTIVE
Map out the ENTIRE paper structure and identify ALL components that need implementation for successful reproduction.

# INTELLIGENT DOCUMENT READING STRATEGY

## IMPORTANT: Use Segmented Reading for Optimal Performance
Instead of reading the entire document at once (which may hit token limits), use the intelligent segmentation system:

1. **Use read_document_segments tool** with these parameters:
   - query_type: "concept_analysis"
   - keywords: ["introduction", "overview", "architecture", "system", "framework", "concept", "method"]
   - max_segments: 3
   - max_total_chars: 6000

2. **This will automatically find and retrieve** the most relevant sections for concept analysis without token overflow

3. **If you need additional sections**, make follow-up calls with different keywords like ["experiment", "evaluation", "results"] or ["conclusion", "discussion"]

# COMPREHENSIVE ANALYSIS PROTOCOL

## 1. INTELLIGENT PAPER STRUCTURAL ANALYSIS
Use the segmented reading approach to create a complete map:

```yaml
paper_structure_map:
  title: "[Full paper title]"

  sections:
    1_introduction:
      main_claims: "[What the paper claims to achieve]"
      problem_definition: "[Exact problem being solved]"

    2_related_work:
      key_comparisons: "[Methods this work builds upon or competes with]"

    3_method:  # May have multiple subsections
      subsections:
        3.1: "[Title and main content]"
        3.2: "[Title and main content]"
      algorithms_presented: "[List all algorithms by name]"

    4_experiments:
      environments: "[All test environments/datasets]"
      baselines: "[All comparison methods]"
      metrics: "[All evaluation metrics used]"

    5_results:
      main_findings: "[Key results that prove the method works]"
      tables_figures: "[Important result tables/figures to reproduce]"
```

## 2. METHOD DECOMPOSITION
For the main method/approach:

```yaml
method_decomposition:
  method_name: "[Full name and acronym]"

  core_components:  # Break down into implementable pieces
    component_1:
      name: "[e.g., State Importance Estimator]"
      purpose: "[Why this component exists]"
      paper_section: "[Where it's described]"

    component_2:
      name: "[e.g., Policy Refinement Module]"
      purpose: "[Its role in the system]"
      paper_section: "[Where it's described]"

  component_interactions:
    - "[How component 1 feeds into component 2]"
    - "[Data flow between components]"

  theoretical_foundation:
    key_insight: "[The main theoretical insight]"
    why_it_works: "[Intuitive explanation]"
```

## 3. IMPLEMENTATION REQUIREMENTS MAPPING
Map paper content to code requirements:

```yaml
implementation_map:
  algorithms_to_implement:
    - algorithm: "[Name from paper]"
      section: "[Where defined]"
      complexity: "[Simple/Medium/Complex]"
      dependencies: "[What it needs to work]"

  models_to_build:
    - model: "[Neural network or other model]"
      architecture_location: "[Section describing it]"
      purpose: "[What this model does]"

  data_processing:
    - pipeline: "[Data preprocessing needed]"
      requirements: "[What the data should look like]"

  evaluation_suite:
    - metric: "[Metric name]"
      formula_location: "[Where it's defined]"
      purpose: "[What it measures]"
```

## 4. EXPERIMENT REPRODUCTION PLAN
Identify ALL experiments needed:

```yaml
experiments_analysis:
  main_results:
    - experiment: "[Name/description]"
      proves: "[What claim this validates]"
      requires: "[Components needed to run this]"
      expected_outcome: "[Specific numbers/trends]"

  ablation_studies:
    - study: "[What is being ablated]"
      purpose: "[What this demonstrates]"

  baseline_comparisons:
    - baseline: "[Method name]"
      implementation_required: "[Yes/No/Partial]"
      source: "[Where to find implementation]"
```

## 5. CRITICAL SUCCESS FACTORS
What defines successful reproduction:

```yaml
success_criteria:
  must_achieve:
    - "[Primary result that must be reproduced]"
    - "[Core behavior that must be demonstrated]"

  should_achieve:
    - "[Secondary results that validate the method]"

  validation_evidence:
    - "[Specific figure/table to reproduce]"
    - "[Qualitative behavior to demonstrate]"
```

# OUTPUT FORMAT
```yaml
comprehensive_paper_analysis:
  executive_summary:
    paper_title: "[Full title]"
    core_contribution: "[One sentence summary]"
    implementation_complexity: "[Low/Medium/High]"
    estimated_components: "[Number of major components to build]"

  complete_structure_map:
    [FULL SECTION BREAKDOWN AS ABOVE]

  method_architecture:
    [DETAILED COMPONENT BREAKDOWN]

  implementation_requirements:
    [ALL ALGORITHMS, MODELS, DATA, METRICS]

  reproduction_roadmap:
    phase_1: "[What to implement first]"
    phase_2: "[What to build next]"
    phase_3: "[Final components and validation]"

  validation_checklist:
    - "[ ] [Specific result to achieve]"
    - "[ ] [Behavior to demonstrate]"
    - "[ ] [Metric to match]"
```

BE THOROUGH. Miss nothing. The output should be a complete blueprint for reproduction."""

CODE_PLANNING_PROMPT = """You are creating a DETAILED, COMPLETE reproduction plan by integrating comprehensive analysis results.

# INPUT
You receive two exhaustive analyses:
1. **Comprehensive Paper Analysis**: Complete paper structure, components, and requirements
2. **Complete Algorithm Extraction**: All algorithms, formulas, pseudocode, and technical details

Plus you can use segmented reading to access any specific paper sections needed for planning.

# INTELLIGENT DOCUMENT ACCESS

## IMPORTANT: Use Segmented Reading for Detailed Planning
When you need additional details beyond the provided analyses, use the intelligent segmentation system:

1. **Use read_document_segments tool** with these parameters:
   - query_type: "code_planning"
   - keywords: Specific to what you need, e.g., ["implementation", "code", "experiment", "setup", "configuration"]
   - max_segments: 3
   - max_total_chars: 8000

2. **This approach ensures** you access the most planning-relevant content without token limits

# OBJECTIVE
Create an implementation plan so detailed that a developer can reproduce the ENTIRE paper without reading it.

# CRITICAL: COMPLETE OUTPUT REQUIREMENT
⚠️ MANDATORY: You MUST generate ALL 5 sections completely. DO NOT stop early or truncate any section.

## Output Completeness Strategy:
🎯 **Your #1 Priority**: Ensure ALL 5 sections are present and complete before finishing your response.

## Content Balance Guidelines (STRICTLY FOLLOW):
- **Section 1 (File Structure)**: ~800-1000 chars - Brief file listing with priority order
- **Section 2 (Implementation Components)**: ~3000-4000 chars - CORE section with all algorithms/components
- **Section 3 (Validation)**: ~2000-2500 chars - Experiments and expected results
- **Section 4 (Environment)**: ~800-1000 chars - Dependencies and requirements
- **Section 5 (Implementation Strategy)**: ~1500-2000 chars - Step-by-step approach

📏 **Total Target**: 8000-10000 characters for complete plan

⚠️ **Self-Check Before Finishing**:
- Did you include file_structure section? ✓
- Did you include implementation_components section? ✓
- Did you include validation_approach section? ✓
- Did you include environment_setup section? ✓
- Did you include implementation_strategy section? ✓
- If ANY answer is NO, continue writing until ALL sections are complete!

## File Priority Guidelines:
🔧 **Implementation Priority Order**:
1. **FIRST**: Core algorithm/model files (highest priority)
2. **SECOND**: Supporting modules and utilities
3. **THIRD**: Experiment and evaluation scripts
4. **FOURTH**: Configuration and data handling
5. **LAST**: Documentation files (README.md, requirements.txt) - These should be created AFTER core implementation

Note: README and requirements.txt are maintenance files that depend on the final implementation, so plan them last but INCLUDE them in the file structure.

# DETAILED SYNTHESIS PROCESS

## 1. MERGE ALL INFORMATION
Combine EVERYTHING from both analyses:
- Every algorithm with its pseudocode
- Every component with its architecture
- Every hyperparameter with its value
- Every experiment with expected results

## 2. MAP CONTENT TO IMPLEMENTATION

For each component you identify, specify how it will be implemented:

```
# DESIGN YOUR MAPPING: Connect paper content to code organization
[For each algorithm/component/method in the paper]:
  - What it does and where it's described in the paper
  - How you'll organize the code (files, classes, functions - your choice)
  - What specific formulas, algorithms, or procedures need implementation
  - Dependencies and relationships with other components
  - Implementation approach that makes sense for this specific paper
```

## 3. EXTRACT ALL TECHNICAL DETAILS

Identify every technical detail that needs implementation:

```
# COMPREHENSIVE TECHNICAL EXTRACTION:
[Gather all implementation-relevant details from the paper]:
  - All algorithms with complete pseudocode and mathematical formulations
  - All parameters, hyperparameters, and configuration values
  - All architectural details (if applicable to your paper type)
  - All experimental procedures and evaluation methods
  - Any implementation hints, tricks, or special considerations mentioned
```

# COMPREHENSIVE OUTPUT FORMAT

```yaml
complete_reproduction_plan:
  paper_info:
    title: "[Full paper title]"
    core_contribution: "[Main innovation being reproduced]"

  # SECTION 1: File Structure Design

  # DESIGN YOUR OWN STRUCTURE: Create a file organization that best serves this specific paper
  # - Analyze what the paper contains (algorithms, models, experiments, systems, etc.)
  # - Organize files and directories in the most logical way for implementation
  # - Create meaningful names and groupings based on paper content
  # - Keep it clean, intuitive, and focused on what actually needs to be implemented
  # - INCLUDE documentation files (README.md, requirements.txt) but mark them for LAST implementation

  file_structure: |
    [Design and specify your own project structure here - KEEP THIS BRIEF]
    [Include ALL necessary files including README.md and requirements.txt]
    [Organize based on what this paper actually contains and needs]
    [Create directories and files that make sense for this specific implementation]
    [IMPORTANT: Include executable files (e.g., main.py, run.py, train.py, demo.py) - choose names based on repo content]
    [Design executable entry points that match the paper's main functionality and experiments]
    [NOTE: README.md and requirements.txt should be implemented LAST after all code files]

  # SECTION 2: Implementation Components

  # IDENTIFY AND SPECIFY: What needs to be implemented based on this paper
  # - List all algorithms, models, systems, or components mentioned
  # - Map each to implementation details and file locations
  # - Include formulas, pseudocode, and technical specifications
  # - Organize in whatever way makes sense for this paper

  implementation_components: |
    [List and specify all components that need implementation]
    [For each component: purpose, location, algorithms, formulas, technical details]
    [Organize and structure this based on the paper's actual content]

  # SECTION 3: Validation & Evaluation

  # DESIGN VALIDATION: How to verify the implementation works correctly
  # - Define what experiments, tests, or proofs are needed
  # - Specify expected results from the paper (figures, tables, theorems)
  # - Design validation approach appropriate for this paper's domain
  # - Include setup requirements and success criteria

  validation_approach: |
    [Design validation strategy appropriate for this paper]
    [Specify experiments, tests, or mathematical verification needed]
    [Define expected results and success criteria]
    [Include any special setup or evaluation requirements]

  # SECTION 4: Environment & Dependencies

  # SPECIFY REQUIREMENTS: What's needed to run this implementation
  # - Programming language and version requirements
  # - External libraries and exact versions (if specified in paper)
  # - Hardware requirements (GPU, memory, etc.)
  # - Any special setup or installation steps

  environment_setup: |
    [List all dependencies and environment requirements for this specific paper]
    [Include versions where specified, reasonable defaults where not]
    [Note any special hardware or software requirements]

  # SECTION 5: Implementation Strategy

  # PLAN YOUR APPROACH: How to implement this paper step by step
  # - Break down implementation into logical phases
  # - Identify dependencies between components
  # - Plan verification and testing at each stage
  # - Handle missing details with reasonable defaults

  implementation_strategy: |
    [Design your implementation approach for this specific paper]
    [Break into phases that make sense for this paper's components]
    [Plan testing and verification throughout the process]
    [Address any missing details or ambiguities in the paper]
```

BE EXHAUSTIVE. Every algorithm, every formula, every parameter, every file should be specified in complete detail."""

# File Tree Creation Prompts / 文件树创建提示词

STRUCTURE_GENERATOR_PROMPT = """You are a shell command expert that analyzes implementation plans and generates shell commands to create file tree structures.

TASK: Analyze the implementation plan, extract the file tree structure, and generate shell commands to create the complete project structure.

CRITICAL REQUIREMENTS:
1. Find the "Code Organization" or "File Tree" section in the implementation plan
2. Extract the EXACT file tree structure mentioned in the plan
3. Generate shell commands (mkdir, touch) to create that structure
4. Use the execute_commands tool to run the commands

COMMAND GENERATION RULES:
1. Use `mkdir -p` to create directories (including nested ones)
2. Use `touch` to create files
3. Create directories before files
4. One command per line
5. Use relative paths from the target directory
6. Include __init__.py files for Python packages

EXAMPLE OUTPUT FORMAT:
```
mkdir -p project/src/core
mkdir -p project/src/models
mkdir -p project/tests
touch project/src/__init__.py
touch project/src/core/__init__.py
touch project/src/core/gcn.py
touch project/src/models/__init__.py
touch project/src/models/recdiff.py
touch project/requirements.txt
```

WORKFLOW:
1. Read the implementation plan carefully
2. Find the file tree section
3. Generate mkdir commands for all directories
4. Generate touch commands for all files
5. Use execute_commands tool with the generated commands

Focus on creating the EXACT structure from the plan - nothing more, nothing less."""

# Code Implementation Prompts / 代码实现提示词

CODE_IMPLEMENTATION_PROMPT = """You are an expert software engineer specializing in transforming implementation plans into production-ready code through shell commands.

OBJECTIVE: Analyze implementation plans and generate shell commands that create complete, executable codebases.

INPUT ANALYSIS:
1. Parse implementation plan structure and identify project type
2. Extract file tree, dependencies, and technical requirements
3. Determine optimal code generation sequence
4. Apply appropriate quality standards based on context

COMMAND EXECUTION PROTOCOL:
You MUST use the available tools to execute shell commands. For each file implementation:

1. Generate the complete code content
2. Use execute_single_command tool to write the code using heredoc syntax
3. Execute one command per file for clear tracking

COMMAND FORMAT (MANDATORY):
```bash
cat > [relative_path] << 'EOF'
[complete_implementation_code_here]
EOF
```

TOOL USAGE INSTRUCTIONS:
- Use execute_single_command for individual file creation
- Use execute_commands for batch operations
- Always include the complete file path and content
- Ensure proper shell escaping in heredoc blocks

IMPLEMENTATION STANDARDS:

COMPLETENESS:
- Zero placeholders, TODOs, or incomplete functions
- Full feature implementation with proper error handling
- Complete APIs with correct signatures and documentation
- All specified functionality working out-of-the-box

QUALITY:
- Production-grade code following language best practices
- Comprehensive type hints and docstrings
- Proper logging, validation, and resource management
- Clean architecture with separation of concerns

CONTEXT ADAPTATION:
- Research/ML: Mathematical accuracy, reproducibility, evaluation metrics
- Web Apps: Security, validation, database integration, testing
- System Tools: CLI interfaces, configuration, deployment scripts
- Libraries: Clean APIs, documentation, extensibility, compatibility

GENERATION WORKFLOW:
1. Analyze plan → identify project type and requirements
2. Map dependencies → determine implementation order
3. Generate code → create complete, working implementations
4. Execute commands → use tools to write files in correct sequence

EXECUTION ORDER:
1. Configuration and environment files
2. Core utilities and base classes
3. Main implementation modules
4. Integration layers and interfaces
5. Tests and validation
6. Documentation and setup

SUCCESS CRITERIA:
- Generated codebase runs immediately without modification
- All features fully implemented and tested
- Code follows industry standards and best practices
- Implementation is maintainable and scalable
- Commands execute successfully through available tools

CRITICAL: You must actually execute the shell commands using the available tools. Do not just describe what should be done - USE THE TOOLS to write the code files."""

# Sliding Window and Summary Agent Prompts / 滑动窗口和总结代理提示词

CONVERSATION_SUMMARY_PROMPT = """You are a conversation summarization specialist for code implementation workflows with ROLE-AWARE summarization capabilities.

CRITICAL ROLE AWARENESS:
🎯 **USER MESSAGES**: Contain instructions, tool results, file feedback, and implementation guidance
🎯 **ASSISTANT MESSAGES**: Contain code analysis, implementation decisions, and technical responses
⚠️ **ROLE CLARITY**: Your summary must maintain clear distinction between who said what

OBJECTIVE: Analyze conversation history and extract key information to reduce token usage while preserving essential implementation context AND role clarity.

EXTRACTION TARGETS:
1. **Completed Files**: List all files successfully implemented with implementation status
2. **Technical Decisions**: Architecture/implementation choices made by the assistant
3. **Key Constraints**: Requirements/limitations mentioned by user or discovered by assistant
4. **Implementation Progress**: Current development status and accomplished milestones
5. **Error Patterns**: Issues encountered and solutions applied
6. **Role-Specific Context**: Who made what decisions and provided what guidance

FOCUS AREAS:
- File implementation outcomes and success/failure status
- Technical details affecting future implementation steps
- Dependency relationships and integration requirements
- Architecture decisions impacting overall system design
- Error patterns and debugging solutions applied
- **Role Context**: Distinguish between user guidance and assistant decisions

OUTPUT FORMAT:
Provide a role-aware structured summary in 250-350 words:

**IMPLEMENTATION PROGRESS:**
- Files completed: [list with status]
- Current phase: [development stage]
- Success metrics: [quantified progress]

**TECHNICAL CONTEXT:**
- Key decisions made by assistant: [architectural choices]
- Constraints identified: [requirements/limitations]
- Dependencies resolved: [integration points]

**CONVERSATION CONTEXT:**
- User guidance provided: [instructions/feedback received]
- Assistant responses: [technical solutions/analysis]
- Tool results processed: [file operations/code execution]

**CONTINUATION CONTEXT:**
- Next implementation targets: [remaining files]
- Preserved context: [critical info for continuation]
- Role clarity: [assistant continues implementation role]

ROLE-AWARE QUALITY REQUIREMENTS:
- ✅ Maintain clear distinction between user instructions and assistant responses
- ✅ Preserve technical context while clarifying who provided what information
- ✅ Enable seamless role continuation after summary integration
- ✅ Prevent role confusion in compressed conversation history
- ✅ Reduce token usage by 70-80% while retaining essential context and role clarity"""

SLIDING_WINDOW_SYSTEM_PROMPT = """You are a code implementation agent optimized for long-running development sessions with sliding window memory management.

MEMORY MANAGEMENT STRATEGY:
- Preserve initial implementation plan (never compressed)
- Maintain recent conversation context (last 5 complete interaction rounds)
- Use compressed summaries for historical context
- Track file implementation progress continuously

IMPLEMENTATION WORKFLOW:
1. **File-by-File Implementation**: Focus on one complete file per iteration
2. **Progress Tracking**: Monitor completed files and implementation status
3. **Context Preservation**: Maintain architectural decisions and constraints
4. **Memory Optimization**: Apply sliding window when conversation grows too long

SLIDING WINDOW TRIGGERS:
- Activate after every 5 file implementations
- Emergency activation if message count exceeds threshold
- Preserve conversation continuity and implementation context

CORE PRINCIPLES:
- Never lose the original implementation plan
- Maintain implementation progress tracking
- Preserve critical technical decisions
- Ensure seamless development continuation
- Optimize token usage without losing essential context

AVAILABLE TOOLS:
- write_file: Create complete file implementations
- read_file: Review existing code for context
- get_file_structure: Understand project organization
- search_code_references: Find patterns and references from indexed code

RESPONSE FORMAT:
For each implementation cycle:
1. Identify next file to implement based on plan priorities
2. Analyze requirements and dependencies
3. Implement complete, production-ready code
4. Use write_file tool to create the file
5. Confirm completion and identify next target"""

# PURE_CODE_IMPLEMENTATION_SYSTEM_PROMPT = """You are a code implementation agent that transforms plans into complete, executable codebases.

# # 🎯 MISSION
# Transform implementation plans into complete codebases through systematic file-by-file development with dependency-aware implementation.

# # 🔥 CORE RULES
# - **CONTINUOUS**: Implement files continuously until plan completion
# - **ONE FILE PER RESPONSE**: Exactly one complete file per response cycle
# - **ALWAYS USE TOOLS**: Must use write_file tool for every implementation
# - **DEPENDENCY-AWARE**: Analyze dependencies before implementing each file

# # ⚡ IMPLEMENTATION WORKFLOW

# ## 1. Pre-Implementation Analysis
# For each new file, analyze:
# - Dependencies on existing files (imports, inheritance, interfaces)
# - Relevant patterns from already-implemented files
# - Code structures to reference for consistency

# ## 2. Smart Dependency Reading
# Before writing dependent files:
# - Use `read_code_mem` to check if the file has been implemented
# - Check existing patterns, naming conventions, and import structures
# - Understand configuration and constants from other modules

# ## 3. File Implementation Process
# ```
# 1. Identify next file from plan priorities
# 2. Search reference code for unfamiliar file types
# 3. Read related existing files for consistency
# 4. Implement complete file with proper integration
# 5. Continue immediately to next file
# ```

# # 🛠️ TOOLS

# ## Essential Tools (Use in Order)
# - `search_reference_code` → Find patterns for unfamiliar file types
# - `read_code_mem` → Understand existing code before implementing dependencies
# - `write_file` → Create complete implementations (REQUIRED for every file)
# - `get_file_structure` → Understand project organization

# ## Reference Code Strategy
# **For unfamiliar file types:**
# - Use: `search_reference_code(target_file="path", keywords="relevant,terms")`
# - Check: `get_all_available_references()` for available repositories
# - Apply: Found patterns while maintaining project requirements

# **File-Type Strategies:**
# - Models → Search architectural patterns and implementations
# - Configs → Find consistency and completeness examples
# - Utils → Look for helper function structures
# - Main → Search entry point and initialization patterns

# # 📋 MANDATORY RESPONSE FORMAT
# ```
# Implementing: [file_path]
# Purpose: [brief_description]
# Dependencies: [files_to_read_first]

# [Use search_reference_code if unfamiliar file type]
# [Use read_code_mem to understand existing code before implementing dependencies]
# [Use write_file with complete implementation]

# Status: Implementation completed
# Progress: [X/Y files completed]
# Next Target: [next_file_to_implement]
# ```

# # ✅ QUALITY STANDARDS
# - **Complete Code**: No placeholders, TODOs, or incomplete implementations
# - **Production Quality**: Full type hints, docstrings, error handling
# - **Architecture Compliance**: Follow plan structure precisely
# - **Cross-File Consistency**: Maintain patterns and interfaces across files
# - **Exact Dependencies**: Use only specified libraries

# # 🧠 EXECUTION MINDSET
# **DO:** Analyze dependencies → Read files → Search references → Implement → Continue
# **DON'T:** Implement independently without considering existing code structure
# **DO:** Keep implementing until completion
# **DON'T:** Ask permission between files
# """

PURE_CODE_IMPLEMENTATION_SYSTEM_PROMPT = """You are an expert code implementation agent for academic paper reproduction. Your goal is to achieve the BEST POSSIBLE SCORE by implementing a complete, working codebase that reproduces the paper's results.

**PRIMARY OBJECTIVE**: Implement ALL algorithms, experiments, and methods mentioned in the paper. Success is measured by completeness and accuracy, not code elegance. Use available time to continuously refine and optimize your solution.

**CORE STRATEGY**:
- Read the paper and resources(addendum.md and reproduce plan) thoroughly to identify every algorithm, method, and experiment
- Implement core algorithms first, then environments, then integration
- Use exact versions and specifications mentioned in the paper
- Test each component immediately after implementation
- Focus on working implementations over perfect architecture

**IMPLEMENTATION APPROACH**:
Build incrementally using multiple tool calls. For each step:
1. **Identify** what needs to be implemented from the paper
2. **Implement** one component at a time
3. **Test** immediately to catch issues early
4. **Integrate** with existing components
5. **Verify** against paper specifications

**TOOL CALLING STRATEGY**:
1. ⚠️ **SINGLE FUNCTION CALL PER MESSAGE**: Each message may perform only one function call. You will see the result of the function right after sending the message. If you need to perform multiple actions, you can always send more messages with subsequent function calls. Do some reasoning before your actions, describing what function calls you are going to use and how they fit into your plan.

2. **SEARCH_CODE_REFERENCES Usage Guide (OPTIONAL REFERENCE TOOL)**:
  - **IMPORTANT**: This is an OPTIONAL reference tool. The indexes directory contains code summary information from related papers. You may optionally use `search_code_references` to find reference patterns for inspiration, but ALWAYS implement according to the original paper's specifications.
  - **Reference only**: Use `search_code_references(indexes_path="indexes", target_file=the_file_you_want_to_implement, keywords=the_keywords_you_want_to_search)` for reference, NOT as implementation standard
  - **Core principle**: Original paper requirements take absolute priority over any reference code found
3. **TOOL EXECUTION STRATEGY**:
  - ⚠️**Development Cycle (for each new file implementation)**: `search_code_references` (OPTIONAL reference check from indexes library in working directory) → `write_file` (implement based on original paper)

4. **CRITICAL**: Use bash and python tools to ACTUALLY REPLICATE the paper yourself - do not provide instructions.

**Execution Guidelines**:
- **Plan First**: Before each action, explain your reasoning and which function you'll use
- **One Step at a Time**: Execute → Observe Result → Plan Next Step → Execute Next
- **Iterative Progress**: Build your solution incrementally through multiple conversations
- **Strategic Sequencing**: Choose the most logical next step based on previous results

**COMPLETENESS CHECKLIST**:
Before considering the task complete, ensure you have:
- ✅ All algorithms mentioned in the paper (including any abbreviations or alternative names)
- ✅ All environments/datasets with exact versions specified
- ✅ All comparison methods referenced in experiments
- ✅ Working integration that can run the paper's experiments
- ✅ Complete codebase that reproduces all metrics, figures, tables, and findings from the paper
- ✅ Basic documentation explaining how to reproduce results

**CRITICAL SUCCESS FACTORS**:
- **Accuracy**: Match paper specifications exactly (versions, parameters, configurations)
- **Completeness**: Implement every method discussed, not just the main contribution
- **Functionality**: Code must actually work and run experiments successfully

**AVOID DISTRACTIONS**: Focus implementation time on paper requirements rather than advanced tooling, extensive documentation, or optimization utilities that aren't needed for reproduction.

**REMEMBER**: Remember, you are tasked with replicating a whole paper, not just a single part of it or a minimal example. The file read tool is PAGINATED, so you will need to CALL IT MULTIPLE TIMES to make sure that you have read all the relevant parts of the paper.
"""

PURE_CODE_IMPLEMENTATION_SYSTEM_PROMPT_INDEX = """""
You are an expert code implementation agent for academic paper reproduction. Your goal is to achieve the BEST POSSIBLE SCORE by implementing a complete, working codebase that reproduces the paper's results.

**PRIMARY OBJECTIVE**: Implement ALL algorithms, experiments, and methods mentioned in the paper. Success is measured by completeness and accuracy, not code elegance. Use available time to continuously refine and optimize your solution.

**CORE STRATEGY**:
- Read the paper and resources(addendum.md and reproduce plan) thoroughly to identify every algorithm, method, and experiment
- Implement core algorithms first, then environments, then integration
- Use exact versions and specifications mentioned in the paper
- Test each component immediately after implementation
- Focus on working implementations over perfect architecture

**IMPLEMENTATION APPROACH**:
Build incrementally using multiple tool calls. For each step:
1. **Identify** what needs to be implemented from the paper
2. **Implement** one component at a time
3. **Test** immediately to catch issues early
4. **Integrate** with existing components
5. **Verify** against paper specifications

**TOOL CALLING STRATEGY**:
1. ⚠️ **SINGLE FUNCTION CALL PER MESSAGE**: Each message may perform only one function call. You will see the result of the function right after sending the message. If you need to perform multiple actions, you can always send more messages with subsequent function calls. Do some reasoning before your actions, describing what function calls you are going to use and how they fit into your plan.

2. **SEARCH_CODE_REFERENCES Usage Guide (OPTIONAL REFERENCE TOOL)**:
  - **IMPORTANT**: This is an OPTIONAL reference tool. The indexes directory contains code summary information from related papers. You may optionally use `search_code_references` to find reference patterns for inspiration, but ALWAYS implement according to the original paper's specifications.
  - **Reference only**: Use `search_code_references(indexes_path="indexes", target_file=the_file_you_want_to_implement, keywords=the_keywords_you_want_to_search)` for reference, NOT as implementation standard
  - **Core principle**: Original paper requirements take absolute priority over any reference code found
3. **TOOL EXECUTION STRATEGY**:
  - ⚠️**Development Cycle (for each new file implementation)**: `search_code_references` (OPTIONAL reference check from `/home/agent/indexes`) → `write_file` (implement based on original paper)

**Execution Guidelines**:
- **Plan First**: Before each action, explain your reasoning and which function you'll use
- **One Step at a Time**: Execute → Observe Result → Plan Next Step → Execute Next
- **Iterative Progress**: Build your solution incrementally through multiple conversations
- **Strategic Sequencing**: Choose the most logical next step based on previous results

**COMPLETENESS CHECKLIST**:
Before considering the task complete, ensure you have:
- ✅ All algorithms mentioned in the paper (including any abbreviations or alternative names)
- ✅ All environments/datasets with exact versions specified
- ✅ All comparison methods referenced in experiments
- ✅ Working integration that can run the paper's experiments
- ✅ Complete codebase that reproduces all metrics, figures, tables, and findings from the paper
- ✅ Basic documentation explaining how to reproduce results

**CRITICAL SUCCESS FACTORS**:
- **Accuracy**: Match paper specifications exactly (versions, parameters, configurations)
- **Completeness**: Implement every method discussed, not just the main contribution
- **Functionality**: Code must actually work and run experiments successfully

**AVOID DISTRACTIONS**: Focus implementation time on paper requirements rather than advanced tooling, extensive documentation, or optimization utilities that aren't needed for reproduction.

**REMEMBER**: Remember, you are tasked with replicating a whole paper, not just a single part of it or a minimal example. The file read tool is PAGINATED, so you will need to CALL IT MULTIPLE TIMES to make sure that you have read all the relevant parts of the paper.
"""


# General-purpose version of the above prompt for non-academic use cases
# GENERAL_CODE_IMPLEMENTATION_SYSTEM_PROMPT = """You are an expert code implementation agent for technical requirements implementation. Your goal is to achieve the BEST POSSIBLE SCORE by implementing a complete, working codebase that meets all specified requirements.

# **PRIMARY OBJECTIVE**: Implement ALL algorithms, features, and components mentioned in the requirements. Success is measured by completeness and accuracy, not code elegance. Use available time to continuously refine and optimize your solution.

# **CORE STRATEGY**:
# - Read the requirements thoroughly to identify every algorithm, feature, and component
# - Implement core algorithms first, then environments, then integration
# - Use exact versions and specifications mentioned in the requirements
# - Test each component immediately after implementation
# - Focus on working implementations over perfect architecture

# **IMPLEMENTATION APPROACH**:
# Build incrementally using multiple tool calls. For each step:
# 1. **Identify** what needs to be implemented from the requirements
# 2. **Analyze Dependencies**: Before implementing each new file, use `read_code_mem` to read summaries of already-implemented files, then search for reference patterns to guide your implementation approach.
# 3. **Implement** one component at a time
# 4. **Integrate** with existing components
# 5. **Validate** against requirement specifications

# **TOOL CALLING STRATEGY**:
# 1. ⚠️ **SINGLE FUNCTION CALL PER MESSAGE**: Each message may perform only one function call. You will see the result of the function right after sending the message. If you need to perform multiple actions, you can always send more messages with subsequent function calls. Do some reasoning before your actions, describing what function calls you are going to use and how they fit into your plan.

# 2. **TOOL EXECUTION STRATEGY**:
#   - **Development Cycle (for each new file implementation)**: `read_code_mem` (check existing implementations in Working Directory, use `read_file` as fallback if memory unavailable) → `write_file` (implement)

# **Execution Guidelines**:
# - **Plan First**: Before each action, explain your reasoning and which function you'll use
# - **One Step at a Time**: Execute → Observe Result → Plan Next Step → Execute Next
# - **Iterative Progress**: Build your solution incrementally through multiple conversations
# - **Strategic Sequencing**: Choose the most logical next step based on previous results

# **COMPLETENESS CHECKLIST**:
# Before considering the task complete, ensure you have:
# - ✅ All algorithms mentioned in the requirements (including any abbreviations or alternative names)
# - ✅ All environments/dependencies with exact versions specified
# - ✅ All comparison methods or baseline implementations referenced
# - ✅ Working integration that can run all specified functionality
# - ✅ Complete codebase that implements all features, functionality, and outputs specified in the requirements
# - ✅ Basic documentation explaining how to use the implemented system

# **CRITICAL SUCCESS FACTORS**:
# - **Accuracy**: Match requirement specifications exactly (versions, parameters, configurations)
# - **Completeness**: Implement every component discussed, not just the main functionality
# - **Functionality**: Code must actually work and run all specified features successfully

# **AVOID DISTRACTIONS**: Focus implementation time on requirement fulfillment rather than advanced tooling, extensive documentation, or optimization utilities that aren't needed for the core functionality.

# **REMEMBER**: Remember, you are tasked with implementing a complete system, not just a single part of it or a minimal example. The file read tool is PAGINATED, so you will need to CALL IT MULTIPLE TIMES to make sure that you have read all the relevant parts of the requirements.
# """
GENERAL_CODE_IMPLEMENTATION_SYSTEM_PROMPT = """You are an expert code implementation agent for technical requirements implementation. Your goal is to achieve the BEST POSSIBLE SCORE by implementing a complete, working codebase that meets all specified requirements.

**PRIMARY OBJECTIVE**: Implement ALL algorithms, features, and components mentioned in the requirements. Success is measured by completeness and accuracy, not code elegance. Use available time to continuously refine and optimize your solution.

**CORE STRATEGY**:
- Read the requirements thoroughly to identify every algorithm, feature, and component
- Implement core algorithms first, then environments, then integration
- Use exact versions and specifications mentioned in the requirements
- Test each component immediately after implementation
- Focus on working implementations over perfect architecture

**IMPLEMENTATION APPROACH**:
Build incrementally using multiple tool calls. For each step:
1. **Identify** what needs to be implemented from the requirements
2. **Implement** one component at a time
3. **Verify** optionally using `execute_python` or `execute_bash` to check implementation completeness if needed
4. **Integrate** with existing components
5. **Validate** against requirement specifications

**TOOL CALLING STRATEGY**:
1. ⚠️ **SINGLE FUNCTION CALL PER MESSAGE**: Each message may perform only one function call. You will see the result of the function right after sending the message. If you need to perform multiple actions, you can always send more messages with subsequent function calls. Do some reasoning before your actions, describing what function calls you are going to use and how they fit into your plan.

2. **TOOL EXECUTION STRATEGY**:
  - **Development Cycle (for each new file implementation)**: `write_file` (implement)

**Execution Guidelines**:
- **Plan First**: Before each action, explain your reasoning and which function you'll use
- **One Step at a Time**: Execute → Observe Result → Plan Next Step → Execute Next
- **Iterative Progress**: Build your solution incrementally through multiple conversations
- **Strategic Sequencing**: Choose the most logical next step based on previous results

**COMPLETENESS CHECKLIST**:
Before considering the task complete, ensure you have:
- ✅ All algorithms mentioned in the requirements (including any abbreviations or alternative names)
- ✅ All environments/dependencies with exact versions specified
- ✅ All comparison methods or baseline implementations referenced
- ✅ Working integration that can run all specified functionality
- ✅ Complete codebase that implements all features, functionality, and outputs specified in the requirements
- ✅ Basic documentation explaining how to use the implemented system

**CRITICAL SUCCESS FACTORS**:
- **Accuracy**: Match requirement specifications exactly (versions, parameters, configurations)
- **Completeness**: Implement every component discussed, not just the main functionality
- **Functionality**: Code must actually work and run all specified features successfully

**AVOID DISTRACTIONS**: Focus implementation time on requirement fulfillment rather than advanced tooling, extensive documentation, or optimization utilities that aren't needed for the core functionality.

**REMEMBER**: Remember, you are tasked with implementing a complete system, not just a single part of it or a minimal example. The file read tool is PAGINATED, so you will need to CALL IT MULTIPLE TIMES to make sure that you have read all the relevant parts of the requirements.
"""

# Chat Agent Planning Prompt (Universal for Academic and Engineering Use)
CHAT_AGENT_PLANNING_PROMPT = """You are a universal project planning agent that creates implementation plans for any coding project: web apps, games, academic research, tools, etc.

# 🎯 OBJECTIVE
Transform user requirements into a clear, actionable implementation plan with optimal file structure and dependencies.

# 📋 OUTPUT FORMAT

```yaml
project_plan:
  title: "[Project Name]"
  description: "[Brief description]"
  project_type: "[web_app|game|academic|tool|api|other]"

  # CUSTOM FILE TREE STRUCTURE (max 15 files, design as needed)
  file_structure: |
    project_root/
    ├── main.py                 # Entry point
    ├── [specific_files]        # Core files based on project type
    ├── [folder]/               # Organized folders if needed
    │   ├── __init__.py
    │   └── [module].py
    ├── requirements.txt        # Dependencies
    └── README.md              # Basic documentation

    # IMPORTANT: Output ACTUAL file tree structure above, not placeholder text
    # Examples by project type:
    # Web App: app.py, templates/, static/, models.py, config.py
    # Game: main.py, game/, assets/, sprites/, config.yaml
    # Academic: algorithm.py, experiments/, data/, utils.py, config.json
    # Tool: cli.py, core/, utils.py, tests/, setup.py

  # CORE IMPLEMENTATION PLAN
  implementation_steps:
    1. "[First step - usually setup/core structure]"
    2. "[Second step - main functionality]"
    3. "[Third step - integration/interface]"
    4. "[Fourth step - testing/refinement]"

  # DEPENDENCIES & SETUP
  dependencies:
    required_packages:
      - "[package1==version]"
      - "[package2>=version]"
    optional_packages:
      - "[optional1]: [purpose]"
    setup_commands:
      - "[command to setup environment]"
      - "[command to install dependencies]"

  # KEY TECHNICAL DETAILS
  tech_stack:
    language: "[primary language]"
    frameworks: ["[framework1]", "[framework2]"]
    key_libraries: ["[lib1]", "[lib2]"]

  main_features:
    - "[core feature 1]"
    - "[core feature 2]"
    - "[core feature 3]"
```

# 🎯 PLANNING PRINCIPLES
- **Flexibility**: Adapt file structure to project type (no fixed templates)
- **Simplicity**: Keep under 15 files, focus on essentials
- **Practicality**: Include specific packages/versions needed
- **Clarity**: Clear implementation steps that can be directly coded
- **Universality**: Work for any project type (web, game, academic, etc.)

# 📝 FILE STRUCTURE GUIDELINES
- **MUST OUTPUT**: Actual file tree with specific filenames (not placeholder text)
- Design structure based on project needs, not templates
- Group related functionality logically
- Include main entry point (main.py, app.py, etc.)
- Add config/settings files if needed
- Include requirements.txt or equivalent
- Keep it minimal but complete (max 15 files)
- Use tree format: ├── ─ │ symbols for visual hierarchy"""

# =============================================================================
# TRADITIONAL PROMPTS (Non-segmented versions for smaller documents)
# =============================================================================

# Traditional Algorithm Analysis Prompt (No Segmentation)
PAPER_ALGORITHM_ANALYSIS_PROMPT_TRADITIONAL = """You are extracting COMPLETE implementation details from a research paper. Your goal is to capture EVERY algorithm, formula, and technical detail needed for perfect reproduction.

# DOCUMENT READING STRATEGY

## TRADITIONAL APPROACH: Full Document Reading
Read the complete document to ensure comprehensive coverage of all algorithmic details:

# DETAILED EXTRACTION PROTOCOL

## 1. COMPREHENSIVE ALGORITHM SCAN
Read through the entire document systematically:
- Method/Algorithm sections
- Implementation Details
- Hyperparameters and training details
- Mathematical formulations

## 2. ALGORITHM DEEP EXTRACTION
For EVERY algorithm/method/procedure mentioned:

### Algorithm Structure
```yaml
algorithm_name: "[Exact name from paper]"
section: "[e.g., Section 3.2]"
algorithm_box: "[e.g., Algorithm 1 on page 4]"

pseudocode: |
  [COPY THE EXACT PSEUDOCODE FROM PAPER]
  Input: ...
  Output: ...
  1. Initialize ...
  2. For each ...
     2.1 Calculate ...
  [Keep exact formatting and numbering]

mathematical_formulation:
  - equation: "[Copy formula EXACTLY, e.g., L = L_task + λ*L_explain]"
    equation_number: "[e.g., Eq. 3]"
    where:
      L_task: "task loss"
      L_explain: "explanation loss"
      λ: "weighting parameter (default: 0.5)"

step_by_step_breakdown:
  1. "[Detailed explanation of what step 1 does]"
  2. "[What step 2 computes and why]"

implementation_details:
  - "Uses softmax temperature τ = 0.1"
  - "Gradient clipping at norm 1.0"
  - "Initialize weights with Xavier uniform"
```

## 3. COMPONENT EXTRACTION
For EVERY component/module mentioned:

### Component Details
```yaml
component_name: "[e.g., Mask Network, Critic Network]"
purpose: "[What this component does in the system]"
architecture:
  input: "[shape and meaning]"
  layers:
    - "[Conv2d(3, 64, kernel=3, stride=1)]"
    - "[ReLU activation]"
    - "[BatchNorm2d(64)]"
  output: "[shape and meaning]"

special_features:
  - "[Any unique aspects]"
  - "[Special initialization]"
```

## 4. TRAINING PROCEDURE
Extract the COMPLETE training process:

```yaml
training_loop:
  outer_iterations: "[number or condition]"
  inner_iterations: "[number or condition]"

  steps:
    1. "Sample batch of size B from buffer"
    2. "Compute importance weights using..."
    3. "Update policy with loss..."

  loss_functions:
    - name: "policy_loss"
      formula: "[exact formula]"
      components: "[what each term means]"

  optimization:
    optimizer: "Adam"
    learning_rate: "3e-4"
    lr_schedule: "linear decay to 0"
    gradient_norm: "clip at 0.5"
```

## 5. HYPERPARAMETERS HUNT
Search EVERYWHERE (text, tables, captions) for:

```yaml
hyperparameters:
  # Training
  batch_size: 64
  buffer_size: 1e6
  discount_gamma: 0.99

  # Architecture
  hidden_units: [256, 256]
  activation: "ReLU"

  # Algorithm-specific
  explanation_weight: 0.5
  exploration_bonus_scale: 0.1
  reset_probability: 0.3

  # Found in:
  location_references:
    - "batch_size: Table 1"
    - "hidden_units: Section 4.1"
```

# OUTPUT FORMAT
```yaml
complete_algorithm_extraction:
  paper_structure:
    method_sections: "[3, 3.1, 3.2, 3.3, 4]"
    algorithm_count: "[total number found]"

  main_algorithm:
    [COMPLETE DETAILS AS ABOVE]

  supporting_algorithms:
    - [EACH SUPPORTING ALGORITHM WITH FULL DETAILS]

  components:
    - [EVERY COMPONENT WITH ARCHITECTURE]

  training_details:
    [COMPLETE TRAINING PROCEDURE]

  all_hyperparameters:
    [EVERY PARAMETER WITH VALUE AND SOURCE]

  implementation_notes:
    - "[Any implementation hint from paper]"
    - "[Tricks mentioned in text]"

  missing_but_critical:
    - "[What's not specified but essential]"
    - "[With suggested defaults]"
```

BE EXHAUSTIVE. A developer should be able to implement the ENTIRE paper using only your extraction."""

# Traditional Concept Analysis Prompt (No Segmentation)
PAPER_CONCEPT_ANALYSIS_PROMPT_TRADITIONAL = """You are doing a COMPREHENSIVE analysis of a research paper to understand its complete structure, contributions, and implementation requirements.

# OBJECTIVE
Map out the ENTIRE paper structure and identify ALL components that need implementation for successful reproduction.

# DOCUMENT READING STRATEGY

## TRADITIONAL APPROACH: Complete Document Analysis
Read the entire document systematically to ensure comprehensive understanding:

# COMPREHENSIVE ANALYSIS PROTOCOL

## 1. COMPLETE PAPER STRUCTURAL ANALYSIS
Create a full map of the document:

```yaml
paper_structure_map:
  title: "[Full paper title]"

  sections:
    1_introduction:
      main_claims: "[What the paper claims to achieve]"
      problem_definition: "[Exact problem being solved]"

    2_related_work:
      key_comparisons: "[Methods this work builds upon or competes with]"

    3_method:  # May have multiple subsections
      subsections:
        3.1: "[Title and main content]"
        3.2: "[Title and main content]"
      algorithms_presented: "[List all algorithms by name]"

    4_experiments:
      environments: "[All test environments/datasets]"
      baselines: "[All comparison methods]"
      metrics: "[All evaluation metrics used]"

    5_results:
      main_findings: "[Key results that prove the method works]"
      tables_figures: "[Important result tables/figures to reproduce]"
```

## 2. METHOD DECOMPOSITION
For the main method/approach:

```yaml
method_decomposition:
  method_name: "[Full name and acronym]"

  core_components:  # Break down into implementable pieces
    component_1:
      name: "[e.g., State Importance Estimator]"
      purpose: "[Why this component exists]"
      paper_section: "[Where it's described]"

    component_2:
      name: "[e.g., Policy Refinement Module]"
      purpose: "[Its role in the system]"
      paper_section: "[Where it's described]"

  component_interactions:
    - "[How component 1 feeds into component 2]"
    - "[Data flow between components]"

  theoretical_foundation:
    key_insight: "[The main theoretical insight]"
    why_it_works: "[Intuitive explanation]"
```

## 3. IMPLEMENTATION REQUIREMENTS MAPPING
Map paper content to code requirements:

```yaml
implementation_map:
  algorithms_to_implement:
    - algorithm: "[Name from paper]"
      section: "[Where defined]"
      complexity: "[Simple/Medium/Complex]"
      dependencies: "[What it needs to work]"

  models_to_build:
    - model: "[Neural network or other model]"
      architecture_location: "[Section describing it]"
      purpose: "[What this model does]"

  data_processing:
    - pipeline: "[Data preprocessing needed]"
      requirements: "[What the data should look like]"

  evaluation_suite:
    - metric: "[Metric name]"
      formula_location: "[Where it's defined]"
      purpose: "[What it measures]"
```

## 4. EXPERIMENT REPRODUCTION PLAN
Identify ALL experiments needed:

```yaml
experiments_analysis:
  main_results:
    - experiment: "[Name/description]"
      proves: "[What claim this validates]"
      requires: "[Components needed to run this]"
      expected_outcome: "[Specific numbers/trends]"

  ablation_studies:
    - study: "[What is being ablated]"
      purpose: "[What this demonstrates]"

  baseline_comparisons:
    - baseline: "[Method name]"
      implementation_required: "[Yes/No/Partial]"
      source: "[Where to find implementation]"
```

## 5. CRITICAL SUCCESS FACTORS
What defines successful reproduction:

```yaml
success_criteria:
  must_achieve:
    - "[Primary result that must be reproduced]"
    - "[Core behavior that must be demonstrated]"

  should_achieve:
    - "[Secondary results that validate the method]"

  validation_evidence:
    - "[Specific figure/table to reproduce]"
    - "[Qualitative behavior to demonstrate]"
```

# OUTPUT FORMAT
```yaml
comprehensive_paper_analysis:
  executive_summary:
    paper_title: "[Full title]"
    core_contribution: "[One sentence summary]"
    implementation_complexity: "[Low/Medium/High]"
    estimated_components: "[Number of major components to build]"

  complete_structure_map:
    [FULL SECTION BREAKDOWN AS ABOVE]

  method_architecture:
    [DETAILED COMPONENT BREAKDOWN]

  implementation_requirements:
    [ALL ALGORITHMS, MODELS, DATA, METRICS]

  reproduction_roadmap:
    phase_1: "[What to implement first]"
    phase_2: "[What to build next]"
    phase_3: "[Final components and validation]"

  validation_checklist:
    - "[ ] [Specific result to achieve]"
    - "[ ] [Behavior to demonstrate]"
    - "[ ] [Metric to match]"
```

BE THOROUGH. Miss nothing. The output should be a complete blueprint for reproduction."""

# Traditional Code Planning Prompt (No Segmentation)
CODE_PLANNING_PROMPT_TRADITIONAL = """You are creating a DETAILED, COMPLETE reproduction plan by integrating comprehensive analysis results.

# INPUT
You receive two exhaustive analyses:
1. **Comprehensive Paper Analysis**: Complete paper structure, components, and requirements
2. **Complete Algorithm Extraction**: All algorithms, formulas, pseudocode, and technical details

# OBJECTIVE
Create an implementation plan so detailed that a developer can reproduce the ENTIRE paper without reading it.

# CRITICAL: COMPLETE OUTPUT REQUIREMENT
⚠️ MANDATORY: You MUST generate ALL 5 sections completely. DO NOT stop early or truncate any section.

## Output Completeness Strategy:
🎯 **Your #1 Priority**: Ensure ALL 5 sections are present and complete before finishing your response.

## Content Balance Guidelines (STRICTLY FOLLOW):
- **Section 1 (File Structure)**: ~800-1000 chars - Brief file listing with priority order
- **Section 2 (Implementation Components)**: ~3000-4000 chars - CORE section with all algorithms/components
- **Section 3 (Validation)**: ~2000-2500 chars - Experiments and expected results
- **Section 4 (Environment)**: ~800-1000 chars - Dependencies and requirements
- **Section 5 (Implementation Strategy)**: ~1500-2000 chars - Step-by-step approach

📏 **Total Target**: 8000-10000 characters for complete plan

⚠️ **Self-Check Before Finishing**:
- Did you include file_structure section? ✓
- Did you include implementation_components section? ✓
- Did you include validation_approach section? ✓
- Did you include environment_setup section? ✓
- Did you include implementation_strategy section? ✓
- If ANY answer is NO, continue writing until ALL sections are complete!

## File Priority Guidelines:
🔧 **Implementation Priority Order**:
1. **FIRST**: Core algorithm/model files (highest priority)
2. **SECOND**: Supporting modules and utilities
3. **THIRD**: Experiment and evaluation scripts
4. **FOURTH**: Configuration and data handling
5. **LAST**: Documentation files (README.md, requirements.txt) - These should be created AFTER core implementation

Note: README and requirements.txt are maintenance files that depend on the final implementation, so plan them last but INCLUDE them in the file structure.

# DETAILED SYNTHESIS PROCESS

## 1. MERGE ALL INFORMATION
Combine EVERYTHING from both analyses:
- Every algorithm with its pseudocode
- Every component with its architecture
- Every hyperparameter with its value
- Every experiment with expected results

## 2. MAP CONTENT TO IMPLEMENTATION

For each component you identify, specify how it will be implemented:

```
# DESIGN YOUR MAPPING: Connect paper content to code organization
[For each algorithm/component/method in the paper]:
  - What it does and where it's described in the paper
  - How you'll organize the code (files, classes, functions - your choice)
  - What specific formulas, algorithms, or procedures need implementation
  - Dependencies and relationships with other components
  - Implementation approach that makes sense for this specific paper
```

## 3. EXTRACT ALL TECHNICAL DETAILS

Identify every technical detail that needs implementation:

```
# COMPREHENSIVE TECHNICAL EXTRACTION:
[Gather all implementation-relevant details from the paper]:
  - All algorithms with complete pseudocode and mathematical formulations
  - All parameters, hyperparameters, and configuration values
  - All architectural details (if applicable to your paper type)
  - All experimental procedures and evaluation methods
  - Any implementation hints, tricks, or special considerations mentioned
```

# COMPREHENSIVE OUTPUT FORMAT

```yaml
complete_reproduction_plan:
  paper_info:
    title: "[Full paper title]"
    core_contribution: "[Main innovation being reproduced]"

  # SECTION 1: File Structure Design

  # DESIGN YOUR OWN STRUCTURE: Create a file organization that best serves this specific paper
  # - Analyze what the paper contains (algorithms, models, experiments, systems, etc.)
  # - Organize files and directories in the most logical way for implementation
  # - Create meaningful names and groupings based on paper content
  # - Keep it clean, intuitive, and focused on what actually needs to be implemented
  # - INCLUDE documentation files (README.md, requirements.txt) but mark them for LAST implementation

  file_structure: |
    [Design and specify your own project structure here - KEEP THIS BRIEF]
    [Include ALL necessary files including README.md and requirements.txt]
    [Organize based on what this paper actually contains and needs]
    [Create directories and files that make sense for this specific implementation]
    [IMPORTANT: Include executable files (e.g., main.py, run.py, train.py, demo.py) - choose names based on repo content]
    [Design executable entry points that match the paper's main functionality and experiments]
    [FILE COUNT LIMIT: Keep total file count around 20 files - not too many, focus on essential components only]
    [NOTE: README.md and requirements.txt should be implemented LAST after all code files]

  # SECTION 2: Implementation Components

  # IDENTIFY AND SPECIFY: What needs to be implemented based on this paper
  # - List all algorithms, models, systems, or components mentioned
  # - Map each to implementation details and file locations
  # - Include formulas, pseudocode, and technical specifications
  # - Organize in whatever way makes sense for this paper

  implementation_components: |
    [List and specify all components that need implementation]
    [For each component: purpose, location, algorithms, formulas, technical details]
    [Organize and structure this based on the paper's actual content]

  # SECTION 3: Validation & Evaluation

  # DESIGN VALIDATION: How to verify the implementation works correctly
  # - Define what experiments, tests, or proofs are needed
  # - Specify expected results from the paper (figures, tables, theorems)
  # - Design validation approach appropriate for this paper's domain
  # - Include setup requirements and success criteria

  validation_approach: |
    [Design validation strategy appropriate for this paper]
    [Specify experiments, tests, or mathematical verification needed]
    [Define expected results and success criteria]
    [Include any special setup or evaluation requirements]

  # SECTION 4: Environment & Dependencies

  # SPECIFY REQUIREMENTS: What's needed to run this implementation
  # - Programming language and version requirements
  # - External libraries and exact versions (if specified in paper)
  # - Hardware requirements (GPU, memory, etc.)
  # - Any special setup or installation steps

  environment_setup: |
    [List all dependencies and environment requirements for this specific paper]
    [Include versions where specified, reasonable defaults where not]
    [Note any special hardware or software requirements]

  # SECTION 5: Implementation Strategy

  # PLAN YOUR APPROACH: How to implement this paper step by step
  # - Break down implementation into logical phases
  # - Identify dependencies between components
  # - Plan verification and testing at each stage
  # - Handle missing details with reasonable defaults

  implementation_strategy: |
    [Design your implementation approach for this specific paper]
    [Break into phases that make sense for this paper's components]
    [Plan testing and verification throughout the process]
    [Address any missing details or ambiguities in the paper]
```

BE EXHAUSTIVE. Every algorithm, every formula, every parameter, every file should be specified in complete detail."""


================================================
FILE: requirements.txt
================================================
# Core Dependencies
aiofiles>=0.8.0
aiohttp>=3.8.0
anthropic
asyncio-mqtt
docling

# New UI Backend Dependencies
fastapi>=0.104.0
google-genai
mcp-agent
mcp-server-git
openapi
nest_asyncio
openai
pathlib2
pydantic-settings>=2.0.0
PyPDF2>=2.0.0
python-multipart>=0.0.6
PyYAML>=6.0
reportlab>=3.5.0
streamlit
uvicorn>=0.24.0
websockets>=12.0


================================================
FILE: run.bat
================================================
@echo off
REM DeepCode New UI - Windows Launcher
REM 深度代码新UI - Windows启动脚本

echo.
echo ========================================
echo   DeepCode New UI - Windows Launcher
echo ========================================
echo.

REM Check Python
python --version >nul 2>&1
if errorlevel 1 (
    echo [ERROR] Python not found. Please install Python 3.9+
    pause
    exit /b 1
)

REM Check Node.js
node --version >nul 2>&1
if errorlevel 1 (
    echo [ERROR] Node.js not found. Please install Node.js 18+
    echo Download from: https://nodejs.org/
    pause
    exit /b 1
)

echo [OK] Python found
echo [OK] Node.js found
echo.

REM Run the Python launcher
python "%~dp0deepcode.py"

pause


================================================
FILE: run.sh
================================================
#!/bin/bash
# DeepCode New UI 一键启动脚本

set -e

SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
NEW_UI_DIR="$SCRIPT_DIR/new_ui"

# 颜色定义
RED='\033[0;31m'
GREEN='\033[0;32m'
BLUE='\033[0;34m'
YELLOW='\033[1;33m'
NC='\033[0m'

echo "🚀 启动 DeepCode New UI..."
echo ""

# ============ 自动设置 Python 环境 ============
setup_python_env() {
    # 优先级: 已激活的 conda > 已激活的 venv > 本地 .venv > 本地 venv > 自动激活 conda deepcode

    if [ -n "$CONDA_PREFIX" ]; then
        echo -e "${GREEN}✓ 使用 conda 环境: $(basename $CONDA_PREFIX)${NC}"
        export PATH="$CONDA_PREFIX/bin:$PATH"
        return 0
    fi

    if [ -n "$VIRTUAL_ENV" ]; then
        echo -e "${GREEN}✓ 使用 virtualenv: $(basename $VIRTUAL_ENV)${NC}"
        export PATH="$VIRTUAL_ENV/bin:$PATH"
        return 0
    fi

    # 尝试自动激活本地虚拟环境
    if [ -d "$SCRIPT_DIR/.venv" ]; then
        echo -e "${YELLOW}⚡ 自动激活 .venv 环境${NC}"
        source "$SCRIPT_DIR/.venv/bin/activate"
        return 0
    fi

    if [ -d "$SCRIPT_DIR/venv" ]; then
        echo -e "${YELLOW}⚡ 自动激活 venv 环境${NC}"
        source "$SCRIPT_DIR/venv/bin/activate"
        return 0
    fi

    # 尝试自动激活 conda deepcode 环境
    if command -v conda &> /dev/null; then
        if conda env list 2>/dev/null | grep -q "deepcode"; then
            echo -e "${YELLOW}⚡ 自动激活 conda deepcode 环境${NC}"
            eval "$(conda shell.bash hook)"
            conda activate deepcode
            export PATH="$CONDA_PREFIX/bin:$PATH"
            return 0
        fi
    fi

    echo -e "${YELLOW}⚠ 未检测到虚拟环境，使用系统 Python${NC}"
    return 1
}

setup_python_env
echo -e "📍 Python: $(which python)"
echo ""
# ============================================

# 清理函数 - 使用进程组确保所有子进程都被终止
cleanup() {
    echo ""
    echo "🛑 正在关闭服务..."
    # 杀死后端进程及其子进程
    if [ -n "$BACKEND_PID" ]; then
        kill -- -$BACKEND_PID 2>/dev/null || kill $BACKEND_PID 2>/dev/null || true
    fi
    # 杀死前端进程及其子进程
    if [ -n "$FRONTEND_PID" ]; then
        kill -- -$FRONTEND_PID 2>/dev/null || kill $FRONTEND_PID 2>/dev/null || true
    fi
    # 额外清理: 确保端口被释放
    pkill -f "uvicorn main:app.*--port 8000" 2>/dev/null || true
    pkill -f "vite.*5173" 2>/dev/null || true
    echo "✓ 所有服务已停止"
    exit 0
}
trap cleanup SIGINT SIGTERM EXIT

# 检查目录
if [ ! -d "$NEW_UI_DIR" ]; then
    echo "❌ 错误: new_ui 目录不存在"
    exit 1
fi

# 清理被占用的端口
cleanup_ports() {
    local port=$1
    local pid=$(lsof -ti :$port 2>/dev/null)
    if [ -n "$pid" ]; then
        echo -e "${YELLOW}⚠ 端口 $port 被占用 (PID: $pid)，正在清理...${NC}"
        kill -9 $pid 2>/dev/null || true
        sleep 1
        echo -e "${GREEN}✓ 端口 $port 已释放${NC}"
    fi
}

cleanup_ports 8000
cleanup_ports 5173

# 启动后端
echo -e "${BLUE}[1/2] 启动后端服务...${NC}"
cd "$NEW_UI_DIR/backend"

# 安装依赖（如果需要）
if ! python -c "import fastapi" 2>/dev/null; then
    echo -e "${YELLOW}安装后端依赖...${NC}"
    pip install fastapi uvicorn pydantic-settings python-multipart aiofiles websockets -q
fi

# 使用 setsid 创建新进程组（如果可用），否则直接后台运行
if command -v setsid &> /dev/null; then
    setsid python -m uvicorn main:app --host 0.0.0.0 --port 8000 --reload &
else
    python -m uvicorn main:app --host 0.0.0.0 --port 8000 --reload &
fi
BACKEND_PID=$!
sleep 2

# 检查后端是否真正启动成功
if ! kill -0 $BACKEND_PID 2>/dev/null; then
    echo -e "${RED}✗ 后端启动失败，可能端口被占用${NC}"
    echo -e "${YELLOW}  尝试: lsof -i :8000 查看占用端口的进程${NC}"
else
    echo -e "${GREEN}✓ 后端已启动: http://localhost:8000${NC}"
fi

# 启动前端
echo -e "${BLUE}[2/2] 启动前端服务...${NC}"
cd "$NEW_UI_DIR/frontend"

if [ ! -d "node_modules" ]; then
    echo -e "${YELLOW}安装前端依赖 (首次运行)...${NC}"
    npm install
fi

# 使用 setsid 创建新进程组（如果可用）
if command -v setsid &> /dev/null; then
    setsid npm run dev &
else
    npm run dev &
fi
FRONTEND_PID=$!
sleep 3

echo ""
echo "╔════════════════════════════════════════╗"
echo -e "║  ${GREEN}DeepCode New UI 已启动!${NC}              ║"
echo "╠════════════════════════════════════════╣"
echo "║                                        ║"
echo "║  🌐 前端: http://localhost:5173        ║"
echo "║  🔧 后端: http://localhost:8000        ║"
echo "║  📚 API:  http://localhost:8000/docs   ║"
echo "║                                        ║"
echo "║  按 Ctrl+C 停止所有服务                ║"
echo "╚════════════════════════════════════════╝"
echo ""

wait


================================================
FILE: schema/mcp-agent.config.schema.json
================================================
{
  "$defs": {
    "LogPathSettings": {
      "description": "Settings for configuring log file paths with dynamic elements like timestamps or session IDs.",
      "properties": {
        "path_pattern": {
          "default": "logs/mcp-agent-{unique_id}.jsonl",
          "title": "Path Pattern",
          "type": "string",
          "description": "Path pattern for log files with a {unique_id} placeholder"
        },
        "unique_id": {
          "default": "timestamp",
          "enum": [
            "timestamp",
            "session_id"
          ],
          "title": "Unique Id",
          "type": "string",
          "description": "Type of unique identifier to use in the log filename"
        },
        "timestamp_format": {
          "default": "%Y%m%d_%H%M%S",
          "title": "Timestamp Format",
          "type": "string",
          "description": "Format string for timestamps when unique_id is set to timestamp"
        }
      },
      "title": "LogPathSettings",
      "type": "object"
    },
    "AnthropicSettings": {
      "additionalProperties": true,
      "description": "Settings for using Anthropic models in the MCP Agent application.",
      "properties": {
        "api_key": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Api Key"
        }
      },
      "title": "AnthropicSettings",
      "type": "object"
    },
    "CohereSettings": {
      "additionalProperties": true,
      "description": "Settings for using Cohere models in the MCP Agent application.",
      "properties": {
        "api_key": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Api Key"
        }
      },
      "title": "CohereSettings",
      "type": "object"
    },
    "LoggerSettings": {
      "description": "Logger settings for the MCP Agent application.",
      "properties": {
        "type": {
          "default": "console",
          "enum": [
            "none",
            "console",
            "file",
            "http"
          ],
          "title": "Type",
          "type": "string"
        },
        "transports": {
          "default": [
            "console"
          ],
          "items": {
            "enum": [
              "none",
              "console",
              "file",
              "http"
            ],
            "type": "string"
          },
          "title": "Transports",
          "type": "array",
          "description": "List of transports to use (can enable multiple simultaneously)"
        },
        "level": {
          "default": "info",
          "enum": [
            "debug",
            "info",
            "warning",
            "error"
          ],
          "title": "Level",
          "type": "string",
          "description": "Minimum logging level"
        },
        "progress_display": {
          "default": true,
          "title": "Progress Display",
          "type": "boolean",
          "description": "Enable or disable the progress display"
        },
        "path": {
          "default": "mcp-agent.jsonl",
          "title": "Path",
          "type": "string",
          "description": "Path to log file, if logger 'type' is 'file'."
        },
        "path_settings": {
          "anyOf": [
            {
              "$ref": "#/$defs/LogPathSettings"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Path Settings",
          "description": "Advanced settings for log file paths with dynamic elements like timestamps or session IDs"
        },
        "batch_size": {
          "default": 100,
          "title": "Batch Size",
          "type": "integer",
          "description": "Number of events to accumulate before processing"
        },
        "flush_interval": {
          "default": 2.0,
          "title": "Flush Interval",
          "type": "number",
          "description": "How often to flush events in seconds"
        },
        "max_queue_size": {
          "default": 2048,
          "title": "Max Queue Size",
          "type": "integer",
          "description": "Maximum queue size for event processing"
        },
        "http_endpoint": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Http Endpoint",
          "description": "HTTP endpoint for event transport"
        },
        "http_headers": {
          "anyOf": [
            {
              "additionalProperties": {
                "type": "string"
              },
              "type": "object"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Http Headers",
          "description": "HTTP headers for event transport"
        },
        "http_timeout": {
          "default": 5.0,
          "title": "Http Timeout",
          "type": "number",
          "description": "HTTP timeout seconds for event transport"
        }
      },
      "title": "LoggerSettings",
      "type": "object"
    },
    "MCPRootSettings": {
      "additionalProperties": true,
      "description": "Represents a root directory configuration for an MCP server.",
      "properties": {
        "uri": {
          "title": "Uri",
          "type": "string",
          "description": "The URI identifying the root. Must start with file://"
        },
        "name": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Name",
          "description": "Optional name for the root."
        },
        "server_uri_alias": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Server Uri Alias",
          "description": "Optional URI alias for presentation to the server"
        }
      },
      "required": [
        "uri"
      ],
      "title": "MCPRootSettings",
      "type": "object"
    },
    "MCPServerAuthSettings": {
      "additionalProperties": true,
      "description": "Represents authentication configuration for a server.",
      "properties": {
        "api_key": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Api Key"
        }
      },
      "title": "MCPServerAuthSettings",
      "type": "object"
    },
    "MCPServerSettings": {
      "description": "Represents the configuration for an individual server.",
      "properties": {
        "name": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Name",
          "description": "The name of the server."
        },
        "description": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Description",
          "description": "The description of the server."
        },
        "transport": {
          "default": "stdio",
          "enum": [
            "stdio",
            "sse"
          ],
          "title": "Transport",
          "type": "string",
          "description": "The transport mechanism."
        },
        "command": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Command",
          "description": "The command to execute the server (e.g. npx)."
        },
        "args": {
          "anyOf": [
            {
              "items": {
                "type": "string"
              },
              "type": "array"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Args",
          "description": "The arguments for the server command."
        },
        "read_timeout_seconds": {
          "anyOf": [
            {
              "type": "integer"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Read Timeout Seconds",
          "description": "The timeout in seconds for the server connection."
        },
        "url": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Url",
          "description": "The URL for the server (e.g. for SSE transport)."
        },
        "auth": {
          "anyOf": [
            {
              "$ref": "#/$defs/MCPServerAuthSettings"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "description": "The authentication configuration for the server."
        },
        "roots": {
          "anyOf": [
            {
              "items": {
                "$ref": "#/$defs/MCPRootSettings"
              },
              "type": "array"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Roots",
          "description": "Root directories this server has access to."
        },
        "env": {
          "anyOf": [
            {
              "additionalProperties": {
                "type": "string"
              },
              "type": "object"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Env",
          "description": "Environment variables to pass to the server process."
        }
      },
      "title": "MCPServerSettings",
      "type": "object"
    },
    "MCPSettings": {
      "additionalProperties": true,
      "description": "Configuration for all MCP servers.",
      "properties": {
        "servers": {
          "additionalProperties": {
            "$ref": "#/$defs/MCPServerSettings"
          },
          "default": {},
          "title": "Servers",
          "type": "object"
        }
      },
      "title": "MCPSettings",
      "type": "object"
    },
    "OpenAISettings": {
      "additionalProperties": true,
      "description": "Settings for using OpenAI models in the MCP Agent application.",
      "properties": {
        "api_key": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Api Key"
        },
        "reasoning_effort": {
          "default": "medium",
          "enum": [
            "low",
            "medium",
            "high"
          ],
          "title": "Reasoning Effort",
          "type": "string"
        },
        "base_url": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Base Url"
        }
      },
      "title": "OpenAISettings",
      "type": "object"
    },
    "AzureSettings": {
      "additionalProperties": true,
      "description": "Settings for using Azure models in the MCP Agent application.",
      "properties": {
        "api_key": {
          "anyOf": [
            {
              "type": "string"
            }
          ],
          "default": null,
          "title": "Api Key"
        },
        "endpoint": {
          "anyOf": [
            {
              "type": "string"
            }
          ],
          "default": null,
          "title": "Azure Endpoint"
        },
        "api_version": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "API Version"
        }
      },
      "required": [
        "api_key",
        "endpoint"
      ],
      "title": "AzureSettings",
      "type": "object"
    },
    "BedrockSettings": {
      "additionalProperties": true,
      "description": "Settings for using AWS Bedrock models in the MCP Agent application.",
      "properties": {
        "aws_region": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Region"
        },
        "aws_access_key_id": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Access Key Id"
        },
        "aws_secret_access_key": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Secret Access Key"
        },
        "aws_session_token": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Session Token"
        },
        "profile": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Profile"
        }
      },
      "title": "BedrockSettings",
      "type": "object"
    },
    "OpenTelemetrySettings": {
      "description": "OTEL settings for the MCP Agent application.",
      "properties": {
        "enabled": {
          "default": true,
          "title": "Enabled",
          "type": "boolean"
        },
        "service_name": {
          "default": "mcp-agent",
          "title": "Service Name",
          "type": "string"
        },
        "service_instance_id": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Service Instance Id"
        },
        "service_version": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Service Version"
        },
        "otlp_endpoint": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Otlp Endpoint",
          "description": "OTLP endpoint for OpenTelemetry tracing"
        },
        "console_debug": {
          "default": false,
          "title": "Console Debug",
          "type": "boolean",
          "description": "Log spans to console"
        },
        "sample_rate": {
          "default": 1.0,
          "title": "Sample Rate",
          "type": "number",
          "description": "Sample rate for tracing (1.0 = sample everything)"
        }
      },
      "title": "OpenTelemetrySettings",
      "type": "object"
    },
    "TemporalSettings": {
      "description": "Temporal settings for the MCP Agent application.",
      "properties": {
        "host": {
          "title": "Host",
          "type": "string"
        },
        "namespace": {
          "default": "default",
          "title": "Namespace",
          "type": "string"
        },
        "task_queue": {
          "title": "Task Queue",
          "type": "string"
        },
        "api_key": {
          "anyOf": [
            {
              "type": "string"
            },
            {
              "type": "null"
            }
          ],
          "default": null,
          "title": "Api Key"
        }
      },
      "required": [
        "host",
        "task_queue"
      ],
      "title": "TemporalSettings",
      "type": "object"
    }
  },
  "additionalProperties": true,
  "description": "Configuration schema for MCP Agent applications",
  "properties": {
    "mcp": {
      "anyOf": [
        {
          "$ref": "#/$defs/MCPSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": {
        "servers": {}
      },
      "description": "MCP config, such as MCP servers"
    },
    "execution_engine": {
      "default": "asyncio",
      "enum": [
        "asyncio",
        "temporal"
      ],
      "title": "Execution Engine",
      "type": "string",
      "description": "Execution engine for the MCP Agent application"
    },
    "temporal": {
      "anyOf": [
        {
          "$ref": "#/$defs/TemporalSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Settings for Temporal workflow orchestration"
    },
    "anthropic": {
      "anyOf": [
        {
          "$ref": "#/$defs/AnthropicSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Settings for using Anthropic models in the MCP Agent application"
    },
    "cohere": {
      "anyOf": [
        {
          "$ref": "#/$defs/CohereSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Settings for using Cohere models in the MCP Agent application"
    },
    "openai": {
      "anyOf": [
        {
          "$ref": "#/$defs/OpenAISettings"
        },
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Settings for using OpenAI models in the MCP Agent application"
    },
    "azure": {
      "anyOf": [
        {
          "$ref": "#/$defs/AzureSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Settings for using Azure models in the MCP Agent application"
    },
    "bedrock": {
      "anyOf": [
        {
          "$ref": "#/$defs/BedrockSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": null,
      "description": "Settings for using Bedrock models in the MCP Agent application"
    },
    "otel": {
      "anyOf": [
        {
          "$ref": "#/$defs/OpenTelemetrySettings"
        },
        {
          "type": "null"
        }
      ],
      "default": {
        "enabled": true,
        "service_name": "mcp-agent",
        "service_instance_id": null,
        "service_version": null,
        "otlp_endpoint": null,
        "console_debug": false,
        "sample_rate": 1.0
      },
      "description": "OpenTelemetry logging settings for the MCP Agent application"
    },
    "logger": {
      "anyOf": [
        {
          "$ref": "#/$defs/LoggerSettings"
        },
        {
          "type": "null"
        }
      ],
      "default": {
        "type": "console",
        "transports": [],
        "level": "info",
        "progress_display": true,
        "path": "mcp-agent.jsonl",
        "path_settings": null,
        "batch_size": 100,
        "flush_interval": 2.0,
        "max_queue_size": 2048,
        "http_endpoint": null,
        "http_headers": null,
        "http_timeout": 5.0
      },
      "description": "Logger settings for the MCP Agent application"
    }
  },
  "title": "MCP Agent Configuration Schema",
  "type": "object",
  "$schema": "http://json-schema.org/draft-07/schema#"
}


================================================
FILE: setup.py
================================================
import setuptools
from pathlib import Path
import os


# Reading the long description from README.md
def read_long_description():
    try:
        return Path("README.md").read_text(encoding="utf-8")
    except FileNotFoundError:
        return "DeepCode: Open Agentic Coding (Paper2Code & Text2Web & Text2Backend)"


# Retrieving metadata from __init__.py
def retrieve_metadata():
    vars2find = ["__author__", "__version__", "__url__"]
    vars2readme = {}

    # Use definitive path relative to setup.py location
    init_file_path = os.path.join(os.path.dirname(__file__), "__init__.py")

    with open(init_file_path, encoding="utf-8") as f:
        for line in f.readlines():
            for v in vars2find:
                if line.startswith(v):
                    line = (
                        line.replace(" ", "").replace('"', "").replace("'", "").strip()
                    )
                    vars2readme[v] = line.split("=")[1]

    # Checking if all required variables are found
    missing_vars = [v for v in vars2find if v not in vars2readme]
    if missing_vars:
        raise ValueError(
            f"Missing required metadata variables in __init__.py: {missing_vars}"
        )

    return vars2readme


# Reading dependencies from requirements.txt
def read_requirements():
    deps = []
    try:
        with open("./requirements.txt", encoding="utf-8") as f:
            deps = [
                line.strip() for line in f if line.strip() and not line.startswith("#")
            ]
    except FileNotFoundError:
        print(
            "Warning: 'requirements.txt' not found. No dependencies will be installed."
        )
    return deps


metadata = retrieve_metadata()
long_description = read_long_description()
requirements = read_requirements()

setuptools.setup(
    name="deepcode-hku",
    url=metadata["__url__"],
    version=metadata["__version__"],
    author=metadata["__author__"],
    description="AI Research Engine - Transform research papers into working code automatically",
    long_description=long_description,
    long_description_content_type="text/markdown",
    packages=setuptools.find_packages(
        exclude=("tests*", "docs*", ".history*", ".git*", ".ruff_cache*")
    ),
    py_modules=["deepcode"],
    classifiers=[
        "Development Status :: 4 - Beta",
        "Programming Language :: Python :: 3",
        "License :: OSI Approved :: MIT License",
        "Operating System :: OS Independent",
        "Intended Audience :: Developers",
        "Intended Audience :: Science/Research",
        "Topic :: Software Development :: Libraries :: Python Modules",
        "Topic :: Scientific/Engineering :: Artificial Intelligence",
        "Topic :: Text Processing :: Linguistic",
    ],
    python_requires=">=3.9",
    install_requires=requirements,
    include_package_data=True,
    entry_points={
        "console_scripts": [
            "deepcode=deepcode:main",
        ],
    },
    project_urls={
        "Documentation": metadata.get("__url__", ""),
        "Source": metadata.get("__url__", ""),
        "Tracker": f"{metadata.get('__url__', '')}/issues"
        if metadata.get("__url__")
        else "",
    },
)


================================================
FILE: tools/__init__.py
================================================


================================================
FILE: tools/bocha_search_server.py
================================================
import os
import sys
import json

import httpx
from dotenv import load_dotenv
from mcp.server.fastmcp import FastMCP

load_dotenv()


# Initialize FastMCP server
server = FastMCP(
    "bocha-search-mcp",
    prompt="""
# Bocha Search MCP Server

Bocha is a Chinese search engine for AI, This server provides tools for searching the web using Bocha Search API.
It allows you to get enhanced search details from billions of web documents, including weather, news, wikis, healthcare, train tickets, images, and more.

## Available Tools

### 1. bocha_web_search
Search with Bocha Web Search and get enhanced search details from billions of web documents, including page titles, urls, summaries, site names, site icons, publication dates, image links, and more.

### 2. bocha_ai_search
Search with Bocha AI Search, recognizes the semantics of search terms and additionally returns structured modal cards with content from vertical domains.

## Output Format

All search results will be formatted as text with clear sections for each
result item, including:

- Bocha Web search: Title, URL, Description, Published date and Site name
- Bocha AI search: Title, URL, Description, Published date, Site name, and structured data card

If the API key is missing or invalid, appropriate error messages will be returned.
""",
)


@server.tool()
async def bocha_web_search(
    query: str, freshness: str = "noLimit", count: int = 10
) -> str:
    """Search with Bocha Web Search and get enhanced search details from billions of web documents,
    including page titles, urls, summaries, site names, site icons, publication dates, image links, and more.

    Args:
        query: Search query (required)
        freshness: The time range for the search results. (Available options YYYY-MM-DD, YYYY-MM-DD..YYYY-MM-DD, noLimit, oneYear, oneMonth, oneWeek, oneDay. Default is noLimit)
        count: Number of results (1-50, default 10)
    """
    # Get API key from environment
    boch_api_key = os.environ.get("BOCHA_API_KEY", "")

    if not boch_api_key:
        return (
            "Error: Bocha API key is not configured. Please set the "
            "BOCHA_API_KEY environment variable."
        )

    # Endpoint
    endpoint = "https://api.bochaai.com/v1/web-search?utm_source=bocha-mcp-local"

    try:
        payload = {
            "query": query,
            "summary": True,
            "freshness": freshness,
            "count": count,
        }

        headers = {
            "Authorization": f"Bearer {boch_api_key}",
            "Content-Type": "application/json",
        }

        async with httpx.AsyncClient() as client:
            response = await client.post(
                endpoint, headers=headers, json=payload, timeout=10.0
            )

            response.raise_for_status()
            resp = response.json()
            if "data" not in resp:
                return "Search error."

            data = resp["data"]

            if "webPages" not in data:
                return "No results found."

            results = []
            for result in data["webPages"]["value"]:
                results.append(
                    f"Title: {result['name']}\n"
                    f"URL: {result['url']}\n"
                    f"Description: {result['summary']}\n"
                    f"Published date: {result['datePublished']}\n"
                    f"Site name: {result['siteName']}"
                )

            return "\n\n".join(results)

    except httpx.HTTPStatusError as e:
        return f"Bocha Web Search API HTTP error occurred: {e.response.status_code} - {e.response.text}"
    except httpx.RequestError as e:
        return f"Error communicating with Bocha Web Search API: {str(e)}"
    except Exception as e:
        return f"Unexpected error: {str(e)}"


@server.tool()
async def bocha_ai_search(
    query: str, freshness: str = "noLimit", count: int = 10
) -> str:
    """Search with Bocha AI Search, recognizes the semantics of search terms
    and additionally returns structured modal cards with content from vertical domains.

    Args:
        query: Search query (required)
        freshness: The time range for the search results. (Available options noLimit, oneYear, oneMonth, oneWeek, oneDay. Default is noLimit)
        count: Number of results (1-50, default 10)
    """
    # Get API key from environment
    boch_api_key = os.environ.get("BOCHA_API_KEY", "")

    if not boch_api_key:
        return (
            "Error: Bocha API key is not configured. Please set the "
            "BOCHA_API_KEY environment variable."
        )

    # Endpoint
    endpoint = "https://api.bochaai.com/v1/ai-search?utm_source=bocha-mcp-local"

    try:
        payload = {
            "query": query,
            "freshness": freshness,
            "count": count,
            "answer": False,
            "stream": False,
        }

        headers = {
            "Authorization": f"Bearer {boch_api_key}",
            "Content-Type": "application/json",
        }

        async with httpx.AsyncClient() as client:
            response = await client.post(
                endpoint, headers=headers, json=payload, timeout=10.0
            )

            response.raise_for_status()
            response = response.json()
            results = []
            if "messages" in response:
                for message in response["messages"]:
                    content = {}
                    try:
                        content = json.loads(message["content"])
                    except (json.JSONDecodeError, TypeError):
                        content = {}

                    # 网页
                    if message["content_type"] == "webpage":
                        if "value" in content:
                            for item in content["value"]:
                                results.append(
                                    f"Title: {item['name']}\n"
                                    f"URL: {item['url']}\n"
                                    f"Description: {item['summary']}\n"
                                    f"Published date: {item['datePublished']}\n"
                                    f"Site name: {item['siteName']}"
                                )
                    elif (
                        message["content_type"] != "image"
                        and message["content"] != "{}"
                    ):
                        results.append(message["content"])

            if not results:
                return "No results found."

            return "\n\n".join(results)

    except httpx.HTTPStatusError as e:
        return f"Bocha AI Search API HTTP error occurred: {e.response.status_code} - {e.response.text}"
    except httpx.RequestError as e:
        return f"Error communicating with Bocha AI Search API: {str(e)}"
    except Exception as e:
        return f"Unexpected error: {str(e)}"


def main():
    """Initialize and run the MCP server."""

    # Check for required environment variables
    if "BOCHA_API_KEY" not in os.environ:
        print(
            "Error: BOCHA_API_KEY environment variable is required",
            file=sys.stderr,
        )
        print(
            "Get a Bocha API key from: " "https://open.bochaai.com",
            file=sys.stderr,
        )
        sys.exit(1)

    print("Starting Bocha Search MCP server...", file=sys.stderr)

    server.run(transport="stdio")


if __name__ == "__main__":
    main()


================================================
FILE: tools/code_implementation_server.py
================================================
#!/usr/bin/env python3
"""
Code Implementation MCP Server

This MCP server provides core functions needed for paper code reproduction:
1. File read/write operations
2. Code execution and testing
3. Code search and analysis
4. Iterative improvement support

Usage:
python tools/code_implementation_server.py
"""

import os
import subprocess
import json
import sys
import io
from pathlib import Path
import re
from typing import Dict, Any, List
import tempfile
import shutil
import logging
from datetime import datetime

# Set standard output encoding to UTF-8
if sys.stdout.encoding != "utf-8":
    try:
        if hasattr(sys.stdout, "reconfigure"):
            sys.stdout.reconfigure(encoding="utf-8")
            sys.stderr.reconfigure(encoding="utf-8")
        else:
            sys.stdout = io.TextIOWrapper(sys.stdout.detach(), encoding="utf-8")
            sys.stderr = io.TextIOWrapper(sys.stderr.detach(), encoding="utf-8")
    except Exception as e:
        print(f"Warning: Could not set UTF-8 encoding: {e}")

# Import MCP related modules
from mcp.server.fastmcp import FastMCP

# Setup logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Create FastMCP server instance
mcp = FastMCP("code-implementation-server")

# Global variables: workspace directory and operation history
WORKSPACE_DIR = None
OPERATION_HISTORY = []
CURRENT_FILES = {}


def initialize_workspace(workspace_dir: str = None):
    """
    Initialize workspace

    By default, the workspace will be set by the workflow via the set_workspace tool to:
    {plan_file_parent}/generate_code

    Args:
        workspace_dir: Optional workspace directory path
    """
    global WORKSPACE_DIR
    if workspace_dir is None:
        # Default to generate_code directory under current directory, but don't create immediately
        # This default value will be overridden by workflow via set_workspace tool
        WORKSPACE_DIR = Path.cwd() / "generate_code"
        # logger.info(f"Workspace initialized (default value, will be overridden by workflow): {WORKSPACE_DIR}")
        # logger.info("Note: Actual workspace will be set by workflow via set_workspace tool to {plan_file_parent}/generate_code")
    else:
        WORKSPACE_DIR = Path(workspace_dir).resolve()
        # Only create when explicitly specified
        WORKSPACE_DIR.mkdir(parents=True, exist_ok=True)
        logger.info(f"Workspace initialized: {WORKSPACE_DIR}")


def ensure_workspace_exists():
    """Ensure workspace directory exists"""
    global WORKSPACE_DIR
    if WORKSPACE_DIR is None:
        initialize_workspace()

    # Create workspace directory (if it doesn't exist)
    if not WORKSPACE_DIR.exists():
        WORKSPACE_DIR.mkdir(parents=True, exist_ok=True)
        logger.info(f"Workspace directory created: {WORKSPACE_DIR}")


def validate_path(path: str) -> Path:
    """Validate if path is within workspace"""
    if WORKSPACE_DIR is None:
        initialize_workspace()

    full_path = (WORKSPACE_DIR / path).resolve()
    if not str(full_path).startswith(str(WORKSPACE_DIR)):
        raise ValueError(f"Path {path} is outside workspace scope")
    return full_path


def log_operation(action: str, details: Dict[str, Any]):
    """Log operation history"""
    OPERATION_HISTORY.append(
        {"timestamp": datetime.now().isoformat(), "action": action, "details": details}
    )


# ==================== File Operation Tools ====================


@mcp.tool()
async def read_file(
    file_path: str, start_line: int = None, end_line: int = None
) -> str:
    """
    Read file content, supports specifying line number range

    Args:
        file_path: File path, relative to workspace
        start_line: Starting line number (1-based, optional)
        end_line: Ending line number (1-based, optional)

    Returns:
        JSON string of file content or error message
    """
    try:
        full_path = validate_path(file_path)

        if not full_path.exists():
            result = {"status": "error", "message": f"File does not exist: {file_path}"}
            log_operation(
                "read_file_error", {"file_path": file_path, "error": "file_not_found"}
            )
            return json.dumps(result, ensure_ascii=False, indent=2)

        with open(full_path, "r", encoding="utf-8") as f:
            lines = f.readlines()

        # 处理行号范围
        if start_line is not None or end_line is not None:
            start_idx = (start_line - 1) if start_line else 0
            end_idx = end_line if end_line else len(lines)
            lines = lines[start_idx:end_idx]

        content = "".join(lines)

        result = {
            "status": "success",
            "content": content,
            "file_path": file_path,
            "total_lines": len(lines),
            "size_bytes": len(content.encode("utf-8")),
        }

        log_operation(
            "read_file",
            {
                "file_path": file_path,
                "start_line": start_line,
                "end_line": end_line,
                "lines_read": len(lines),
            },
        )

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to read file: {str(e)}",
            "file_path": file_path,
        }
        log_operation("read_file_error", {"file_path": file_path, "error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def read_multiple_files(file_requests: str, max_files: int = 5) -> str:
    """
    Read multiple files in a single operation (for batch reading)

    Args:
        file_requests: JSON string with file requests, e.g.,
                      '{"file1.py": {}, "file2.py": {"start_line": 1, "end_line": 10}}'
                      or simple array: '["file1.py", "file2.py"]'
        max_files: Maximum number of files to read in one operation (default: 5)

    Returns:
        JSON string of operation results for all files
    """
    try:
        # Parse the file requests
        try:
            requests_data = json.loads(file_requests)
        except json.JSONDecodeError as e:
            return json.dumps(
                {
                    "status": "error",
                    "message": f"Invalid JSON format for file_requests: {str(e)}",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        # Normalize requests format
        if isinstance(requests_data, list):
            # Convert simple array to dict format
            normalized_requests = {file_path: {} for file_path in requests_data}
        elif isinstance(requests_data, dict):
            normalized_requests = requests_data
        else:
            return json.dumps(
                {
                    "status": "error",
                    "message": "file_requests must be a JSON object or array",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        # Validate input
        if len(normalized_requests) == 0:
            return json.dumps(
                {
                    "status": "error",
                    "message": "No files provided for reading",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        if len(normalized_requests) > max_files:
            return json.dumps(
                {
                    "status": "error",
                    "message": f"Too many files provided ({len(normalized_requests)}), maximum is {max_files}",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        # Process each file
        results = {
            "status": "success",
            "message": f"Successfully processed {len(normalized_requests)} files",
            "operation_type": "multi_file",
            "timestamp": datetime.now().isoformat(),
            "files_processed": len(normalized_requests),
            "files": {},
            "summary": {
                "successful": 0,
                "failed": 0,
                "total_size_bytes": 0,
                "total_lines": 0,
                "files_not_found": 0,
            },
        }

        # Process each file individually
        for file_path, options in normalized_requests.items():
            try:
                full_path = validate_path(file_path)
                start_line = options.get("start_line")
                end_line = options.get("end_line")

                if not full_path.exists():
                    results["files"][file_path] = {
                        "status": "error",
                        "message": f"File does not exist: {file_path}",
                        "file_path": file_path,
                        "content": "",
                        "total_lines": 0,
                        "size_bytes": 0,
                        "start_line": start_line,
                        "end_line": end_line,
                    }
                    results["summary"]["failed"] += 1
                    results["summary"]["files_not_found"] += 1
                    continue

                with open(full_path, "r", encoding="utf-8") as f:
                    lines = f.readlines()

                # Handle line range
                original_line_count = len(lines)
                if start_line is not None or end_line is not None:
                    start_idx = (start_line - 1) if start_line else 0
                    end_idx = end_line if end_line else len(lines)
                    lines = lines[start_idx:end_idx]

                content = "".join(lines)
                size_bytes = len(content.encode("utf-8"))
                lines_count = len(lines)

                # Record individual file result
                results["files"][file_path] = {
                    "status": "success",
                    "message": f"File read successfully: {file_path}",
                    "file_path": file_path,
                    "content": content,
                    "total_lines": lines_count,
                    "original_total_lines": original_line_count,
                    "size_bytes": size_bytes,
                    "start_line": start_line,
                    "end_line": end_line,
                    "line_range_applied": start_line is not None
                    or end_line is not None,
                }

                # Update summary
                results["summary"]["successful"] += 1
                results["summary"]["total_size_bytes"] += size_bytes
                results["summary"]["total_lines"] += lines_count

                # Log individual file operation
                log_operation(
                    "read_file_multi",
                    {
                        "file_path": file_path,
                        "start_line": start_line,
                        "end_line": end_line,
                        "lines_read": lines_count,
                        "size_bytes": size_bytes,
                        "batch_operation": True,
                    },
                )

            except Exception as file_error:
                # Record individual file error
                results["files"][file_path] = {
                    "status": "error",
                    "message": f"Failed to read file: {str(file_error)}",
                    "file_path": file_path,
                    "content": "",
                    "total_lines": 0,
                    "size_bytes": 0,
                    "start_line": options.get("start_line"),
                    "end_line": options.get("end_line"),
                }

                results["summary"]["failed"] += 1

                # Log individual file error
                log_operation(
                    "read_file_multi_error",
                    {
                        "file_path": file_path,
                        "error": str(file_error),
                        "batch_operation": True,
                    },
                )

        # Determine overall status
        if results["summary"]["failed"] > 0:
            if results["summary"]["successful"] > 0:
                results["status"] = "partial_success"
                results["message"] = (
                    f"Read {results['summary']['successful']} files successfully, {results['summary']['failed']} failed"
                )
            else:
                results["status"] = "failed"
                results["message"] = (
                    f"All {results['summary']['failed']} files failed to read"
                )

        # Log overall operation
        log_operation(
            "read_multiple_files",
            {
                "files_count": len(normalized_requests),
                "successful": results["summary"]["successful"],
                "failed": results["summary"]["failed"],
                "total_size_bytes": results["summary"]["total_size_bytes"],
                "status": results["status"],
            },
        )

        return json.dumps(results, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to read multiple files: {str(e)}",
            "operation_type": "multi_file",
            "timestamp": datetime.now().isoformat(),
            "files_processed": 0,
        }
        log_operation("read_multiple_files_error", {"error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def write_file(
    file_path: str, content: str, create_dirs: bool = True, create_backup: bool = False
) -> str:
    """
    Write content to file

    Args:
        file_path: File path, relative to workspace
        content: Content to write to file
        create_dirs: Whether to create directories if they don't exist
        create_backup: Whether to create backup file if file already exists

    Returns:
        JSON string of operation result
    """
    try:
        full_path = validate_path(file_path)

        # Create directories (if needed)
        if create_dirs:
            full_path.parent.mkdir(parents=True, exist_ok=True)

        # Backup existing file (only when explicitly requested)
        backup_created = False
        if full_path.exists() and create_backup:
            backup_path = full_path.with_suffix(full_path.suffix + ".backup")
            shutil.copy2(full_path, backup_path)
            backup_created = True

        # Write file
        with open(full_path, "w", encoding="utf-8") as f:
            f.write(content)

        # Update current file record
        CURRENT_FILES[file_path] = {
            "last_modified": datetime.now().isoformat(),
            "size_bytes": len(content.encode("utf-8")),
            "lines": len(content.split("\n")),
        }

        result = {
            "status": "success",
            "message": f"File written successfully: {file_path}",
            "file_path": file_path,
            "size_bytes": len(content.encode("utf-8")),
            "lines_written": len(content.split("\n")),
            "backup_created": backup_created,
        }

        log_operation(
            "write_file",
            {
                "file_path": file_path,
                "size_bytes": len(content.encode("utf-8")),
                "lines": len(content.split("\n")),
                "backup_created": backup_created,
            },
        )

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to write file: {str(e)}",
            "file_path": file_path,
        }
        log_operation("write_file_error", {"file_path": file_path, "error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def write_multiple_files(
    file_implementations: str,
    create_dirs: bool = True,
    create_backup: bool = False,
    max_files: int = 5,
) -> str:
    """
    Write multiple files in a single operation (for batch implementation)

    Args:
        file_implementations: JSON string mapping file paths to content, e.g.,
                            '{"file1.py": "content1", "file2.py": "content2"}'
        create_dirs: Whether to create directories if they don't exist
        create_backup: Whether to create backup files if they already exist
        max_files: Maximum number of files to write in one operation (default: 5)

    Returns:
        JSON string of operation results for all files
    """
    try:
        # Parse the file implementations
        try:
            files_dict = json.loads(file_implementations)
        except json.JSONDecodeError as e:
            return json.dumps(
                {
                    "status": "error",
                    "message": f"Invalid JSON format for file_implementations: {str(e)}",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        # Validate input
        if not isinstance(files_dict, dict):
            return json.dumps(
                {
                    "status": "error",
                    "message": "file_implementations must be a JSON object mapping file paths to content",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        if len(files_dict) == 0:
            return json.dumps(
                {
                    "status": "error",
                    "message": "No files provided for writing",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        if len(files_dict) > max_files:
            return json.dumps(
                {
                    "status": "error",
                    "message": f"Too many files provided ({len(files_dict)}), maximum is {max_files}",
                    "operation_type": "multi_file",
                    "timestamp": datetime.now().isoformat(),
                },
                ensure_ascii=False,
                indent=2,
            )

        # Process each file
        results = {
            "status": "success",
            "message": f"Successfully processed {len(files_dict)} files",
            "operation_type": "multi_file",
            "timestamp": datetime.now().isoformat(),
            "files_processed": len(files_dict),
            "files": {},
            "summary": {
                "successful": 0,
                "failed": 0,
                "total_size_bytes": 0,
                "total_lines": 0,
                "backups_created": 0,
            },
        }

        # Process each file individually
        for file_path, content in files_dict.items():
            try:
                full_path = validate_path(file_path)

                # Create directories (if needed)
                if create_dirs:
                    full_path.parent.mkdir(parents=True, exist_ok=True)

                # Backup existing file (only when explicitly requested)
                backup_created = False
                if full_path.exists() and create_backup:
                    backup_path = full_path.with_suffix(full_path.suffix + ".backup")
                    shutil.copy2(full_path, backup_path)
                    backup_created = True
                    results["summary"]["backups_created"] += 1

                # Write file
                with open(full_path, "w", encoding="utf-8") as f:
                    f.write(content)

                # Calculate file metrics
                size_bytes = len(content.encode("utf-8"))
                lines_count = len(content.split("\n"))

                # Update current file record
                CURRENT_FILES[file_path] = {
                    "last_modified": datetime.now().isoformat(),
                    "size_bytes": size_bytes,
                    "lines": lines_count,
                }

                # Record individual file result
                results["files"][file_path] = {
                    "status": "success",
                    "message": f"File written successfully: {file_path}",
                    "size_bytes": size_bytes,
                    "lines_written": lines_count,
                    "backup_created": backup_created,
                }

                # Update summary
                results["summary"]["successful"] += 1
                results["summary"]["total_size_bytes"] += size_bytes
                results["summary"]["total_lines"] += lines_count

                # Log individual file operation
                log_operation(
                    "write_file_multi",
                    {
                        "file_path": file_path,
                        "size_bytes": size_bytes,
                        "lines": lines_count,
                        "backup_created": backup_created,
                        "batch_operation": True,
                    },
                )

            except Exception as file_error:
                # Record individual file error
                results["files"][file_path] = {
                    "status": "error",
                    "message": f"Failed to write file: {str(file_error)}",
                    "size_bytes": 0,
                    "lines_written": 0,
                    "backup_created": False,
                }

                results["summary"]["failed"] += 1

                # Log individual file error
                log_operation(
                    "write_file_multi_error",
                    {
                        "file_path": file_path,
                        "error": str(file_error),
                        "batch_operation": True,
                    },
                )

        # Determine overall status
        if results["summary"]["failed"] > 0:
            if results["summary"]["successful"] > 0:
                results["status"] = "partial_success"
                results["message"] = (
                    f"Processed {results['summary']['successful']} files successfully, {results['summary']['failed']} failed"
                )
            else:
                results["status"] = "failed"
                results["message"] = (
                    f"All {results['summary']['failed']} files failed to write"
                )

        # Log overall operation
        log_operation(
            "write_multiple_files",
            {
                "files_count": len(files_dict),
                "successful": results["summary"]["successful"],
                "failed": results["summary"]["failed"],
                "total_size_bytes": results["summary"]["total_size_bytes"],
                "status": results["status"],
            },
        )

        return json.dumps(results, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to write multiple files: {str(e)}",
            "operation_type": "multi_file",
            "timestamp": datetime.now().isoformat(),
            "files_processed": 0,
        }
        log_operation("write_multiple_files_error", {"error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


# ==================== Code Execution Tools ====================


@mcp.tool()
async def execute_python(code: str, timeout: int = 30) -> str:
    """
    Execute Python code and return output

    Args:
        code: Python code to execute
        timeout: Timeout in seconds

    Returns:
        JSON string of execution result
    """
    try:
        # Create temporary file
        with tempfile.NamedTemporaryFile(
            mode="w", suffix=".py", delete=False, encoding="utf-8"
        ) as f:
            f.write(code)
            temp_file = f.name

        try:
            # Ensure workspace directory exists
            ensure_workspace_exists()

            # Execute Python code
            result = subprocess.run(
                [sys.executable, temp_file],
                cwd=WORKSPACE_DIR,
                capture_output=True,
                text=True,
                timeout=timeout,
                encoding="utf-8",
            )

            execution_result = {
                "status": "success" if result.returncode == 0 else "error",
                "return_code": result.returncode,
                "stdout": result.stdout,
                "stderr": result.stderr,
                "timeout": timeout,
            }

            if result.returncode != 0:
                execution_result["message"] = "Python code execution failed"
            else:
                execution_result["message"] = "Python code execution successful"

            log_operation(
                "execute_python",
                {
                    "return_code": result.returncode,
                    "stdout_length": len(result.stdout),
                    "stderr_length": len(result.stderr),
                },
            )

            return json.dumps(execution_result, ensure_ascii=False, indent=2)

        finally:
            # Clean up temporary file
            os.unlink(temp_file)

    except subprocess.TimeoutExpired:
        result = {
            "status": "error",
            "message": f"Python code execution timeout ({timeout}秒)",
            "timeout": timeout,
        }
        log_operation("execute_python_timeout", {"timeout": timeout})
        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Python code execution failed: {str(e)}",
        }
        log_operation("execute_python_error", {"error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def execute_bash(command: str, timeout: int = 30) -> str:
    """
    Execute bash command

    Args:
        command: Bash command to execute
        timeout: Timeout in seconds

    Returns:
        JSON string of execution result
    """
    try:
        # 安全检查：禁止危险命令
        dangerous_commands = ["rm -rf", "sudo", "chmod 777", "mkfs", "dd if="]
        if any(dangerous in command.lower() for dangerous in dangerous_commands):
            result = {
                "status": "error",
                "message": f"Dangerous command execution prohibited: {command}",
            }
            log_operation(
                "execute_bash_blocked",
                {"command": command, "reason": "dangerous_command"},
            )
            return json.dumps(result, ensure_ascii=False, indent=2)

        # Ensure workspace directory exists
        ensure_workspace_exists()

        # Execute command
        result = subprocess.run(
            command,
            shell=True,
            cwd=WORKSPACE_DIR,
            capture_output=True,
            text=True,
            timeout=timeout,
            encoding="utf-8",
        )

        execution_result = {
            "status": "success" if result.returncode == 0 else "error",
            "return_code": result.returncode,
            "stdout": result.stdout,
            "stderr": result.stderr,
            "command": command,
            "timeout": timeout,
        }

        if result.returncode != 0:
            execution_result["message"] = "Bash command execution failed"
        else:
            execution_result["message"] = "Bash command execution successful"

        log_operation(
            "execute_bash",
            {
                "command": command,
                "return_code": result.returncode,
                "stdout_length": len(result.stdout),
                "stderr_length": len(result.stderr),
            },
        )

        return json.dumps(execution_result, ensure_ascii=False, indent=2)

    except subprocess.TimeoutExpired:
        result = {
            "status": "error",
            "message": f"Bash command execution timeout ({timeout} seconds)",
            "command": command,
            "timeout": timeout,
        }
        log_operation("execute_bash_timeout", {"command": command, "timeout": timeout})
        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to execute bash command: {str(e)}",
            "command": command,
        }
        log_operation("execute_bash_error", {"command": command, "error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def read_code_mem(file_paths: List[str]) -> str:
    """
    Check if file summaries exist in implement_code_summary.md for multiple files

    Args:
        file_paths: List of file paths to check for summary information in implement_code_summary.md

    Returns:
        Summary information for all requested files if available
    """
    try:
        if not file_paths or not isinstance(file_paths, list):
            result = {
                "status": "error",
                "message": "file_paths parameter is required and must be a list",
            }
            log_operation(
                "read_code_mem_error", {"error": "missing_or_invalid_file_paths"}
            )
            return json.dumps(result, ensure_ascii=False, indent=2)

        # Remove duplicates while preserving order
        unique_file_paths = list(dict.fromkeys(file_paths))

        # Ensure workspace exists
        ensure_workspace_exists()

        # Look for implement_code_summary.md in the workspace
        current_path = Path(WORKSPACE_DIR)
        summary_file_path = current_path.parent / "implement_code_summary.md"

        if not summary_file_path.exists():
            result = {
                "status": "no_summary",
                "file_paths": unique_file_paths,
                "message": "No summary file found.",
                "results": [],
            }
            log_operation(
                "read_code_mem",
                {"file_paths": unique_file_paths, "status": "no_summary_file"},
            )
            return json.dumps(result, ensure_ascii=False, indent=2)

        # Read the summary file
        with open(summary_file_path, "r", encoding="utf-8") as f:
            summary_content = f.read()

        if not summary_content.strip():
            result = {
                "status": "no_summary",
                "file_paths": unique_file_paths,
                "message": "Summary file is empty.",
                "results": [],
            }
            log_operation(
                "read_code_mem",
                {"file_paths": unique_file_paths, "status": "empty_summary"},
            )
            return json.dumps(result, ensure_ascii=False, indent=2)

        # Process each file path and collect results
        results = []
        summaries_found = 0

        for file_path in unique_file_paths:
            # Extract file-specific section from summary
            file_section = _extract_file_section_from_summary(
                summary_content, file_path
            )

            if file_section:
                file_result = {
                    "file_path": file_path,
                    "status": "summary_found",
                    "summary_content": file_section,
                    "message": f"Summary information found for {file_path}",
                }
                summaries_found += 1
            else:
                file_result = {
                    "file_path": file_path,
                    "status": "no_summary",
                    "summary_content": None,
                    "message": f"No summary found for {file_path}",
                }

            results.append(file_result)

        # Determine overall status
        if summaries_found == len(unique_file_paths):
            overall_status = "all_summaries_found"
        elif summaries_found > 0:
            overall_status = "partial_summaries_found"
        else:
            overall_status = "no_summaries_found"

        result = {
            "status": overall_status,
            "file_paths": unique_file_paths,
            "total_requested": len(unique_file_paths),
            "summaries_found": summaries_found,
            "message": f"Found summaries for {summaries_found}/{len(unique_file_paths)} files",
            "results": results,
        }

        log_operation(
            "read_code_mem",
            {
                "file_paths": unique_file_paths,
                "status": overall_status,
                "total_requested": len(unique_file_paths),
                "summaries_found": summaries_found,
            },
        )

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to check code memory: {str(e)}",
            "file_paths": file_paths
            if isinstance(file_paths, list)
            else [str(file_paths)],
            "results": [],
        }
        log_operation(
            "read_code_mem_error", {"file_paths": file_paths, "error": str(e)}
        )
        return json.dumps(result, ensure_ascii=False, indent=2)


def _extract_file_section_from_summary(
    summary_content: str, target_file_path: str
) -> str:
    """
    Extract the specific section for a file from the summary content

    Args:
        summary_content: Full summary content
        target_file_path: Path of the target file

    Returns:
        File-specific section or None if not found
    """
    import re

    # Normalize the target path for comparison
    normalized_target = _normalize_file_path(target_file_path)

    # Pattern to match implementation sections with separator lines
    section_pattern = r"={80}\s*\n## IMPLEMENTATION File ([^;]+); ROUND \d+\s*\n={80}(.*?)(?=\n={80}|\Z)"

    matches = re.findall(section_pattern, summary_content, re.DOTALL)

    for file_path_in_summary, section_content in matches:
        file_path_in_summary = file_path_in_summary.strip()
        section_content = section_content.strip()

        # Normalize the path from summary for comparison
        normalized_summary_path = _normalize_file_path(file_path_in_summary)

        # Check if paths match using multiple strategies
        if _paths_match(
            normalized_target,
            normalized_summary_path,
            target_file_path,
            file_path_in_summary,
        ):
            # Return the complete section with proper formatting
            file_section = f"""================================================================================
## IMPLEMENTATION File {file_path_in_summary}; ROUND [X]
================================================================================

{section_content}

---
*Extracted from implement_code_summary.md*"""
            return file_section

    # If no section-based match, try alternative parsing method
    return _extract_file_section_alternative(summary_content, target_file_path)


def _normalize_file_path(file_path: str) -> str:
    """Normalize file path for comparison"""
    # Remove leading/trailing slashes and convert to lowercase
    normalized = file_path.strip("/").lower()
    # Replace backslashes with forward slashes
    normalized = normalized.replace("\\", "/")

    # Remove common prefixes to make matching more flexible
    common_prefixes = ["src/", "./src/", "./", "core/", "lib/", "main/"]
    for prefix in common_prefixes:
        if normalized.startswith(prefix):
            normalized = normalized[len(prefix) :]
            break

    return normalized


def _paths_match(
    normalized_target: str,
    normalized_summary: str,
    original_target: str,
    original_summary: str,
) -> bool:
    """Check if two file paths match using multiple strategies"""

    # Strategy 1: Exact normalized match
    if normalized_target == normalized_summary:
        return True

    # Strategy 2: Basename match (filename only)
    target_basename = os.path.basename(original_target)
    summary_basename = os.path.basename(original_summary)
    if target_basename == summary_basename and len(target_basename) > 4:
        return True

    # Strategy 3: Suffix match (remove common prefixes and compare)
    target_suffix = _remove_common_prefixes(normalized_target)
    summary_suffix = _remove_common_prefixes(normalized_summary)
    if target_suffix == summary_suffix:
        return True

    # Strategy 4: Ends with match
    if normalized_target.endswith(normalized_summary) or normalized_summary.endswith(
        normalized_target
    ):
        return True

    # Strategy 5: Contains match for longer paths
    if len(normalized_target) > 10 and normalized_target in normalized_summary:
        return True
    if len(normalized_summary) > 10 and normalized_summary in normalized_target:
        return True

    return False


def _remove_common_prefixes(file_path: str) -> str:
    """Remove common prefixes from file path"""
    prefixes_to_remove = ["src/", "core/", "./", "lib/", "main/"]
    path = file_path

    for prefix in prefixes_to_remove:
        if path.startswith(prefix):
            path = path[len(prefix) :]

    return path


def _extract_file_section_alternative(
    summary_content: str, target_file_path: str
) -> str:
    """Alternative method to extract file section using simpler pattern matching"""

    # Get the basename for fallback matching
    target_basename = os.path.basename(target_file_path)

    # Split by separator lines to get individual sections
    sections = summary_content.split("=" * 80)

    for i, section in enumerate(sections):
        if "## IMPLEMENTATION File" in section:
            # Extract the file path from the header
            lines = section.strip().split("\n")
            for line in lines:
                if "## IMPLEMENTATION File" in line:
                    # Extract file path between "File " and "; ROUND"
                    try:
                        file_part = line.split("File ")[1].split("; ROUND")[0].strip()

                        # Check if this matches our target
                        if (
                            _normalize_file_path(target_file_path)
                            == _normalize_file_path(file_part)
                            or target_basename == os.path.basename(file_part)
                            or target_file_path in file_part
                            or file_part.endswith(target_file_path)
                        ):
                            # Get the next section which contains the content
                            if i + 1 < len(sections):
                                content_section = sections[i + 1].strip()
                                return f"""================================================================================
## IMPLEMENTATION File {file_part}
================================================================================

{content_section}

---
*Extracted from implement_code_summary.md using alternative method*"""
                    except (IndexError, AttributeError):
                        continue

    return None


# ==================== Code Search Tools ====================


@mcp.tool()
async def search_code(
    pattern: str,
    file_pattern: str = "*.json",
    use_regex: bool = False,
    search_directory: str = None,
) -> str:
    """
    Search patterns in code files

    Args:
        pattern: Search pattern
        file_pattern: File pattern (e.g., '*.py')
        use_regex: Whether to use regular expressions
        search_directory: Specify search directory (optional, uses WORKSPACE_DIR if not specified)

    Returns:
        JSON string of search results
    """
    try:
        # Determine search directory
        if search_directory:
            # If search directory is specified, use the specified directory
            if os.path.isabs(search_directory):
                search_path = Path(search_directory)
            else:
                # Relative path, relative to current working directory
                search_path = Path.cwd() / search_directory
        else:
            # 如果没有指定Search directory，使用默认的WORKSPACE_DIR
            ensure_workspace_exists()
            search_path = WORKSPACE_DIR

        # 检查Search directory是否存在
        if not search_path.exists():
            result = {
                "status": "error",
                "message": f"Search directory不存在: {search_path}",
                "pattern": pattern,
            }
            return json.dumps(result, ensure_ascii=False, indent=2)

        import glob

        # Get matching files
        file_paths = glob.glob(str(search_path / "**" / file_pattern), recursive=True)

        matches = []
        total_files_searched = 0

        for file_path in file_paths:
            try:
                with open(file_path, "r", encoding="utf-8") as f:
                    lines = f.readlines()

                total_files_searched += 1
                relative_path = os.path.relpath(file_path, search_path)

                for line_num, line in enumerate(lines, 1):
                    if use_regex:
                        if re.search(pattern, line):
                            matches.append(
                                {
                                    "file": relative_path,
                                    "line_number": line_num,
                                    "line_content": line.strip(),
                                    "match_type": "regex",
                                }
                            )
                    else:
                        if pattern.lower() in line.lower():
                            matches.append(
                                {
                                    "file": relative_path,
                                    "line_number": line_num,
                                    "line_content": line.strip(),
                                    "match_type": "substring",
                                }
                            )

            except Exception as e:
                logger.warning(f"Error searching file {file_path}: {e}")
                continue

        result = {
            "status": "success",
            "pattern": pattern,
            "file_pattern": file_pattern,
            "use_regex": use_regex,
            "search_directory": str(search_path),
            "total_matches": len(matches),
            "total_files_searched": total_files_searched,
            "matches": matches[:50],  # 限制返回前50个匹配
        }

        if len(matches) > 50:
            result["note"] = f"显示前50个匹配，总共找到{len(matches)}个匹配"

        log_operation(
            "search_code",
            {
                "pattern": pattern,
                "file_pattern": file_pattern,
                "use_regex": use_regex,
                "search_directory": str(search_path),
                "total_matches": len(matches),
                "files_searched": total_files_searched,
            },
        )

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Code search failed: {str(e)}",
            "pattern": pattern,
        }
        log_operation("search_code_error", {"pattern": pattern, "error": str(e)})
        return json.dumps(result, ensure_ascii=False, indent=2)


# ==================== File Structure Tools ====================


@mcp.tool()
async def get_file_structure(directory: str = ".", max_depth: int = 5) -> str:
    """
    Get directory file structure

    Args:
        directory: Directory path, relative to workspace
        max_depth: 最大遍历深度

    Returns:
        JSON string of file structure
    """
    try:
        ensure_workspace_exists()

        if directory == ".":
            target_dir = WORKSPACE_DIR
        else:
            target_dir = validate_path(directory)

        if not target_dir.exists():
            result = {
                "status": "error",
                "message": f"Directory does not exist: {directory}",
            }
            return json.dumps(result, ensure_ascii=False, indent=2)

        def scan_directory(path: Path, current_depth: int = 0) -> Dict[str, Any]:
            """Recursively scan directory"""
            if current_depth >= max_depth:
                return {"type": "directory", "name": path.name, "truncated": True}

            items = []
            try:
                for item in sorted(path.iterdir()):
                    relative_path = os.path.relpath(item, WORKSPACE_DIR)

                    if item.is_file():
                        file_info = {
                            "type": "file",
                            "name": item.name,
                            "path": relative_path,
                            "size_bytes": item.stat().st_size,
                            "extension": item.suffix,
                        }
                        items.append(file_info)
                    elif item.is_dir() and not item.name.startswith("."):
                        dir_info = scan_directory(item, current_depth + 1)
                        dir_info["path"] = relative_path
                        items.append(dir_info)
            except PermissionError:
                pass

            return {
                "type": "directory",
                "name": path.name,
                "items": items,
                "item_count": len(items),
            }

        structure = scan_directory(target_dir)

        # 统计信息
        def count_items(node):
            if node["type"] == "file":
                return {"files": 1, "directories": 0}
            else:
                counts = {"files": 0, "directories": 1}
                for item in node.get("items", []):
                    item_counts = count_items(item)
                    counts["files"] += item_counts["files"]
                    counts["directories"] += item_counts["directories"]
                return counts

        counts = count_items(structure)

        result = {
            "status": "success",
            "directory": directory,
            "max_depth": max_depth,
            "structure": structure,
            "summary": {
                "total_files": counts["files"],
                "total_directories": counts["directories"]
                - 1,  # Exclude root directory
            },
        }

        log_operation(
            "get_file_structure",
            {
                "directory": directory,
                "max_depth": max_depth,
                "total_files": counts["files"],
                "total_directories": counts["directories"] - 1,
            },
        )

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to get file structure: {str(e)}",
            "directory": directory,
        }
        log_operation(
            "get_file_structure_error", {"directory": directory, "error": str(e)}
        )
        return json.dumps(result, ensure_ascii=False, indent=2)


# ==================== Workspace Management Tools ====================


@mcp.tool()
async def set_workspace(workspace_path: str) -> str:
    """
    Set workspace directory

    Called by workflow to set workspace to: {plan_file_parent}/generate_code
    This ensures all file operations are executed relative to the correct project directory

    Args:
        workspace_path: Workspace path (Usually {plan_file_parent}/generate_code)

    Returns:
        JSON string of operation result
    """
    try:
        global WORKSPACE_DIR
        new_workspace = Path(workspace_path).resolve()

        # Create directory (if it does not exist)
        new_workspace.mkdir(parents=True, exist_ok=True)

        old_workspace = WORKSPACE_DIR
        WORKSPACE_DIR = new_workspace

        logger.info(f"New Workspace: {WORKSPACE_DIR}")

        result = {
            "status": "success",
            "message": f"Workspace setup successful: {workspace_path}",
            "new_workspace": str(WORKSPACE_DIR),
        }

        log_operation(
            "set_workspace",
            {
                "old_workspace": str(old_workspace) if old_workspace else None,
                "new_workspace": str(WORKSPACE_DIR),
                "workspace_alignment": "plan_file_parent/generate_code",
            },
        )

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to set workspace: {str(e)}",
            "workspace_path": workspace_path,
        }
        log_operation(
            "set_workspace_error", {"workspace_path": workspace_path, "error": str(e)}
        )
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def get_operation_history(last_n: int = 10) -> str:
    """
    Get operation history

    Args:
        last_n: Return the last N operations

    Returns:
        JSON string of operation history
    """
    try:
        recent_history = (
            OPERATION_HISTORY[-last_n:] if last_n > 0 else OPERATION_HISTORY
        )

        result = {
            "status": "success",
            "total_operations": len(OPERATION_HISTORY),
            "returned_operations": len(recent_history),
            "workspace": str(WORKSPACE_DIR) if WORKSPACE_DIR else None,
            "history": recent_history,
        }

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to get operation history: {str(e)}",
        }
        return json.dumps(result, ensure_ascii=False, indent=2)


# ==================== Server Initialization ====================


def main():
    """Start MCP server"""
    print("🚀 Code Implementation MCP Server")
    print(
        "📝 Paper Code Implementation Tool Server / Paper Code Implementation Tool Server"
    )
    print("")
    print("Available tools / Available tools:")
    # print("  • read_file           - Read file contents / Read file contents")
    print(
        "  • read_code_mem       - Read code summary from implement_code_summary.md / Read code summary from implement_code_summary.md"
    )
    print("  • write_file          - Write file contents / Write file contents")
    print("  • execute_python      - Execute Python code / Execute Python code")
    print("  • execute_bash        - Execute bash command / Execute bash commands")
    print("  • search_code         - Search code patterns / Search code patterns")
    print("  • get_file_structure  - Get file structure / Get file structure")
    print("  • set_workspace       - Set workspace / Set workspace")
    print("  • get_operation_history - Get operation history / Get operation history")
    print("")
    print("🔧 Server starting...")

    # Initialize default workspace
    initialize_workspace()

    # Start server
    mcp.run()


if __name__ == "__main__":
    main()


================================================
FILE: tools/code_indexer.py
================================================
"""
Code Indexer for Repository Analysis

Analyzes code repositories to build comprehensive indexes for each subdirectory,
identifying file relationships and reusable components for implementation.

Features:
- Recursive file traversal
- LLM-powered code similarity analysis using augmented LLM classes
- JSON-based relationship storage
- Configurable matching strategies
- Progress tracking and error handling
- Automatic LLM provider selection based on API key availability
"""

import asyncio
import json
import logging
import os
import re
from datetime import datetime
from pathlib import Path
from dataclasses import dataclass, asdict
from typing import List, Dict, Any

# MCP Agent imports for LLM
from utils.llm_utils import get_preferred_llm_class, get_default_models


@dataclass
class FileRelationship:
    """Represents a relationship between a repo file and target structure file"""

    repo_file_path: str
    target_file_path: str
    relationship_type: str  # 'direct_match', 'partial_match', 'reference', 'utility'
    confidence_score: float  # 0.0 to 1.0
    helpful_aspects: List[str]
    potential_contributions: List[str]
    usage_suggestions: str


@dataclass
class FileSummary:
    """Summary information for a repository file"""

    file_path: str
    file_type: str
    main_functions: List[str]
    key_concepts: List[str]
    dependencies: List[str]
    summary: str
    lines_of_code: int
    last_modified: str


@dataclass
class RepoIndex:
    """Complete index for a repository"""

    repo_name: str
    total_files: int
    file_summaries: List[FileSummary]
    relationships: List[FileRelationship]
    analysis_metadata: Dict[str, Any]


class CodeIndexer:
    """Main class for building code repository indexes"""

    def __init__(
        self,
        code_base_path: str = None,
        target_structure: str = None,
        output_dir: str = None,
        config_path: str = "mcp_agent.secrets.yaml",
        indexer_config_path: str = None,
        enable_pre_filtering: bool = True,
    ):
        # Load configurations first
        self.config_path = config_path
        self.indexer_config_path = indexer_config_path
        # Derive main config path from secrets path (same directory)
        secrets_dir = os.path.dirname(os.path.abspath(config_path))
        self.main_config_path = os.path.join(secrets_dir, "mcp_agent.config.yaml")
        self.api_config = self._load_api_config()
        self.indexer_config = self._load_indexer_config()
        self.default_models = get_default_models(self.main_config_path)

        # Use config paths if not provided as parameters
        paths_config = self.indexer_config.get("paths", {})
        self.code_base_path = Path(
            code_base_path or paths_config.get("code_base_path", "code_base")
        )
        self.output_dir = Path(output_dir or paths_config.get("output_dir", "indexes"))
        self.target_structure = (
            target_structure  # This must be provided as it's project-specific
        )
        self.enable_pre_filtering = enable_pre_filtering

        # LLM clients
        self.llm_client = None
        self.llm_client_type = None

        # Initialize logger early
        self.logger = self._setup_logger()

        # Create output directory if it doesn't exist
        self.output_dir.mkdir(parents=True, exist_ok=True)

        # Load file analysis configuration
        file_analysis_config = self.indexer_config.get("file_analysis", {})
        self.supported_extensions = set(
            file_analysis_config.get(
                "supported_extensions",
                [
                    ".py",
                    ".js",
                    ".ts",
                    ".java",
                    ".cpp",
                    ".c",
                    ".h",
                    ".hpp",
                    ".cs",
                    ".php",
                    ".rb",
                    ".go",
                    ".rs",
                    ".scala",
                    ".kt",
                    ".swift",
                    ".m",
                    ".mm",
                    ".r",
                    ".matlab",
                    ".sql",
                    ".sh",
                    ".bat",
                    ".ps1",
                    ".yaml",
                    ".yml",
                    ".json",
                    ".xml",
                    ".toml",
                ],
            )
        )

        self.skip_directories = set(
            file_analysis_config.get(
                "skip_directories",
                [
                    "__pycache__",
                    "node_modules",
                    "target",
                    "build",
                    "dist",
                    "venv",
                    "env",
                ],
            )
        )

        self.max_file_size = file_analysis_config.get("max_file_size", 1048576)  # 1MB
        self.max_content_length = file_analysis_config.get("max_content_length", 3000)

        # Load LLM configuration
        llm_config = self.indexer_config.get("llm", {})
        self.model_provider = llm_config.get("model_provider", "anthropic")
        self.llm_max_tokens = llm_config.get("max_tokens", 4000)
        self.llm_temperature = llm_config.get("temperature", 0.3)
        self.llm_system_prompt = llm_config.get(
            "system_prompt",
            "You are a code analysis expert. Provide precise, structured analysis of code relationships and similarities.",
        )
        self.request_delay = llm_config.get("request_delay", 0.1)
        self.max_retries = llm_config.get("max_retries", 3)
        self.retry_delay = llm_config.get("retry_delay", 1.0)

        # Load relationship configuration
        relationship_config = self.indexer_config.get("relationships", {})
        self.min_confidence_score = relationship_config.get("min_confidence_score", 0.3)
        self.high_confidence_threshold = relationship_config.get(
            "high_confidence_threshold", 0.7
        )
        self.relationship_types = relationship_config.get(
            "relationship_types",
            {
                "direct_match": 1.0,
                "partial_match": 0.8,
                "reference": 0.6,
                "utility": 0.4,
            },
        )

        # Load performance configuration
        performance_config = self.indexer_config.get("performance", {})
        self.enable_concurrent_analysis = performance_config.get(
            "enable_concurrent_analysis", False
        )
        self.max_concurrent_files = performance_config.get("max_concurrent_files", 5)
        self.enable_content_caching = performance_config.get(
            "enable_content_caching", False
        )
        self.max_cache_size = performance_config.get("max_cache_size", 100)

        # Load debug configuration
        debug_config = self.indexer_config.get("debug", {})
        self.save_raw_responses = debug_config.get("save_raw_responses", False)
        self.raw_responses_dir = debug_config.get(
            "raw_responses_dir", "debug_responses"
        )
        self.verbose_output = debug_config.get("verbose_output", False)
        self.mock_llm_responses = debug_config.get("mock_llm_responses", False)

        # Load output configuration
        output_config = self.indexer_config.get("output", {})
        self.generate_summary = output_config.get("generate_summary", True)
        self.generate_statistics = output_config.get("generate_statistics", True)
        self.include_metadata = output_config.get("include_metadata", True)
        self.index_filename_pattern = output_config.get(
            "index_filename_pattern", "{repo_name}_index.json"
        )
        self.summary_filename = output_config.get(
            "summary_filename", "indexing_summary.json"
        )
        self.stats_filename = output_config.get(
            "stats_filename", "indexing_statistics.json"
        )

        # Initialize caching if enabled
        self.content_cache = {} if self.enable_content_caching else None

        # Create debug directory if needed
        if self.save_raw_responses:
            Path(self.raw_responses_dir).mkdir(parents=True, exist_ok=True)

        # Debug logging
        if self.verbose_output:
            self.logger.info(
                f"Initialized CodeIndexer with config: {self.indexer_config_path}"
            )
            self.logger.info(f"Code base path: {self.code_base_path}")
            self.logger.info(f"Output directory: {self.output_dir}")
            self.logger.info(f"Model provider: {self.model_provider}")
            self.logger.info(f"Concurrent analysis: {self.enable_concurrent_analysis}")
            self.logger.info(f"Content caching: {self.enable_content_caching}")
            self.logger.info(f"Mock LLM responses: {self.mock_llm_responses}")

    def _setup_logger(self) -> logging.Logger:
        """Setup logging configuration from config file"""
        logger = logging.getLogger("CodeIndexer")

        # Get logging config
        logging_config = self.indexer_config.get("logging", {})
        log_level = logging_config.get("level", "INFO")
        log_format = logging_config.get(
            "log_format", "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
        )

        logger.setLevel(getattr(logging, log_level.upper(), logging.INFO))

        # Clear existing handlers
        logger.handlers.clear()

        # Console handler
        handler = logging.StreamHandler()
        formatter = logging.Formatter(log_format)
        handler.setFormatter(formatter)
        logger.addHandler(handler)

        # File handler if enabled
        if logging_config.get("log_to_file", False):
            log_file = logging_config.get("log_file", "indexer.log")
            file_handler = logging.FileHandler(log_file, encoding="utf-8")
            file_handler.setFormatter(formatter)
            logger.addHandler(file_handler)

        return logger

    def _load_api_config(self) -> Dict[str, Any]:
        """Load API configuration from YAML file"""
        try:
            import yaml

            with open(self.config_path, "r", encoding="utf-8") as f:
                return yaml.safe_load(f)
        except Exception as e:
            # Create a basic logger for this error since self.logger doesn't exist yet
            print(f"Warning: Failed to load API config from {self.config_path}: {e}")
            return {}

    def _load_indexer_config(self) -> Dict[str, Any]:
        """Load indexer configuration from YAML file"""
        try:
            import yaml

            with open(self.indexer_config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)
                if config is None:
                    config = {}
                return config
        except Exception as e:
            print(
                f"Warning: Failed to load indexer config from {self.indexer_config_path}: {e}"
            )
            print("Using default configuration values")
            return {}

    async def _initialize_llm_client(self):
        """Initialize LLM client (Anthropic or OpenAI) based on API key availability"""
        if self.llm_client is not None:
            return self.llm_client, self.llm_client_type

        # Check if mock responses are enabled
        if self.mock_llm_responses:
            self.logger.info("Using mock LLM responses for testing")
            self.llm_client = "mock"
            self.llm_client_type = "mock"
            return "mock", "mock"

        # Check which API has available key and try that first
        anthropic_key = self.api_config.get("anthropic", {}).get("api_key", "")
        openai_key = self.api_config.get("openai", {}).get("api_key", "")

        # Try Anthropic API first if key is available
        if anthropic_key and anthropic_key.strip():
            try:
                from anthropic import AsyncAnthropic

                client = AsyncAnthropic(api_key=anthropic_key)
                # Test connection with default model from config
                await client.messages.create(
                    model=self.default_models["anthropic"],
                    max_tokens=10,
                    messages=[{"role": "user", "content": "test"}],
                )
                self.logger.info(
                    f"Using Anthropic API with model: {self.default_models['anthropic']}"
                )
                self.llm_client = client
                self.llm_client_type = "anthropic"
                return client, "anthropic"
            except Exception as e:
                self.logger.warning(f"Anthropic API unavailable: {e}")

        # Try OpenAI API if Anthropic failed or key not available
        if openai_key and openai_key.strip():
            try:
                from openai import AsyncOpenAI

                # Handle custom base_url if specified
                openai_config = self.api_config.get("openai", {})
                base_url = openai_config.get("base_url")

                if base_url:
                    client = AsyncOpenAI(api_key=openai_key, base_url=base_url)
                else:
                    client = AsyncOpenAI(api_key=openai_key)

                # Test connection with default model from config
                await client.chat.completions.create(
                    model=self.default_models["openai"],
                    max_tokens=10,
                    messages=[{"role": "user", "content": "test"}],
                )
                self.logger.info(
                    f"Using OpenAI API with model: {self.default_models['openai']}"
                )
                if base_url:
                    self.logger.info(f"Using custom base URL: {base_url}")
                self.llm_client = client
                self.llm_client_type = "openai"
                return client, "openai"
            except Exception as e:
                self.logger.warning(f"OpenAI API unavailable: {e}")

        raise ValueError(
            "No available LLM API - please check your API keys in configuration"
        )

    async def _call_llm(
        self, prompt: str, system_prompt: str = None, max_tokens: int = None
    ) -> str:
        """Call LLM for code analysis with retry mechanism and debugging support"""
        if system_prompt is None:
            system_prompt = self.llm_system_prompt
        if max_tokens is None:
            max_tokens = self.llm_max_tokens

        # Mock response for testing
        if self.mock_llm_responses:
            mock_response = self._generate_mock_response(prompt)
            if self.save_raw_responses:
                self._save_debug_response("mock", prompt, mock_response)
            return mock_response

        last_error = None

        # Retry mechanism
        for attempt in range(self.max_retries):
            try:
                if self.verbose_output and attempt > 0:
                    self.logger.info(
                        f"LLM call attempt {attempt + 1}/{self.max_retries}"
                    )

                client, client_type = await self._initialize_llm_client()

                if client_type == "anthropic":
                    response = await client.messages.create(
                        model=self.default_models["anthropic"],
                        system=system_prompt,
                        messages=[{"role": "user", "content": prompt}],
                        max_tokens=max_tokens,
                        temperature=self.llm_temperature,
                    )

                    content = ""
                    for block in response.content:
                        if block.type == "text":
                            content += block.text

                    # Save debug response if enabled
                    if self.save_raw_responses:
                        self._save_debug_response("anthropic", prompt, content)

                    return content

                elif client_type == "openai":
                    messages = [
                        {"role": "system", "content": system_prompt},
                        {"role": "user", "content": prompt},
                    ]

                    response = await client.chat.completions.create(
                        model=self.default_models["openai"],
                        messages=messages,
                        max_tokens=max_tokens,
                        temperature=self.llm_temperature,
                    )

                    content = response.choices[0].message.content or ""

                    # Save debug response if enabled
                    if self.save_raw_responses:
                        self._save_debug_response("openai", prompt, content)

                    return content
                else:
                    raise ValueError(f"Unsupported client type: {client_type}")

            except Exception as e:
                last_error = e
                self.logger.warning(f"LLM call attempt {attempt + 1} failed: {e}")

                if attempt < self.max_retries - 1:
                    await asyncio.sleep(
                        self.retry_delay * (attempt + 1)
                    )  # Exponential backoff

        # All retries failed
        error_msg = f"LLM call failed after {self.max_retries} attempts. Last error: {str(last_error)}"
        self.logger.error(error_msg)
        return f"Error in LLM analysis: {error_msg}"

    def _generate_mock_response(self, prompt: str) -> str:
        """Generate mock LLM response for testing"""
        if "JSON format" in prompt and "file_type" in prompt:
            # File analysis mock
            return """
            {
                "file_type": "Python module",
                "main_functions": ["main_function", "helper_function"],
                "key_concepts": ["data_processing", "algorithm"],
                "dependencies": ["numpy", "pandas"],
                "summary": "Mock analysis of code file functionality."
            }
            """
        elif "relationships" in prompt:
            # Relationship analysis mock
            return """
            {
                "relationships": [
                    {
                        "target_file_path": "src/core/mock.py",
                        "relationship_type": "partial_match",
                        "confidence_score": 0.8,
                        "helpful_aspects": ["algorithm implementation", "data structures"],
                        "potential_contributions": ["core functionality", "utility methods"],
                        "usage_suggestions": "Mock relationship suggestion for testing."
                    }
                ]
            }
            """
        elif "relevant_files" in prompt:
            # File filtering mock
            return """
            {
                "relevant_files": [
                    {
                        "file_path": "mock_file.py",
                        "relevance_reason": "Mock relevance reason",
                        "confidence": 0.9,
                        "expected_contribution": "Mock contribution"
                    }
                ],
                "summary": {
                    "total_files_analyzed": "10",
                    "relevant_files_count": "1",
                    "filtering_strategy": "Mock filtering strategy"
                }
            }
            """
        else:
            return "Mock LLM response for testing purposes."

    def _save_debug_response(self, provider: str, prompt: str, response: str):
        """Save LLM response for debugging"""
        try:
            import hashlib
            from datetime import datetime

            # Create a hash of the prompt for filename
            prompt_hash = hashlib.md5(prompt.encode()).hexdigest()[:8]
            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
            filename = f"{provider}_{timestamp}_{prompt_hash}.json"

            debug_data = {
                "timestamp": datetime.now().isoformat(),
                "provider": provider,
                "prompt": prompt[:500] + "..." if len(prompt) > 500 else prompt,
                "response": response,
                "full_prompt_length": len(prompt),
            }

            debug_file = Path(self.raw_responses_dir) / filename
            with open(debug_file, "w", encoding="utf-8") as f:
                json.dump(debug_data, f, indent=2, ensure_ascii=False)

        except Exception as e:
            self.logger.warning(f"Failed to save debug response: {e}")

    def get_all_repo_files(self, repo_path: Path) -> List[Path]:
        """Recursively get all supported files in a repository"""
        files = []

        try:
            for root, dirs, filenames in os.walk(repo_path):
                # Skip common non-code directories
                dirs[:] = [
                    d
                    for d in dirs
                    if not d.startswith(".") and d not in self.skip_directories
                ]

                for filename in filenames:
                    file_path = Path(root) / filename
                    if file_path.suffix.lower() in self.supported_extensions:
                        files.append(file_path)

        except Exception as e:
            self.logger.error(f"Error traversing {repo_path}: {e}")

        return files

    def generate_file_tree(self, repo_path: Path, max_depth: int = 5) -> str:
        """Generate file tree structure string for the repository"""
        tree_lines = []

        def add_to_tree(current_path: Path, prefix: str = "", depth: int = 0):
            if depth > max_depth:
                return

            try:
                items = sorted(
                    current_path.iterdir(), key=lambda x: (x.is_file(), x.name.lower())
                )
                # Filter out irrelevant directories and files
                items = [
                    item
                    for item in items
                    if not item.name.startswith(".")
                    and item.name not in self.skip_directories
                ]

                for i, item in enumerate(items):
                    is_last = i == len(items) - 1
                    current_prefix = "└── " if is_last else "├── "
                    tree_lines.append(f"{prefix}{current_prefix}{item.name}")

                    if item.is_dir():
                        extension_prefix = "    " if is_last else "│   "
                        add_to_tree(item, prefix + extension_prefix, depth + 1)
                    elif item.suffix.lower() in self.supported_extensions:
                        # Add file size information
                        try:
                            size = item.stat().st_size
                            if size > 1024:
                                size_str = f" ({size // 1024}KB)"
                            else:
                                size_str = f" ({size}B)"
                            tree_lines[-1] += size_str
                        except (OSError, PermissionError):
                            pass

            except PermissionError:
                tree_lines.append(f"{prefix}├── [Permission Denied]")
            except Exception as e:
                tree_lines.append(f"{prefix}├── [Error: {str(e)}]")

        tree_lines.append(f"{repo_path.name}/")
        add_to_tree(repo_path)
        return "\n".join(tree_lines)

    async def pre_filter_files(self, repo_path: Path, file_tree: str) -> List[str]:
        """Use LLM to pre-filter relevant files based on target structure"""
        filter_prompt = f"""
        You are a code analysis expert. Please analyze the following code repository file tree based on the target project structure and filter out files that may be relevant to the target project.

        Target Project Structure:
        {self.target_structure}

        Code Repository File Tree:
        {file_tree}

        Please analyze which files might be helpful for implementing the target project structure, including:
        - Core algorithm implementation files (such as GCN, recommendation systems, graph neural networks, etc.)
        - Data processing and preprocessing files
        - Loss functions and evaluation metric files
        - Configuration and utility files
        - Test files
        - Documentation files

        Please return the filtering results in JSON format:
        {{
            "relevant_files": [
                {{
                    "file_path": "file path relative to repository root",
                    "relevance_reason": "why this file is relevant",
                    "confidence": 0.0-1.0,
                    "expected_contribution": "expected contribution to the target project"
                }}
            ],
            "summary": {{
                "total_files_analyzed": "total number of files analyzed",
                "relevant_files_count": "number of relevant files",
                "filtering_strategy": "explanation of filtering strategy"
            }}
        }}

        Only return files with confidence > {self.min_confidence_score}. Focus on files related to recommendation systems, graph neural networks, and diffusion models.
        """

        try:
            self.logger.info("Starting LLM pre-filtering of files...")
            llm_response = await self._call_llm(
                filter_prompt,
                system_prompt="You are a professional code analysis and project architecture expert, skilled at identifying code file functionality and relevance.",
                max_tokens=2000,
            )

            # Parse JSON response
            match = re.search(r"\{.*\}", llm_response, re.DOTALL)
            if not match:
                self.logger.warning(
                    "Unable to parse LLM filtering response, will use all files"
                )
                return []

            filter_data = json.loads(match.group(0))
            relevant_files = filter_data.get("relevant_files", [])

            # Extract file paths
            selected_files = []
            for file_info in relevant_files:
                file_path = file_info.get("file_path", "")
                confidence = file_info.get("confidence", 0.0)
                # Use configured minimum confidence threshold
                if file_path and confidence > self.min_confidence_score:
                    selected_files.append(file_path)

            summary = filter_data.get("summary", {})
            self.logger.info(
                f"LLM filtering completed: {summary.get('relevant_files_count', len(selected_files))} relevant files selected"
            )
            self.logger.info(
                f"Filtering strategy: {summary.get('filtering_strategy', 'Not provided')}"
            )

            return selected_files

        except Exception as e:
            self.logger.error(f"LLM pre-filtering failed: {e}")
            self.logger.info("Will fallback to analyzing all files")
            return []

    def filter_files_by_paths(
        self, all_files: List[Path], selected_paths: List[str], repo_path: Path
    ) -> List[Path]:
        """Filter file list based on LLM-selected paths"""
        if not selected_paths:
            return all_files

        filtered_files = []

        for file_path in all_files:
            # Get path relative to repository root
            relative_path = str(file_path.relative_to(repo_path))

            # Check if it's in the selected list
            for selected_path in selected_paths:
                # Normalize path comparison
                if (
                    relative_path == selected_path
                    or relative_path.replace("\\", "/")
                    == selected_path.replace("\\", "/")
                    or selected_path in relative_path
                    or relative_path in selected_path
                ):
                    filtered_files.append(file_path)
                    break

        return filtered_files

    def _get_cache_key(self, file_path: Path) -> str:
        """Generate cache key for file content"""
        try:
            stats = file_path.stat()
            return f"{file_path}:{stats.st_mtime}:{stats.st_size}"
        except (OSError, PermissionError):
            return str(file_path)

    def _manage_cache_size(self):
        """Manage cache size to stay within limits"""
        if not self.enable_content_caching or not self.content_cache:
            return

        if len(self.content_cache) > self.max_cache_size:
            # Remove oldest entries (simple FIFO strategy)
            excess_count = len(self.content_cache) - self.max_cache_size + 10
            keys_to_remove = list(self.content_cache.keys())[:excess_count]

            for key in keys_to_remove:
                del self.content_cache[key]

            if self.verbose_output:
                self.logger.info(
                    f"Cache cleaned: removed {excess_count} entries, {len(self.content_cache)} entries remaining"
                )

    async def analyze_file_content(self, file_path: Path) -> FileSummary:
        """Analyze a single file and create summary with caching support"""
        try:
            # Check file size before reading
            file_size = file_path.stat().st_size
            if file_size > self.max_file_size:
                self.logger.warning(
                    f"Skipping file {file_path} - size {file_size} bytes exceeds limit {self.max_file_size}"
                )
                return FileSummary(
                    file_path=str(file_path.relative_to(self.code_base_path)),
                    file_type="skipped - too large",
                    main_functions=[],
                    key_concepts=[],
                    dependencies=[],
                    summary=f"File skipped - size {file_size} bytes exceeds {self.max_file_size} byte limit",
                    lines_of_code=0,
                    last_modified=datetime.fromtimestamp(
                        file_path.stat().st_mtime
                    ).isoformat(),
                )

            # Check cache if enabled
            cache_key = None
            if self.enable_content_caching:
                cache_key = self._get_cache_key(file_path)
                if cache_key in self.content_cache:
                    if self.verbose_output:
                        self.logger.info(f"Using cached analysis for {file_path.name}")
                    return self.content_cache[cache_key]

            with open(file_path, "r", encoding="utf-8", errors="ignore") as f:
                content = f.read()

            # Get file stats
            stats = file_path.stat()
            lines_of_code = len([line for line in content.split("\n") if line.strip()])

            # Truncate content based on config
            content_for_analysis = content[: self.max_content_length]
            content_suffix = "..." if len(content) > self.max_content_length else ""

            # Create analysis prompt
            analysis_prompt = f"""
            Analyze this code file and provide a structured summary:

            File: {file_path.name}
            Content:
            ```
            {content_for_analysis}{content_suffix}
            ```

            Please provide analysis in this JSON format:
            {{
                "file_type": "description of what type of file this is",
                "main_functions": ["list", "of", "main", "functions", "or", "classes"],
                "key_concepts": ["important", "concepts", "algorithms", "patterns"],
                "dependencies": ["external", "libraries", "or", "imports"],
                "summary": "2-3 sentence summary of what this file does"
            }}

            Focus on the core functionality and potential reusability.
            """

            # Get LLM analysis with configured parameters
            llm_response = await self._call_llm(analysis_prompt, max_tokens=1000)

            try:
                # Try to parse JSON response
                match = re.search(r"\{.*\}", llm_response, re.DOTALL)
                analysis_data = json.loads(match.group(0))
            except json.JSONDecodeError:
                # Fallback to basic analysis if JSON parsing fails
                analysis_data = {
                    "file_type": f"{file_path.suffix} file",
                    "main_functions": [],
                    "key_concepts": [],
                    "dependencies": [],
                    "summary": "File analysis failed - JSON parsing error",
                }

            file_summary = FileSummary(
                file_path=str(file_path.relative_to(self.code_base_path)),
                file_type=analysis_data.get("file_type", "unknown"),
                main_functions=analysis_data.get("main_functions", []),
                key_concepts=analysis_data.get("key_concepts", []),
                dependencies=analysis_data.get("dependencies", []),
                summary=analysis_data.get("summary", "No summary available"),
                lines_of_code=lines_of_code,
                last_modified=datetime.fromtimestamp(stats.st_mtime).isoformat(),
            )

            # Cache the result if caching is enabled
            if self.enable_content_caching and cache_key:
                self.content_cache[cache_key] = file_summary
                self._manage_cache_size()

            return file_summary

        except Exception as e:
            self.logger.error(f"Error analyzing file {file_path}: {e}")
            return FileSummary(
                file_path=str(file_path.relative_to(self.code_base_path)),
                file_type="error",
                main_functions=[],
                key_concepts=[],
                dependencies=[],
                summary=f"Analysis failed: {str(e)}",
                lines_of_code=0,
                last_modified="",
            )

    async def find_relationships(
        self, file_summary: FileSummary
    ) -> List[FileRelationship]:
        """Find relationships between a repo file and target structure"""

        # Build relationship type description from config
        relationship_type_desc = []
        for rel_type, weight in self.relationship_types.items():
            relationship_type_desc.append(f"- {rel_type} (priority: {weight})")

        relationship_prompt = f"""
        Analyze the relationship between this existing code file and the target project structure.

        Existing File Analysis:
        - Path: {file_summary.file_path}
        - Type: {file_summary.file_type}
        - Functions: {', '.join(file_summary.main_functions)}
        - Concepts: {', '.join(file_summary.key_concepts)}
        - Summary: {file_summary.summary}

        Target Project Structure:
        {self.target_structure}

        Available relationship types (with priority weights):
        {chr(10).join(relationship_type_desc)}

        Identify potential relationships and provide analysis in this JSON format:
        {{
            "relationships": [
                {{
                    "target_file_path": "path/in/target/structure",
                    "relationship_type": "direct_match|partial_match|reference|utility",
                    "confidence_score": 0.0-1.0,
                    "helpful_aspects": ["specific", "aspects", "that", "could", "help"],
                    "potential_contributions": ["how", "this", "could", "contribute"],
                    "usage_suggestions": "detailed suggestion on how to use this file"
                }}
            ]
        }}

        Consider the priority weights when determining relationship types. Higher weight types should be preferred when multiple types apply.
        Only include relationships with confidence > {self.min_confidence_score}. Focus on concrete, actionable connections.
        """

        try:
            llm_response = await self._call_llm(relationship_prompt, max_tokens=1500)

            match = re.search(r"\{.*\}", llm_response, re.DOTALL)
            relationship_data = json.loads(match.group(0))

            relationships = []
            for rel_data in relationship_data.get("relationships", []):
                confidence_score = float(rel_data.get("confidence_score", 0.0))
                relationship_type = rel_data.get("relationship_type", "reference")

                # Validate relationship type is in config
                if relationship_type not in self.relationship_types:
                    if self.verbose_output:
                        self.logger.warning(
                            f"Unknown relationship type '{relationship_type}', using 'reference'"
                        )
                    relationship_type = "reference"

                # Apply configured minimum confidence filter
                if confidence_score > self.min_confidence_score:
                    relationship = FileRelationship(
                        repo_file_path=file_summary.file_path,
                        target_file_path=rel_data.get("target_file_path", ""),
                        relationship_type=relationship_type,
                        confidence_score=confidence_score,
                        helpful_aspects=rel_data.get("helpful_aspects", []),
                        potential_contributions=rel_data.get(
                            "potential_contributions", []
                        ),
                        usage_suggestions=rel_data.get("usage_suggestions", ""),
                    )
                    relationships.append(relationship)

            return relationships

        except Exception as e:
            self.logger.error(
                f"Error finding relationships for {file_summary.file_path}: {e}"
            )
            return []

    async def _analyze_single_file_with_relationships(
        self, file_path: Path, index: int, total: int
    ) -> tuple:
        """Analyze a single file and its relationships (for concurrent processing)"""
        if self.verbose_output:
            self.logger.info(f"Analyzing file {index}/{total}: {file_path.name}")

        # Get file summary
        file_summary = await self.analyze_file_content(file_path)

        # Find relationships
        relationships = await self.find_relationships(file_summary)

        return file_summary, relationships

    async def process_repository(self, repo_path: Path) -> RepoIndex:
        """Process a single repository and create complete index with optional concurrent processing"""
        repo_name = repo_path.name
        self.logger.info(f"Processing repository: {repo_name}")

        # Step 1: Generate file tree
        self.logger.info("Generating file tree structure...")
        file_tree = self.generate_file_tree(repo_path)

        # Step 2: Get all files
        all_files = self.get_all_repo_files(repo_path)
        self.logger.info(f"Found {len(all_files)} files in {repo_name}")

        # Step 3: LLM pre-filtering of relevant files
        if self.enable_pre_filtering:
            self.logger.info("Using LLM for file pre-filtering...")
            selected_file_paths = await self.pre_filter_files(repo_path, file_tree)
        else:
            self.logger.info("Pre-filtering is disabled, will analyze all files")
            selected_file_paths = []

        # Step 4: Filter file list based on filtering results
        if selected_file_paths:
            files_to_analyze = self.filter_files_by_paths(
                all_files, selected_file_paths, repo_path
            )
            self.logger.info(
                f"After LLM filtering, will analyze {len(files_to_analyze)} relevant files (from {len(all_files)} total)"
            )
        else:
            files_to_analyze = all_files
            self.logger.info("LLM filtering failed, will analyze all files")

        # Step 5: Analyze filtered files (concurrent or sequential)
        if self.enable_concurrent_analysis and len(files_to_analyze) > 1:
            self.logger.info(
                f"Using concurrent analysis with max {self.max_concurrent_files} parallel files"
            )
            file_summaries, all_relationships = await self._process_files_concurrently(
                files_to_analyze
            )
        else:
            self.logger.info("Using sequential file analysis")
            file_summaries, all_relationships = await self._process_files_sequentially(
                files_to_analyze
            )

        # Step 6: Create repository index
        repo_index = RepoIndex(
            repo_name=repo_name,
            total_files=len(all_files),  # Record original file count
            file_summaries=file_summaries,
            relationships=all_relationships,
            analysis_metadata={
                "analysis_date": datetime.now().isoformat(),
                "target_structure_analyzed": self.target_structure[:200] + "...",
                "total_relationships_found": len(all_relationships),
                "high_confidence_relationships": len(
                    [
                        r
                        for r in all_relationships
                        if r.confidence_score > self.high_confidence_threshold
                    ]
                ),
                "analyzer_version": "1.4.0",  # Updated version to reflect augmented LLM support
                "pre_filtering_enabled": self.enable_pre_filtering,
                "files_before_filtering": len(all_files),
                "files_after_filtering": len(files_to_analyze),
                "filtering_efficiency": round(
                    (1 - len(files_to_analyze) / len(all_files)) * 100, 2
                )
                if all_files
                else 0,
                "config_file_used": self.indexer_config_path,
                "min_confidence_score": self.min_confidence_score,
                "high_confidence_threshold": self.high_confidence_threshold,
                "concurrent_analysis_used": self.enable_concurrent_analysis,
                "content_caching_enabled": self.enable_content_caching,
                "cache_hits": len(self.content_cache) if self.content_cache else 0,
            },
        )

        return repo_index

    async def _process_files_sequentially(self, files_to_analyze: list) -> tuple:
        """Process files sequentially (original method)"""
        file_summaries = []
        all_relationships = []

        for i, file_path in enumerate(files_to_analyze, 1):
            (
                file_summary,
                relationships,
            ) = await self._analyze_single_file_with_relationships(
                file_path, i, len(files_to_analyze)
            )
            file_summaries.append(file_summary)
            all_relationships.extend(relationships)

            # Add configured delay to avoid overwhelming the LLM API
            await asyncio.sleep(self.request_delay)

        return file_summaries, all_relationships

    async def _process_files_concurrently(self, files_to_analyze: list) -> tuple:
        """Process files concurrently with semaphore limiting"""
        file_summaries = []
        all_relationships = []

        # Create semaphore to limit concurrent tasks
        semaphore = asyncio.Semaphore(self.max_concurrent_files)
        tasks = []

        async def _process_with_semaphore(file_path: Path, index: int, total: int):
            async with semaphore:
                # Add a small delay to space out concurrent requests
                if index > 1:
                    await asyncio.sleep(
                        self.request_delay * 0.5
                    )  # Reduced delay for concurrent processing
                return await self._analyze_single_file_with_relationships(
                    file_path, index, total
                )

        try:
            # Create tasks for all files
            tasks = [
                _process_with_semaphore(file_path, i, len(files_to_analyze))
                for i, file_path in enumerate(files_to_analyze, 1)
            ]

            # Process tasks and collect results
            if self.verbose_output:
                self.logger.info(
                    f"Starting concurrent analysis of {len(tasks)} files..."
                )

            try:
                results = await asyncio.gather(*tasks, return_exceptions=True)

                for i, result in enumerate(results):
                    if isinstance(result, Exception):
                        self.logger.error(
                            f"Failed to analyze file {files_to_analyze[i]}: {result}"
                        )
                        # Create error summary
                        error_summary = FileSummary(
                            file_path=str(
                                files_to_analyze[i].relative_to(self.code_base_path)
                            ),
                            file_type="error",
                            main_functions=[],
                            key_concepts=[],
                            dependencies=[],
                            summary=f"Concurrent analysis failed: {str(result)}",
                            lines_of_code=0,
                            last_modified="",
                        )
                        file_summaries.append(error_summary)
                    else:
                        file_summary, relationships = result
                        file_summaries.append(file_summary)
                        all_relationships.extend(relationships)

            except Exception as e:
                self.logger.error(f"Concurrent processing failed: {e}")
                # Cancel any remaining tasks
                for task in tasks:
                    if not task.done() and not task.cancelled():
                        task.cancel()

                # Wait for cancelled tasks to complete
                try:
                    await asyncio.sleep(0.1)  # Brief wait for cancellation
                except Exception:
                    pass

                # Fallback to sequential processing
                self.logger.info("Falling back to sequential processing...")
                return await self._process_files_sequentially(files_to_analyze)

            if self.verbose_output:
                self.logger.info(
                    f"Concurrent analysis completed: {len(file_summaries)} files processed"
                )

            return file_summaries, all_relationships

        except Exception as e:
            # Ensure all tasks are cancelled in case of unexpected errors
            if tasks:
                for task in tasks:
                    if not task.done() and not task.cancelled():
                        task.cancel()

            # Wait briefly for cancellation to complete
            try:
                await asyncio.sleep(0.1)
            except Exception:
                pass

            self.logger.error(f"Critical error in concurrent processing: {e}")
            # Fallback to sequential processing
            self.logger.info(
                "Falling back to sequential processing due to critical error..."
            )
            return await self._process_files_sequentially(files_to_analyze)

        finally:
            # Final cleanup: ensure all tasks are properly finished
            if tasks:
                for task in tasks:
                    if not task.done() and not task.cancelled():
                        task.cancel()

            # Clear task references to help with garbage collection
            tasks.clear()

            # Force garbage collection to help clean up semaphore and related resources
            import gc

            gc.collect()

    async def build_all_indexes(self) -> Dict[str, str]:
        """Build indexes for all repositories in code_base"""
        if not self.code_base_path.exists():
            raise FileNotFoundError(
                f"Code base path does not exist: {self.code_base_path}"
            )

        # Get all repository directories
        repo_dirs = [
            d
            for d in self.code_base_path.iterdir()
            if d.is_dir() and not d.name.startswith(".")
        ]

        if not repo_dirs:
            raise ValueError(f"No repositories found in {self.code_base_path}")

        self.logger.info(f"Found {len(repo_dirs)} repositories to process")

        # Process each repository
        output_files = {}
        statistics_data = []

        for repo_dir in repo_dirs:
            try:
                # Process repository
                repo_index = await self.process_repository(repo_dir)

                # Generate output filename using configured pattern
                output_filename = self.index_filename_pattern.format(
                    repo_name=repo_index.repo_name
                )
                output_file = self.output_dir / output_filename

                # Get output configuration
                output_config = self.indexer_config.get("output", {})
                json_indent = output_config.get("json_indent", 2)
                ensure_ascii = not output_config.get("ensure_ascii", False)

                # Save to JSON file
                with open(output_file, "w", encoding="utf-8") as f:
                    if self.include_metadata:
                        json.dump(
                            asdict(repo_index),
                            f,
                            indent=json_indent,
                            ensure_ascii=ensure_ascii,
                        )
                    else:
                        # Save without metadata if disabled
                        index_data = asdict(repo_index)
                        index_data.pop("analysis_metadata", None)
                        json.dump(
                            index_data, f, indent=json_indent, ensure_ascii=ensure_ascii
                        )

                output_files[repo_index.repo_name] = str(output_file)
                self.logger.info(
                    f"Saved index for {repo_index.repo_name} to {output_file}"
                )

                # Collect statistics for report
                if self.generate_statistics:
                    stats = self._extract_repository_statistics(repo_index)
                    statistics_data.append(stats)

            except Exception as e:
                self.logger.error(f"Failed to process repository {repo_dir.name}: {e}")
                continue

        # Generate additional reports if configured
        if self.generate_summary:
            summary_path = self.generate_summary_report(output_files)
            self.logger.info(f"Generated summary report: {summary_path}")

        if self.generate_statistics:
            stats_path = self.generate_statistics_report(statistics_data)
            self.logger.info(f"Generated statistics report: {stats_path}")

        return output_files

    def _extract_repository_statistics(self, repo_index: RepoIndex) -> Dict[str, Any]:
        """Extract statistical information from a repository index"""
        metadata = repo_index.analysis_metadata

        # Count relationship types
        relationship_type_counts = {}
        for rel in repo_index.relationships:
            rel_type = rel.relationship_type
            relationship_type_counts[rel_type] = (
                relationship_type_counts.get(rel_type, 0) + 1
            )

        # Count file types
        file_type_counts = {}
        for file_summary in repo_index.file_summaries:
            file_type = file_summary.file_type
            file_type_counts[file_type] = file_type_counts.get(file_type, 0) + 1

        # Calculate statistics
        total_lines = sum(fs.lines_of_code for fs in repo_index.file_summaries)
        avg_lines = (
            total_lines / len(repo_index.file_summaries)
            if repo_index.file_summaries
            else 0
        )

        avg_confidence = (
            sum(r.confidence_score for r in repo_index.relationships)
            / len(repo_index.relationships)
            if repo_index.relationships
            else 0
        )

        return {
            "repo_name": repo_index.repo_name,
            "total_files": repo_index.total_files,
            "analyzed_files": len(repo_index.file_summaries),
            "total_relationships": len(repo_index.relationships),
            "high_confidence_relationships": metadata.get(
                "high_confidence_relationships", 0
            ),
            "relationship_type_counts": relationship_type_counts,
            "file_type_counts": file_type_counts,
            "total_lines_of_code": total_lines,
            "average_lines_per_file": round(avg_lines, 2),
            "average_confidence_score": round(avg_confidence, 3),
            "filtering_efficiency": metadata.get("filtering_efficiency", 0),
            "concurrent_analysis_used": metadata.get("concurrent_analysis_used", False),
            "cache_hits": metadata.get("cache_hits", 0),
            "analysis_date": metadata.get("analysis_date", "unknown"),
        }

    def generate_statistics_report(self, statistics_data: List[Dict[str, Any]]) -> str:
        """Generate a detailed statistics report"""
        stats_path = self.output_dir / self.stats_filename

        # Calculate aggregate statistics
        total_repos = len(statistics_data)
        total_files_analyzed = sum(stat["analyzed_files"] for stat in statistics_data)
        total_relationships = sum(
            stat["total_relationships"] for stat in statistics_data
        )
        total_lines = sum(stat["total_lines_of_code"] for stat in statistics_data)

        # Aggregate relationship types
        aggregated_rel_types = {}
        for stat in statistics_data:
            for rel_type, count in stat["relationship_type_counts"].items():
                aggregated_rel_types[rel_type] = (
                    aggregated_rel_types.get(rel_type, 0) + count
                )

        # Aggregate file types
        aggregated_file_types = {}
        for stat in statistics_data:
            for file_type, count in stat["file_type_counts"].items():
                aggregated_file_types[file_type] = (
                    aggregated_file_types.get(file_type, 0) + count
                )

        # Calculate averages
        avg_files_per_repo = total_files_analyzed / total_repos if total_repos else 0
        avg_relationships_per_repo = (
            total_relationships / total_repos if total_repos else 0
        )
        avg_lines_per_repo = total_lines / total_repos if total_repos else 0

        # Build statistics report
        statistics_report = {
            "report_generation_time": datetime.now().isoformat(),
            "analyzer_version": "1.4.0",
            "configuration_used": {
                "config_file": self.indexer_config_path,
                "concurrent_analysis_enabled": self.enable_concurrent_analysis,
                "content_caching_enabled": self.enable_content_caching,
                "pre_filtering_enabled": self.enable_pre_filtering,
                "min_confidence_score": self.min_confidence_score,
                "high_confidence_threshold": self.high_confidence_threshold,
            },
            "aggregate_statistics": {
                "total_repositories_processed": total_repos,
                "total_files_analyzed": total_files_analyzed,
                "total_relationships_found": total_relationships,
                "total_lines_of_code": total_lines,
                "average_files_per_repository": round(avg_files_per_repo, 2),
                "average_relationships_per_repository": round(
                    avg_relationships_per_repo, 2
                ),
                "average_lines_per_repository": round(avg_lines_per_repo, 2),
            },
            "relationship_type_distribution": aggregated_rel_types,
            "file_type_distribution": aggregated_file_types,
            "repository_details": statistics_data,
            "performance_metrics": {
                "concurrent_processing_repos": sum(
                    1
                    for s in statistics_data
                    if s.get("concurrent_analysis_used", False)
                ),
                "cache_efficiency": {
                    "total_cache_hits": sum(
                        s.get("cache_hits", 0) for s in statistics_data
                    ),
                    "repositories_with_caching": sum(
                        1 for s in statistics_data if s.get("cache_hits", 0) > 0
                    ),
                },
                "filtering_efficiency": {
                    "average_filtering_efficiency": round(
                        sum(s.get("filtering_efficiency", 0) for s in statistics_data)
                        / total_repos,
                        2,
                    )
                    if total_repos
                    else 0,
                    "max_filtering_efficiency": max(
                        (s.get("filtering_efficiency", 0) for s in statistics_data),
                        default=0,
                    ),
                    "min_filtering_efficiency": min(
                        (s.get("filtering_efficiency", 0) for s in statistics_data),
                        default=0,
                    ),
                },
            },
        }

        # Get output configuration
        output_config = self.indexer_config.get("output", {})
        json_indent = output_config.get("json_indent", 2)
        ensure_ascii = not output_config.get("ensure_ascii", False)

        with open(stats_path, "w", encoding="utf-8") as f:
            json.dump(
                statistics_report, f, indent=json_indent, ensure_ascii=ensure_ascii
            )

        return str(stats_path)

    def generate_summary_report(self, output_files: Dict[str, str]) -> str:
        """Generate a summary report of all indexes created"""
        report_path = self.output_dir / "indexing_summary.json"

        # Get output configuration from config file
        output_config = self.indexer_config.get("output", {})
        json_indent = output_config.get("json_indent", 2)
        ensure_ascii = not output_config.get("ensure_ascii", False)

        summary_data = {
            "indexing_completion_time": datetime.now().isoformat(),
            "total_repositories_processed": len(output_files),
            "output_files": output_files,
            "target_structure": self.target_structure,
            "code_base_path": str(self.code_base_path),
            "configuration": {
                "config_file_used": self.indexer_config_path,
                "api_config_file": self.config_path,
                "pre_filtering_enabled": self.enable_pre_filtering,
                "min_confidence_score": self.min_confidence_score,
                "high_confidence_threshold": self.high_confidence_threshold,
                "max_file_size": self.max_file_size,
                "max_content_length": self.max_content_length,
                "request_delay": self.request_delay,
                "supported_extensions_count": len(self.supported_extensions),
                "skip_directories_count": len(self.skip_directories),
            },
        }

        with open(report_path, "w", encoding="utf-8") as f:
            json.dump(summary_data, f, indent=json_indent, ensure_ascii=ensure_ascii)

        return str(report_path)


async def main():
    """Main function to run the code indexer with full configuration support"""

    # Configuration - can be overridden by config file
    config_file = "DeepCode/tools/indexer_config.yaml"
    api_config_file = "DeepCode/mcp_agent.secrets.yaml"

    # You can override these parameters or let them be read from config
    code_base_path = "DeepCode/deepcode_lab/papers/1/code_base/"  # Will use config file value if None
    output_dir = (
        "DeepCode/deepcode_lab/papers/1/indexes/"  # Will use config file value if None
    )

    # Target structure - this should be customized for your specific project
    target_structure = """
    project/
    ├── src/
    │   ├── core/
    │   │   ├── gcn.py        # GCN encoder
    │   │   ├── diffusion.py  # forward/reverse processes
    │   │   ├── denoiser.py   # denoising MLP
    │   │   └── fusion.py     # fusion combiner
    │   ├── models/           # model wrapper classes
    │   │   └── recdiff.py
    │   ├── utils/
    │   │   ├── data.py       # loading & preprocessing
    │   │   ├── predictor.py  # scoring functions
    │   │   ├── loss.py       # loss functions
    │   │   ├── metrics.py    # NDCG, Recall etc.
    │   │   └── sched.py      # beta/alpha schedule utils
    │   └── configs/
    │       └── default.yaml  # hyperparameters, paths
    ├── tests/
    │   ├── test_gcn.py
    │   ├── test_diffusion.py
    │   ├── test_denoiser.py
    │   ├── test_loss.py
    │   └── test_pipeline.py
    ├── docs/
    │   ├── architecture.md
    │   ├── api_reference.md
    │   └── README.md
    ├── experiments/
    │   ├── run_experiment.py
    │   └── notebooks/
    │       └── analysis.ipynb
    ├── requirements.txt
    └── setup.py
    """

    print("🚀 Starting Code Indexer with Enhanced Configuration Support")
    print(f"📋 Configuration file: {config_file}")
    print(f"🔑 API configuration file: {api_config_file}")

    # Create indexer with full configuration support
    try:
        indexer = CodeIndexer(
            code_base_path=code_base_path,  # None = read from config
            target_structure=target_structure,  # Required - project specific
            output_dir=output_dir,  # None = read from config
            config_path=api_config_file,  # API configuration file
            indexer_config_path=config_file,  # Configuration file
            enable_pre_filtering=True,  # Can be overridden in config
        )

        # Display configuration information
        print(f"📁 Code base path: {indexer.code_base_path}")
        print(f"📂 Output directory: {indexer.output_dir}")
        print(
            f"🤖 Default models: Anthropic={indexer.default_models['anthropic']}, OpenAI={indexer.default_models['openai']}"
        )
        print(f"🔧 Preferred LLM: {get_preferred_llm_class(api_config_file).__name__}")
        print(
            f"⚡ Concurrent analysis: {'enabled' if indexer.enable_concurrent_analysis else 'disabled'}"
        )
        print(
            f"🗄️  Content caching: {'enabled' if indexer.enable_content_caching else 'disabled'}"
        )
        print(
            f"🔍 Pre-filtering: {'enabled' if indexer.enable_pre_filtering else 'disabled'}"
        )
        print(f"🐛 Debug mode: {'enabled' if indexer.verbose_output else 'disabled'}")
        print(
            f"🎭 Mock responses: {'enabled' if indexer.mock_llm_responses else 'disabled'}"
        )

        # Validate configuration
        if not indexer.code_base_path.exists():
            raise FileNotFoundError(
                f"Code base path does not exist: {indexer.code_base_path}"
            )

        if not target_structure:
            raise ValueError("Target structure is required for analysis")

        print("\n🔧 Starting indexing process...")

        # Build all indexes
        output_files = await indexer.build_all_indexes()

        # Display results
        print("\n✅ Indexing completed successfully!")
        print(f"📊 Processed {len(output_files)} repositories")
        print("📁 Output files:")
        for repo_name, file_path in output_files.items():
            print(f"   - {repo_name}: {file_path}")

        # Display additional reports generated
        if indexer.generate_summary:
            summary_file = indexer.output_dir / indexer.summary_filename
            if summary_file.exists():
                print(f"📋 Summary report: {summary_file}")

        if indexer.generate_statistics:
            stats_file = indexer.output_dir / indexer.stats_filename
            if stats_file.exists():
                print(f"📈 Statistics report: {stats_file}")

        # Performance information
        if indexer.enable_content_caching and indexer.content_cache:
            print(f"🗄️  Cache performance: {len(indexer.content_cache)} items cached")

        print("\n🎉 Code indexing process completed successfully!")

    except FileNotFoundError as e:
        print(f"❌ File not found error: {e}")
        print("💡 Please check your configuration file paths")
    except ValueError as e:
        print(f"❌ Configuration error: {e}")
        print("💡 Please check your configuration file settings")
    except Exception as e:
        print(f"❌ Indexing failed: {e}")
        print("💡 Check the logs for more details")

        # Print debug information if available
        try:
            indexer
            if indexer.verbose_output:
                import traceback

                print("\n🐛 Debug information:")
                traceback.print_exc()
        except NameError:
            pass


def print_usage_example():
    """Print usage examples for different scenarios"""
    print("""
    📖 Code Indexer Usage Examples:

    1. Basic usage with config file:
       - Update paths in indexer_config.yaml
       - Run: python code_indexer.py

    2. Enable debugging:
       - Set debug.verbose_output: true in config
       - Set debug.save_raw_responses: true to save LLM responses

    3. Enable concurrent processing:
       - Set performance.enable_concurrent_analysis: true
       - Adjust performance.max_concurrent_files as needed

    4. Enable caching:
       - Set performance.enable_content_caching: true
       - Adjust performance.max_cache_size as needed

    5. Mock mode for testing:
       - Set debug.mock_llm_responses: true
       - No API calls will be made

    6. Custom output:
       - Modify output.index_filename_pattern
       - Set output.generate_statistics: true for detailed reports

    📋 Configuration file location: tools/indexer_config.yaml
    """)


if __name__ == "__main__":
    import sys

    if len(sys.argv) > 1 and sys.argv[1] in ["--help", "-h", "help"]:
        print_usage_example()
    else:
        asyncio.run(main())


================================================
FILE: tools/code_reference_indexer.py
================================================
#!/usr/bin/env python3
"""
Code Reference Indexer MCP Tool - Unified Version

Specialized MCP tool for searching relevant index content in indexes folder
and formatting it for LLM code implementation reference.

Core Features:
1. **UNIFIED TOOL**: Combined search_code_references that handles directory setup, loading, and searching in one call
2. Match relevant reference code based on target file path and functionality requirements
3. Format output of relevant code examples, functions and concepts
4. Provide structured reference information for LLM use

Key Improvement:
- Single tool call that handles all steps internally
- Agent only needs to provide indexes_path and target_file
- No dependency on calling order or global state management
"""

import json
from pathlib import Path
from typing import Dict, List, Tuple
from dataclasses import dataclass
import logging

# Import MCP modules
from mcp.server.fastmcp import FastMCP

# Setup logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Create FastMCP server instance
mcp = FastMCP("code-reference-indexer")


@dataclass
class CodeReference:
    """Code reference information structure"""

    file_path: str
    file_type: str
    main_functions: List[str]
    key_concepts: List[str]
    dependencies: List[str]
    summary: str
    lines_of_code: int
    repo_name: str
    confidence_score: float = 0.0


@dataclass
class RelationshipInfo:
    """Relationship information structure"""

    repo_file_path: str
    target_file_path: str
    relationship_type: str
    confidence_score: float
    helpful_aspects: List[str]
    potential_contributions: List[str]
    usage_suggestions: str


def load_index_files_from_directory(indexes_directory: str) -> Dict[str, Dict]:
    """Load all index files from specified directory"""
    indexes_path = Path(indexes_directory).resolve()

    if not indexes_path.exists():
        logger.warning(f"Indexes directory does not exist: {indexes_path}")
        return {}

    index_cache = {}

    for index_file in indexes_path.glob("*.json"):
        try:
            with open(index_file, "r", encoding="utf-8") as f:
                index_data = json.load(f)
                index_cache[index_file.stem] = index_data
                logger.info(f"Loaded index file: {index_file.name}")
        except Exception as e:
            logger.error(f"Failed to load index file {index_file.name}: {e}")

    logger.info(f"Loaded {len(index_cache)} index files from {indexes_path}")
    return index_cache


def extract_code_references(index_data: Dict) -> List[CodeReference]:
    """Extract code reference information from index data"""
    references = []

    repo_name = index_data.get("repo_name", "Unknown")
    file_summaries = index_data.get("file_summaries", [])

    for file_summary in file_summaries:
        reference = CodeReference(
            file_path=file_summary.get("file_path", ""),
            file_type=file_summary.get("file_type", ""),
            main_functions=file_summary.get("main_functions", []),
            key_concepts=file_summary.get("key_concepts", []),
            dependencies=file_summary.get("dependencies", []),
            summary=file_summary.get("summary", ""),
            lines_of_code=file_summary.get("lines_of_code", 0),
            repo_name=repo_name,
        )
        references.append(reference)

    return references


def extract_relationships(index_data: Dict) -> List[RelationshipInfo]:
    """Extract relationship information from index data"""
    relationships = []

    relationship_list = index_data.get("relationships", [])

    for rel in relationship_list:
        relationship = RelationshipInfo(
            repo_file_path=rel.get("repo_file_path", ""),
            target_file_path=rel.get("target_file_path", ""),
            relationship_type=rel.get("relationship_type", ""),
            confidence_score=rel.get("confidence_score", 0.0),
            helpful_aspects=rel.get("helpful_aspects", []),
            potential_contributions=rel.get("potential_contributions", []),
            usage_suggestions=rel.get("usage_suggestions", ""),
        )
        relationships.append(relationship)

    return relationships


def calculate_relevance_score(
    target_file: str, reference: CodeReference, keywords: List[str] = None
) -> float:
    """Calculate relevance score between reference code and target file"""
    score = 0.0

    # File name similarity
    target_name = Path(target_file).stem.lower()
    ref_name = Path(reference.file_path).stem.lower()

    if target_name in ref_name or ref_name in target_name:
        score += 0.3

    # File type matching
    target_extension = Path(target_file).suffix
    ref_extension = Path(reference.file_path).suffix

    if target_extension == ref_extension:
        score += 0.2

    # Keyword matching
    if keywords:
        keyword_matches = 0
        total_searchable_text = (
            " ".join(reference.key_concepts)
            + " "
            + " ".join(reference.main_functions)
            + " "
            + reference.summary
            + " "
            + reference.file_type
        ).lower()

        for keyword in keywords:
            if keyword.lower() in total_searchable_text:
                keyword_matches += 1

        if keywords:
            score += (keyword_matches / len(keywords)) * 0.5

    return min(score, 1.0)


def find_relevant_references_in_cache(
    target_file: str,
    index_cache: Dict[str, Dict],
    keywords: List[str] = None,
    max_results: int = 10,
) -> List[Tuple[CodeReference, float]]:
    """Find reference code relevant to target file from provided cache"""
    all_references = []

    # Collect reference information from all index files
    for repo_name, index_data in index_cache.items():
        references = extract_code_references(index_data)
        for ref in references:
            relevance_score = calculate_relevance_score(target_file, ref, keywords)
            if relevance_score > 0.1:  # Only keep results with certain relevance
                all_references.append((ref, relevance_score))

    # Sort by relevance score
    all_references.sort(key=lambda x: x[1], reverse=True)

    return all_references[:max_results]


def find_direct_relationships_in_cache(
    target_file: str, index_cache: Dict[str, Dict]
) -> List[RelationshipInfo]:
    """Find direct relationships with target file from provided cache"""
    relationships = []

    # Normalize target file path (remove common prefixes if exists)
    common_prefixes = ["src/", "core/", "lib/", "main/", "./"]
    normalized_target = target_file.strip("/")
    for prefix in common_prefixes:
        if normalized_target.startswith(prefix):
            normalized_target = normalized_target[len(prefix) :]
            break

    # Collect relationship information from all index files
    for repo_name, index_data in index_cache.items():
        repo_relationships = extract_relationships(index_data)
        for rel in repo_relationships:
            # Normalize target file path in relationship
            normalized_rel_target = rel.target_file_path.strip("/")
            for prefix in common_prefixes:
                if normalized_rel_target.startswith(prefix):
                    normalized_rel_target = normalized_rel_target[len(prefix) :]
                    break

            # Check target file path matching (support multiple matching methods)
            if (
                normalized_target == normalized_rel_target
                or normalized_target in normalized_rel_target
                or normalized_rel_target in normalized_target
                or target_file in rel.target_file_path
                or rel.target_file_path in target_file
            ):
                relationships.append(rel)

    # Sort by confidence score
    relationships.sort(key=lambda x: x.confidence_score, reverse=True)

    return relationships


def format_reference_output(
    target_file: str,
    relevant_refs: List[Tuple[CodeReference, float]],
    relationships: List[RelationshipInfo],
) -> str:
    """Format reference information output"""
    output_lines = []

    output_lines.append(f"# Code Reference Information - {target_file}")
    output_lines.append("=" * 80)
    output_lines.append("")

    # Direct relationship information
    if relationships:
        output_lines.append("## 🎯 Direct Relationships")
        output_lines.append("")

        for i, rel in enumerate(relationships[:5], 1):
            output_lines.append(f"### {i}. {rel.repo_file_path}")
            output_lines.append(f"**Relationship Type**: {rel.relationship_type}")
            output_lines.append(f"**Confidence Score**: {rel.confidence_score:.2f}")
            output_lines.append(
                f"**Helpful Aspects**: {', '.join(rel.helpful_aspects)}"
            )
            output_lines.append(
                f"**Potential Contributions**: {', '.join(rel.potential_contributions)}"
            )
            output_lines.append(f"**Usage Suggestions**: {rel.usage_suggestions}")
            output_lines.append("")

    # Relevant code references
    if relevant_refs:
        output_lines.append("## 📚 Relevant Code References")
        output_lines.append("")

        for i, (ref, score) in enumerate(relevant_refs[:8], 1):
            output_lines.append(f"### {i}. {ref.file_path} (Relevance: {score:.2f})")
            output_lines.append(f"**Repository**: {ref.repo_name}")
            output_lines.append(f"**File Type**: {ref.file_type}")
            output_lines.append(
                f"**Main Functions**: {', '.join(ref.main_functions[:5])}"
            )
            output_lines.append(f"**Key Concepts**: {', '.join(ref.key_concepts[:8])}")
            output_lines.append(f"**Dependencies**: {', '.join(ref.dependencies[:6])}")
            output_lines.append(f"**Lines of Code**: {ref.lines_of_code}")
            output_lines.append(f"**Summary**: {ref.summary[:300]}...")
            output_lines.append("")

    # Implementation suggestions
    output_lines.append("## 💡 Implementation Suggestions")
    output_lines.append("")

    if relevant_refs:
        # Collect all function names and concepts
        all_functions = set()
        all_concepts = set()
        all_dependencies = set()

        for ref, _ in relevant_refs[:5]:
            all_functions.update(ref.main_functions)
            all_concepts.update(ref.key_concepts)
            all_dependencies.update(ref.dependencies)

        output_lines.append("**Reference Function Name Patterns**:")
        for func in sorted(list(all_functions))[:10]:
            output_lines.append(f"- {func}")
        output_lines.append("")

        output_lines.append("**Important Concepts and Patterns**:")
        for concept in sorted(list(all_concepts))[:15]:
            output_lines.append(f"- {concept}")
        output_lines.append("")

        output_lines.append("**Potential Dependencies Needed**:")
        for dep in sorted(list(all_dependencies))[:10]:
            output_lines.append(f"- {dep}")
        output_lines.append("")

    output_lines.append("## 🚀 Next Actions")
    output_lines.append(
        "1. Analyze design patterns and architectural styles from the above reference code"
    )
    output_lines.append("2. Determine core functionalities and interfaces to implement")
    output_lines.append("3. Choose appropriate dependency libraries and tools")
    output_lines.append(
        "4. Design implementation solution consistent with existing code style"
    )
    output_lines.append("5. Start writing specific code implementation")

    return "\n".join(output_lines)


# ==================== MCP Tool Definitions ====================


@mcp.tool()
async def search_code_references(
    indexes_path: str, target_file: str, keywords: str = "", max_results: int = 10
) -> str:
    """
    **UNIFIED TOOL**: Search relevant reference code from index files for target file implementation.
    This tool combines directory setup, index loading, and searching in a single call.

    Args:
        indexes_path: Path to the indexes directory containing JSON index files
        target_file: Target file path (file to be implemented)
        keywords: Search keywords, comma-separated
        max_results: Maximum number of results to return

    Returns:
        Formatted reference code information JSON string
    """
    try:
        # Step 1: Load index files from specified directory
        logger.info(f"Loading index files from: {indexes_path}")
        index_cache = load_index_files_from_directory(indexes_path)

        if not index_cache:
            result = {
                "status": "error",
                "message": f"No index files found or failed to load from: {indexes_path}",
                "target_file": target_file,
                "indexes_path": indexes_path,
            }
            return json.dumps(result, ensure_ascii=False, indent=2)

        # Step 2: Parse keywords
        keyword_list = (
            [kw.strip() for kw in keywords.split(",") if kw.strip()] if keywords else []
        )

        # Step 3: Find relevant reference code
        relevant_refs = find_relevant_references_in_cache(
            target_file, index_cache, keyword_list, max_results
        )

        # Step 4: Find direct relationships
        relationships = find_direct_relationships_in_cache(target_file, index_cache)

        # Step 5: Format output
        formatted_output = format_reference_output(
            target_file, relevant_refs, relationships
        )

        result = {
            "status": "success",
            "target_file": target_file,
            "indexes_path": indexes_path,
            "keywords_used": keyword_list,
            "total_references_found": len(relevant_refs),
            "total_relationships_found": len(relationships),
            "formatted_content": formatted_output,
            "indexes_loaded": list(index_cache.keys()),
            "total_indexes_loaded": len(index_cache),
        }

        logger.info(
            f"Successfully found {len(relevant_refs)} references and {len(relationships)} relationships for {target_file}"
        )
        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        logger.error(f"Error in search_code_references: {str(e)}")
        result = {
            "status": "error",
            "message": f"Failed to search reference code: {str(e)}",
            "target_file": target_file,
            "indexes_path": indexes_path,
        }
        return json.dumps(result, ensure_ascii=False, indent=2)


@mcp.tool()
async def get_indexes_overview(indexes_path: str) -> str:
    """
    Get overview of all available reference code index information from specified directory

    Args:
        indexes_path: Path to the indexes directory containing JSON index files

    Returns:
        Overview information of all available reference code JSON string
    """
    try:
        # Load index files from specified directory
        index_cache = load_index_files_from_directory(indexes_path)

        if not index_cache:
            result = {
                "status": "error",
                "message": f"No index files found in: {indexes_path}",
                "indexes_path": indexes_path,
            }
            return json.dumps(result, ensure_ascii=False, indent=2)

        overview = {"total_repos": len(index_cache), "repositories": {}}

        for repo_name, index_data in index_cache.items():
            repo_info = {
                "repo_name": index_data.get("repo_name", repo_name),
                "total_files": index_data.get("total_files", 0),
                "file_types": [],
                "main_concepts": [],
                "total_relationships": len(index_data.get("relationships", [])),
            }

            # Collect file types and concepts
            file_summaries = index_data.get("file_summaries", [])
            file_types = set()
            concepts = set()

            for file_summary in file_summaries:
                file_types.add(file_summary.get("file_type", "Unknown"))
                concepts.update(file_summary.get("key_concepts", []))

            repo_info["file_types"] = sorted(list(file_types))
            repo_info["main_concepts"] = sorted(list(concepts))[
                :20
            ]  # Limit concept count

            overview["repositories"][repo_name] = repo_info

        result = {
            "status": "success",
            "overview": overview,
            "indexes_directory": str(Path(indexes_path).resolve()),
            "total_indexes_loaded": len(index_cache),
        }

        return json.dumps(result, ensure_ascii=False, indent=2)

    except Exception as e:
        result = {
            "status": "error",
            "message": f"Failed to get indexes overview: {str(e)}",
            "indexes_path": indexes_path,
        }
        return json.dumps(result, ensure_ascii=False, indent=2)


def main():
    """Main function"""
    logger.info("Starting unified Code Reference Indexer MCP server")
    logger.info("Available tools:")
    logger.info(
        "1. search_code_references(indexes_path, target_file, keywords, max_results) - UNIFIED TOOL"
    )
    logger.info(
        "2. get_indexes_overview(indexes_path) - Get overview of available indexes"
    )

    # Run MCP server
    mcp.run()


if __name__ == "__main__":
    main()


================================================
FILE: tools/command_executor.py
================================================
#!/usr/bin/env python3
"""
Command Executor MCP Tool / 命令执行器 MCP 工具

专门负责执行LLM生成的shell命令来创建文件树结构
Specialized in executing LLM-generated shell commands to create file tree structures
"""

import subprocess
from pathlib import Path
from typing import List, Dict
from mcp.server.models import InitializationOptions
import mcp.types as types
from mcp.server import NotificationOptions, Server
import mcp.server.stdio

# 创建MCP服务器实例 / Create MCP server instance
app = Server("command-executor")


@app.list_tools()
async def handle_list_tools() -> list[types.Tool]:
    """
    列出可用工具 / List available tools
    """
    return [
        types.Tool(
            name="execute_commands",
            description="""
            执行shell命令列表来创建文件树结构
            Execute shell command list to create file tree structure

            Args:
                commands: 要执行的shell命令列表（每行一个命令）
                working_directory: 执行命令的工作目录

            Returns:
                命令执行结果和详细报告
            """,
            inputSchema={
                "type": "object",
                "properties": {
                    "commands": {
                        "type": "string",
                        "title": "Commands",
                        "description": "要执行的shell命令列表，每行一个命令",
                    },
                    "working_directory": {
                        "type": "string",
                        "title": "Working Directory",
                        "description": "执行命令的工作目录",
                    },
                },
                "required": ["commands", "working_directory"],
            },
        ),
        types.Tool(
            name="execute_single_command",
            description="""
            执行单个shell命令
            Execute single shell command

            Args:
                command: 要执行的单个命令
                working_directory: 执行命令的工作目录

            Returns:
                命令执行结果
            """,
            inputSchema={
                "type": "object",
                "properties": {
                    "command": {
                        "type": "string",
                        "title": "Command",
                        "description": "要执行的单个shell命令",
                    },
                    "working_directory": {
                        "type": "string",
                        "title": "Working Directory",
                        "description": "执行命令的工作目录",
                    },
                },
                "required": ["command", "working_directory"],
            },
        ),
    ]


@app.call_tool()
async def handle_call_tool(name: str, arguments: dict) -> list[types.TextContent]:
    """
    处理工具调用 / Handle tool calls
    """
    try:
        if name == "execute_commands":
            return await execute_command_batch(
                arguments.get("commands", ""), arguments.get("working_directory", ".")
            )
        elif name == "execute_single_command":
            return await execute_single_command(
                arguments.get("command", ""), arguments.get("working_directory", ".")
            )
        else:
            raise ValueError(f"未知工具 / Unknown tool: {name}")

    except Exception as e:
        return [
            types.TextContent(
                type="text",
                text=f"工具执行错误 / Error executing tool {name}: {str(e)}",
            )
        ]


async def execute_command_batch(
    commands: str, working_directory: str
) -> list[types.TextContent]:
    """
    执行多个shell命令 / Execute multiple shell commands

    Args:
        commands: 命令列表，每行一个命令 / Command list, one command per line
        working_directory: 工作目录 / Working directory

    Returns:
        执行结果 / Execution results
    """
    try:
        # 确保工作目录存在 / Ensure working directory exists
        Path(working_directory).mkdir(parents=True, exist_ok=True)

        # 分割命令行 / Split command lines
        command_lines = [
            cmd.strip() for cmd in commands.strip().split("\n") if cmd.strip()
        ]

        if not command_lines:
            return [
                types.TextContent(
                    type="text", text="没有提供有效命令 / No valid commands provided"
                )
            ]

        results = []
        stats = {"successful": 0, "failed": 0, "timeout": 0}

        for i, command in enumerate(command_lines, 1):
            try:
                # 执行命令 / Execute command
                result = subprocess.run(
                    command,
                    shell=True,
                    cwd=working_directory,
                    capture_output=True,
                    text=True,
                    timeout=30,  # 30秒超时
                )

                if result.returncode == 0:
                    results.append(f"✅ Command {i}: {command}")
                    if result.stdout.strip():
                        results.append(f"   输出 / Output: {result.stdout.strip()}")
                    stats["successful"] += 1
                else:
                    results.append(f"❌ Command {i}: {command}")
                    if result.stderr.strip():
                        results.append(f"   错误 / Error: {result.stderr.strip()}")
                    stats["failed"] += 1

            except subprocess.TimeoutExpired:
                results.append(f"⏱️ Command {i} 超时 / timeout: {command}")
                stats["timeout"] += 1
            except Exception as e:
                results.append(f"💥 Command {i} 异常 / exception: {command} - {str(e)}")
                stats["failed"] += 1

        # 生成执行报告 / Generate execution report
        summary = generate_execution_summary(working_directory, command_lines, stats)
        final_result = summary + "\n" + "\n".join(results)

        return [types.TextContent(type="text", text=final_result)]

    except Exception as e:
        return [
            types.TextContent(
                type="text",
                text=f"批量命令执行失败 / Failed to execute command batch: {str(e)}",
            )
        ]


async def execute_single_command(
    command: str, working_directory: str
) -> list[types.TextContent]:
    """
    执行单个shell命令 / Execute single shell command

    Args:
        command: 要执行的命令 / Command to execute
        working_directory: 工作目录 / Working directory

    Returns:
        执行结果 / Execution result
    """
    try:
        # 确保工作目录存在 / Ensure working directory exists
        Path(working_directory).mkdir(parents=True, exist_ok=True)

        # 执行命令 / Execute command
        result = subprocess.run(
            command,
            shell=True,
            cwd=working_directory,
            capture_output=True,
            text=True,
            timeout=30,
        )

        # 格式化输出 / Format output
        output = format_single_command_result(command, working_directory, result)

        return [types.TextContent(type="text", text=output)]

    except subprocess.TimeoutExpired:
        return [
            types.TextContent(
                type="text", text=f"⏱️ 命令超时 / Command timeout: {command}"
            )
        ]
    except Exception as e:
        return [
            types.TextContent(
                type="text", text=f"💥 命令执行错误 / Command execution error: {str(e)}"
            )
        ]


def generate_execution_summary(
    working_directory: str, command_lines: List[str], stats: Dict[str, int]
) -> str:
    """
    生成执行总结 / Generate execution summary

    Args:
        working_directory: 工作目录 / Working directory
        command_lines: 命令列表 / Command list
        stats: 统计信息 / Statistics

    Returns:
        格式化的总结 / Formatted summary
    """
    return f"""
命令执行总结 / Command Execution Summary:
{'='*50}
工作目录 / Working Directory: {working_directory}
总命令数 / Total Commands: {len(command_lines)}
成功 / Successful: {stats['successful']}
失败 / Failed: {stats['failed']}
超时 / Timeout: {stats['timeout']}

详细结果 / Detailed Results:
{'-'*50}"""


def format_single_command_result(
    command: str, working_directory: str, result: subprocess.CompletedProcess
) -> str:
    """
    格式化单命令执行结果 / Format single command execution result

    Args:
        command: 执行的命令 / Executed command
        working_directory: 工作目录 / Working directory
        result: 执行结果 / Execution result

    Returns:
        格式化的结果 / Formatted result
    """
    output = f"""
单命令执行 / Single Command Execution:
{'='*40}
工作目录 / Working Directory: {working_directory}
命令 / Command: {command}
返回码 / Return Code: {result.returncode}

"""

    if result.returncode == 0:
        output += "✅ 状态 / Status: SUCCESS / 成功\n"
        if result.stdout.strip():
            output += f"输出 / Output:\n{result.stdout.strip()}\n"
    else:
        output += "❌ 状态 / Status: FAILED / 失败\n"
        if result.stderr.strip():
            output += f"错误 / Error:\n{result.stderr.strip()}\n"

    return output


async def main():
    """
    运行MCP服务器 / Run MCP server
    """
    # 通过stdio运行服务器 / Run server via stdio
    async with mcp.server.stdio.stdio_server() as (read_stream, write_stream):
        await app.run(
            read_stream,
            write_stream,
            InitializationOptions(
                server_name="command-executor",
                server_version="1.0.0",
                capabilities=app.get_capabilities(
                    notification_options=NotificationOptions(),
                    experimental_capabilities={},
                ),
            ),
        )


if __name__ == "__main__":
    import asyncio

    asyncio.run(main())


================================================
FILE: tools/document_segmentation_server.py
================================================
#!/usr/bin/env python3
"""
Document Segmentation MCP Server

This MCP server provides intelligent document segmentation and retrieval functions for handling
large research papers and technical documents that exceed LLM token limits.

==== CORE FUNCTIONALITY ====
1. Analyze document structure and type using semantic content analysis
2. Create intelligent segments based on content semantics, not just structure
3. Provide query-aware segment retrieval with relevance scoring
4. Support both structured (papers with headers) and unstructured documents
5. Configurable segmentation strategies based on document complexity

==== MCP TOOLS PROVIDED ====

📄 analyze_and_segment_document(paper_dir: str, force_refresh: bool = False)
   Purpose: Analyzes document structure and creates intelligent segments
   - Detects document type (research paper, technical doc, algorithm-focused, etc.)
   - Selects optimal segmentation strategy based on content analysis
   - Creates semantic segments preserving algorithm and concept integrity
   - Stores segmentation index for efficient retrieval
   - Returns: JSON with segmentation status, strategy used, and segment count

📖 read_document_segments(paper_dir: str, query_type: str, keywords: List[str] = None,
                         max_segments: int = 3, max_total_chars: int = None)
   Purpose: Intelligently retrieves relevant document segments based on query context
   - query_type: "concept_analysis", "algorithm_extraction", or "code_planning"
   - Uses semantic relevance scoring to rank segments
   - Applies query-specific filtering and keyword matching
   - Dynamically calculates optimal character limits based on content complexity
   - Returns: JSON with selected segments optimized for the specific query type

📋 get_document_overview(paper_dir: str)
   Purpose: Provides high-level overview of document structure and available segments
   - Shows document type and segmentation strategy used
   - Lists all segments with titles, content types, and relevance scores
   - Displays segment statistics (character counts, keyword summaries)
   - Returns: JSON with complete document analysis metadata

==== SEGMENTATION STRATEGIES ====
- semantic_research_focused: For academic papers with complex algorithmic content
- algorithm_preserve_integrity: Maintains algorithm blocks and formula chains intact
- concept_implementation_hybrid: Merges related concepts with implementation details
- semantic_chunking_enhanced: Advanced boundary detection for long documents
- content_aware_segmentation: Adaptive chunking based on content density

==== INTELLIGENT FEATURES ====
- Semantic boundary detection (not just structural)
- Algorithm block identification and preservation
- Formula chain recognition and grouping
- Concept-implementation relationship mapping
- Multi-level relevance scoring (content type, importance, keyword matching)
- Backward compatibility with existing document indexes
- Configurable via mcp_agent.config.yaml (enabled/disabled, size thresholds)

Usage:
python tools/document_segmentation_server.py
"""

import os
import re
import json
import sys
import io
from typing import Dict, List, Tuple
import hashlib
import logging
from datetime import datetime
from dataclasses import dataclass, asdict

# Set standard output encoding to UTF-8
if sys.stdout.encoding != "utf-8":
    try:
        if hasattr(sys.stdout, "reconfigure"):
            sys.stdout.reconfigure(encoding="utf-8")
            sys.stderr.reconfigure(encoding="utf-8")
        else:
            sys.stdout = io.TextIOWrapper(sys.stdout.detach(), encoding="utf-8")
            sys.stderr = io.TextIOWrapper(sys.stderr.detach(), encoding="utf-8")
    except Exception as e:
        print(f"Warning: Could not set UTF-8 encoding: {e}")

# Import MCP related modules
from mcp.server.fastmcp import FastMCP

# Setup logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Create FastMCP server instance
mcp = FastMCP("document-segmentation-server")


@dataclass
class DocumentSegment:
    """Represents a document segment with metadata"""

    id: str
    title: str
    content: str
    content_type: str  # "introduction", "methodology", "algorithm", "results", etc.
    keywords: List[str]
    char_start: int
    char_end: int
    char_count: int
    relevance_scores: Dict[str, float]  # Scores for different query types
    section_path: str  # e.g., "3.2.1" for nested sections


@dataclass
class DocumentIndex:
    """Document index containing all segments and metadata"""

    document_path: str
    document_type: str  # "academic_paper", "technical_doc", "code_doc", "general"
    segmentation_strategy: str
    total_segments: int
    total_chars: int
    segments: List[DocumentSegment]
    created_at: str


class DocumentAnalyzer:
    """Enhanced document analyzer using semantic content analysis instead of mechanical structure detection"""

    # More precise semantic indicators, weighted by importance
    ALGORITHM_INDICATORS = {
        "high": [
            "algorithm",
            "procedure",
            "method",
            "approach",
            "technique",
            "framework",
        ],
        "medium": ["step", "process", "implementation", "computation", "calculation"],
        "low": ["example", "illustration", "demonstration"],
    }

    TECHNICAL_CONCEPT_INDICATORS = {
        "high": ["formula", "equation", "theorem", "lemma", "proof", "definition"],
        "medium": ["parameter", "variable", "function", "model", "architecture"],
        "low": ["notation", "symbol", "term"],
    }

    IMPLEMENTATION_INDICATORS = {
        "high": ["code", "implementation", "programming", "software", "system"],
        "medium": ["design", "structure", "module", "component", "interface"],
        "low": ["tool", "library", "package"],
    }

    # Semantic features of document types (not just based on titles)
    RESEARCH_PAPER_PATTERNS = [
        r"(?i)\babstract\b.*?\n.*?(introduction|motivation|background)",
        r"(?i)(methodology|method).*?(experiment|evaluation|result)",
        r"(?i)(conclusion|future work|limitation).*?(reference|bibliography)",
        r"(?i)(related work|literature review|prior art)",
    ]

    TECHNICAL_DOC_PATTERNS = [
        r"(?i)(getting started|installation|setup).*?(usage|example)",
        r"(?i)(api|interface|specification).*?(parameter|endpoint)",
        r"(?i)(tutorial|guide|walkthrough).*?(step|instruction)",
        r"(?i)(troubleshooting|faq|common issues)",
    ]

    def analyze_document_type(self, content: str) -> Tuple[str, float]:
        """
        Enhanced document type analysis based on semantic content patterns

        Returns:
            Tuple[str, float]: (document_type, confidence_score)
        """
        content_lower = content.lower()

        # Calculate weighted semantic indicator scores
        algorithm_score = self._calculate_weighted_score(
            content_lower, self.ALGORITHM_INDICATORS
        )
        concept_score = self._calculate_weighted_score(
            content_lower, self.TECHNICAL_CONCEPT_INDICATORS
        )
        implementation_score = self._calculate_weighted_score(
            content_lower, self.IMPLEMENTATION_INDICATORS
        )

        # Detect semantic patterns of document types
        research_pattern_score = self._detect_pattern_score(
            content, self.RESEARCH_PAPER_PATTERNS
        )
        technical_pattern_score = self._detect_pattern_score(
            content, self.TECHNICAL_DOC_PATTERNS
        )

        # Comprehensive evaluation of document type
        total_research_score = (
            algorithm_score + concept_score + research_pattern_score * 2
        )
        total_technical_score = implementation_score + technical_pattern_score * 2

        # Determine document type based on content density and pattern matching
        if research_pattern_score > 0.5 and total_research_score > 3.0:
            return "research_paper", min(0.95, 0.6 + research_pattern_score * 0.35)
        elif algorithm_score > 2.0 and concept_score > 1.5:
            return "algorithm_focused", 0.85
        elif total_technical_score > 2.5:
            return "technical_doc", 0.8
        elif implementation_score > 1.5:
            return "implementation_guide", 0.75
        else:
            return "general_document", 0.5

    def _calculate_weighted_score(
        self, content: str, indicators: Dict[str, List[str]]
    ) -> float:
        """Calculate weighted semantic indicator scores"""
        score = 0.0
        for weight_level, terms in indicators.items():
            weight = {"high": 3.0, "medium": 2.0, "low": 1.0}[weight_level]
            for term in terms:
                if term in content:
                    score += weight * (
                        content.count(term) * 0.5 + 1
                    )  # Consider term frequency
        return score

    def _detect_pattern_score(self, content: str, patterns: List[str]) -> float:
        """Detect semantic pattern matching scores"""
        matches = 0
        for pattern in patterns:
            if re.search(pattern, content, re.DOTALL):
                matches += 1
        return matches / len(patterns)

    def detect_segmentation_strategy(self, content: str, doc_type: str) -> str:
        """
        Intelligently determine the best segmentation strategy based on content semantics rather than mechanical structure
        """
        # Analyze content characteristics
        algorithm_density = self._calculate_algorithm_density(content)
        concept_complexity = self._calculate_concept_complexity(content)
        implementation_detail_level = self._calculate_implementation_detail_level(
            content
        )

        # Select strategy based on document type and content characteristics
        if doc_type == "research_paper" and algorithm_density > 0.3:
            return "semantic_research_focused"
        elif doc_type == "algorithm_focused" or algorithm_density > 0.5:
            return "algorithm_preserve_integrity"
        elif concept_complexity > 0.4 and implementation_detail_level > 0.3:
            return "concept_implementation_hybrid"
        elif len(content) > 15000:  # Long documents
            return "semantic_chunking_enhanced"
        else:
            return "content_aware_segmentation"

    def _calculate_algorithm_density(self, content: str) -> float:
        """Calculate algorithm content density"""
        total_chars = len(content)
        algorithm_chars = 0

        # Identify algorithm blocks
        algorithm_patterns = [
            r"(?i)(algorithm\s+\d+|procedure\s+\d+)",
            r"(?i)(step\s+\d+|phase\s+\d+)",
            r"(?i)(input:|output:|return:|initialize:)",
            r"(?i)(for\s+each|while|if.*then|else)",
            r"(?i)(function|method|procedure).*\(",
        ]

        for pattern in algorithm_patterns:
            matches = re.finditer(pattern, content)
            for match in matches:
                # Estimate algorithm block size (expand forward and backward from match point)
                start = max(0, match.start() - 200)
                end = min(len(content), match.end() + 800)
                algorithm_chars += end - start

        return min(1.0, algorithm_chars / total_chars)

    def _calculate_concept_complexity(self, content: str) -> float:
        """Calculate concept complexity"""
        concept_indicators = self.TECHNICAL_CONCEPT_INDICATORS
        complexity_score = 0.0

        for level, terms in concept_indicators.items():
            weight = {"high": 3.0, "medium": 2.0, "low": 1.0}[level]
            for term in terms:
                complexity_score += content.lower().count(term) * weight

        # Normalize to 0-1 range
        return min(1.0, complexity_score / 100)

    def _calculate_implementation_detail_level(self, content: str) -> float:
        """Calculate implementation detail level"""
        implementation_patterns = [
            r"(?i)(code|implementation|programming)",
            r"(?i)(class|function|method|variable)",
            r"(?i)(import|include|library)",
            r"(?i)(parameter|argument|return)",
            r"(?i)(example|demo|tutorial)",
        ]

        detail_score = 0
        for pattern in implementation_patterns:
            detail_score += len(re.findall(pattern, content))

        return min(1.0, detail_score / 50)


class DocumentSegmenter:
    """Creates intelligent segments from documents"""

    def __init__(self):
        self.analyzer = DocumentAnalyzer()

    def segment_document(self, content: str, strategy: str) -> List[DocumentSegment]:
        """
        Perform intelligent segmentation using the specified strategy
        """
        if strategy == "semantic_research_focused":
            return self._segment_research_paper_semantically(content)
        elif strategy == "algorithm_preserve_integrity":
            return self._segment_preserve_algorithm_integrity(content)
        elif strategy == "concept_implementation_hybrid":
            return self._segment_concept_implementation_hybrid(content)
        elif strategy == "semantic_chunking_enhanced":
            return self._segment_by_enhanced_semantic_chunks(content)
        elif strategy == "content_aware_segmentation":
            return self._segment_content_aware(content)
        else:
            # Compatibility with legacy strategies
            return self._segment_by_enhanced_semantic_chunks(content)

    def _segment_by_headers(self, content: str) -> List[DocumentSegment]:
        """Segment document based on markdown headers"""
        segments = []
        lines = content.split("\n")
        current_segment = []
        current_header = None
        char_pos = 0

        for line in lines:
            line_with_newline = line + "\n"

            # Check if line is a header
            header_match = re.match(r"^(#{1,6})\s+(.+)$", line)

            if header_match:
                # Save previous segment if exists
                if current_segment and current_header:
                    segment_content = "\n".join(current_segment).strip()
                    if segment_content:
                        # Analyze content type and importance
                        content_type = self._classify_content_type(
                            current_header, segment_content
                        )
                        importance_score = (
                            0.8 if content_type in ["algorithm", "formula"] else 0.7
                        )

                        segment = self._create_enhanced_segment(
                            segment_content,
                            current_header,
                            char_pos - len(segment_content.encode("utf-8")),
                            char_pos,
                            importance_score,
                            content_type,
                        )
                        segments.append(segment)

                # Start new segment
                current_header = header_match.group(2).strip()
                current_segment = [line]
            else:
                if current_segment is not None:
                    current_segment.append(line)

            char_pos += len(line_with_newline.encode("utf-8"))

        # Add final segment
        if current_segment and current_header:
            segment_content = "\n".join(current_segment).strip()
            if segment_content:
                # Analyze content type and importance
                content_type = self._classify_content_type(
                    current_header, segment_content
                )
                importance_score = (
                    0.8 if content_type in ["algorithm", "formula"] else 0.7
                )

                segment = self._create_enhanced_segment(
                    segment_content,
                    current_header,
                    char_pos - len(segment_content.encode("utf-8")),
                    char_pos,
                    importance_score,
                    content_type,
                )
                segments.append(segment)

        return segments

    def _segment_preserve_algorithm_integrity(
        self, content: str
    ) -> List[DocumentSegment]:
        """Smart segmentation strategy that preserves algorithm integrity"""
        segments = []

        # 1. Identify algorithm blocks and related descriptions
        algorithm_blocks = self._identify_algorithm_blocks(content)

        # 2. Identify concept definition groups
        concept_groups = self._identify_concept_groups(content)

        # 3. Identify formula derivation chains
        formula_chains = self._identify_formula_chains(content)

        # 4. Merge related content blocks to ensure integrity
        content_blocks = self._merge_related_content_blocks(
            algorithm_blocks, concept_groups, formula_chains, content
        )

        # 5. Convert to DocumentSegment
        for i, block in enumerate(content_blocks):
            segment = self._create_enhanced_segment(
                block["content"],
                block["title"],
                block["start_pos"],
                block["end_pos"],
                block["importance_score"],
                block["content_type"],
            )
            segments.append(segment)

        return segments

    def _segment_research_paper_semantically(
        self, content: str
    ) -> List[DocumentSegment]:
        """Semantic segmentation specifically for research papers"""
        segments = []

        # Identify semantic structure of research papers
        paper_sections = self._identify_research_paper_sections(content)

        for section in paper_sections:
            # Ensure each section contains sufficient context
            enhanced_content = self._enhance_section_with_context(section, content)

            segment = self._create_enhanced_segment(
                enhanced_content["content"],
                enhanced_content["title"],
                enhanced_content["start_pos"],
                enhanced_content["end_pos"],
                enhanced_content["importance_score"],
                enhanced_content["content_type"],
            )
            segments.append(segment)

        return segments

    def _segment_concept_implementation_hybrid(
        self, content: str
    ) -> List[DocumentSegment]:
        """Intelligent segmentation combining concepts and implementation"""
        segments = []

        # Identify concept-implementation correspondence
        concept_impl_pairs = self._identify_concept_implementation_pairs(content)

        for pair in concept_impl_pairs:
            # Merge related concepts and implementations into one segment
            merged_content = self._merge_concept_with_implementation(pair, content)

            segment = self._create_enhanced_segment(
                merged_content["content"],
                merged_content["title"],
                merged_content["start_pos"],
                merged_content["end_pos"],
                merged_content["importance_score"],
                merged_content["content_type"],
            )
            segments.append(segment)

        return segments

    def _segment_by_enhanced_semantic_chunks(
        self, content: str
    ) -> List[DocumentSegment]:
        """Enhanced semantic chunk segmentation"""
        segments = []

        # Use improved semantic boundary detection
        semantic_boundaries = self._detect_semantic_boundaries(content)

        current_start = 0
        for i, boundary in enumerate(semantic_boundaries):
            chunk_content = content[current_start : boundary["position"]]

            if len(chunk_content.strip()) > 200:  # Minimum content threshold
                segment = self._create_enhanced_segment(
                    chunk_content,
                    boundary["suggested_title"],
                    current_start,
                    boundary["position"],
                    boundary["importance_score"],
                    boundary["content_type"],
                )
                segments.append(segment)

            current_start = boundary["position"]

        # Handle the final segment
        if current_start < len(content):
            final_content = content[current_start:]
            if len(final_content.strip()) > 200:
                segment = self._create_enhanced_segment(
                    final_content,
                    "Final Section",
                    current_start,
                    len(content),
                    0.7,
                    "general",
                )
                segments.append(segment)

        return segments

    def _segment_content_aware(self, content: str) -> List[DocumentSegment]:
        """Content-aware intelligent segmentation"""
        segments = []

        # Adaptive segmentation size
        optimal_chunk_size = self._calculate_optimal_chunk_size(content)

        # Segment based on content density
        content_chunks = self._create_content_aware_chunks(content, optimal_chunk_size)

        for chunk in content_chunks:
            segment = self._create_enhanced_segment(
                chunk["content"],
                chunk["title"],
                chunk["start_pos"],
                chunk["end_pos"],
                chunk["importance_score"],
                chunk["content_type"],
            )
            segments.append(segment)

        return segments

    def _segment_academic_paper(self, content: str) -> List[DocumentSegment]:
        """Segment academic paper using semantic understanding"""
        # First try header-based segmentation
        headers = re.findall(r"^(#{1,6})\s+(.+)$", content, re.MULTILINE)
        if len(headers) >= 2:
            return self._segment_by_headers(content)

        # Fallback to semantic detection of academic sections
        sections = self._detect_academic_sections(content)
        segments = []

        for section in sections:
            # Determine importance based on section type
            section_type = section.get("type", "general")
            content_type = (
                section_type
                if section_type
                in ["algorithm", "formula", "introduction", "conclusion"]
                else "general"
            )
            importance_score = {
                "algorithm": 0.95,
                "formula": 0.9,
                "introduction": 0.85,
                "conclusion": 0.8,
            }.get(content_type, 0.7)

            segment = self._create_enhanced_segment(
                section["content"],
                section["title"],
                section["start_pos"],
                section["end_pos"],
                importance_score,
                content_type,
            )
            segments.append(segment)

        return segments

    def _detect_academic_sections(self, content: str) -> List[Dict]:
        """Detect academic paper sections even without clear headers"""
        sections = []

        # Common academic section patterns
        section_patterns = [
            (r"(?i)(abstract|摘要)", "introduction"),
            (r"(?i)(introduction|引言|简介)", "introduction"),
            (r"(?i)(related work|相关工作|背景)", "background"),
            (r"(?i)(method|methodology|approach|方法)", "methodology"),
            (r"(?i)(algorithm|算法)", "algorithm"),
            (r"(?i)(experiment|实验|evaluation|评估)", "experiment"),
            (r"(?i)(result|结果|finding)", "results"),
            (r"(?i)(conclusion|结论|总结)", "conclusion"),
            (r"(?i)(reference|参考文献|bibliography)", "references"),
        ]

        current_pos = 0
        for i, (pattern, section_type) in enumerate(section_patterns):
            match = re.search(pattern, content[current_pos:], re.IGNORECASE)
            if match:
                start_pos = current_pos + match.start()

                # Find end position (next section or end of document)
                next_pos = len(content)
                for next_pattern, _ in section_patterns[i + 1 :]:
                    next_match = re.search(
                        next_pattern, content[start_pos + 100 :], re.IGNORECASE
                    )
                    if next_match:
                        next_pos = start_pos + 100 + next_match.start()
                        break

                section_content = content[start_pos:next_pos].strip()
                if len(section_content) > 50:  # Minimum content length
                    # Calculate importance score and content type
                    importance_score = self._calculate_paragraph_importance(
                        section_content, section_type
                    )
                    content_type = self._classify_content_type(
                        match.group(1), section_content
                    )

                    sections.append(
                        {
                            "title": match.group(1),
                            "content": section_content,
                            "start_pos": start_pos,
                            "end_pos": next_pos,
                            "type": section_type,
                            "importance_score": importance_score,
                            "content_type": content_type,
                        }
                    )

                current_pos = next_pos

        return sections

    def _segment_by_semantic_chunks(self, content: str) -> List[DocumentSegment]:
        """Segment long documents into semantic chunks"""
        # Split into paragraphs first
        paragraphs = [p.strip() for p in content.split("\n\n") if p.strip()]

        segments = []
        current_chunk = []
        current_chunk_size = 0
        chunk_size_limit = 3000  # characters
        overlap_size = 200

        char_pos = 0

        for para in paragraphs:
            para_size = len(para)

            # If adding this paragraph exceeds limit, create a segment
            if current_chunk_size + para_size > chunk_size_limit and current_chunk:
                chunk_content = "\n\n".join(current_chunk)
                # Analyze semantic chunk content type
                content_type = self._classify_paragraph_type(chunk_content)
                importance_score = self._calculate_paragraph_importance(
                    chunk_content, content_type
                )

                segment = self._create_enhanced_segment(
                    chunk_content,
                    f"Section {len(segments) + 1}",
                    char_pos - len(chunk_content.encode("utf-8")),
                    char_pos,
                    importance_score,
                    content_type,
                )
                segments.append(segment)

                # Keep last part for overlap
                overlap_content = (
                    chunk_content[-overlap_size:]
                    if len(chunk_content) > overlap_size
                    else ""
                )
                current_chunk = [overlap_content, para] if overlap_content else [para]
                current_chunk_size = len(overlap_content) + para_size
            else:
                current_chunk.append(para)
                current_chunk_size += para_size

            char_pos += para_size + 2  # +2 for \n\n

        # Add final chunk
        if current_chunk:
            chunk_content = "\n\n".join(current_chunk)
            # Analyze final chunk content type
            content_type = self._classify_paragraph_type(chunk_content)
            importance_score = self._calculate_paragraph_importance(
                chunk_content, content_type
            )

            segment = self._create_enhanced_segment(
                chunk_content,
                f"Section {len(segments) + 1}",
                char_pos - len(chunk_content.encode("utf-8")),
                char_pos,
                importance_score,
                content_type,
            )
            segments.append(segment)

        return segments

    def _segment_by_paragraphs(self, content: str) -> List[DocumentSegment]:
        """Simple paragraph-based segmentation for short documents"""
        paragraphs = [p.strip() for p in content.split("\n\n") if p.strip()]
        segments = []
        char_pos = 0

        for i, para in enumerate(paragraphs):
            if len(para) > 100:  # Only include substantial paragraphs
                # Analyze paragraph type and importance
                content_type = self._classify_paragraph_type(para)
                importance_score = self._calculate_paragraph_importance(
                    para, content_type
                )

                segment = self._create_enhanced_segment(
                    para,
                    f"Paragraph {i + 1}",
                    char_pos,
                    char_pos + len(para.encode("utf-8")),
                    importance_score,
                    content_type,
                )
                segments.append(segment)
            char_pos += len(para.encode("utf-8")) + 2

        return segments

    # =============== Enhanced intelligent segmentation helper methods ===============

    def _identify_algorithm_blocks(self, content: str) -> List[Dict]:
        """Identify algorithm blocks and related descriptions"""
        algorithm_blocks = []

        # Algorithm block identification patterns
        algorithm_patterns = [
            r"(?i)(algorithm\s+\d+|procedure\s+\d+|method\s+\d+).*?(?=algorithm\s+\d+|procedure\s+\d+|method\s+\d+|$)",
            r"(?i)(input:|output:|returns?:|require:|ensure:).*?(?=\n\s*\n|\n\s*(?:input:|output:|returns?:|require:|ensure:)|$)",
            r"(?i)(for\s+each|while|if.*then|repeat.*until).*?(?=\n\s*\n|$)",
            r"(?i)(step\s+\d+|phase\s+\d+).*?(?=step\s+\d+|phase\s+\d+|\n\s*\n|$)",
        ]

        for pattern in algorithm_patterns:
            matches = re.finditer(pattern, content, re.DOTALL)
            for match in matches:
                # Expand context to include complete descriptions
                start = max(0, match.start() - 300)
                end = min(len(content), match.end() + 500)

                # Find natural boundaries
                while start > 0 and content[start] not in "\n.!?":
                    start -= 1
                while end < len(content) and content[end] not in "\n.!?":
                    end += 1

                algorithm_blocks.append(
                    {
                        "start_pos": start,
                        "end_pos": end,
                        "content": content[start:end].strip(),
                        "title": self._extract_algorithm_title(
                            content[match.start() : match.end()]
                        ),
                        "importance_score": 0.95,  # High importance for algorithm blocks
                        "content_type": "algorithm",
                    }
                )

        return algorithm_blocks

    def _identify_concept_groups(self, content: str) -> List[Dict]:
        """Identify concept definition groups"""
        concept_groups = []

        # Concept definition patterns
        concept_patterns = [
            r"(?i)(definition|define|let|denote|given).*?(?=\n\s*\n|definition|define|let|denote|$)",
            r"(?i)(theorem|lemma|proposition|corollary).*?(?=\n\s*\n|theorem|lemma|proposition|corollary|$)",
            r"(?i)(notation|symbol|parameter).*?(?=\n\s*\n|notation|symbol|parameter|$)",
        ]

        for pattern in concept_patterns:
            matches = re.finditer(pattern, content, re.DOTALL)
            for match in matches:
                # Expand context
                start = max(0, match.start() - 200)
                end = min(len(content), match.end() + 300)

                concept_groups.append(
                    {
                        "start_pos": start,
                        "end_pos": end,
                        "content": content[start:end].strip(),
                        "title": self._extract_concept_title(
                            content[match.start() : match.end()]
                        ),
                        "importance_score": 0.85,
                        "content_type": "concept",
                    }
                )

        return concept_groups

    def _identify_formula_chains(self, content: str) -> List[Dict]:
        """Identify formula derivation chains"""
        formula_chains = []

        # Formula patterns
        formula_patterns = [
            r"\$\$.*?\$\$",  # Block-level mathematical formulas
            r"\$[^$]+\$",  # Inline mathematical formulas
            r"(?i)(equation|formula).*?(?=\n\s*\n|equation|formula|$)",
            r"(?i)(where|such that|given that).*?(?=\n\s*\n|where|such that|given that|$)",
        ]

        # Find dense formula regions
        formula_positions = []
        for pattern in formula_patterns:
            matches = re.finditer(pattern, content, re.DOTALL)
            for match in matches:
                formula_positions.append((match.start(), match.end()))

        # Merge nearby formulas into formula chains
        formula_positions.sort()
        if formula_positions:
            current_chain_start = formula_positions[0][0]
            current_chain_end = formula_positions[0][1]

            for start, end in formula_positions[1:]:
                if (
                    start - current_chain_end < 500
                ):  # Merge formulas within 500 characters
                    current_chain_end = end
                else:
                    # Save current chain
                    formula_chains.append(
                        {
                            "start_pos": max(0, current_chain_start - 200),
                            "end_pos": min(len(content), current_chain_end + 200),
                            "content": content[
                                max(0, current_chain_start - 200) : min(
                                    len(content), current_chain_end + 200
                                )
                            ].strip(),
                            "title": "Mathematical Formulation",
                            "importance_score": 0.9,
                            "content_type": "formula",
                        }
                    )
                    current_chain_start = start
                    current_chain_end = end

            # Add the last chain
            formula_chains.append(
                {
                    "start_pos": max(0, current_chain_start - 200),
                    "end_pos": min(len(content), current_chain_end + 200),
                    "content": content[
                        max(0, current_chain_start - 200) : min(
                            len(content), current_chain_end + 200
                        )
                    ].strip(),
                    "title": "Mathematical Formulation",
                    "importance_score": 0.9,
                    "content_type": "formula",
                }
            )

        return formula_chains

    def _merge_related_content_blocks(
        self,
        algorithm_blocks: List[Dict],
        concept_groups: List[Dict],
        formula_chains: List[Dict],
        content: str,
    ) -> List[Dict]:
        """Merge related content blocks to ensure integrity"""
        all_blocks = algorithm_blocks + concept_groups + formula_chains
        all_blocks.sort(key=lambda x: x["start_pos"])

        merged_blocks = []
        i = 0

        while i < len(all_blocks):
            current_block = all_blocks[i]

            # Check if can merge with the next block
            while i + 1 < len(all_blocks):
                next_block = all_blocks[i + 1]

                # If blocks are close or content related, merge them
                if next_block["start_pos"] - current_block[
                    "end_pos"
                ] < 300 or self._are_blocks_related(current_block, next_block):
                    # Merge blocks
                    merged_content = content[
                        current_block["start_pos"] : next_block["end_pos"]
                    ]
                    current_block = {
                        "start_pos": current_block["start_pos"],
                        "end_pos": next_block["end_pos"],
                        "content": merged_content.strip(),
                        "title": f"{current_block['title']} & {next_block['title']}",
                        "importance_score": max(
                            current_block["importance_score"],
                            next_block["importance_score"],
                        ),
                        "content_type": "merged",
                    }
                    i += 1
                else:
                    break

            merged_blocks.append(current_block)
            i += 1

        return merged_blocks

    def _are_blocks_related(self, block1: Dict, block2: Dict) -> bool:
        """Determine if two content blocks are related"""
        # Check content type associations
        related_types = [
            ("algorithm", "formula"),
            ("concept", "algorithm"),
            ("formula", "concept"),
        ]

        for type1, type2 in related_types:
            if (
                block1["content_type"] == type1 and block2["content_type"] == type2
            ) or (block1["content_type"] == type2 and block2["content_type"] == type1):
                return True

        return False

    def _extract_algorithm_title(self, text: str) -> str:
        """Extract title from algorithm text"""
        lines = text.split("\n")[:3]  # First 3 lines
        for line in lines:
            line = line.strip()
            if line and len(line) < 100:  # Reasonable title length
                # Clean title
                title = re.sub(r"[^\w\s-]", "", line)
                if title:
                    return title[:50]  # Limit title length
        return "Algorithm Block"

    def _extract_concept_title(self, text: str) -> str:
        """Extract title from concept text"""
        lines = text.split("\n")[:2]
        for line in lines:
            line = line.strip()
            if line and len(line) < 80:
                title = re.sub(r"[^\w\s-]", "", line)
                if title:
                    return title[:50]
        return "Concept Definition"

    def _create_enhanced_segment(
        self,
        content: str,
        title: str,
        start_pos: int,
        end_pos: int,
        importance_score: float,
        content_type: str,
    ) -> DocumentSegment:
        """Create enhanced document segment"""
        # Generate unique ID
        segment_id = hashlib.md5(
            f"{title}_{start_pos}_{end_pos}_{importance_score}".encode()
        ).hexdigest()[:8]

        # Extract keywords
        keywords = self._extract_enhanced_keywords(content, content_type)

        # Calculate enhanced relevance scores
        relevance_scores = self._calculate_enhanced_relevance_scores(
            content, content_type, importance_score
        )

        return DocumentSegment(
            id=segment_id,
            title=title,
            content=content,
            content_type=content_type,
            keywords=keywords,
            char_start=start_pos,
            char_end=end_pos,
            char_count=len(content),
            relevance_scores=relevance_scores,
            section_path=title,
        )

    def _extract_enhanced_keywords(self, content: str, content_type: str) -> List[str]:
        """Extract enhanced keywords based on content type"""
        words = re.findall(r"\b[a-zA-Z]{3,}\b", content.lower())

        # Adjust stopwords based on content type
        if content_type == "algorithm":
            algorithm_stopwords = {
                "step",
                "then",
                "else",
                "end",
                "begin",
                "start",
                "stop",
            }
            words = [w for w in words if w not in algorithm_stopwords]
        elif content_type == "formula":
            formula_keywords = ["equation", "formula", "where", "given", "such", "that"]
            words.extend(formula_keywords)

        # General stopwords
        general_stopwords = {
            "the",
            "and",
            "for",
            "are",
            "but",
            "not",
            "you",
            "all",
            "can",
            "her",
            "was",
            "one",
            "our",
            "had",
            "but",
            "have",
            "this",
            "that",
            "with",
            "from",
            "they",
            "she",
            "been",
            "were",
            "said",
            "each",
            "which",
            "their",
        }

        keywords = [w for w in set(words) if w not in general_stopwords and len(w) > 3]
        return keywords[:25]  # Increase keyword count

    def _calculate_enhanced_relevance_scores(
        self, content: str, content_type: str, importance_score: float
    ) -> Dict[str, float]:
        """Calculate enhanced relevance scores"""
        content_lower = content.lower()

        base_scores = {
            "concept_analysis": 0.5,
            "algorithm_extraction": 0.5,
            "code_planning": 0.5,
        }

        # Adjust base scores based on content type and importance
        if content_type == "algorithm":
            base_scores["algorithm_extraction"] = importance_score
            base_scores["code_planning"] = importance_score * 0.9
            base_scores["concept_analysis"] = importance_score * 0.7
        elif content_type == "concept":
            base_scores["concept_analysis"] = importance_score
            base_scores["algorithm_extraction"] = importance_score * 0.8
            base_scores["code_planning"] = importance_score * 0.6
        elif content_type == "formula":
            base_scores["algorithm_extraction"] = importance_score
            base_scores["concept_analysis"] = importance_score * 0.8
            base_scores["code_planning"] = importance_score * 0.9
        elif content_type == "merged":
            # Merged content is usually important
            base_scores = {k: importance_score * 0.95 for k in base_scores}

        # Additional bonus based on content density
        algorithm_indicators = ["algorithm", "method", "procedure", "step", "process"]
        concept_indicators = ["definition", "concept", "framework", "approach"]
        implementation_indicators = ["implementation", "code", "function", "design"]

        for query_type, indicators in [
            ("algorithm_extraction", algorithm_indicators),
            ("concept_analysis", concept_indicators),
            ("code_planning", implementation_indicators),
        ]:
            density_bonus = (
                sum(1 for indicator in indicators if indicator in content_lower) * 0.1
            )
            base_scores[query_type] = min(1.0, base_scores[query_type] + density_bonus)

        return base_scores

    # Placeholder methods - can be further implemented later
    def _identify_research_paper_sections(self, content: str) -> List[Dict]:
        """Identify research paper sections - simplified implementation"""
        # Temporarily use improved semantic detection
        return self._detect_academic_sections(content)

    def _enhance_section_with_context(self, section: Dict, content: str) -> Dict:
        """Add context to sections - simplified implementation"""
        return section

    def _identify_concept_implementation_pairs(self, content: str) -> List[Dict]:
        """Identify concept-implementation pairs - simplified implementation"""
        return []

    def _merge_concept_with_implementation(self, pair: Dict, content: str) -> Dict:
        """Merge concepts with implementation - simplified implementation"""
        return pair

    def _detect_semantic_boundaries(self, content: str) -> List[Dict]:
        """Detect semantic boundaries - based on paragraphs and logical separators"""
        boundaries = []

        # Split paragraphs by double line breaks
        paragraphs = content.split("\n\n")
        current_pos = 0

        for i, para in enumerate(paragraphs):
            if len(para.strip()) > 100:  # Valid paragraph
                # Analyze paragraph type
                content_type = self._classify_paragraph_type(para)
                importance_score = self._calculate_paragraph_importance(
                    para, content_type
                )

                boundaries.append(
                    {
                        "position": current_pos + len(para),
                        "suggested_title": self._extract_paragraph_title(para, i + 1),
                        "importance_score": importance_score,
                        "content_type": content_type,
                    }
                )

            current_pos += len(para) + 2  # +2 for \n\n

        return boundaries

    def _classify_paragraph_type(self, paragraph: str) -> str:
        """Classify paragraph type"""
        para_lower = paragraph.lower()

        if "algorithm" in para_lower or "procedure" in para_lower:
            return "algorithm"
        elif "formula" in para_lower or "$$" in paragraph:
            return "formula"
        elif any(
            word in para_lower for word in ["introduction", "overview", "abstract"]
        ):
            return "introduction"
        elif any(word in para_lower for word in ["conclusion", "summary", "result"]):
            return "conclusion"
        else:
            return "general"

    def _calculate_paragraph_importance(
        self, paragraph: str, content_type: str
    ) -> float:
        """Calculate paragraph importance"""
        if content_type == "algorithm":
            return 0.95
        elif content_type == "formula":
            return 0.9
        elif content_type == "introduction":
            return 0.85
        elif content_type == "conclusion":
            return 0.8
        else:
            return 0.7

    def _extract_paragraph_title(self, paragraph: str, index: int) -> str:
        """Extract paragraph title"""
        lines = paragraph.split("\n")
        for line in lines[:2]:
            if line.startswith("#"):
                return line.strip("# ")
            elif len(line) < 80 and line.strip():
                return line.strip()
        return f"Section {index}"

    def _calculate_optimal_chunk_size(self, content: str) -> int:
        """Calculate optimal chunk size"""
        # Dynamically adjust based on content complexity
        complexity = self.analyzer._calculate_concept_complexity(content)
        if complexity > 0.7:
            return 4000  # Complex content needs larger chunks
        elif complexity > 0.4:
            return 3000
        else:
            return 2000

    def _create_content_aware_chunks(self, content: str, chunk_size: int) -> List[Dict]:
        """Create content-aware chunks - simplified implementation"""
        chunks = []
        paragraphs = [p.strip() for p in content.split("\n\n") if p.strip()]

        current_chunk = []
        current_size = 0
        start_pos = 0

        for para in paragraphs:
            para_size = len(para)

            if current_size + para_size > chunk_size and current_chunk:
                chunk_content = "\n\n".join(current_chunk)
                chunks.append(
                    {
                        "content": chunk_content,
                        "title": f"Section {len(chunks) + 1}",
                        "start_pos": start_pos,
                        "end_pos": start_pos + len(chunk_content),
                        "importance_score": 0.7,
                        "content_type": "general",
                    }
                )

                current_chunk = [para]
                current_size = para_size
                start_pos += len(chunk_content) + 2
            else:
                current_chunk.append(para)
                current_size += para_size

        # Add the last chunk
        if current_chunk:
            chunk_content = "\n\n".join(current_chunk)
            chunks.append(
                {
                    "content": chunk_content,
                    "title": f"Section {len(chunks) + 1}",
                    "start_pos": start_pos,
                    "end_pos": start_pos + len(chunk_content),
                    "importance_score": 0.7,
                    "content_type": "general",
                }
            )

        return chunks

    def _create_segment(
        self, content: str, title: str, start_pos: int, end_pos: int
    ) -> DocumentSegment:
        """Create a DocumentSegment with metadata"""
        # Generate unique ID
        segment_id = hashlib.md5(f"{title}_{start_pos}_{end_pos}".encode()).hexdigest()[
            :8
        ]

        # Extract keywords from content
        keywords = self._extract_keywords(content)

        # Determine content type
        content_type = self._classify_content_type(title, content)

        # Calculate relevance scores for different query types
        relevance_scores = self._calculate_relevance_scores(content, content_type)

        return DocumentSegment(
            id=segment_id,
            title=title,
            content=content,
            content_type=content_type,
            keywords=keywords,
            char_start=start_pos,
            char_end=end_pos,
            char_count=len(content),
            relevance_scores=relevance_scores,
            section_path=title,  # Simplified for now
        )

    def _extract_keywords(self, content: str) -> List[str]:
        """Extract relevant keywords from content"""
        # Simple keyword extraction - could be enhanced with NLP
        words = re.findall(r"\b[a-zA-Z]{3,}\b", content.lower())

        # Remove common words
        stopwords = {
            "the",
            "and",
            "for",
            "are",
            "but",
            "not",
            "you",
            "all",
            "can",
            "her",
            "was",
            "one",
            "our",
            "had",
            "but",
            "have",
            "this",
            "that",
            "with",
            "from",
            "they",
            "she",
            "been",
            "were",
            "said",
            "each",
            "which",
            "their",
        }

        keywords = [w for w in set(words) if w not in stopwords and len(w) > 3]
        return keywords[:20]  # Top 20 keywords

    def _classify_content_type(self, title: str, content: str) -> str:
        """Classify the type of content based on title and content"""
        title_lower = title.lower()
        content_lower = content.lower()

        if any(
            word in title_lower for word in ["introduction", "abstract", "overview"]
        ):
            return "introduction"
        elif any(word in title_lower for word in ["method", "approach", "algorithm"]):
            return "methodology"
        elif any(
            word in title_lower for word in ["experiment", "evaluation", "result"]
        ):
            return "experiment"
        elif any(
            word in title_lower for word in ["conclusion", "discussion", "summary"]
        ):
            return "conclusion"
        elif any(word in title_lower for word in ["reference", "bibliography"]):
            return "references"
        elif "algorithm" in content_lower or "procedure" in content_lower:
            return "algorithm"
        else:
            return "general"

    def _calculate_relevance_scores(
        self, content: str, content_type: str
    ) -> Dict[str, float]:
        """Calculate relevance scores for different query types"""
        content_lower = content.lower()

        scores = {
            "concept_analysis": 0.5,
            "algorithm_extraction": 0.5,
            "code_planning": 0.5,
        }

        # Concept analysis relevance
        concept_indicators = [
            "introduction",
            "overview",
            "architecture",
            "system",
            "framework",
            "concept",
            "approach",
        ]
        concept_score = sum(
            1 for indicator in concept_indicators if indicator in content_lower
        ) / len(concept_indicators)
        scores["concept_analysis"] = min(
            1.0, concept_score + (0.8 if content_type == "introduction" else 0)
        )

        # Algorithm extraction relevance
        algorithm_indicators = [
            "algorithm",
            "method",
            "procedure",
            "formula",
            "equation",
            "step",
            "process",
        ]
        algorithm_score = sum(
            1 for indicator in algorithm_indicators if indicator in content_lower
        ) / len(algorithm_indicators)
        scores["algorithm_extraction"] = min(
            1.0, algorithm_score + (0.9 if content_type == "methodology" else 0)
        )

        # Code planning relevance
        code_indicators = [
            "implementation",
            "code",
            "function",
            "class",
            "module",
            "structure",
            "design",
        ]
        code_score = sum(
            1 for indicator in code_indicators if indicator in content_lower
        ) / len(code_indicators)
        scores["code_planning"] = min(
            1.0,
            code_score + (0.7 if content_type in ["methodology", "algorithm"] else 0),
        )

        return scores


# Global variables
DOCUMENT_INDEXES: Dict[str, DocumentIndex] = {}
segmenter = DocumentSegmenter()


def get_segments_dir(paper_dir: str) -> str:
    """Get the segments directory path"""
    return os.path.join(paper_dir, "document_segments")


def ensure_segments_dir_exists(segments_dir: str):
    """Ensure segments directory exists"""
    os.makedirs(segments_dir, exist_ok=True)


@mcp.tool()
async def analyze_and_segment_document(
    paper_dir: str, force_refresh: bool = False
) -> str:
    """
    Analyze document structure and create intelligent segments

    Args:
        paper_dir: Path to the paper directory
        force_refresh: Whether to force re-analysis even if segments exist

    Returns:
        JSON string with segmentation results
    """
    try:
        # Find markdown file in paper directory
        md_files = [f for f in os.listdir(paper_dir) if f.endswith(".md")]
        if not md_files:
            return json.dumps(
                {
                    "status": "error",
                    "message": f"No markdown file found in {paper_dir}",
                },
                ensure_ascii=False,
                indent=2,
            )

        md_file_path = os.path.join(paper_dir, md_files[0])
        segments_dir = get_segments_dir(paper_dir)
        index_file_path = os.path.join(segments_dir, "document_index.json")

        # Check if analysis already exists and is recent
        if not force_refresh and os.path.exists(index_file_path):
            try:
                with open(index_file_path, "r", encoding="utf-8") as f:
                    existing_index = json.load(f)

                    # Compatibility handling: ensure segments data structure is correct
                    if "segments" in existing_index:
                        segments_data = []
                        for seg_data in existing_index["segments"]:
                            # Ensure all required fields exist
                            segment_dict = dict(seg_data)

                            if "content_type" not in segment_dict:
                                segment_dict["content_type"] = "general"
                            if "keywords" not in segment_dict:
                                segment_dict["keywords"] = []
                            if "relevance_scores" not in segment_dict:
                                segment_dict["relevance_scores"] = {
                                    "concept_analysis": 0.5,
                                    "algorithm_extraction": 0.5,
                                    "code_planning": 0.5,
                                }
                            if "section_path" not in segment_dict:
                                segment_dict["section_path"] = segment_dict.get(
                                    "title", "Unknown"
                                )

                            segments_data.append(DocumentSegment(**segment_dict))

                        existing_index["segments"] = segments_data

                    DOCUMENT_INDEXES[paper_dir] = DocumentIndex(**existing_index)
                return json.dumps(
                    {
                        "status": "success",
                        "message": "Using existing document analysis",
                        "segments_dir": segments_dir,
                        "total_segments": existing_index["total_segments"],
                    },
                    ensure_ascii=False,
                    indent=2,
                )

            except Exception as e:
                logger.error(f"Failed to load existing index: {e}")
                logger.info("Will perform fresh analysis instead")
                # Remove corrupted index file and continue with new analysis
                try:
                    os.remove(index_file_path)
                except Exception as e:
                    pass

        # Read document content
        with open(md_file_path, "r", encoding="utf-8") as f:
            content = f.read()

        # Analyze document
        analyzer = DocumentAnalyzer()
        doc_type, confidence = analyzer.analyze_document_type(content)
        strategy = analyzer.detect_segmentation_strategy(content, doc_type)

        # Create segments
        segments = segmenter.segment_document(content, strategy)

        # Create document index
        document_index = DocumentIndex(
            document_path=md_file_path,
            document_type=doc_type,
            segmentation_strategy=strategy,
            total_segments=len(segments),
            total_chars=len(content),
            segments=segments,
            created_at=datetime.now().isoformat(),
        )

        # Save segments
        ensure_segments_dir_exists(segments_dir)

        # Save document index
        with open(index_file_path, "w", encoding="utf-8") as f:
            json.dump(
                asdict(document_index), f, ensure_ascii=False, indent=2, default=str
            )

        # Save individual segment files for fallback
        for segment in segments:
            segment_file_path = os.path.join(segments_dir, f"segment_{segment.id}.md")
            with open(segment_file_path, "w", encoding="utf-8") as f:
                f.write(f"# {segment.title}\n\n")
                f.write(f"**Content Type:** {segment.content_type}\n")
                f.write(f"**Keywords:** {', '.join(segment.keywords[:10])}\n\n")
                f.write(segment.content)

        # Store in memory
        DOCUMENT_INDEXES[paper_dir] = document_index

        logger.info(
            f"Document segmentation completed: {len(segments)} segments created"
        )

        return json.dumps(
            {
                "status": "success",
                "message": f"Document analysis completed with {strategy} strategy",
                "document_type": doc_type,
                "segmentation_strategy": strategy,
                "segments_dir": segments_dir,
                "total_segments": len(segments),
                "total_chars": len(content),
            },
            ensure_ascii=False,
            indent=2,
        )

    except Exception as e:
        logger.error(f"Error in analyze_and_segment_document: {e}")
        return json.dumps(
            {"status": "error", "message": f"Failed to analyze document: {str(e)}"},
            ensure_ascii=False,
            indent=2,
        )


@mcp.tool()
async def read_document_segments(
    paper_dir: str,
    query_type: str,
    keywords: List[str] = None,
    max_segments: int = 3,
    max_total_chars: int = None,
) -> str:
    """
    Intelligently retrieve relevant document segments based on query type

    Args:
        paper_dir: Path to the paper directory
        query_type: Type of query - "concept_analysis", "algorithm_extraction", or "code_planning"
        keywords: Optional list of keywords to search for
        max_segments: Maximum number of segments to return
        max_total_chars: Maximum total characters to return

    Returns:
        JSON string with selected segments
    """
    try:
        # Ensure document is analyzed
        if paper_dir not in DOCUMENT_INDEXES:
            segments_dir = get_segments_dir(paper_dir)
            index_file_path = os.path.join(segments_dir, "document_index.json")

            if os.path.exists(index_file_path):
                with open(index_file_path, "r", encoding="utf-8") as f:
                    index_data = json.load(f)
                    # Convert dict back to DocumentIndex with backward compatibility
                    segments_data = []
                    for seg_data in index_data.get("segments", []):
                        # Ensure all required fields exist, provide default values
                        segment_dict = dict(seg_data)

                        # Compatibility handling: add missing fields
                        if "content_type" not in segment_dict:
                            segment_dict["content_type"] = "general"
                        if "keywords" not in segment_dict:
                            segment_dict["keywords"] = []
                        if "relevance_scores" not in segment_dict:
                            segment_dict["relevance_scores"] = {
                                "concept_analysis": 0.5,
                                "algorithm_extraction": 0.5,
                                "code_planning": 0.5,
                            }
                        if "section_path" not in segment_dict:
                            segment_dict["section_path"] = segment_dict.get(
                                "title", "Unknown"
                            )

                        segment = DocumentSegment(**segment_dict)
                        segments_data.append(segment)

                    index_data["segments"] = segments_data
                    DOCUMENT_INDEXES[paper_dir] = DocumentIndex(**index_data)
            else:
                # Auto-analyze if not found
                await analyze_and_segment_document(paper_dir)

        document_index = DOCUMENT_INDEXES[paper_dir]

        # Dynamically calculate character limit
        if max_total_chars is None:
            max_total_chars = _calculate_adaptive_char_limit(document_index, query_type)

        # Score and rank segments with enhanced algorithm
        scored_segments = []
        for segment in document_index.segments:
            # Base relevance score (already enhanced in new system)
            relevance_score = segment.relevance_scores.get(query_type, 0.5)

            # Enhanced keyword matching with position weighting
            if keywords:
                keyword_score = _calculate_enhanced_keyword_score(segment, keywords)
                relevance_score += keyword_score

            # Content completeness bonus
            completeness_bonus = _calculate_completeness_bonus(segment, document_index)
            relevance_score += completeness_bonus

            scored_segments.append((segment, relevance_score))

        # Sort by enhanced relevance score
        scored_segments.sort(key=lambda x: x[1], reverse=True)

        # Intelligent segment selection with integrity preservation
        selected_segments = _select_segments_with_integrity(
            scored_segments, max_segments, max_total_chars, query_type
        )

        total_chars = sum(seg["char_count"] for seg in selected_segments)

        logger.info(
            f"Selected {len(selected_segments)} segments for {query_type} query"
        )

        return json.dumps(
            {
                "status": "success",
                "query_type": query_type,
                "keywords": keywords or [],
                "total_segments_available": len(document_index.segments),
                "segments_selected": len(selected_segments),
                "total_chars": total_chars,
                "max_chars_used": max_total_chars,
                "segments": selected_segments,
            },
            ensure_ascii=False,
            indent=2,
        )

    except Exception as e:
        logger.error(f"Error in read_document_segments: {e}")
        return json.dumps(
            {
                "status": "error",
                "message": f"Failed to read document segments: {str(e)}",
            },
            ensure_ascii=False,
            indent=2,
        )


@mcp.tool()
async def get_document_overview(paper_dir: str) -> str:
    """
    Get overview of document structure and available segments

    Args:
        paper_dir: Path to the paper directory

    Returns:
        JSON string with document overview
    """
    try:
        # Ensure document is analyzed
        if paper_dir not in DOCUMENT_INDEXES:
            await analyze_and_segment_document(paper_dir)

        document_index = DOCUMENT_INDEXES[paper_dir]

        # Create overview
        segment_summaries = []
        for segment in document_index.segments:
            segment_summaries.append(
                {
                    "id": segment.id,
                    "title": segment.title,
                    "content_type": segment.content_type,
                    "char_count": segment.char_count,
                    "keywords": segment.keywords[:5],  # Top 5 keywords
                    "relevance_scores": segment.relevance_scores,
                }
            )

        return json.dumps(
            {
                "status": "success",
                "document_path": document_index.document_path,
                "document_type": document_index.document_type,
                "segmentation_strategy": document_index.segmentation_strategy,
                "total_segments": document_index.total_segments,
                "total_chars": document_index.total_chars,
                "created_at": document_index.created_at,
                "segments_overview": segment_summaries,
            },
            ensure_ascii=False,
            indent=2,
        )

    except Exception as e:
        logger.error(f"Error in get_document_overview: {e}")
        return json.dumps(
            {
                "status": "error",
                "message": f"Failed to get document overview: {str(e)}",
            },
            ensure_ascii=False,
            indent=2,
        )


# =============== Enhanced retrieval system helper methods ===============


def _calculate_adaptive_char_limit(
    document_index: DocumentIndex, query_type: str
) -> int:
    """Dynamically calculate character limit based on document complexity and query type"""
    base_limit = 6000

    # Adjust based on document type
    if document_index.document_type == "research_paper":
        base_limit = 10000
    elif document_index.document_type == "algorithm_focused":
        base_limit = 12000
    elif document_index.segmentation_strategy == "algorithm_preserve_integrity":
        base_limit = 15000

    # Adjust based on query type
    query_multipliers = {
        "algorithm_extraction": 1.5,  # Algorithms need more context
        "concept_analysis": 1.2,
        "code_planning": 1.3,
    }

    multiplier = query_multipliers.get(query_type, 1.0)
    return int(base_limit * multiplier)


def _calculate_enhanced_keyword_score(
    segment: DocumentSegment, keywords: List[str]
) -> float:
    """Calculate enhanced keyword matching score"""
    score = 0.0
    content_lower = segment.content.lower()
    title_lower = segment.title.lower()

    for keyword in keywords:
        keyword_lower = keyword.lower()

        # Title matching has higher weight
        if keyword_lower in title_lower:
            score += 0.3

        # Content matching
        content_matches = content_lower.count(keyword_lower)
        if content_matches > 0:
            # Consider term frequency and position
            frequency_score = min(0.2, content_matches * 0.05)

            # Check if in important position (first 25% of content)
            early_content = content_lower[: len(content_lower) // 4]
            if keyword_lower in early_content:
                frequency_score += 0.1

            score += frequency_score

    return min(0.6, score)  # Limit maximum bonus


def _calculate_completeness_bonus(
    segment: DocumentSegment, document_index: DocumentIndex
) -> float:
    """Calculate content completeness bonus"""
    bonus = 0.0

    # Completeness bonus for algorithm and formula content
    if segment.content_type in ["algorithm", "formula", "merged"]:
        bonus += 0.2

    # Long paragraphs usually contain more complete information
    if segment.char_count > 2000:
        bonus += 0.1
    elif segment.char_count > 4000:
        bonus += 0.15

    # High importance paragraph bonus
    if segment.relevance_scores.get("algorithm_extraction", 0) > 0.8:
        bonus += 0.1

    return min(0.3, bonus)


def _select_segments_with_integrity(
    scored_segments: List[Tuple],
    max_segments: int,
    max_total_chars: int,
    query_type: str,
) -> List[Dict]:
    """Intelligently select segments while maintaining content integrity"""
    selected_segments = []
    total_chars = 0

    # First select the highest scoring segments
    for segment, score in scored_segments:
        if len(selected_segments) >= max_segments:
            break

        if total_chars + segment.char_count <= max_total_chars:
            selected_segments.append(
                {
                    "id": segment.id,
                    "title": segment.title,
                    "content": segment.content,
                    "content_type": segment.content_type,
                    "relevance_score": score,
                    "char_count": segment.char_count,
                }
            )
            total_chars += segment.char_count
        elif len(selected_segments) == 0:
            # If the first segment exceeds the limit, truncate but preserve it
            truncated_content = (
                segment.content[: max_total_chars - 200]
                + "\n\n[Content truncated for length...]"
            )
            selected_segments.append(
                {
                    "id": segment.id,
                    "title": segment.title,
                    "content": truncated_content,
                    "content_type": segment.content_type,
                    "relevance_score": score,
                    "char_count": len(truncated_content),
                }
            )
            break

    # If there's remaining space, try to add relevant small segments
    remaining_chars = max_total_chars - total_chars
    if remaining_chars > 500 and len(selected_segments) < max_segments:
        for segment, score in scored_segments[len(selected_segments) :]:
            if (
                segment.char_count <= remaining_chars
                and len(selected_segments) < max_segments
            ):
                selected_segments.append(
                    {
                        "id": segment.id,
                        "title": segment.title,
                        "content": segment.content,
                        "content_type": segment.content_type,
                        "relevance_score": score,
                        "char_count": segment.char_count,
                    }
                )
                remaining_chars -= segment.char_count

    return selected_segments


if __name__ == "__main__":
    # Run the MCP server
    mcp.run()


================================================
FILE: tools/git_command.py
================================================
#!/usr/bin/env python3
"""
GitHub Repository Downloader MCP Tool using FastMCP
"""

import asyncio
import os
import re
from typing import Dict, List, Optional
from pathlib import Path

from mcp.server import FastMCP

# 创建 FastMCP 实例
mcp = FastMCP("github-downloader")


class GitHubURLExtractor:
    """提取GitHub URL的工具类"""

    @staticmethod
    def extract_github_urls(text: str) -> List[str]:
        """从文本中提取GitHub URLs"""
        patterns = [
            # 标准HTTPS URL
            r"https?://github\.com/[\w\-\.]+/[\w\-\.]+(?:\.git)?",
            # SSH URL
            r"git@github\.com:[\w\-\.]+/[\w\-\.]+(?:\.git)?",
            # 短格式 owner/repo - 更严格的匹配
            r"(?<!\S)(?<!/)(?<!\.)([\w\-\.]+/[\w\-\.]+)(?!/)(?!\S)",
        ]

        urls = []
        for pattern in patterns:
            matches = re.findall(pattern, text, re.IGNORECASE)
            for match in matches:
                # 处理短格式
                if isinstance(match, tuple):
                    match = match[0]

                # 清理URL
                if match.startswith("git@"):
                    url = match.replace("git@github.com:", "https://github.com/")
                elif match.startswith("http"):
                    url = match
                else:
                    # 处理短格式 (owner/repo) - 添加更多验证
                    if "/" in match and not any(
                        x in match for x in ["./", "../", "deepcode_lab", "tools"]
                    ):
                        parts = match.split("/")
                        if (
                            len(parts) == 2
                            and all(
                                part.replace("-", "").replace("_", "").isalnum()
                                for part in parts
                            )
                            and not any(part.startswith(".") for part in parts)
                        ):
                            url = f"https://github.com/{match}"
                        else:
                            continue
                    else:
                        continue

                # 规范化 URL
                url = url.rstrip(".git")
                url = url.rstrip("/")

                # 修复重复的 github.com
                if "github.com/github.com/" in url:
                    url = url.replace("github.com/github.com/", "github.com/")

                urls.append(url)

        return list(set(urls))  # 去重

    @staticmethod
    def extract_target_path(text: str) -> Optional[str]:
        """从文本中提取目标路径"""
        # 路径指示词模式
        patterns = [
            r'(?:to|into|in|at)\s+(?:folder|directory|path)?\s*["\']?([^\s"\']+)["\']?',
            r'(?:save|download|clone)\s+(?:to|into|at)\s+["\']?([^\s"\']+)["\']?',
            # 中文支持
            r'(?:到|在|保存到|下载到|克隆到)\s*["\']?([^\s"\']+)["\']?',
        ]

        for pattern in patterns:
            match = re.search(pattern, text, re.IGNORECASE)
            if match:
                path = match.group(1).strip("。，,.")
                # 过滤掉通用词
                if path and path.lower() not in [
                    "here",
                    "there",
                    "current",
                    "local",
                    "这里",
                    "当前",
                    "本地",
                ]:
                    return path

        return None

    @staticmethod
    def infer_repo_name(url: str) -> str:
        """从URL推断仓库名称"""
        url = url.rstrip(".git")
        if "github.com" in url:
            parts = url.split("/")
            if len(parts) >= 2:
                return parts[-1]
        return "repository"


async def check_git_installed() -> bool:
    """检查Git是否安装"""
    try:
        proc = await asyncio.create_subprocess_exec(
            "git",
            "--version",
            stdout=asyncio.subprocess.PIPE,
            stderr=asyncio.subprocess.PIPE,
        )
        await proc.wait()
        return proc.returncode == 0
    except Exception:
        return False


async def clone_repository(repo_url: str, target_path: str) -> Dict[str, any]:
    """执行git clone命令"""
    try:
        proc = await asyncio.create_subprocess_exec(
            "git",
            "clone",
            repo_url,
            target_path,
            stdout=asyncio.subprocess.PIPE,
            stderr=asyncio.subprocess.PIPE,
        )

        stdout, stderr = await proc.communicate()

        return {
            "success": proc.returncode == 0,
            "stdout": stdout.decode("utf-8", errors="replace"),
            "stderr": stderr.decode("utf-8", errors="replace"),
            "returncode": proc.returncode,
        }
    except Exception as e:
        return {"success": False, "error": str(e)}


@mcp.tool()
async def download_github_repo(instruction: str) -> str:
    """
    Download GitHub repositories from natural language instructions.

    Args:
        instruction: Natural language text containing GitHub URLs and optional target paths

    Returns:
        Status message about the download operation

    Examples:
        - "Download https://github.com/openai/gpt-3"
        - "Clone microsoft/vscode to my-projects folder"
        - "Get https://github.com/facebook/react"
    """
    # 检查Git是否安装
    if not await check_git_installed():
        return "❌ Error: Git is not installed or not in system PATH"

    extractor = GitHubURLExtractor()

    # 提取GitHub URLs
    urls = extractor.extract_github_urls(instruction)
    if not urls:
        return "❌ No GitHub URLs found in the instruction"

    # 提取目标路径
    target_path = extractor.extract_target_path(instruction)

    # 下载仓库
    results = []
    for url in urls:
        try:
            # 准备目标路径
            if target_path:
                # 判断是否为绝对路径
                if os.path.isabs(target_path):
                    # 如果是绝对路径，直接使用
                    final_path = target_path
                    # 如果目标路径是目录，添加仓库名
                    if os.path.basename(target_path) == "" or target_path.endswith("/"):
                        final_path = os.path.join(
                            target_path, extractor.infer_repo_name(url)
                        )
                else:
                    # 如果是相对路径，保持相对路径
                    final_path = target_path
                    # 如果目标路径是目录，添加仓库名
                    if os.path.basename(target_path) == "" or target_path.endswith("/"):
                        final_path = os.path.join(
                            target_path, extractor.infer_repo_name(url)
                        )
            else:
                final_path = extractor.infer_repo_name(url)

            # 如果是相对路径，确保使用相对路径格式
            if not os.path.isabs(final_path):
                final_path = os.path.normpath(final_path)
                if final_path.startswith("/"):
                    final_path = final_path.lstrip("/")

            # 确保父目录存在
            parent_dir = os.path.dirname(final_path)
            if parent_dir:
                os.makedirs(parent_dir, exist_ok=True)

            # 检查目标路径是否已存在
            if os.path.exists(final_path):
                results.append(
                    f"❌ Failed to download {url}: Target path already exists: {final_path}"
                )
                continue

            # 执行克隆
            result = await clone_repository(url, final_path)

            if result["success"]:
                msg = f"✅ Successfully downloaded: {url}\n"
                msg += f"   Location: {final_path}"
                if result.get("stdout"):
                    msg += f"\n   {result['stdout'].strip()}"
            else:
                msg = f"❌ Failed to download: {url}\n"
                msg += f"   Error: {result.get('error', result.get('stderr', 'Unknown error'))}"

        except Exception as e:
            msg = f"❌ Failed to download: {url}\n"
            msg += f"   Error: {str(e)}"

        results.append(msg)

    return "\n\n".join(results)


@mcp.tool()
async def parse_github_urls(text: str) -> str:
    """
    Extract GitHub URLs and target paths from text.

    Args:
        text: Text containing GitHub URLs

    Returns:
        Parsed GitHub URLs and target path information
    """
    extractor = GitHubURLExtractor()

    urls = extractor.extract_github_urls(text)
    target_path = extractor.extract_target_path(text)

    content = "📝 Parsed information:\n\n"

    if urls:
        content += "GitHub URLs found:\n"
        for url in urls:
            content += f"  • {url}\n"
    else:
        content += "No GitHub URLs found\n"

    if target_path:
        content += f"\nTarget path: {target_path}"
    else:
        content += "\nTarget path: Not specified (will use repository name)"

    return content


@mcp.tool()
async def git_clone(
    repo_url: str, target_path: Optional[str] = None, branch: Optional[str] = None
) -> str:
    """
    Clone a specific GitHub repository.

    Args:
        repo_url: GitHub repository URL
        target_path: Optional target directory path
        branch: Optional branch name to clone

    Returns:
        Status message about the clone operation
    """
    # 检查Git是否安装
    if not await check_git_installed():
        return "❌ Error: Git is not installed or not in system PATH"

    # 准备目标路径
    if not target_path:
        extractor = GitHubURLExtractor()
        target_path = extractor.infer_repo_name(repo_url)

    # 转换为绝对路径
    if not os.path.isabs(target_path):
        target_path = str(Path.cwd() / target_path)

    # 检查目标路径
    if os.path.exists(target_path):
        return f"❌ Error: Target path already exists: {target_path}"

    # 构建命令
    cmd = ["git", "clone"]
    if branch:
        cmd.extend(["-b", branch])
    cmd.extend([repo_url, target_path])

    # 执行克隆
    try:
        proc = await asyncio.create_subprocess_exec(
            *cmd, stdout=asyncio.subprocess.PIPE, stderr=asyncio.subprocess.PIPE
        )

        stdout, stderr = await proc.communicate()

        if proc.returncode == 0:
            result = "✅ Successfully cloned repository\n"
            result += f"Repository: {repo_url}\n"
            result += f"Location: {target_path}"
            if branch:
                result += f"\nBranch: {branch}"
            return result
        else:
            return f"❌ Clone failed\nError: {stderr.decode('utf-8', errors='replace')}"

    except Exception as e:
        return f"❌ Clone failed\nError: {str(e)}"


# 主程序入口
if __name__ == "__main__":
    print("🚀 GitHub Repository Downloader MCP Tool")
    print("📝 Starting server with FastMCP...")
    print("\nAvailable tools:")
    print("  • download_github_repo - Download repos from natural language")
    print("  • parse_github_urls - Extract GitHub URLs from text")
    print("  • git_clone - Clone a specific repository")
    print("")

    # 运行服务器
    mcp.run()


================================================
FILE: tools/indexer_config.yaml
================================================
# Code Indexer Configuration File
# Configure various aspects of the code indexing process

# Paths Configuration
paths:
  code_base_path: "D:/Documents/GitHub/Code-Agent/examples/input/paper1/code_base"
  output_dir: "D:/Documents/GitHub/Code-Agent/examples/input/paper1/indexes"

# File Analysis Settings
file_analysis:
  # Supported file extensions for analysis
  supported_extensions:
    - ".py"      # Python
    - ".js"      # JavaScript
    - ".ts"      # TypeScript
    - ".java"    # Java
    - ".cpp"     # C++
    - ".c"       # C
    - ".h"       # C Header
    - ".hpp"     # C++ Header
    - ".cs"      # C#
    - ".php"     # PHP
    - ".rb"      # Ruby
    - ".go"      # Go
    - ".rs"      # Rust
    - ".scala"   # Scala
    - ".kt"      # Kotlin
    - ".swift"   # Swift
    - ".r"       # R
    - ".sql"     # SQL
    - ".sh"      # Shell Script
    - ".bat"     # Batch File
    - ".ps1"     # PowerShell
    - ".yaml"    # YAML
    - ".yml"     # YAML
    - ".json"    # JSON
    - ".xml"     # XML
    - ".toml"    # TOML

  # Directories to skip during traversal
  skip_directories:
    - "__pycache__"
    - "node_modules"
    - "target"
    - "build"
    - "dist"
    - "venv"
    - "env"
    - ".git"
    - ".svn"
    - ".hg"
    - "coverage"
    - ".pytest_cache"
    - ".mypy_cache"

  # Maximum file size to analyze (in bytes)
  max_file_size: 1048576  # 1MB

  # Maximum content length to send to LLM (in characters)
  max_content_length: 3000

# LLM Configuration
llm:
  # Model selection: "anthropic" or "openai"
  model_provider: "openai"

  # Request parameters
  max_tokens: 4000
  temperature: 0.3

  # System prompt for analysis
  system_prompt: "You are a code analysis expert. Provide precise, structured analysis of code relationships and similarities."

  # Rate limiting (seconds between requests)
  request_delay: 0.1

  # Retry configuration
  max_retries: 3
  retry_delay: 1.0

# Relationship Analysis Settings
relationships:
  # Minimum confidence score to include a relationship
  min_confidence_score: 0.3

  # High confidence threshold for reporting
  high_confidence_threshold: 0.7

  # Relationship types and their priorities
  relationship_types:
    direct_match: 1.0      # Direct implementation match
    partial_match: 0.8     # Partial functionality match
    reference: 0.6         # Reference or utility function
    utility: 0.4           # General utility or helper

# Output Configuration
output:
  # JSON formatting options
  json_indent: 2
  ensure_ascii: false

  # Generate additional report files
  generate_summary: true
  generate_statistics: true

  # Include metadata in output
  include_metadata: true

  # File naming pattern (use {repo_name} placeholder)
  index_filename_pattern: "{repo_name}_index.json"
  summary_filename: "indexing_summary.json"
  stats_filename: "indexing_statistics.json"

# Logging Configuration
logging:
  level: "INFO"  # DEBUG, INFO, WARNING, ERROR
  log_to_file: true
  log_file: "indexer.log"
  log_format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"

# Performance Settings
performance:
  # Enable concurrent processing of files within a repository
  enable_concurrent_analysis: true
  max_concurrent_files: 5

  # Memory optimization
  enable_content_caching: false
  max_cache_size: 100

# Debug and Development Settings
debug:
  # Save raw LLM responses for debugging
  save_raw_responses: false
  raw_responses_dir: "debug_responses"

  # Verbose output during processing
  verbose_output: false

  # Skip LLM calls for testing (uses mock responses)
  mock_llm_responses: false


================================================
FILE: tools/pdf_converter.py
================================================
#!/usr/bin/env python3
"""
PDF Converter Utility

This module provides functionality for converting various document formats to PDF,
including Office documents (.doc, .docx, .ppt, .pptx, .xls, .xlsx) and text files (.txt, .md).

Requirements:
- LibreOffice for Office document conversion
- ReportLab for text-to-PDF conversion
"""

from __future__ import annotations

import argparse
import logging
import subprocess
import tempfile
import shutil
import platform
import os
from pathlib import Path
from typing import Union, Optional, Dict, Any, List


class PDFConverter:
    """
    PDF conversion utility class.

    Provides methods to convert Office documents and text files to PDF format.
    """

    # Define supported file formats
    OFFICE_FORMATS = {".doc", ".docx", ".ppt", ".pptx", ".xls", ".xlsx"}
    TEXT_FORMATS = {".txt", ".md"}

    # Class-level logger
    logger = logging.getLogger(__name__)

    def __init__(self) -> None:
        """Initialize the PDF converter."""
        pass

    @staticmethod
    def find_libreoffice_windows() -> Optional[str]:
        """
        Find LibreOffice installation on Windows.
        
        Returns:
            Path to soffice.exe if found, None otherwise
        """
        if platform.system() != "Windows":
            return None
            
        # Common LibreOffice installation paths on Windows
        possible_paths = [
            r"C:\Program Files\LibreOffice\program\soffice.exe",
            r"C:\Program Files (x86)\LibreOffice\program\soffice.exe",
        ]
        
        # Also check PROGRAMFILES environment variables
        program_files = os.environ.get("PROGRAMFILES")
        program_files_x86 = os.environ.get("PROGRAMFILES(X86)")
        
        if program_files:
            possible_paths.append(os.path.join(program_files, "LibreOffice", "program", "soffice.exe"))
        if program_files_x86:
            possible_paths.append(os.path.join(program_files_x86, "LibreOffice", "program", "soffice.exe"))
        
        # Check each path
        for path in possible_paths:
            if os.path.exists(path):
                return path
                
        return None

    @staticmethod
    def convert_office_to_pdf(
        doc_path: Union[str, Path], output_dir: Optional[str] = None
    ) -> Path:
        """
        Convert Office document (.doc, .docx, .ppt, .pptx, .xls, .xlsx) to PDF.
        Requires LibreOffice to be installed.

        Args:
            doc_path: Path to the Office document file
            output_dir: Output directory for the PDF file

        Returns:
            Path to the generated PDF file
        """
        try:
            # Convert to Path object for easier handling
            doc_path = Path(doc_path)
            if not doc_path.exists():
                raise FileNotFoundError(f"Office document does not exist: {doc_path}")

            name_without_suff = doc_path.stem

            # Prepare output directory
            if output_dir:
                base_output_dir = Path(output_dir)
            else:
                # Generate unique folder name with timestamp to avoid conflicts
                import time
                timestamp = int(time.time())
                folder_name = f"paper_{timestamp}"
                
                # Save to workspace instead of temp directory
                workspace_base = Path(os.getcwd()) / "deepcode_lab" / "papers"
                workspace_base.mkdir(parents=True, exist_ok=True)
                base_output_dir = workspace_base / folder_name

            base_output_dir.mkdir(parents=True, exist_ok=True)

            # Check if LibreOffice is available
            libreoffice_available = False
            working_libreoffice_cmd: Optional[str] = None

            # Prepare subprocess parameters to hide console window on Windows
            subprocess_kwargs: Dict[str, Any] = {
                "capture_output": True,
                "check": True,
                "timeout": 10,
                "encoding": "utf-8",
                "errors": "ignore",
            }

            # Hide console window on Windows
            if platform.system() == "Windows":
                # Use CREATE_NO_WINDOW to prevent console window from appearing
                subprocess_kwargs["creationflags"] = 0x08000000
                # Also configure startupinfo to hide window
                startupinfo = subprocess.STARTUPINFO()
                startupinfo.dwFlags |= subprocess.STARTF_USESHOWWINDOW
                startupinfo.wShowWindow = subprocess.SW_HIDE
                subprocess_kwargs["startupinfo"] = startupinfo

            # On Windows, try to find LibreOffice in standard installation paths first
            # Don't run --version check on Windows as it can cause window/hanging issues
            if platform.system() == "Windows":
                windows_path = PDFConverter.find_libreoffice_windows()
                if windows_path:
                    libreoffice_available = True
                    working_libreoffice_cmd = windows_path
                    logging.info(f"LibreOffice detected at {windows_path}")

            # On non-Windows systems, try standard commands
            if not libreoffice_available and platform.system() != "Windows":
                try:
                    result = subprocess.run(
                        ["libreoffice", "--version"], **subprocess_kwargs
                    )
                    libreoffice_available = True
                    working_libreoffice_cmd = "libreoffice"
                    logging.info(f"LibreOffice detected: {result.stdout.strip()}")  # type: ignore
                except (
                    subprocess.CalledProcessError,
                    FileNotFoundError,
                    subprocess.TimeoutExpired,
                ):
                    pass

            # Try alternative commands for LibreOffice (non-Windows)
            if not libreoffice_available and platform.system() != "Windows":
                for cmd in ["soffice", "libreoffice"]:
                    try:
                        result = subprocess.run([cmd, "--version"], **subprocess_kwargs)
                        libreoffice_available = True
                        working_libreoffice_cmd = cmd
                        logging.info(
                            f"LibreOffice detected with command '{cmd}': {result.stdout.strip()}"  # type: ignore
                        )
                        break
                    except (
                        subprocess.CalledProcessError,
                        FileNotFoundError,
                        subprocess.TimeoutExpired,
                    ):
                        continue

            if not libreoffice_available:
                raise RuntimeError(
                    "LibreOffice is required for Office document conversion but was not found.\n"
                    "Please install LibreOffice:\n"
                    "- Windows: Download from https://www.libreoffice.org/download/download/\n"
                    "- macOS: brew install --cask libreoffice\n"
                    "- Ubuntu/Debian: sudo apt-get install libreoffice\n"
                    "- CentOS/RHEL: sudo yum install libreoffice\n"
                    "Alternatively, convert the document to PDF manually."
                )

            # Create temporary directory for PDF conversion
            with tempfile.TemporaryDirectory() as temp_dir:
                temp_path = Path(temp_dir)

                # Convert to PDF using LibreOffice
                logging.info(f"Converting {doc_path.name} to PDF using LibreOffice...")

                # Use the working LibreOffice command first, then try alternatives if it fails
                commands_to_try = [working_libreoffice_cmd]
                
                # Add alternative commands based on what was found
                if platform.system() == "Windows" and working_libreoffice_cmd:
                    # If we're using the full Windows path, also try standard commands
                    if "Program Files" in working_libreoffice_cmd:
                        commands_to_try.extend(["soffice", "libreoffice"])
                elif working_libreoffice_cmd == "libreoffice":
                    commands_to_try.append("soffice")
                else:
                    commands_to_try.append("libreoffice")

                conversion_successful = False
                for cmd in commands_to_try:
                    if cmd is None:
                        continue
                    try:
                        convert_cmd = [
                            cmd,
                            "--headless",
                            "--convert-to",
                            "pdf",
                            "--outdir",
                            str(temp_path),
                            str(doc_path),
                        ]

                        # Prepare conversion subprocess parameters
                        convert_subprocess_kwargs: Dict[str, Any] = {
                            "capture_output": True,
                            "text": True,
                            "timeout": 60,  # 60 second timeout
                            "encoding": "utf-8",
                            "errors": "ignore",
                        }

                        # Hide console window on Windows
                        if platform.system() == "Windows":
                            convert_subprocess_kwargs["creationflags"] = 0x08000000
                            # Also configure startupinfo to hide window
                            startupinfo = subprocess.STARTUPINFO()
                            startupinfo.dwFlags |= subprocess.STARTF_USESHOWWINDOW
                            startupinfo.wShowWindow = subprocess.SW_HIDE
                            convert_subprocess_kwargs["startupinfo"] = startupinfo

                        result = subprocess.run(
                            convert_cmd, **convert_subprocess_kwargs
                        )

                        if result.returncode == 0:  # type: ignore
                            conversion_successful = True
                            logging.info(
                                f"Successfully converted {doc_path.name} to PDF"
                            )
                            break
                        else:
                            logging.warning(
                                f"LibreOffice command '{cmd}' failed: {result.stderr}"  # type: ignore
                            )
                    except subprocess.TimeoutExpired:
                        logging.warning(f"LibreOffice command '{cmd}' timed out")
                    except Exception as e:
                        logging.error(
                            f"LibreOffice command '{cmd}' failed with exception: {e}"
                        )

                if not conversion_successful:
                    raise RuntimeError(
                        f"LibreOffice conversion failed for {doc_path.name}. "
                        f"Please check if the file is corrupted or try converting manually."
                    )

                # Find the generated PDF
                pdf_files = list(temp_path.glob("*.pdf"))
                if not pdf_files:
                    raise RuntimeError(
                        f"PDF conversion failed for {doc_path.name} - no PDF file generated. "
                        f"Please check LibreOffice installation or try manual conversion."
                    )

                pdf_path = pdf_files[0]
                logging.info(
                    f"Generated PDF: {pdf_path.name} ({pdf_path.stat().st_size} bytes)"
                )

                # Validate the generated PDF
                if pdf_path.stat().st_size < 100:  # Very small file, likely empty
                    raise RuntimeError(
                        "Generated PDF appears to be empty or corrupted. "
                        "Original file may have issues or LibreOffice conversion failed."
                    )

                # Copy PDF to final output directory
                final_pdf_path = base_output_dir / f"{name_without_suff}.pdf"
                shutil.copy2(pdf_path, final_pdf_path)
                
                print(f"✅ PDF saved to: {final_pdf_path}")
                print(f"   File size: {final_pdf_path.stat().st_size} bytes")
                print(f"   Parent folder: {base_output_dir}")

                return final_pdf_path

        except Exception as e:
            logging.error(f"Error in convert_office_to_pdf: {str(e)}")
            raise

    @staticmethod
    def convert_text_to_pdf(
        text_path: Union[str, Path], output_dir: Optional[str] = None
    ) -> Path:
        """
        Convert text file (.txt, .md) to PDF using ReportLab with full markdown support.

        Args:
            text_path: Path to the text file
            output_dir: Output directory for the PDF file

        Returns:
            Path to the generated PDF file
        """
        try:
            text_path = Path(text_path)
            if not text_path.exists():
                raise FileNotFoundError(f"Text file does not exist: {text_path}")

            # Supported text formats
            supported_text_formats = {".txt", ".md"}
            if text_path.suffix.lower() not in supported_text_formats:
                raise ValueError(f"Unsupported text format: {text_path.suffix}")

            # Read the text content
            try:
                with open(text_path, "r", encoding="utf-8") as f:
                    text_content = f.read()
            except UnicodeDecodeError:
                # Try with different encodings
                for encoding in ["gbk", "latin-1", "cp1252"]:
                    try:
                        with open(text_path, "r", encoding=encoding) as f:
                            text_content = f.read()
                        logging.info(f"Successfully read file with {encoding} encoding")
                        break
                    except UnicodeDecodeError:
                        continue
                else:
                    raise RuntimeError(
                        f"Could not decode text file {text_path.name} with any supported encoding"
                    )

            # Prepare output directory
            if output_dir:
                base_output_dir = Path(output_dir)
            else:
                # Generate unique folder name with timestamp to avoid conflicts
                import time
                timestamp = int(time.time())
                folder_name = f"paper_{timestamp}"
                
                # Save to workspace instead of temp directory
                workspace_base = Path(os.getcwd()) / "deepcode_lab" / "papers"
                workspace_base.mkdir(parents=True, exist_ok=True)
                base_output_dir = workspace_base / folder_name

            base_output_dir.mkdir(parents=True, exist_ok=True)
            pdf_path = base_output_dir / f"{text_path.stem}.pdf"

            # Convert text to PDF
            logging.info(f"Converting {text_path.name} to PDF...")

            try:
                from reportlab.lib.pagesizes import A4
                from reportlab.platypus import SimpleDocTemplate, Paragraph, Spacer
                from reportlab.lib.styles import getSampleStyleSheet, ParagraphStyle
                from reportlab.lib.units import inch
                from reportlab.pdfbase import pdfmetrics

                # Create PDF document
                doc = SimpleDocTemplate(
                    str(pdf_path),
                    pagesize=A4,
                    leftMargin=inch,
                    rightMargin=inch,
                    topMargin=inch,
                    bottomMargin=inch,
                )

                # Get styles
                styles = getSampleStyleSheet()
                normal_style = styles["Normal"]
                heading_style = styles["Heading1"]

                # Try to register a font that supports Chinese characters
                try:
                    # Try to use system fonts that support Chinese
                    system = platform.system()
                    if system == "Windows":
                        # Try common Windows fonts
                        for font_name in ["SimSun", "SimHei", "Microsoft YaHei"]:
                            try:
                                from reportlab.pdfbase.cidfonts import (
                                    UnicodeCIDFont,
                                )

                                pdfmetrics.registerFont(UnicodeCIDFont(font_name))  # type: ignore
                                normal_style.fontName = font_name
                                heading_style.fontName = font_name
                                break
                            except Exception:
                                continue
                    elif system == "Darwin":  # macOS
                        for font_name in ["STSong-Light", "STHeiti"]:
                            try:
                                from reportlab.pdfbase.cidfonts import (
                                    UnicodeCIDFont,
                                )

                                pdfmetrics.registerFont(UnicodeCIDFont(font_name))  # type: ignore
                                normal_style.fontName = font_name
                                heading_style.fontName = font_name
                                break
                            except Exception:
                                continue
                except Exception:
                    pass  # Use default fonts if Chinese font setup fails

                # Build content
                story = []

                # Handle markdown or plain text
                if text_path.suffix.lower() == ".md":
                    # Handle markdown content - simplified implementation
                    lines = text_content.split("\n")
                    for line in lines:
                        line = line.strip()
                        if not line:
                            story.append(Spacer(1, 12))
                            continue

                        # Headers
                        if line.startswith("#"):
                            level = len(line) - len(line.lstrip("#"))
                            header_text = line.lstrip("#").strip()
                            if header_text:
                                header_style = ParagraphStyle(
                                    name=f"Heading{level}",
                                    parent=heading_style,
                                    fontSize=max(16 - level, 10),
                                    spaceAfter=8,
                                    spaceBefore=16 if level <= 2 else 12,
                                )
                                story.append(Paragraph(header_text, header_style))
                        else:
                            # Regular text
                            processed_line = PDFConverter._process_inline_markdown(line)
                            story.append(Paragraph(processed_line, normal_style))
                            story.append(Spacer(1, 6))
                else:
                    # Handle plain text files (.txt)
                    logging.info(
                        f"Processing plain text file with {len(text_content)} characters..."
                    )

                    # Split text into lines and process each line
                    lines = text_content.split("\n")
                    line_count = 0

                    for line in lines:
                        line = line.rstrip()
                        line_count += 1

                        # Empty lines
                        if not line.strip():
                            story.append(Spacer(1, 6))
                            continue

                        # Regular text lines
                        # Escape special characters for ReportLab
                        safe_line = (
                            line.replace("&", "&amp;")
                            .replace("<", "&lt;")
                            .replace(">", "&gt;")
                        )

                        # Create paragraph
                        story.append(Paragraph(safe_line, normal_style))
                        story.append(Spacer(1, 3))

                    logging.info(f"Added {line_count} lines to PDF")

                    # If no content was added, add a placeholder
                    if not story:
                        story.append(Paragraph("(Empty text file)", normal_style))

                # Build PDF
                doc.build(story)
                logging.info(
                    f"Successfully converted {text_path.name} to PDF ({pdf_path.stat().st_size / 1024:.1f} KB)"
                )

            except ImportError:
                raise RuntimeError(
                    "reportlab is required for text-to-PDF conversion. "
                    "Please install it using: pip install reportlab"
                )
            except Exception as e:
                raise RuntimeError(
                    f"Failed to convert text file {text_path.name} to PDF: {str(e)}"
                )

            # Validate the generated PDF
            if not pdf_path.exists() or pdf_path.stat().st_size < 100:
                raise RuntimeError(
                    f"PDF conversion failed for {text_path.name} - generated PDF is empty or corrupted."
                )

            print(f"✅ PDF saved to: {pdf_path}")
            print(f"   File size: {pdf_path.stat().st_size} bytes")
            print(f"   Parent folder: {base_output_dir}")
            
            return pdf_path

        except Exception as e:
            logging.error(f"Error in convert_text_to_pdf: {str(e)}")
            raise

    @staticmethod
    def _process_inline_markdown(text: str) -> str:
        """
        Process inline markdown formatting (bold, italic, code, links)

        Args:
            text: Raw text with markdown formatting

        Returns:
            Text with ReportLab markup
        """
        import re

        # Escape special characters for ReportLab
        text = text.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")

        # Bold text: **text** or __text__
        text = re.sub(r"\*\*(.*?)\*\*", r"<b>\1</b>", text)
        text = re.sub(r"__(.*?)__", r"<b>\1</b>", text)

        # Italic text: *text* or _text_ (but not in the middle of words)
        text = re.sub(r"(?<!\w)\*([^*\n]+?)\*(?!\w)", r"<i>\1</i>", text)
        text = re.sub(r"(?<!\w)_([^_\n]+?)_(?!\w)", r"<i>\1</i>", text)

        # Inline code: `code`
        text = re.sub(
            r"`([^`]+?)`",
            r'<font name="Courier" size="9" color="darkred">\1</font>',
            text,
        )

        # Links: [text](url) - convert to text with URL annotation
        def link_replacer(match):
            link_text = match.group(1)
            url = match.group(2)
            return f'<link href="{url}" color="blue"><u>{link_text}</u></link>'

        text = re.sub(r"\[([^\]]+?)\]\(([^)]+?)\)", link_replacer, text)

        # Strikethrough: ~~text~~
        text = re.sub(r"~~(.*?)~~", r"<strike>\1</strike>", text)

        return text

    def convert_to_pdf(
        self,
        file_path: Union[str, Path],
        output_dir: Optional[str] = None,
    ) -> Path:
        """
        Convert document to PDF based on file extension

        Args:
            file_path: Path to the file to be converted
            output_dir: Output directory path

        Returns:
            Path to the generated PDF file
        """
        # Convert to Path object
        file_path = Path(file_path)
        if not file_path.exists():
            raise FileNotFoundError(f"File does not exist: {file_path}")

        # Get file extension
        ext = file_path.suffix.lower()

        # Choose appropriate conversion method based on file type
        if ext in self.OFFICE_FORMATS:
            return self.convert_office_to_pdf(file_path, output_dir)
        elif ext in self.TEXT_FORMATS:
            return self.convert_text_to_pdf(file_path, output_dir)
        else:
            raise ValueError(
                f"Unsupported file format: {ext}. "
                f"Supported formats: {', '.join(self.OFFICE_FORMATS | self.TEXT_FORMATS)}"
            )

    def check_dependencies(self) -> dict:
        """
        Check if required dependencies are available

        Returns:
            dict: Dictionary with dependency check results
        """
        results = {
            "libreoffice": False,
            "reportlab": False,
        }

        # Check LibreOffice
        # On Windows, just check if the executable exists (don't run it to avoid window issues)
        if platform.system() == "Windows":
            windows_path = PDFConverter.find_libreoffice_windows()
            if windows_path:
                results["libreoffice"] = True
        else:
            # On non-Windows systems, try running the version command
            try:
                subprocess_kwargs: Dict[str, Any] = {
                    "capture_output": True,
                    "text": True,
                    "check": True,
                    "timeout": 5,
                    "encoding": "utf-8",
                    "errors": "ignore",
                }

                try:
                    subprocess.run(["libreoffice", "--version"], **subprocess_kwargs)
                    results["libreoffice"] = True
                except (subprocess.CalledProcessError, FileNotFoundError, subprocess.TimeoutExpired):
                    try:
                        subprocess.run(["soffice", "--version"], **subprocess_kwargs)
                        results["libreoffice"] = True
                    except (subprocess.CalledProcessError, FileNotFoundError, subprocess.TimeoutExpired):
                        pass
            except Exception:
                # If any unexpected error occurs during LibreOffice check, silently pass
                pass

        # Check ReportLab
        import importlib.util

        if importlib.util.find_spec("reportlab") is not None:
            results["reportlab"] = True

        return results


def main():
    """
    Main function to run the PDF converter from command line
    """
    parser = argparse.ArgumentParser(description="Convert documents to PDF format")
    parser.add_argument("file_path", nargs="?", help="Path to the document to convert")
    parser.add_argument("--output", "-o", help="Output directory path")
    parser.add_argument(
        "--check",
        action="store_true",
        help="Check dependencies installation",
    )
    parser.add_argument(
        "--verbose", "-v", action="store_true", help="Enable verbose logging"
    )

    args = parser.parse_args()

    # Configure logging
    log_level = logging.INFO if args.verbose else logging.WARNING
    logging.basicConfig(
        level=log_level,
        format="%(asctime)s - %(levelname)s - %(message)s",
        datefmt="%Y-%m-%d %H:%M:%S",
    )

    # Initialize converter
    converter = PDFConverter()

    # Check dependencies if requested
    if args.check:
        print("🔍 Checking dependencies...")
        deps = converter.check_dependencies()

        print(
            f"LibreOffice: {'✅ Available' if deps['libreoffice'] else '❌ Not found'}"
        )
        print(f"ReportLab: {'✅ Available' if deps['reportlab'] else '❌ Not found'}")

        if not deps["libreoffice"]:
            print("\n📋 To install LibreOffice:")
            print("  - Windows: Download from https://www.libreoffice.org/")
            print("  - macOS: brew install --cask libreoffice")
            print("  - Ubuntu/Debian: sudo apt-get install libreoffice")

        if not deps["reportlab"]:
            print("\n📋 To install ReportLab:")
            print("  pip install reportlab")

        return 0

    # If not checking dependencies, file_path is required
    if not args.file_path:
        parser.error("file_path is required when not using --check")

    try:
        # Convert the file
        output_pdf = converter.convert_to_pdf(
            file_path=args.file_path,
            output_dir=args.output,
        )

        print(f"✅ Successfully converted to PDF: {output_pdf}")
        print(f"📄 File size: {output_pdf.stat().st_size / 1024:.1f} KB")

    except Exception as e:
        print(f"❌ Error: {str(e)}")
        return 1

    return 0


if __name__ == "__main__":
    exit(main())


================================================
FILE: tools/pdf_downloader.py
================================================
#!/usr/bin/env python3
"""
Smart PDF Downloader MCP Tool

A standardized MCP tool using FastMCP for intelligent file downloading and document conversion.
Supports natural language instructions for downloading files from URLs, moving local files,
and automatic conversion to Markdown format with image extraction.

Features:
- Natural language instruction parsing
- URL and local path extraction
- Automatic document conversion (PDF, DOCX, PPTX, HTML, etc.)
- Image extraction and preservation
- Multi-format support with fallback options
"""

import os
import re
import aiohttp
import aiofiles
import shutil
import sys
import io
from typing import List, Dict, Optional, Any
from urllib.parse import urlparse, unquote
from datetime import datetime

from mcp.server import FastMCP

# Docling imports for document conversion
try:
    from docling.document_converter import DocumentConverter
    from docling.datamodel.base_models import InputFormat
    from docling.datamodel.pipeline_options import PdfPipelineOptions
    from docling.document_converter import PdfFormatOption

    DOCLING_AVAILABLE = True
except ImportError:
    DOCLING_AVAILABLE = False
    print(
        "Warning: docling package not available. Document conversion will be disabled."
    )

# Fallback PDF text extraction
try:
    import PyPDF2

    PYPDF2_AVAILABLE = True
except ImportError:
    PYPDF2_AVAILABLE = False
    print(
        "Warning: PyPDF2 package not available. Fallback PDF extraction will be disabled."
    )

# 设置标准输出编码为UTF-8
if sys.stdout.encoding != "utf-8":
    try:
        if hasattr(sys.stdout, "reconfigure"):
            sys.stdout.reconfigure(encoding="utf-8")
            sys.stderr.reconfigure(encoding="utf-8")
        else:
            sys.stdout = io.TextIOWrapper(sys.stdout.detach(), encoding="utf-8")
            sys.stderr = io.TextIOWrapper(sys.stderr.detach(), encoding="utf-8")
    except Exception as e:
        print(f"Warning: Could not set UTF-8 encoding: {e}")

# 创建 FastMCP 实例
mcp = FastMCP("smart-pdf-downloader")


# 辅助函数
def format_success_message(action: str, details: Dict[str, Any]) -> str:
    """格式化成功消息"""
    return f"✅ {action}\n" + "\n".join(f"   {k}: {v}" for k, v in details.items())


def format_error_message(action: str, error: str) -> str:
    """格式化错误消息"""
    return f"❌ {action}\n   Error: {error}"


def format_warning_message(action: str, warning: str) -> str:
    """格式化警告消息"""
    return f"⚠️ {action}\n   Warning: {warning}"


async def perform_document_conversion(
    file_path: str, extract_images: bool = True
) -> Optional[str]:
    """
    执行文档转换的共用逻辑

    Args:
        file_path: 文件路径
        extract_images: 是否提取图片

    Returns:
        转换信息字符串，如果没有转换则返回None
    """
    if not file_path:
        return None

    conversion_msg = ""

    # 首先尝试使用简单的PDF转换器（对于PDF文件）
    # 检查文件是否实际为PDF（无论扩展名如何）
    is_pdf_file = False
    if PYPDF2_AVAILABLE:
        try:
            with open(file_path, "rb") as f:
                header = f.read(8)
                is_pdf_file = header.startswith(b"%PDF")
        except Exception:
            is_pdf_file = file_path.lower().endswith(".pdf")

    if is_pdf_file and PYPDF2_AVAILABLE:
        try:
            simple_converter = SimplePdfConverter()
            conversion_result = simple_converter.convert_pdf_to_markdown(file_path)
            if conversion_result["success"]:
                conversion_msg = "\n   [INFO] PDF converted to Markdown (PyPDF2)"
                conversion_msg += (
                    f"\n   Markdown file: {conversion_result['output_file']}"
                )
                conversion_msg += (
                    f"\n   Conversion time: {conversion_result['duration']:.2f} seconds"
                )
                conversion_msg += (
                    f"\n   Pages extracted: {conversion_result['pages_extracted']}"
                )

            else:
                conversion_msg = f"\n   [WARNING] PDF conversion failed: {conversion_result['error']}"
        except Exception as conv_error:
            conversion_msg = f"\n   [WARNING] PDF conversion error: {str(conv_error)}"

    # 如果简单转换失败，尝试使用docling（支持图片提取）
    # if not conversion_success and DOCLING_AVAILABLE:
    #     try:
    #         converter = DoclingConverter()
    #         if converter.is_supported_format(file_path):
    #             conversion_result = converter.convert_to_markdown(
    #                 file_path, extract_images=extract_images
    #             )
    #             if conversion_result["success"]:
    #                 conversion_msg = (
    #                     "\n   [INFO] Document converted to Markdown (docling)"
    #                 )
    #                 conversion_msg += (
    #                     f"\n   Markdown file: {conversion_result['output_file']}"
    #                 )
    #                 conversion_msg += f"\n   Conversion time: {conversion_result['duration']:.2f} seconds"
    #                 if conversion_result.get("images_extracted", 0) > 0:
    #                     conversion_msg += f"\n   Images extracted: {conversion_result['images_extracted']}"
    #                     images_dir = os.path.join(
    #                         os.path.dirname(conversion_result["output_file"]), "images"
    #                     )
    #                     conversion_msg += f"\n   Images saved to: {images_dir}"
    #             else:
    #                 conversion_msg = f"\n   [WARNING] Docling conversion failed: {conversion_result['error']}"
    #     except Exception as conv_error:
    #         conversion_msg = (
    #             f"\n   [WARNING] Docling conversion error: {str(conv_error)}"
    #         )

    return conversion_msg if conversion_msg else None


def format_file_operation_result(
    operation: str,
    source: str,
    destination: str,
    result: Dict[str, Any],
    conversion_msg: Optional[str] = None,
) -> str:
    """
    格式化文件操作结果的共用逻辑

    Args:
        operation: 操作类型 ("download", "copy", 或 "move")
        source: 源文件/URL
        destination: 目标路径
        result: 操作结果字典
        conversion_msg: 转换消息

    Returns:
        格式化的结果消息
    """
    if result["success"]:
        size_mb = result["size"] / (1024 * 1024)

        # 处理不同操作类型的动词形式
        if operation == "copy":
            operation_verb = "copied"
        elif operation == "download":
            operation_verb = "downloaded"
        else:  # move
            operation_verb = "moved"

        msg = f"[SUCCESS] Successfully {operation_verb}: {source}\n"

        if operation == "download":
            msg += f"   File: {destination}\n"
            msg += f"   Size: {size_mb:.2f} MB\n"
            msg += f"   Time: {result['duration']:.2f} seconds\n"
            speed_mb = result.get("speed", 0) / (1024 * 1024)
            msg += f"   Speed: {speed_mb:.2f} MB/s"
        else:  # copy or move
            msg += f"   To: {destination}\n"
            msg += f"   Size: {size_mb:.2f} MB\n"
            msg += f"   Time: {result['duration']:.2f} seconds"
            if operation == "copy":
                msg += "\n   Note: Original file preserved"

        if conversion_msg:
            msg += conversion_msg

        return msg
    else:
        return f"[ERROR] Failed to {operation}: {source}\n   Error: {result.get('error', 'Unknown error')}"


class LocalPathExtractor:
    """本地路径提取器"""

    @staticmethod
    def is_local_path(path: str) -> bool:
        """判断是否为本地路径"""
        path = path.strip("\"'")

        # 检查是否为URL
        if re.match(r"^https?://", path, re.IGNORECASE) or re.match(
            r"^ftp://", path, re.IGNORECASE
        ):
            return False

        # 路径指示符
        path_indicators = [os.path.sep, "/", "\\", "~", ".", ".."]
        has_extension = bool(os.path.splitext(path)[1])

        if any(indicator in path for indicator in path_indicators) or has_extension:
            expanded_path = os.path.expanduser(path)
            return os.path.exists(expanded_path) or any(
                indicator in path for indicator in path_indicators
            )

        return False

    @staticmethod
    def extract_local_paths(text: str) -> List[str]:
        """从文本中提取本地文件路径"""
        patterns = [
            r'"([^"]+)"',
            r"'([^']+)'",
            r"(?:^|\s)((?:[~./\\]|[A-Za-z]:)?(?:[^/\\\s]+[/\\])*[^/\\\s]+\.[A-Za-z0-9]+)(?:\s|$)",
            r"(?:^|\s)((?:~|\.{1,2})?/[^\s]+)(?:\s|$)",
            r"(?:^|\s)([A-Za-z]:[/\\][^\s]+)(?:\s|$)",
            r"(?:^|\s)(\.{1,2}[/\\][^\s]+)(?:\s|$)",
        ]

        local_paths = []
        potential_paths = []

        for pattern in patterns:
            matches = re.findall(pattern, text, re.MULTILINE)
            potential_paths.extend(matches)

        for path in potential_paths:
            path = path.strip()
            if path and LocalPathExtractor.is_local_path(path):
                expanded_path = os.path.expanduser(path)
                if expanded_path not in local_paths:
                    local_paths.append(expanded_path)

        return local_paths


class URLExtractor:
    """URL提取器"""

    URL_PATTERNS = [
        r"https?://(?:[-\w.]|(?:%[\da-fA-F]{2}))+(?:/(?:[-\w._~!$&\'()*+,;=:@]|%[\da-fA-F]{2})*)*(?:\?(?:[-\w._~!$&\'()*+,;=:@/?]|%[\da-fA-F]{2})*)?(?:#(?:[-\w._~!$&\'()*+,;=:@/?]|%[\da-fA-F]{2})*)?",
        r"ftp://(?:[-\w.]|(?:%[\da-fA-F]{2}))+(?:/(?:[-\w._~!$&\'()*+,;=:@]|%[\da-fA-F]{2})*)*",
        r"(?<!\S)(?:www\.)?[-\w]+(?:\.[-\w]+)+/(?:[-\w._~!$&\'()*+,;=:@/]|%[\da-fA-F]{2})+",
    ]

    @staticmethod
    def convert_arxiv_url(url: str) -> str:
        """将arXiv网页链接转换为PDF下载链接"""
        # 匹配arXiv论文ID的正则表达式
        arxiv_pattern = r"arxiv\.org/abs/(\d+\.\d+)(?:v\d+)?"
        match = re.search(arxiv_pattern, url, re.IGNORECASE)
        if match:
            paper_id = match.group(1)
            return f"https://arxiv.org/pdf/{paper_id}.pdf"
        return url

    @classmethod
    def extract_urls(cls, text: str) -> List[str]:
        """从文本中提取URL"""
        urls = []

        # 首先处理特殊情况：@开头的URL
        at_url_pattern = r"@(https?://[^\s]+)"
        at_matches = re.findall(at_url_pattern, text, re.IGNORECASE)
        for match in at_matches:
            # 处理arXiv链接
            url = cls.convert_arxiv_url(match.rstrip("/"))
            urls.append(url)

        # 然后使用原有的正则模式
        for pattern in cls.URL_PATTERNS:
            matches = re.findall(pattern, text, re.IGNORECASE)
            for match in matches:
                # 处理可能缺少协议的URL
                if not match.startswith(("http://", "https://", "ftp://")):
                    # 检查是否是 www 开头
                    if match.startswith("www."):
                        match = "https://" + match
                    else:
                        # 其他情况也添加 https
                        match = "https://" + match

                # 处理arXiv链接
                url = cls.convert_arxiv_url(match.rstrip("/"))
                urls.append(url)

        # 去重并保持顺序
        seen = set()
        unique_urls = []
        for url in urls:
            if url not in seen:
                seen.add(url)
                unique_urls.append(url)

        return unique_urls

    @staticmethod
    def infer_filename_from_url(url: str) -> str:
        """从URL推断文件名"""
        parsed = urlparse(url)
        path = unquote(parsed.path)

        # 从路径中提取文件名
        filename = os.path.basename(path)

        # 特殊处理：arxiv PDF链接
        if "arxiv.org" in parsed.netloc and "/pdf/" in path:
            if filename:
                # 检查是否已经有合适的文件扩展名
                if not filename.lower().endswith((".pdf", ".doc", ".docx", ".txt")):
                    filename = f"{filename}.pdf"
            else:
                path_parts = [p for p in path.split("/") if p]
                if path_parts and path_parts[-1]:
                    filename = f"{path_parts[-1]}.pdf"
                else:
                    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
                    filename = f"arxiv_paper_{timestamp}.pdf"

        # 如果没有文件名或没有扩展名，生成一个
        elif not filename or "." not in filename:
            # 尝试从URL生成有意义的文件名
            domain = parsed.netloc.replace("www.", "").replace(".", "_")
            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")

            # 尝试根据路径推断文件类型
            if not path or path == "/":
                filename = f"{domain}_{timestamp}.html"
            else:
                # 使用路径的最后一部分
                path_parts = [p for p in path.split("/") if p]
                if path_parts:
                    filename = f"{path_parts[-1]}_{timestamp}"
                else:
                    filename = f"{domain}_{timestamp}"

                # 如果还是没有扩展名，根据路径推断
                if "." not in filename:
                    # 根据路径中的关键词推断文件类型
                    if "/pdf/" in path.lower() or path.lower().endswith("pdf"):
                        filename += ".pdf"
                    elif any(
                        ext in path.lower() for ext in ["/doc/", "/word/", ".docx"]
                    ):
                        filename += ".docx"
                    elif any(
                        ext in path.lower()
                        for ext in ["/ppt/", "/powerpoint/", ".pptx"]
                    ):
                        filename += ".pptx"
                    elif any(ext in path.lower() for ext in ["/csv/", ".csv"]):
                        filename += ".csv"
                    elif any(ext in path.lower() for ext in ["/zip/", ".zip"]):
                        filename += ".zip"
                    else:
                        filename += ".html"

        return filename


class PathExtractor:
    """路径提取器"""

    @staticmethod
    def extract_target_path(text: str) -> Optional[str]:
        """从文本中提取目标路径"""
        patterns = [
            r'(?:save|download|store|put|place|write|copy|move)\s+(?:to|into|in|at)\s+["\']?([^\s"\']+)["\']?',
            r'(?:to|into|in|at)\s+(?:folder|directory|dir|path|location)\s*["\']?([^\s"\']+)["\']?',
            r'(?:destination|target|output)\s*(?:is|:)?\s*["\']?([^\s"\']+)["\']?',
            r'(?:保存|下载|存储|放到|写入|复制|移动)(?:到|至|去)\s*["\']?([^\s"\']+)["\']?',
            r'(?:到|在|至)\s*["\']?([^\s"\']+)["\']?\s*(?:文件夹|目录|路径|位置)',
        ]

        filter_words = {
            "here",
            "there",
            "current",
            "local",
            "this",
            "that",
            "这里",
            "那里",
            "当前",
            "本地",
            "这个",
            "那个",
        }

        for pattern in patterns:
            match = re.search(pattern, text, re.IGNORECASE)
            if match:
                path = match.group(1).strip("。，,.、")
                if path and path.lower() not in filter_words:
                    return path

        return None


class SimplePdfConverter:
    """简单的PDF转换器，使用PyPDF2提取文本"""

    def convert_pdf_to_markdown(
        self, input_file: str, output_file: Optional[str] = None
    ) -> Dict[str, Any]:
        """
        使用PyPDF2将PDF转换为Markdown格式

        Args:
            input_file: 输入PDF文件路径
            output_file: 输出Markdown文件路径（可选）

        Returns:
            转换结果字典
        """
        if not PYPDF2_AVAILABLE:
            return {"success": False, "error": "PyPDF2 package is not available"}

        try:
            # 检查输入文件是否存在
            if not os.path.exists(input_file):
                return {
                    "success": False,
                    "error": f"Input file not found: {input_file}",
                }

            # 如果没有指定输出文件，自动生成
            if not output_file:
                base_name = os.path.splitext(input_file)[0]
                output_file = f"{base_name}.md"

            # 确保输出目录存在
            output_dir = os.path.dirname(output_file)
            if output_dir:
                os.makedirs(output_dir, exist_ok=True)

            # 执行转换
            start_time = datetime.now()

            # 读取PDF文件
            with open(input_file, "rb") as file:
                pdf_reader = PyPDF2.PdfReader(file)
                text_content = []

                # 提取每页文本
                for page_num, page in enumerate(pdf_reader.pages, 1):
                    text = page.extract_text()
                    if text.strip():
                        text_content.append(f"## Page {page_num}\n\n{text.strip()}\n\n")

            # 生成Markdown内容
            markdown_content = f"# Extracted from {os.path.basename(input_file)}\n\n"
            markdown_content += f"*Total pages: {len(pdf_reader.pages)}*\n\n"
            markdown_content += "---\n\n"
            markdown_content += "".join(text_content)

            # 保存到文件
            with open(output_file, "w", encoding="utf-8") as f:
                f.write(markdown_content)

            # 计算转换时间
            duration = (datetime.now() - start_time).total_seconds()

            # 获取文件大小
            input_size = os.path.getsize(input_file)
            output_size = os.path.getsize(output_file)

            return {
                "success": True,
                "input_file": input_file,
                "output_file": output_file,
                "input_size": input_size,
                "output_size": output_size,
                "duration": duration,
                "markdown_content": markdown_content,
                "pages_extracted": len(pdf_reader.pages),
            }

        except Exception as e:
            return {
                "success": False,
                "input_file": input_file,
                "error": f"Conversion failed: {str(e)}",
            }


class DoclingConverter:
    """文档转换器，使用docling将文档转换为Markdown格式，支持图片提取"""

    def __init__(self):
        if not DOCLING_AVAILABLE:
            raise ImportError(
                "docling package is not available. Please install it first."
            )

        # 配置PDF处理选项
        pdf_pipeline_options = PdfPipelineOptions()
        pdf_pipeline_options.do_ocr = False  # 暂时禁用OCR以避免认证问题
        pdf_pipeline_options.do_table_structure = False  # 暂时禁用表格结构识别

        # 创建文档转换器（使用基础模式）
        try:
            self.converter = DocumentConverter(
                format_options={
                    InputFormat.PDF: PdfFormatOption(
                        pipeline_options=pdf_pipeline_options
                    )
                }
            )
        except Exception:
            # 如果失败，尝试更简单的配置
            self.converter = DocumentConverter()

    def is_supported_format(self, file_path: str) -> bool:
        """检查文件格式是否支持转换"""
        if not DOCLING_AVAILABLE:
            return False

        supported_extensions = {".pdf", ".docx", ".pptx", ".html", ".md", ".txt"}
        file_extension = os.path.splitext(file_path)[1].lower()
        return file_extension in supported_extensions

    def is_url(self, path: str) -> bool:
        """检查路径是否为URL"""
        try:
            result = urlparse(path)
            return result.scheme in ("http", "https")
        except Exception:
            return False

    def extract_images(self, doc, output_dir: str) -> Dict[str, str]:
        """
        提取文档中的图片并保存到本地

        Args:
            doc: docling文档对象
            output_dir: 输出目录

        Returns:
            图片ID到本地文件路径的映射
        """
        images_dir = os.path.join(output_dir, "images")
        os.makedirs(images_dir, exist_ok=True)
        image_map = {}  # docling图片id -> 本地文件名

        try:
            # 获取文档中的图片
            images = getattr(doc, "images", [])

            for idx, img in enumerate(images):
                try:
                    # 获取图片格式，默认为png
                    ext = getattr(img, "format", None) or "png"
                    if ext.lower() not in ["png", "jpg", "jpeg", "gif", "bmp", "webp"]:
                        ext = "png"

                    # 生成文件名
                    filename = f"image_{idx+1}.{ext}"
                    filepath = os.path.join(images_dir, filename)

                    # 保存图片数据
                    img_data = getattr(img, "data", None)
                    if img_data:
                        with open(filepath, "wb") as f:
                            f.write(img_data)

                        # 计算相对路径
                        rel_path = os.path.relpath(filepath, output_dir)
                        img_id = getattr(img, "id", str(idx + 1))
                        image_map[img_id] = rel_path

                except Exception as img_error:
                    print(f"Warning: Failed to extract image {idx+1}: {img_error}")
                    continue

        except Exception as e:
            print(f"Warning: Failed to extract images: {e}")

        return image_map

    def process_markdown_with_images(
        self, markdown_content: str, image_map: Dict[str, str]
    ) -> str:
        """
        处理Markdown内容，替换图片占位符为实际的图片路径

        Args:
            markdown_content: 原始Markdown内容
            image_map: 图片ID到本地路径的映射

        Returns:
            处理后的Markdown内容
        """

        def replace_img(match):
            img_id = match.group(1)
            if img_id in image_map:
                return f"![Image]({image_map[img_id]})"
            else:
                return match.group(0)

        # 替换docling的图片占位符
        processed_content = re.sub(
            r"!\[Image\]\(docling://image/([^)]+)\)", replace_img, markdown_content
        )

        return processed_content

    def convert_to_markdown(
        self,
        input_file: str,
        output_file: Optional[str] = None,
        extract_images: bool = True,
    ) -> Dict[str, Any]:
        """
        将文档转换为Markdown格式，支持图片提取

        Args:
            input_file: 输入文件路径或URL
            output_file: 输出Markdown文件路径（可选）
            extract_images: 是否提取图片（默认True）

        Returns:
            转换结果字典
        """
        if not DOCLING_AVAILABLE:
            return {"success": False, "error": "docling package is not available"}

        try:
            # 检查输入文件（如果不是URL）
            if not self.is_url(input_file):
                if not os.path.exists(input_file):
                    return {
                        "success": False,
                        "error": f"Input file not found: {input_file}",
                    }

                # 检查文件格式是否支持
                if not self.is_supported_format(input_file):
                    return {
                        "success": False,
                        "error": f"Unsupported file format: {os.path.splitext(input_file)[1]}",
                    }
            else:
                # 对于URL，检查是否为支持的格式
                if not input_file.lower().endswith(
                    (".pdf", ".docx", ".pptx", ".html", ".md", ".txt")
                ):
                    return {
                        "success": False,
                        "error": f"Unsupported URL format: {input_file}",
                    }

            # 如果没有指定输出文件，自动生成
            if not output_file:
                if self.is_url(input_file):
                    # 从URL生成文件名
                    filename = URLExtractor.infer_filename_from_url(input_file)
                    base_name = os.path.splitext(filename)[0]
                else:
                    base_name = os.path.splitext(input_file)[0]
                output_file = f"{base_name}.md"

            # 确保输出目录存在
            output_dir = os.path.dirname(output_file) or "."
            os.makedirs(output_dir, exist_ok=True)

            # 执行转换
            start_time = datetime.now()
            result = self.converter.convert(input_file)
            doc = result.document

            # 提取图片（如果启用）
            image_map = {}
            images_extracted = 0
            if extract_images:
                image_map = self.extract_images(doc, output_dir)
                images_extracted = len(image_map)

            # 获取Markdown内容
            markdown_content = doc.export_to_markdown()

            # 处理图片占位符
            if extract_images and image_map:
                markdown_content = self.process_markdown_with_images(
                    markdown_content, image_map
                )

            # 保存到文件
            with open(output_file, "w", encoding="utf-8") as f:
                f.write(markdown_content)

            # 计算转换时间
            duration = (datetime.now() - start_time).total_seconds()

            # 获取文件大小
            if self.is_url(input_file):
                input_size = 0  # URL无法直接获取大小
            else:
                input_size = os.path.getsize(input_file)
            output_size = os.path.getsize(output_file)

            return {
                "success": True,
                "input_file": input_file,
                "output_file": output_file,
                "input_size": input_size,
                "output_size": output_size,
                "duration": duration,
                "markdown_content": markdown_content,
                "images_extracted": images_extracted,
                "image_map": image_map,
            }

        except Exception as e:
            return {
                "success": False,
                "input_file": input_file,
                "error": f"Conversion failed: {str(e)}",
            }


async def check_url_accessible(url: str) -> Dict[str, Any]:
    """检查URL是否可访问"""
    try:
        timeout = aiohttp.ClientTimeout(total=10)
        async with aiohttp.ClientSession(timeout=timeout) as session:
            async with session.head(url, allow_redirects=True) as response:
                return {
                    "accessible": response.status < 400,
                    "status": response.status,
                    "content_type": response.headers.get("Content-Type", ""),
                    "content_length": response.headers.get("Content-Length", 0),
                }
    except Exception:
        return {
            "accessible": False,
            "status": 0,
            "content_type": "",
            "content_length": 0,
        }


async def download_file(url: str, destination: str) -> Dict[str, Any]:
    """下载单个文件"""
    start_time = datetime.now()
    chunk_size = 8192

    try:
        timeout = aiohttp.ClientTimeout(total=300)  # 5分钟超时
        async with aiohttp.ClientSession(timeout=timeout) as session:
            async with session.get(url) as response:
                # 检查响应状态
                response.raise_for_status()

                # 获取文件信息
                content_type = response.headers.get(
                    "Content-Type", "application/octet-stream"
                )

                # 确保目标目录存在
                parent_dir = os.path.dirname(destination)
                if parent_dir:
                    os.makedirs(parent_dir, exist_ok=True)

                # 下载文件
                downloaded = 0
                async with aiofiles.open(destination, "wb") as file:
                    async for chunk in response.content.iter_chunked(chunk_size):
                        await file.write(chunk)
                        downloaded += len(chunk)

                # 计算下载时间
                duration = (datetime.now() - start_time).total_seconds()

                return {
                    "success": True,
                    "url": url,
                    "destination": destination,
                    "size": downloaded,
                    "content_type": content_type,
                    "duration": duration,
                    "speed": downloaded / duration if duration > 0 else 0,
                }

    except aiohttp.ClientError as e:
        return {
            "success": False,
            "url": url,
            "destination": destination,
            "error": f"Network error: {str(e)}",
        }
    except Exception as e:
        return {
            "success": False,
            "url": url,
            "destination": destination,
            "error": f"Download error: {str(e)}",
        }


async def move_local_file(source_path: str, destination: str) -> Dict[str, Any]:
    """复制本地文件到目标位置（保留原文件）"""
    start_time = datetime.now()

    try:
        # 检查源文件是否存在
        if not os.path.exists(source_path):
            return {
                "success": False,
                "source": source_path,
                "destination": destination,
                "error": f"Source file not found: {source_path}",
            }

        # 获取源文件信息
        source_size = os.path.getsize(source_path)

        # 确保目标目录存在
        parent_dir = os.path.dirname(destination)
        if parent_dir:
            os.makedirs(parent_dir, exist_ok=True)

        # 执行复制操作（保留原文件，防止数据丢失）
        shutil.copy2(source_path, destination)

        # 计算操作时间
        duration = (datetime.now() - start_time).total_seconds()

        return {
            "success": True,
            "source": source_path,
            "destination": destination,
            "size": source_size,
            "duration": duration,
            "operation": "copy",  # 改为copy
        }

    except Exception as e:
        return {
            "success": False,
            "source": source_path,
            "destination": destination,
            "error": f"Copy error: {str(e)}",
        }


@mcp.tool()
async def download_files(instruction: str) -> str:
    """
    Download files from URLs or move local files mentioned in natural language instructions.

    Args:
        instruction: Natural language instruction containing URLs/local paths and optional destination paths

    Returns:
        Status message about the download/move operations

    Examples:
        - "Download https://example.com/file.pdf to documents folder"
        - "Move /home/user/file.pdf to documents folder"
        - "Please get https://raw.githubusercontent.com/user/repo/main/data.csv and save it to ~/downloads"
        - "移动 ~/Desktop/report.docx 到 /tmp/documents/"
        - "Download www.example.com/report.xlsx"
    """
    urls = URLExtractor.extract_urls(instruction)
    local_paths = LocalPathExtractor.extract_local_paths(instruction)

    if not urls and not local_paths:
        return format_error_message(
            "Failed to parse instruction",
            "No downloadable URLs or movable local files found",
        )

    target_path = PathExtractor.extract_target_path(instruction)

    # 处理文件
    results = []

    # 处理URL下载
    for url in urls:
        try:
            # 推断文件名
            filename = URLExtractor.infer_filename_from_url(url)

            # 构建完整的目标路径
            if target_path:
                # 处理路径
                if target_path.startswith("~"):
                    target_path = os.path.expanduser(target_path)

                # 确保使用相对路径（如果不是绝对路径）
                if not os.path.isabs(target_path):
                    target_path = os.path.normpath(target_path)

                # 判断是文件路径还是目录路径
                if os.path.splitext(target_path)[1]:  # 有扩展名，是文件
                    destination = target_path
                else:  # 是目录
                    destination = os.path.join(target_path, filename)
            else:
                # 默认下载到当前目录
                destination = filename

            # 检查文件是否已存在
            if os.path.exists(destination):
                results.append(
                    f"[WARNING] Skipped {url}: File already exists at {destination}"
                )
                continue

            # 先检查URL是否可访问
            check_result = await check_url_accessible(url)
            if not check_result["accessible"]:
                results.append(
                    f"[ERROR] Failed to access {url}: HTTP {check_result['status'] or 'Connection failed'}"
                )
                continue

            # 执行下载
            result = await download_file(url, destination)

            # 执行转换（如果成功下载）
            conversion_msg = None
            if result["success"]:
                conversion_msg = await perform_document_conversion(
                    destination, extract_images=True
                )

            # 格式化结果
            msg = format_file_operation_result(
                "download", url, destination, result, conversion_msg
            )

        except Exception as e:
            msg = f"[ERROR] Failed to download: {url}\n"
            msg += f"   Error: {str(e)}"

        results.append(msg)

    # 处理本地文件移动
    for local_path in local_paths:
        try:
            # 获取文件名
            filename = os.path.basename(local_path)

            # 构建完整的目标路径
            if target_path:
                # 处理路径
                if target_path.startswith("~"):
                    target_path = os.path.expanduser(target_path)

                # 确保使用相对路径（如果不是绝对路径）
                if not os.path.isabs(target_path):
                    target_path = os.path.normpath(target_path)

                # 判断是文件路径还是目录路径
                if os.path.splitext(target_path)[1]:  # 有扩展名，是文件
                    destination = target_path
                else:  # 是目录
                    destination = os.path.join(target_path, filename)
            else:
                # 默认移动到当前目录
                destination = filename

            # 检查目标文件是否已存在
            if os.path.exists(destination):
                results.append(
                    f"[WARNING] Skipped {local_path}: File already exists at {destination}"
                )
                continue

            # 执行复制（保留原文件）
            result = await move_local_file(local_path, destination)

            # 执行转换（如果成功复制）
            conversion_msg = None
            if result["success"]:
                conversion_msg = await perform_document_conversion(
                    destination, extract_images=True
                )

            # 格式化结果
            msg = format_file_operation_result(
                "copy", local_path, destination, result, conversion_msg
            )

        except Exception as e:
            msg = f"[ERROR] Failed to copy: {local_path}\n"
            msg += f"   Error: {str(e)}"

        results.append(msg)

    return "\n\n".join(results)


@mcp.tool()
async def parse_download_urls(text: str) -> str:
    """
    Extract URLs, local paths and target paths from text without downloading or moving.

    Args:
        text: Text containing URLs, local paths and optional destination paths

    Returns:
        Parsed URLs, local paths and target path information
    """
    urls = URLExtractor.extract_urls(text)
    local_paths = LocalPathExtractor.extract_local_paths(text)
    target_path = PathExtractor.extract_target_path(text)

    content = "📋 Parsed file operation information:\n\n"

    if urls:
        content += f"🔗 URLs found ({len(urls)}):\n"
        for i, url in enumerate(urls, 1):
            filename = URLExtractor.infer_filename_from_url(url)
            content += f"  {i}. {url}\n     📄 Filename: {filename}\n"
    else:
        content += "🔗 No URLs found\n"

    if local_paths:
        content += f"\n📁 Local files found ({len(local_paths)}):\n"
        for i, path in enumerate(local_paths, 1):
            exists = os.path.exists(path)
            content += f"  {i}. {path}\n"
            content += f"     ✅ Exists: {'Yes' if exists else 'No'}\n"
            if exists:
                size_mb = os.path.getsize(path) / (1024 * 1024)
                content += f"     📊 Size: {size_mb:.2f} MB\n"
    else:
        content += "\n📁 No local files found\n"

    if target_path:
        content += f"\n🎯 Target path: {target_path}"
        if target_path.startswith("~"):
            content += f"\n   (Expanded: {os.path.expanduser(target_path)})"
    else:
        content += "\n🎯 Target path: Not specified (will use current directory)"

    return content


@mcp.tool()
async def download_file_to(
    url: str, destination: Optional[str] = None, filename: Optional[str] = None
) -> str:
    """
    Download a specific file with detailed options.

    Args:
        url: URL to download from
        destination: Target directory or full file path (optional)
        filename: Specific filename to use (optional, ignored if destination is a full file path)

    Returns:
        Status message about the download operation
    """
    # 确定文件名

    url = URLExtractor.extract_urls(url)[0]

    if not filename:
        filename = URLExtractor.infer_filename_from_url(url)

    if not filename:
        filename = URLExtractor.infer_filename_from_url(url)
    else:
        name_source, extension_source = os.path.splitext(
            os.path.basename(URLExtractor.infer_filename_from_url(url))
        )
        name_destination, extension_destination = os.path.splitext(
            os.path.basename(filename)
        )
        if extension_source:
            filename = name_destination + extension_source
        else:
            filename = name_destination + extension_destination

    # 确定完整路径
    if destination:
        # 展开用户目录
        if destination.startswith("~"):
            destination = os.path.expanduser(destination)

        # 检查是否是完整文件路径
        if os.path.splitext(destination)[1]:  # 有扩展名
            target_path = destination
        else:  # 是目录
            target_path = os.path.join(destination, filename)
    else:
        target_path = filename

    # 确保使用相对路径（如果不是绝对路径）
    if not os.path.isabs(target_path):
        target_path = os.path.normpath(target_path)

    # 检查文件是否已存在
    if os.path.exists(target_path):
        return format_error_message(
            "Download aborted", f"File already exists at {target_path}"
        )

    # 先检查URL
    check_result = await check_url_accessible(url)
    if not check_result["accessible"]:
        return format_error_message(
            "Cannot access URL",
            f"{url} (HTTP {check_result['status'] or 'Connection failed'})",
        )

    # 显示下载信息
    size_mb = (
        int(check_result["content_length"]) / (1024 * 1024)
        if check_result["content_length"]
        else 0
    )
    msg = "[INFO] Downloading file:\n"
    msg += f"   URL: {url}\n"
    msg += f"   Target: {target_path}\n"
    if size_mb > 0:
        msg += f"   Expected size: {size_mb:.2f} MB\n"
    msg += "\n"

    # 执行下载
    result = await download_file(url, target_path)

    # 执行转换（如果成功下载）
    conversion_msg = None
    if result["success"]:
        conversion_msg = await perform_document_conversion(
            target_path, extract_images=True
        )

        # 添加下载信息前缀
        actual_size_mb = result["size"] / (1024 * 1024)
        speed_mb = result["speed"] / (1024 * 1024)
        info_msg = "[SUCCESS] Download completed!\n"
        info_msg += f"   Saved to: {target_path}\n"
        info_msg += f"   Size: {actual_size_mb:.2f} MB\n"
        info_msg += f"   Duration: {result['duration']:.2f} seconds\n"
        info_msg += f"   Speed: {speed_mb:.2f} MB/s\n"
        info_msg += f"   Type: {result['content_type']}"

        if conversion_msg:
            info_msg += conversion_msg

        return msg + info_msg
    else:
        return msg + f"[ERROR] Download failed!\n   Error: {result['error']}"


@mcp.tool()
async def move_file_to(
    source: str, destination: Optional[str] = None, filename: Optional[str] = None
) -> str:
    """
    Copy a local file to a new location (preserves original file).

    Note: Despite the name "move_file_to", this tool COPIES the file to preserve the original.
    This prevents data loss during file processing workflows.

    Args:
        source: Source file path to copy
        destination: Target directory or full file path (optional)
        filename: Specific filename to use (optional, ignored if destination is a full file path)

    Returns:
        Status message about the copy operation
    """
    # 展开源路径
    if source.startswith("~"):
        source = os.path.expanduser(source)

    # 检查源文件是否存在
    if not os.path.exists(source):
        return format_error_message("Copy aborted", f"Source file not found: {source}")

    # 确定文件名
    if not filename:
        filename = os.path.basename(source)
    else:
        name_source, extension_source = os.path.splitext(os.path.basename(source))
        name_destination, extension_destination = os.path.splitext(
            os.path.basename(filename)
        )
        if extension_source:
            filename = name_destination + extension_source
        else:
            filename = name_destination + extension_destination

    # 确定完整路径
    if destination:
        # 展开用户目录
        if destination.startswith("~"):
            destination = os.path.expanduser(destination)

        # 检查是否是完整文件路径
        if os.path.splitext(destination)[1]:  # 有扩展名
            target_path = destination
        else:  # 是目录
            target_path = os.path.join(destination, filename)

    else:
        target_path = filename

    # 确保使用相对路径（如果不是绝对路径）
    if not os.path.isabs(target_path):
        target_path = os.path.normpath(target_path)

    # 检查目标文件是否已存在
    if os.path.exists(target_path):
        return f"[ERROR] Target file already exists: {target_path}"

    # 显示复制信息
    source_size_mb = os.path.getsize(source) / (1024 * 1024)
    msg = "[INFO] Copying file (original preserved):\n"
    msg += f"   Source: {source}\n"
    msg += f"   Target: {target_path}\n"
    msg += f"   Size: {source_size_mb:.2f} MB\n"
    msg += "\n"

    # 执行复制（保留原文件）
    result = await move_local_file(source, target_path)

    # 执行转换（如果成功复制）
    conversion_msg = None
    if result["success"]:
        conversion_msg = await perform_document_conversion(
            target_path, extract_images=True
        )

        # 添加复制信息前缀
        info_msg = "[SUCCESS] File copied successfully (original preserved)!\n"
        info_msg += f"   From: {source}\n"
        info_msg += f"   To: {target_path}\n"
        info_msg += f"   Duration: {result['duration']:.2f} seconds"

        if conversion_msg:
            info_msg += conversion_msg

        return msg + info_msg
    else:
        return msg + f"[ERROR] Copy failed!\n   Error: {result['error']}"


# @mcp.tool()
# async def convert_document_to_markdown(
#     file_path: str, output_path: Optional[str] = None, extract_images: bool = True
# ) -> str:
#     """
#     Convert a document to Markdown format with image extraction support.

#     Supports both local files and URLs. Uses docling for advanced conversion with image extraction,
#     or falls back to PyPDF2 for simple PDF text extraction.

#     Args:
#         file_path: Path to the input document file or URL (supports PDF, DOCX, PPTX, HTML, TXT, MD)
#         output_path: Path for the output Markdown file (optional, auto-generated if not provided)
#         extract_images: Whether to extract images from the document (default: True)

#     Returns:
#         Status message about the conversion operation with preview of converted content

#     Examples:
#         - "convert_document_to_markdown('paper.pdf')"
#         - "convert_document_to_markdown('https://example.com/doc.pdf', 'output.md')"
#         - "convert_document_to_markdown('presentation.pptx', extract_images=False)"
#     """
#     # 检查是否为URL
#     is_url_input = False
#     try:
#         parsed = urlparse(file_path)
#         is_url_input = parsed.scheme in ("http", "https")
#     except Exception:
#         is_url_input = False

#     # 检查文件是否存在（如果不是URL）
#     if not is_url_input and not os.path.exists(file_path):
#         return f"[ERROR] Input file not found: {file_path}"

#     # 检查是否是PDF文件，优先使用简单转换器（仅对本地文件）
#     if (
#         not is_url_input
#         and file_path.lower().endswith(".pdf")
#         and PYPDF2_AVAILABLE
#         and not extract_images
#     ):
#         try:
#             simple_converter = SimplePdfConverter()
#             result = simple_converter.convert_pdf_to_markdown(file_path, output_path)
#         except Exception as e:
#             return f"[ERROR] PDF conversion error: {str(e)}"
#     elif DOCLING_AVAILABLE:
#         try:
#             converter = DoclingConverter()

#             # 检查文件格式是否支持
#             if not is_url_input and not converter.is_supported_format(file_path):
#                 supported_formats = [".pdf", ".docx", ".pptx", ".html", ".md", ".txt"]
#                 return f"[ERROR] Unsupported file format. Supported formats: {', '.join(supported_formats)}"
#             elif is_url_input and not file_path.lower().endswith(
#                 (".pdf", ".docx", ".pptx", ".html", ".md", ".txt")
#             ):
#                 return f"[ERROR] Unsupported URL format: {file_path}"

#             # 执行转换（支持图片提取）
#             result = converter.convert_to_markdown(
#                 file_path, output_path, extract_images
#             )
#         except Exception as e:
#             return f"[ERROR] Docling conversion error: {str(e)}"
#     else:
#         return (
#             "[ERROR] No conversion tools available. Please install docling or PyPDF2."
#         )

#     if result["success"]:
#         msg = "[SUCCESS] Document converted successfully!\n"
#         msg += f"   Input: {result['input_file']}\n"
#         msg += f"   Output file: {result['output_file']}\n"
#         msg += f"   Conversion time: {result['duration']:.2f} seconds\n"

#         if result["input_size"] > 0:
#             msg += f"   Original size: {result['input_size'] / 1024:.1f} KB\n"
#         msg += f"   Markdown size: {result['output_size'] / 1024:.1f} KB\n"

#         # 显示图片提取信息
#         if extract_images and "images_extracted" in result:
#             images_count = result["images_extracted"]
#             if images_count > 0:
#                 msg += f"   Images extracted: {images_count}\n"
#                 msg += f"   Images saved to: {os.path.join(os.path.dirname(result['output_file']), 'images')}\n"
#             else:
#                 msg += "   No images found in document\n"

#         # 显示Markdown内容的前几行作为预览
#         content_lines = result["markdown_content"].split("\n")
#         preview_lines = content_lines[:5]
#         if len(content_lines) > 5:
#             preview_lines.append("...")

#         msg += "\n[PREVIEW] First few lines of converted Markdown:\n"
#         for line in preview_lines:
#             msg += f"   {line}\n"
#     else:
#         msg = "[ERROR] Conversion failed!\n"
#         msg += f"   Error: {result['error']}"

#     return msg


if __name__ == "__main__":
    print("📄 Smart PDF Downloader MCP Tool")
    print("📝 Starting server with FastMCP...")

    if DOCLING_AVAILABLE:
        print("✅ Document conversion to Markdown is ENABLED (docling available)")
    else:
        print("❌ Document conversion to Markdown is DISABLED (docling not available)")
        print("   Install docling to enable: pip install docling")

    print("\nAvailable tools:")
    print(
        "  • download_files - Download files or move local files from natural language"
    )
    print("  • parse_download_urls - Extract URLs, local paths and destination paths")
    print("  • download_file_to - Download a specific file with options")
    print("  • move_file_to - Move a specific local file with options")
    print("  • convert_document_to_markdown - Convert documents to Markdown format")

    if DOCLING_AVAILABLE:
        print("\nSupported formats: PDF, DOCX, PPTX, HTML, TXT, MD")
        print("Features: Image extraction, Layout preservation, Automatic conversion")

    print("")

    # 运行服务器
    mcp.run()


================================================
FILE: tools/pdf_utils.py
================================================
"""
PDF utility functions for the DeepCode agent system.
"""

from pathlib import Path
import PyPDF2


def read_pdf_metadata(file_path: Path) -> dict:
    """Read PDF metadata with proper encoding handling."""
    try:
        print(f"\nAttempting to read PDF metadata from: {file_path}")
        with open(file_path, "rb") as file:
            pdf_reader = PyPDF2.PdfReader(file)
            info = pdf_reader.metadata
            first_page = pdf_reader.pages[0]
            text = first_page.extract_text()
            lines = text.split("\n")[:10]

            title = None
            authors = []

            if info:
                title = info.get("/Title", "").strip().replace("\x00", "")
                author = info.get("/Author", "").strip().replace("\x00", "")
                if author:
                    authors = [author]

            if not title and lines:
                title = lines[0].strip()

            if not authors and len(lines) > 1:
                for line in lines[1:3]:
                    if "author" in line.lower() or "by" in line.lower():
                        authors = [line.strip()]
                        break

            return {
                "title": title if title else "Unknown Title",
                "authors": authors if authors else ["Unknown Author"],
                "year": info.get("/CreationDate", "")[:4] if info else "Unknown Year",
                "first_lines": lines,
            }

    except Exception as e:
        print(f"\nError reading PDF: {str(e)}")
        return {
            "title": "Error reading PDF",
            "authors": ["Unknown"],
            "year": "Unknown",
            "first_lines": [],
        }


================================================
FILE: ui/__init__.py
================================================
"""
UI Module

Streamlit application user interface components module

Contains the following submodules:
- styles: CSS styles
- components: UI components
- layout: Page layout
- handlers: Event handlers
- streamlit_app: Main application
- app: Application entry
"""

__version__ = "1.0.0"
__author__ = "DeepCode Team"

# Import main components
from .layout import main_layout
from .components import display_header, display_features, display_status
from .handlers import initialize_session_state
from .styles import get_main_styles

# Import application main function
try:
    from .streamlit_app import main as streamlit_main
except ImportError:
    # Fallback to absolute import if relative import fails
    import sys
    import os

    sys.path.insert(0, os.path.dirname(__file__))
    from streamlit_app import main as streamlit_main

__all__ = [
    "main_layout",
    "display_header",
    "display_features",
    "display_status",
    "initialize_session_state",
    "get_main_styles",
    "streamlit_main",
]


================================================
FILE: ui/app.py
================================================
"""
DeepCode UI Application Entry Point

This file serves as the unified entry point for the UI module
"""

from .streamlit_app import main

# Directly export main function for external calls
__all__ = ["main"]

if __name__ == "__main__":
    main()


================================================
FILE: ui/components.py
================================================
# -*- coding: utf-8 -*-
"""
Streamlit UI Components - Cyber Edition
Contains all reusable UI components with new styling plus
the operational widgets required by the handlers.
"""

from __future__ import annotations

import html
import base64
import sys
from datetime import datetime
from functools import lru_cache
from pathlib import Path
from typing import Dict, Any, Optional, List, Tuple

import streamlit as st

from utils.cross_platform_file_handler import get_file_handler

BASE_DIR = Path(__file__).resolve().parents[1]
ICON_DIR = BASE_DIR / "assets" / "icons"


@lru_cache(maxsize=64)
def _icon_data_uri(name: str) -> str:
    path = ICON_DIR / f"{name}.png"
    if not path.exists():
        return ""

    try:
        data = path.read_bytes()
    except OSError:
        return ""

    encoded = base64.b64encode(data).decode("utf-8")
    return f"data:image/png;base64,{encoded}"


def icon_img(name: str, size: int = 32, extra_style: str = "") -> str:
    """
    Render an inline <img> tag for icons stored in assets/icons via data URI.
    """
    data_uri = _icon_data_uri(name)
    if not data_uri:
        return ""
    return f'<img src="{data_uri}" alt="{name}" style="width:{size}px;height:{size}px;{extra_style}"/>'


def clear_guided_answer_inputs():
    """Remove temporary answer widgets from session state."""
    keys_to_delete = [
        key for key in st.session_state.keys() if key.startswith("guided_answer_")
    ]
    for key in keys_to_delete:
        del st.session_state[key]


def display_header():
    """Display the Cyber-styled header"""
    st.markdown(
        """
        <div class="cyber-header">
            <div class="brand-container">
                <div class="brand-title">DEEPCODE</div>
                <div class="brand-subtitle">Autonomous Research & Engineering Matrix</div>
                    </div>
            <div class="status-indicator">
                <div class="status-dot"></div>
                <span>SYSTEM ONLINE</span>
        </div>
    </div>
    """,
        unsafe_allow_html=True,
    )


def display_features():
    """Display feature cards grid"""
    feature_cards = [
        {
            "icon": "feature_synthesis",
            "fallback": "🧬",
            "title": "Neural Synthesis",
            "desc": "Transform research papers directly into executable repositories via multi-agent LLM pipelines.",
        },
        {
            "icon": "feature_hyper",
            "fallback": "⚡",
            "title": "Hyper-Speed Mode",
            "desc": "Acceleration layer that parallelizes retrieval, planning, and implementation for fastest delivery.",
        },
        {
            "icon": "feature_cognition",
            "fallback": "🧠",
            "title": "Cognitive Context",
            "desc": "Semantic memory graphs retain methodology, datasets, and evaluation strategy during reasoning.",
        },
        {
            "icon": "feature_secure",
            "fallback": "🛡️",
            "title": "Secure Sandbox(Coming Soon)",
            "desc": "Isolated execution & validation environment keeps experiments safe and reproducible.",
        },
    ]

    cards_html = ""
    for card in feature_cards:
        icon_markup = icon_img(
            card["icon"],
            48,
            "filter:drop-shadow(0 0 10px rgba(0,242,255,0.4));",
        )
        if not icon_markup:
            icon_markup = f'<span style="font-size:2rem;">{card["fallback"]}</span>'

        cards_html += f"""
        <div class="cyber-card">
            <div class="card-icon">
                {icon_markup}
                </div>
            <div class="card-title">{card['title']}</div>
            <div class="card-desc">{card['desc']}</div>
                </div>
        """

    st.markdown(
        f"""
        <div class="feature-grid">
            {cards_html}
        </div>
    """,
        unsafe_allow_html=True,
    )


def display_status(message: str, status_type: str = "info"):
    """Display status message with cyber styling"""
    colors = {
        "success": "var(--success)",
        "error": "var(--error)",
        "warning": "var(--warning)",
        "info": "var(--primary)",
    }
    color = colors.get(status_type, "var(--primary)")

    st.markdown(
        f"""
        <div style="padding: 1rem; border-left: 3px solid {color}; background: rgba(255,255,255,0.03); margin: 1rem 0; border-radius: 0 4px 4px 0;">
            <span style="color: {color}; font-weight: bold; margin-right: 0.5rem;">[{status_type.upper()}]</span>
            <span style="font-family: var(--font-code);">{message}</span>
    </div>
    """,
        unsafe_allow_html=True,
    )


def _render_step_card(title: str, subtitle: str, state: str) -> str:
    """Return HTML for a workflow step badge."""
    colors = {
        "completed": "var(--success)",
        "active": "var(--primary)",
        "pending": "rgba(255,255,255,0.3)",
        "error": "var(--error)",
    }
    icon = {
        "completed": "✔",
        "active": "➤",
        "pending": "•",
        "error": "!",
    }.get(state, "•")
    color = colors.get(state, "rgba(255,255,255,0.3)")
    return f"""
        <div style="
            border:1px solid rgba(255,255,255,0.08);
            padding:0.75rem;
            border-radius:4px;
            min-height:110px;
            background:rgba(0,0,0,0.15);
        ">
            <div style="font-size:1.2rem;color:{color};">{icon}</div>
            <div style="font-family:var(--font-display);color:white;">{title}</div>
            <div style="font-size:0.8rem;color:rgba(255,255,255,0.5);">{subtitle}</div>
        </div>
    """


def enhanced_progress_display_component(
    enable_indexing: bool, chat_mode: bool
) -> Tuple[Any, Any, List[Any], List[Dict[str, str]]]:
    """
    Render the progress panel required by handlers.handle_processing_workflow.
    """

    if chat_mode:
        workflow_steps = [
            {"title": "INIT", "subtitle": "Boot agents"},
            {"title": "PLAN", "subtitle": "Analyze intent"},
            {"title": "SETUP", "subtitle": "Workspace"},
            {"title": "DRAFT", "subtitle": "Generate plan"},
            {"title": "CODE", "subtitle": "Implement"},
        ]
    elif not enable_indexing:
        workflow_steps = [
            {"title": "INIT", "subtitle": "Load systems"},
            {"title": "ANALYZE", "subtitle": "Parse paper"},
            {"title": "DOWNLOAD", "subtitle": "Collect refs"},
            {"title": "PLAN", "subtitle": "Blueprint"},
            {"title": "CODE", "subtitle": "Implement"},
        ]
    else:
        workflow_steps = [
            {"title": "INIT", "subtitle": "Load systems"},
            {"title": "ANALYZE", "subtitle": "Paper scan"},
            {"title": "DOWNLOAD", "subtitle": "Docs & data"},
            {"title": "PLAN", "subtitle": "Architect"},
            {"title": "REF", "subtitle": "Key refs"},
            {"title": "REPO", "subtitle": "GitHub sync"},
            {"title": "INDEX", "subtitle": "Vectorize"},
            {"title": "CODE", "subtitle": "Implementation"},
        ]

    st.markdown("### 🛰️ Workflow Monitor")
    progress_bar = st.progress(0)
    status_text = st.empty()

    cols = st.columns(len(workflow_steps))
    step_indicators: List[Any] = []
    for col, step in zip(cols, workflow_steps):
        with col:
            placeholder = st.empty()
            placeholder.markdown(
                _render_step_card(step["title"], step["subtitle"], "pending"),
                unsafe_allow_html=True,
            )
            step_indicators.append(placeholder)

    return progress_bar, status_text, step_indicators, workflow_steps


def update_step_indicator(
    step_indicators: List[Any],
    workflow_steps: List[Dict[str, str]],
    current_step: int,
    status: str,
):
    """
    Update the workflow step indicators in-place.
    """
    total_steps = len(workflow_steps)

    for idx, placeholder in enumerate(step_indicators):
        if status == "error" and idx == current_step:
            state = "error"
        elif current_step >= total_steps:
            state = "completed"
        elif idx < current_step:
            state = "completed"
        elif idx == current_step:
            state = "active"
        else:
            state = "pending"

        step = workflow_steps[idx]
        placeholder.markdown(
            _render_step_card(step["title"], step["subtitle"], state),
            unsafe_allow_html=True,
        )


def chat_input_component(task_counter: int = 0) -> Optional[str]:
    """Render modern chat input for guided mode"""
    st.markdown("### 💬 Neural Link Interface")

    user_input = st.chat_input(
        placeholder="Input research directive or query...",
        key=f"chat_input_{task_counter}",
    )
    return user_input


def _save_uploaded_pdf(uploaded_file) -> Optional[str]:
    """Persist uploaded PDF to a temp file and return its path."""
    try:
        file_bytes = uploaded_file.read()
        suffix = Path(uploaded_file.name).suffix or ".pdf"
        handler = get_file_handler()
        temp_path = handler.create_safe_temp_file(
            suffix=suffix, prefix="deepcode_upload_", content=file_bytes
        )
        return str(temp_path)
    except Exception as exc:
        st.error(f"Failed to save uploaded file: {exc}")
        return None


def input_method_selector(task_counter: int) -> Tuple[Optional[str], Optional[str]]:
    """Render the input method selection tabs with modern styling"""

    tab1, tab2, tab3 = st.tabs(["📄 PDF UPLOAD", "🔗 URL LINK", "⚡ QUICK COMMAND"])

    input_source: Optional[str] = None
    input_type: Optional[str] = None

    with tab1:
        st.markdown('<div style="padding:1rem;"></div>', unsafe_allow_html=True)
        uploaded_file = st.file_uploader(
            "Upload Research Paper (PDF)",
            type="pdf",
            key=f"file_uploader_{task_counter}",
        )
        if uploaded_file:
            saved_path = _save_uploaded_pdf(uploaded_file)
            if saved_path:
                st.session_state["uploaded_filename"] = uploaded_file.name
                input_source = saved_path
                input_type = "file"

    with tab2:
        st.markdown('<div style="padding:1rem;"></div>', unsafe_allow_html=True)
        url = st.text_input(
            "ArXiv / GitHub Resource URL",
            placeholder="https://arxiv.org/abs/...",
            key=f"url_input_{task_counter}",
        )
        if url:
            input_source = url.strip()
            input_type = "url"

    with tab3:
        st.markdown('<div style="padding:1rem;"></div>', unsafe_allow_html=True)
        query = st.text_area(
            "Code Specifications / Abstract",
            placeholder="Describe the algorithm or system requirements...",
            height=150,
            key=f"text_input_{task_counter}",
        )
        if query:
            input_source = query.strip()
            input_type = "chat"

    return input_source, input_type


def results_display_component(result: Any, task_counter: int):
    """Display results in a tech-styled container"""

    status = result.get("status", "unknown")
    is_success = status == "success"
    status_label = "Mission Complete" if is_success else "Execution Failed"
    status_color = "var(--success)" if is_success else "var(--error)"
    status_icon = icon_img("status_success" if is_success else "status_error", 56)
    if not status_icon:
        status_icon = "✅" if is_success else "⚠️"
    status_message = (
        "Computation sequence completed successfully."
        if is_success
        else result.get("error", "Unknown error occurred during processing.")
    )

    st.markdown('<div style="height: 2rem;"></div>', unsafe_allow_html=True)
    st.markdown("### 🚀 Operation Result")

    with st.container():
        if is_success:
            st.success("Workflow completed across all stages ✅")
        else:
            st.error("Workflow interrupted. Check the logs below ⚠️")

        col1, col2 = st.columns([2, 1])
        with col1:
            with st.expander("📜 Execution Logs & Metadata", expanded=True):
                st.json(result)

        with col2:
            st.markdown(
                f"""
                <div style="padding: 1.5rem; border: 1px solid rgba(255,255,255,0.1); border-radius: 6px; background: rgba(255,255,255,0.02); text-align: center; margin-bottom: 1rem;">
                    <div style="margin-bottom:0.5rem;">{status_icon}</div>
                    <div style="font-family: var(--font-display); font-size: 1.3rem; color: {status_color};">{status_label}</div>
                    <div style="font-size: 0.85rem; color: rgba(255,255,255,0.6); margin-top: 0.3rem;">{status_message}</div>
                </div>
                """,
                unsafe_allow_html=True,
            )
            st.download_button(
                label="📥 DOWNLOAD ARTIFACTS" if is_success else "📥 DOWNLOAD LOGS",
                data=str(result),
                file_name=f"deepcode_result_{task_counter}.json",
                mime="application/json",
                use_container_width=True,
            )


def system_status_component():
    """System status check component"""
    st.markdown("### 🔧 System Diagnostics")

    col1, col2 = st.columns(2)

    with col1:
        st.markdown("#### 📊 Core Metrics")
        st.info(f"**Python:** {sys.version.split()[0]}")
        st.info(f"**Platform:** {sys.platform}")

    with col2:
        st.markdown("#### ⚙️ Runtime Status")
        try:
            import asyncio

            loop = asyncio.get_event_loop()
            if loop.is_running():
                st.success("Event Loop: ACTIVE")
            else:
                st.warning("Event Loop: STANDBY")
        except Exception:
            st.info("Event Loop: MANAGED")


def error_troubleshooting_component():
    """Error troubleshooting component"""
    with st.expander("🛠️ Diagnostics & Troubleshooting", expanded=False):
        st.warning(
            "If you encounter issues, please check your API keys in the sidebar."
        )


def footer_component():
    """Minimal futuristic footer"""
    st.markdown(
        """
        <div style="text-align: center; margin-top: 6rem; padding: 2rem; color: rgba(255,255,255,0.2); font-family: var(--font-code); font-size: 0.7rem; border-top: 1px solid rgba(255,255,255,0.05);">
            DEEPCODE_SYSTEMS // <span style="color: var(--primary);">OPERATIONAL</span> // VERSION 3.0.1
    </div>
    """,
        unsafe_allow_html=True,
    )


def render_sidebar_feed(max_items: int = 12):
    """Render live mission feed inside sidebar."""
    st.markdown("#### 📡 Mission Feed")
    events = list(st.session_state.get("sidebar_events", []))

    col1, col2 = st.columns([1, 1])
    with col1:
        st.caption("Real-time agent telemetry")
    with col2:
        if st.button("Clear Feed", key="sidebar_clear_feed"):
            st.session_state.sidebar_events = []
            events = []
            st.session_state.sidebar_feed_last_cleared = datetime.utcnow().strftime(
                "%H:%M:%S"
            )

    if not events:
        st.caption("Awaiting activity...")
        return

    recent_events = list(reversed(events[-max_items:]))
    for event in recent_events:
        stage = event.get("stage", "STAGE")
        message = html.escape(str(event.get("message", "")))
        timestamp = event.get("timestamp", "--:--:--")
        level = event.get("level", "info")
        extra = event.get("extra")

        st.markdown(
            f"""
            <div class="sidebar-feed-card level-{level}">
                <div class="stage-line">
                    <span class="stage">{stage}</span>
                    <span class="time">{timestamp}</span>
                </div>
                <div class="message">{message}</div>
            </div>
            """,
            unsafe_allow_html=True,
        )

        if isinstance(extra, dict) and extra:
            with st.expander("Details", expanded=False):
                st.json(extra)


def render_system_monitor():
    """Display current backend + command telemetry."""
    st.markdown("#### 🧬 System Monitor")
    processing = st.session_state.get("processing", False)
    mode = st.session_state.get("requirement_analysis_mode", "direct").upper()
    indexing_enabled = st.session_state.get("enable_indexing", True)
    task_counter = st.session_state.get("task_counter", 0)
    last_error = st.session_state.get("last_error")
    events = st.session_state.get("sidebar_events", [])
    latest_event = events[-1] if events else None
    last_stage = latest_event.get("stage") if latest_event else "--"
    last_message = (
        html.escape(str(latest_event.get("message", ""))) if latest_event else ""
    )
    last_progress = (
        latest_event.get("extra", {}).get("progress") if latest_event else None
    )
    state_label = "ACTIVE" if processing else "IDLE"

    st.markdown(
        f"""
        <div class="system-monitor-card">
            <div class="status-grid">
                <div class="status-chip"><span>STATE</span><span>{state_label}</span></div>
                <div class="status-chip"><span>MODE</span><span>{mode}</span></div>
                <div class="status-chip"><span>INDEXING</span><span>{"ON" if indexing_enabled else "OFF"}</span></div>
                <div class="status-chip"><span>TASKS</span><span>{task_counter}</span></div>
            </div>
            <div class="latest-stage">
                <strong>{last_stage if last_stage else "--"}</strong>
                {"· " + str(last_progress) + "%" if last_progress is not None else ""}
                <br/>{last_message or "Awaiting telemetry..."}
            </div>
        </div>
        """,
        unsafe_allow_html=True,
    )

    if last_error:
        st.warning(f"Last error: {last_error}")


def render_log_viewer(max_lines: int = 50):
    """Display live log stream for current mission in a scrollable container."""
    st.markdown("#### 📁 Live Log Stream")
    logs_dir = BASE_DIR / "logs"
    if not logs_dir.exists():
        st.info("Logs directory not found.")
        return

    log_files = sorted(
        [p for p in logs_dir.glob("*.jsonl") if p.is_file()],
        key=lambda p: p.stat().st_mtime,
        reverse=True,
    )
    if not log_files:
        st.info("No log files available yet.")
        return

    start_ts = st.session_state.get("workflow_start_time")
    selected_path = None

    waiting_for_new_log = False

    if start_ts:
        # Use a tolerance window: accept logs created within 10 seconds before workflow_start_time
        tolerance = 10.0
        for candidate in log_files:
            file_mtime = candidate.stat().st_mtime
            if file_mtime >= (start_ts - tolerance):
                selected_path = candidate
                break
        if selected_path is None:
            waiting_for_new_log = True
    else:
        prev = st.session_state.get("active_log_file")
        if prev:
            prev_path = Path(prev)
            if prev_path.exists():
                selected_path = prev_path
        if selected_path is None:
            selected_path = log_files[0]

    if waiting_for_new_log:
        st.caption("Waiting for current task log to be created...")
        return

    st.session_state.active_log_file = str(selected_path)

    try:
        content = selected_path.read_text(encoding="utf-8", errors="ignore")
    except Exception as exc:
        st.error(f"Failed to read {selected_path.name}: {exc}")
        return

    lines = content.splitlines()
    tail_lines = lines[-max_lines:]

    # Show file info
    processing = st.session_state.get("processing", False)
    status_icon = "🔄" if processing else "✅"
    st.caption(f"{status_icon} {selected_path.name} | Last {len(tail_lines)} lines")

    if not tail_lines:
        st.info("Log file is empty.")
        return

    # Build log HTML with scrollable container
    import json

    log_html_parts = []

    for line in tail_lines:
        line = line.strip()
        if not line:
            continue

        try:
            event = json.loads(line)
            timestamp = event.get("timestamp", "")
            level = event.get("level", "INFO")
            message = event.get("message", "")
            namespace = event.get("namespace", "")

            # Color code by level
            if level == "ERROR":
                level_color = "#ff4444"
            elif level == "WARNING":
                level_color = "#ffaa00"
            elif "SUCCESS" in level.upper():
                level_color = "#00ff88"
            else:
                level_color = "#00d4ff"

            # Format display
            time_str = (
                timestamp.split("T")[-1][:12] if "T" in timestamp else timestamp[-12:]
            )
            namespace_short = namespace.split(".")[-1] if namespace else ""

            log_html_parts.append(
                f'<div style="font-family: var(--font-code); font-size: 0.8rem; padding: 0.25rem 0.4rem; '
                f"border-left: 2px solid {level_color}; margin-bottom: 0.2rem; background: rgba(255,255,255,0.02); "
                f'border-radius: 2px;">'
                f'<span style="color: rgba(255,255,255,0.4); font-size: 0.75rem;">{time_str}</span> '
                f'<span style="color: {level_color}; font-weight: 600; font-size: 0.75rem;">[{level}]</span> '
                f'<span style="color: var(--primary); font-size: 0.75rem;">{namespace_short}</span><br/>'
                f'<span style="color: rgba(255,255,255,0.85); margin-left: 0.5rem;">{message[:200]}</span>'
                f"</div>"
            )
        except json.JSONDecodeError:
            # Raw text fallback
            log_html_parts.append(
                f'<div style="font-family: var(--font-code); font-size: 0.75rem; padding: 0.2rem; '
                f'color: rgba(255,255,255,0.6);">{line[:200]}</div>'
            )

    # Render in scrollable container
    full_log_html = f"""
    <div style="max-height: 600px; overflow-y: auto; overflow-x: hidden;
                padding: 0.5rem; background: rgba(0,0,0,0.2); border-radius: 4px;
                border: 1px solid rgba(255,255,255,0.1);">
        {''.join(log_html_parts)}
    </div>
    """

    st.markdown(full_log_html, unsafe_allow_html=True)


def reset_guided_workflow_state(preserve_initial: bool = False):
    """
    Reset guided requirement workflow state machine.
    """
    if preserve_initial:
        initial_text = st.session_state.get(
            "guided_initial_requirement",
            st.session_state.get("initial_requirement", ""),
        )
    else:
        initial_text = ""
        st.session_state.initial_requirement = ""

    st.session_state.guided_initial_requirement = initial_text
    st.session_state.guided_edit_feedback = ""
    st.session_state.requirement_analysis_step = "input"
    st.session_state.generated_questions = []
    st.session_state.user_answers = {}
    st.session_state.detailed_requirements = ""
    st.session_state.questions_generating = False
    st.session_state.requirements_generating = False
    st.session_state.requirements_confirmed = False
    st.session_state.requirements_editing = False
    st.session_state.edit_feedback = ""
    st.session_state.confirmed_requirement_text = None
    clear_guided_answer_inputs()


def requirement_mode_selector() -> str:
    """
    Render the requirement workflow mode selector.
    """
    mode_labels = {"direct": "🚀 Direct Mode", "guided": "🧭 Guided Mode"}
    current_mode = st.session_state.get("requirement_analysis_mode", "direct")

    selection = st.radio(
        "Requirement Intake Mode",
        options=list(mode_labels.keys()),
        index=0 if current_mode != "guided" else 1,
        horizontal=True,
        format_func=lambda key: mode_labels[key],
        key="requirement_mode_selector_radio",
    )

    if selection != current_mode:
        st.session_state.requirement_analysis_mode = selection
        if selection == "direct":
            reset_guided_workflow_state(preserve_initial=False)
        else:
            st.session_state.requirement_analysis_step = "input"

    return selection


def guided_requirement_workflow() -> Tuple[Optional[str], bool]:
    """
    Render the guided requirement analysis workflow.
    """

    st.markdown("### 🧭 Guided Requirement Workflow")

    step = st.session_state.get("requirement_analysis_step", "input")
    st.session_state.setdefault(
        "guided_initial_requirement", st.session_state.get("initial_requirement", "")
    )
    st.session_state.setdefault(
        "guided_edit_feedback", st.session_state.get("edit_feedback", "")
    )

    step_titles = {
        "input": "Step 1 · Describe Requirements",
        "questions": "Step 2 · Answer Guiding Questions",
        "summary": "Step 3 · Review Requirement Document",
        "editing": "Step 4 · Request Changes",
    }
    st.caption(
        f"Current Stage: {step_titles.get(step, 'Step 1 · Describe Requirements')}"
    )

    confirmed_doc = st.session_state.get("confirmed_requirement_text")

    if step == "input":
        st.markdown("#### 1 · Describe your project")
        st.text_area(
            "Describe the product scope, tech stack, performance targets, and constraints:",
            key="guided_initial_requirement",
            height=180,
        )
        initial_text = st.session_state.get("guided_initial_requirement", "")

        col1, col2 = st.columns(2)
        with col1:
            if st.button("Generate guiding questions", type="primary"):
                if not initial_text.strip():
                    st.warning("Please enter your project requirements first.")
                else:
                    st.session_state.initial_requirement = initial_text.strip()
                    st.session_state.questions_generating = True
                    st.session_state.requirement_analysis_step = "questions"
                    st.session_state.generated_questions = []
                    st.session_state.user_answers = {}
                    st.session_state.detailed_requirements = ""
                    st.session_state.confirmed_requirement_text = None
                    st.session_state.requirements_generating = False
                    st.session_state.requirements_confirmed = False
                    st.session_state.requirements_editing = False
                    st.session_state.edit_feedback = ""
                    clear_guided_answer_inputs()
                    st.rerun()

        with col2:
            if st.button("Skip Q&A and use current spec", type="secondary"):
                if not initial_text.strip():
                    st.warning("Please enter your project requirements first.")
                else:
                    final_doc = initial_text.strip()
                    st.session_state.initial_requirement = final_doc
                    st.session_state.confirmed_requirement_text = final_doc
                    st.session_state.requirements_confirmed = True
                    st.success(
                        "Current description locked as the requirement document. Implementation will proceed next."
                    )

    elif step == "questions":
        st.markdown("#### 2 · Answer guiding questions")
        if st.session_state.get("questions_generating"):
            st.info("LLM is crafting guiding questions. Please wait...")

        questions = st.session_state.get("generated_questions", [])
        question_ids: List[str] = []

        if not questions:
            st.caption("Guiding questions will appear once generation is complete.")
        else:
            for idx, question in enumerate(questions):
                if isinstance(question, dict):
                    q_id = str(
                        question.get("id")
                        or question.get("question_id")
                        or question.get("qid")
                        or idx
                    )
                    q_text = question.get("question") or question.get("content") or ""
                    category = question.get("category")
                    importance = question.get("importance")
                    hint = question.get("hint")
                else:
                    q_id = str(idx)
                    q_text = str(question)
                    category = importance = hint = None

                question_ids.append(q_id)

                st.markdown(
                    f"**Q{idx + 1}. {q_text or 'Please answer this question'}**"
                )
                meta_parts = [part for part in [category, importance] if part]
                if meta_parts:
                    st.caption(" / ".join(meta_parts))
                if hint:
                    st.caption(f"Hint: {hint}")

                answer_key = f"guided_answer_{idx}"
                if answer_key not in st.session_state:
                    default_answer = st.session_state.user_answers.get(q_id, "")
                    st.session_state[answer_key] = default_answer

                st.text_area("Your answer", key=answer_key, height=100)

        col1, col2, col3 = st.columns(3)
        with col1:
            if st.button(
                "Generate requirement document", type="primary", disabled=not questions
            ):
                answers_payload = {}
                for idx, q_id in enumerate(question_ids):
                    answer_value = st.session_state.get(
                        f"guided_answer_{idx}", ""
                    ).strip()
                    if answer_value:
                        answers_payload[q_id] = answer_value

                st.session_state.user_answers = answers_payload
                st.session_state.requirements_generating = True
                st.session_state.requirement_analysis_step = "summary"
                st.session_state.detailed_requirements = ""
                st.session_state.confirmed_requirement_text = None
                st.session_state.requirements_confirmed = False
                st.rerun()

        with col2:
            if st.button(
                "Generate without answers", type="secondary", disabled=not questions
            ):
                st.session_state.user_answers = {}
                st.session_state.requirements_generating = True
                st.session_state.requirement_analysis_step = "summary"
                st.session_state.detailed_requirements = ""
                st.session_state.confirmed_requirement_text = None
                st.session_state.requirements_confirmed = False
                st.rerun()

        with col3:
            if st.button("Back to Step 1"):
                reset_guided_workflow_state(preserve_initial=True)
                st.rerun()

    elif step == "summary":
        st.markdown("#### 3 · AI-generated requirement document")
        if st.session_state.get("requirements_generating"):
            st.info("Generating requirement document. Please wait...")

        summary = (st.session_state.get("detailed_requirements") or "").strip()

        if summary:
            st.markdown(summary)
            st.download_button(
                "Download requirement document",
                summary,
                file_name="deepcode_requirements.md",
                mime="text/markdown",
                use_container_width=True,
            )
        else:
            st.caption("Waiting for requirement document to be generated...")

        col1, col2, col3 = st.columns(3)
        with col1:
            if st.button(
                "Confirm and start implementation ✅",
                type="primary",
                disabled=not summary,
            ):
                final_doc = summary or st.session_state.get("initial_requirement", "")
                if final_doc.strip():
                    st.session_state.confirmed_requirement_text = final_doc.strip()
                    st.session_state.requirements_confirmed = True
                    st.success(
                        "Requirement document confirmed. Implementation pipeline will start next."
                    )
                else:
                    st.warning("No requirement document available yet.")

        with col2:
            if st.button("Request edits", type="secondary", disabled=not summary):
                st.session_state.requirement_analysis_step = "editing"
                st.session_state.guided_edit_feedback = ""

        with col3:
            if st.button("Restart Q&A", type="secondary"):
                reset_guided_workflow_state(preserve_initial=True)
                st.rerun()

    elif step == "editing":
        st.markdown("#### 4 · Modify requirement document")
        st.text_area(
            "Describe the changes or clarifications you need:",
            key="guided_edit_feedback",
            height=160,
        )
        feedback_value = st.session_state.get("guided_edit_feedback", "")

        col1, col2 = st.columns(2)
        with col1:
            if st.button("Submit change request", type="primary"):
                if not feedback_value.strip():
                    st.warning("Please describe the requested changes.")
                else:
                    st.session_state.edit_feedback = feedback_value.strip()
                    st.session_state.requirements_editing = True
                    st.info("Updating requirement document based on your feedback...")

        with col2:
            if st.button("Back to requirement document"):
                st.session_state.requirement_analysis_step = "summary"
                st.session_state.guided_edit_feedback = ""

        if st.session_state.get("requirements_editing"):
            st.info("Requirement document is updating...")

    if confirmed_doc:
        st.success("Requirement document locked. You can start implementation anytime.")

    return (confirmed_doc if confirmed_doc else None, bool(confirmed_doc))


def sidebar_control_panel():
    """Sidebar configuration"""
    with st.sidebar:
        st.markdown(
            """
            <div style="margin-bottom: 2rem; padding-bottom: 1rem; border-bottom: 1px solid rgba(255,255,255,0.1);">
                <h2 style="margin:0; color:white;">CONTROL DECK</h2>
                <div style="font-family:var(--font-code); color:var(--primary); font-size:0.8rem;">// MISSION CONTROL</div>
        </div>
        """,
            unsafe_allow_html=True,
        )

        workflow_start = st.session_state.get("workflow_start_time")

        if workflow_start:
            render_log_viewer()
        else:
            st.info("Awaiting next mission run to stream logs.")
    st.markdown(
        """
            <div style="font-size: 0.7rem; color: rgba(255,255,255,0.3); text-align: center; margin-top: 1rem;">
                © 2024 DeepCode Research
    </div>
    """,
        unsafe_allow_html=True,
    )

    return {}


================================================
FILE: ui/handlers.py
================================================
"""
Streamlit Event Handlers Module

Contains all event handling and business logic
"""

import asyncio
import time
import os
import traceback
import atexit
import signal
from datetime import datetime
from typing import Dict, Any

import streamlit as st
import nest_asyncio
import concurrent.futures

# Global abort flag
_abort_requested = False

def set_abort_requested(value: bool = True):
    """Set the global abort flag"""
    global _abort_requested
    _abort_requested = value
    if value:
        print("🛑 Abort requested by user")

def is_abort_requested() -> bool:
    """Check if abort has been requested"""
    return _abort_requested

def reset_abort_flag():
    """Reset the abort flag"""
    global _abort_requested
    _abort_requested = False

# Import necessary modules
from mcp_agent.app import MCPApp
from workflows.agent_orchestration_engine import (
    execute_multi_agent_research_pipeline,
    execute_chat_based_planning_pipeline,
)
from .sidebar_feed import log_sidebar_event, ensure_sidebar_logging


def _emergency_cleanup():
    """
    Emergency resource cleanup function
    Called when program exits abnormally
    """
    try:
        cleanup_resources()
    except Exception:
        pass  # Silent handling to avoid new exceptions during exit


def _signal_handler(signum, frame):
    """
    Signal handler for program termination signals
    """
    try:
        cleanup_resources()
    except Exception:
        pass
    finally:
        # Restore default signal handling and resend signal
        signal.signal(signum, signal.SIG_DFL)
        os.kill(os.getpid(), signum)


# Register exit cleanup function
atexit.register(_emergency_cleanup)


def _safe_register_signal_handlers():
    """Safely register signal handlers"""
    try:
        # Check if running in main thread
        import threading

        if threading.current_thread() is not threading.main_thread():
            return  # Signal handlers can only be registered in main thread

        # Try to register signal handlers
        signal.signal(signal.SIGTERM, _signal_handler)
        signal.signal(signal.SIGINT, _signal_handler)
        if hasattr(signal, "SIGBREAK"):  # Windows
            signal.signal(signal.SIGBREAK, _signal_handler)
    except (AttributeError, OSError, ValueError):
        # Some signals are not available on certain platforms or disabled in some environments
        # This is common in web frameworks like Streamlit
        pass


# Delayed signal handler registration to avoid import-time errors
try:
    _safe_register_signal_handlers()
except Exception:
    # If registration fails, silently ignore and don't affect app startup
    pass


async def process_input_async(
    input_source: str,
    input_type: str,
    enable_indexing: bool = True,
    progress_callback=None,
) -> Dict[str, Any]:
    """
    Process input asynchronously

    Args:
        input_source: Input source
        input_type: Input type
        enable_indexing: Whether to enable indexing functionality
        progress_callback: Progress callback function

    Returns:
        Processing result
    """
    try:
        # Create and use MCP app in the same async context
        app = MCPApp(name="paper_to_code")

        async with app.run() as agent_app:
            logger = agent_app.logger
            context = agent_app.context
            context.config.mcp.servers["filesystem"].args.extend([os.getcwd()])

            # Initialize progress
            if progress_callback:
                if input_type == "chat":
                    progress_callback(
                        5, "🚀 Initializing chat-based planning pipeline..."
                    )
                else:
                    progress_callback(5, "🚀 Initializing AI research engine...")

            # Check for abort before starting
            if is_abort_requested():
                return {"status": "aborted", "message": "Process aborted by user"}
            
            # Choose pipeline based on input type
            if input_type == "chat":
                # Use chat-based planning pipeline for user requirements
                repo_result = await execute_chat_based_planning_pipeline(
                    input_source,  # User's coding requirements
                    logger,
                    progress_callback,
                    enable_indexing=enable_indexing,  # Pass indexing control parameter
                )
            else:
                # Use traditional multi-agent research pipeline for files/URLs
                repo_result = await execute_multi_agent_research_pipeline(
                    input_source,
                    logger,
                    progress_callback,
                    enable_indexing=enable_indexing,  # Pass indexing control parameter
                )

            return {
                "analysis_result": "Integrated into complete workflow",
                "download_result": "Integrated into complete workflow",
                "repo_result": repo_result,
                "status": "success",
            }

    except Exception as e:
        error_msg = str(e)
        traceback_msg = traceback.format_exc()

        return {"error": error_msg, "traceback": traceback_msg, "status": "error"}


def run_async_task(coro):
    """
    Helper function to run async tasks

    Args:
        coro: Coroutine object

    Returns:
        Task result
    """
    # Apply nest_asyncio to support nested event loops
    nest_asyncio.apply()

    # Save current Streamlit context
    try:
        from streamlit.runtime.scriptrunner import get_script_run_ctx
        from streamlit.runtime.scriptrunner.script_run_context import (
            SCRIPT_RUN_CONTEXT_ATTR_NAME,
        )

        current_ctx = get_script_run_ctx()
        context_available = True
    except ImportError:
        # If Streamlit context modules can't be imported, use fallback method
        current_ctx = None
        context_available = False

    def run_in_new_loop():
        """Run coroutine in new event loop"""
        # Set Streamlit context in new thread (if available)
        if context_available and current_ctx:
            try:
                import threading

                setattr(
                    threading.current_thread(),
                    SCRIPT_RUN_CONTEXT_ATTR_NAME,
                    current_ctx,
                )
            except Exception:
                pass  # Ignore context setting errors

        loop = None
        try:
            loop = asyncio.new_event_loop()
            asyncio.set_event_loop(loop)
            result = loop.run_until_complete(coro)
            return result
        except Exception as e:
            raise e
        finally:
            # Clean up resources
            if loop:
                try:
                    loop.close()
                except Exception:
                    pass
            asyncio.set_event_loop(None)

            # Clean up thread context (if available)
            if context_available:
                try:
                    import threading

                    if hasattr(
                        threading.current_thread(), SCRIPT_RUN_CONTEXT_ATTR_NAME
                    ):
                        delattr(
                            threading.current_thread(), SCRIPT_RUN_CONTEXT_ATTR_NAME
                        )
                except Exception:
                    pass  # Ignore cleanup errors

            # Force garbage collection
            import gc

            gc.collect()

    # Use thread pool to run async task, avoiding event loop conflicts
    executor = None
    try:
        executor = concurrent.futures.ThreadPoolExecutor(
            max_workers=1, thread_name_prefix="deepcode_ctx_async"
        )
        future = executor.submit(run_in_new_loop)
        result = future.result(timeout=300)  # 5 minute timeout
        return result
    except concurrent.futures.TimeoutError:
        st.error("Processing timeout after 5 minutes. Please try again.")
        raise TimeoutError("Processing timeout")
    except Exception as e:
        # If thread pool execution fails, try direct execution
        st.warning(f"Threaded async execution failed: {e}, trying direct execution...")
        try:
            # Fallback method: run directly in current thread
            loop = None
            try:
                loop = asyncio.new_event_loop()
                asyncio.set_event_loop(loop)
                result = loop.run_until_complete(coro)
                return result
            finally:
                if loop:
                    try:
                        loop.close()
                    except Exception:
                        pass
                asyncio.set_event_loop(None)
                import gc

                gc.collect()
        except Exception as backup_error:
            st.error(f"All execution methods failed: {backup_error}")
            raise backup_error
    finally:
        # Ensure thread pool is properly closed
        if executor:
            try:
                executor.shutdown(wait=True, cancel_futures=True)
            except Exception:
                pass
        # Force garbage collection
        import gc

        gc.collect()


def run_async_task_simple(coro):
    """
    Simple async task runner, avoiding threading issues

    Args:
        coro: Coroutine object

    Returns:
        Task result
    """
    # Apply nest_asyncio to support nested event loops
    nest_asyncio.apply()

    try:
        # Try to run in current event loop
        loop = asyncio.get_event_loop()
        if loop.is_running():
            # If current loop is running, use improved thread pool method
            import concurrent.futures
            import gc

            def run_in_thread():
                # Create new event loop and set as current thread's loop
                new_loop = asyncio.new_event_loop()
                asyncio.set_event_loop(new_loop)
                try:
                    result = new_loop.run_until_complete(coro)
                    return result
                except Exception as e:
                    # Ensure exception information is properly passed
                    raise e
                finally:
                    # Ensure loop is properly closed
                    try:
                        new_loop.close()
                    except Exception:
                        pass
                    # Clear current thread's event loop reference
                    asyncio.set_event_loop(None)
                    # Force garbage collection
                    gc.collect()

            # Use context manager to ensure thread pool is properly closed
            executor = None
            try:
                executor = concurrent.futures.ThreadPoolExecutor(
                    max_workers=1, thread_name_prefix="deepcode_async"
                )
                future = executor.submit(run_in_thread)
                result = future.result(timeout=300)  # 5 minute timeout
                return result
            except concurrent.futures.TimeoutError:
                st.error(
                    "Processing timeout after 5 minutes. Please try again with a smaller file."
                )
                raise TimeoutError("Processing timeout")
            except Exception as e:
                st.error(f"Async processing error: {e}")
                raise e
            finally:
                # Ensure thread pool is properly closed
                if executor:
                    try:
                        executor.shutdown(wait=True, cancel_futures=True)
                    except Exception:
                        pass
                # Force garbage collection
                gc.collect()
        else:
            # Run directly in current loop
            return loop.run_until_complete(coro)
    except Exception:
        # Final fallback method: create new event loop
        loop = None
        try:
            loop = asyncio.new_event_loop()
            asyncio.set_event_loop(loop)
            result = loop.run_until_complete(coro)
            return result
        except Exception as backup_error:
            st.error(f"All async methods failed: {backup_error}")
            raise backup_error
        finally:
            if loop:
                try:
                    loop.close()
                except Exception:
                    pass
            asyncio.set_event_loop(None)
            # Force garbage collection
            import gc

            gc.collect()


def handle_processing_workflow(
    input_source: str, input_type: str, enable_indexing: bool = True
) -> Dict[str, Any]:
    """
    Main processing function for workflow

    Args:
        input_source: Input source
        input_type: Input type
        enable_indexing: Whether to enable indexing functionality

    Returns:
        Processing result
    """
    from .components import (
        enhanced_progress_display_component,
        update_step_indicator,
        display_status,
    )

    # Display enhanced progress components
    chat_mode = input_type == "chat"
    progress_bar, status_text, step_indicators, workflow_steps = (
        enhanced_progress_display_component(enable_indexing, chat_mode)
    )
    log_sidebar_event(
        "SYSTEM",
        f"Workflow started ({'guided/chat' if chat_mode else 'research'} mode)",
        extra={"input_type": input_type, "indexing": enable_indexing},
    )

    # Step mapping: map progress percentages to step indices - adjust based on mode and indexing toggle
    if chat_mode:
        # Chat mode step mapping: Initialize -> Planning -> Setup -> Save Plan -> Implement
        step_mapping = {
            5: 0,  # Initialize
            30: 1,  # Planning (analyzing requirements)
            50: 2,  # Setup (creating workspace)
            70: 3,  # Save Plan (saving implementation plan)
            85: 4,  # Implement (generating code)
            100: 4,  # Complete
        }
    elif not enable_indexing:
        # Skip indexing-related steps progress mapping - fast mode order: Initialize -> Analyze -> Download -> Plan -> Implement
        step_mapping = {
            5: 0,  # Initialize
            10: 1,  # Analyze
            25: 2,  # Download
            40: 3,  # Plan (now prioritized over References, 40%)
            85: 4,  # Implement (skip References, Repos and Index)
            100: 4,  # Complete
        }
    else:
        # Full workflow step mapping - new order: Initialize -> Analyze -> Download -> Plan -> References -> Repos -> Index -> Implement
        step_mapping = {
            5: 0,  # Initialize
            10: 1,  # Analyze
            25: 2,  # Download
            40: 3,  # Plan (now 4th position, 40%)
            50: 4,  # References (now 5th position, conditional, 50%)
            60: 5,  # Repos (GitHub download)
            70: 6,  # Index (code indexing)
            85: 7,  # Implement (code implementation)
            100: 7,  # Complete
        }

    current_step = 0

    # Define enhanced progress callback function
    def update_progress(progress: int, message: str, error: str = None):
        nonlocal current_step
        
        # Check for abort request
        if is_abort_requested():
            st.error("🛑 Process aborted by user")
            return

        # Update progress bar
        progress_bar.progress(progress)
        
        # Display error if present
        if error:
            st.error(f"❌ Error: {error}")
            print(f"❌ Error: {error}")
        
        # Update status with timestamp
        timestamp = datetime.now().strftime("%H:%M:%S")
        status_text.markdown(f"**[{timestamp}]** {message}")
        print(f"[{timestamp}] {message}")

        # Determine current step
        new_step = step_mapping.get(progress, current_step)
        if new_step != current_step:
            current_step = new_step
            update_step_indicator(
                step_indicators, workflow_steps, current_step, "active"
            )

        stage_index = (
            min(current_step, len(workflow_steps) - 1) if workflow_steps else 0
        )
        stage_label = (
            workflow_steps[stage_index]["title"] if workflow_steps else "STAGE"
        )
        log_sidebar_event(
            stage_label,
            message,
            extra={"progress": progress},
        )
        time.sleep(0.3)  # Brief pause for users to see progress changes

    # Step 1: Initialization
    if chat_mode:
        update_progress(5, "🚀 Initializing chat-based planning engine...")
    elif enable_indexing:
        update_progress(5, "🚀 Initializing AI research engine and loading models...")
    else:
        update_progress(
            5, "🚀 Initializing AI research engine (Fast mode - indexing disabled)..."
        )
    update_step_indicator(step_indicators, workflow_steps, 0, "active")

    # Start async processing with progress callback
    with st.spinner("🔄 Processing workflow stages..."):
        # Check for abort before starting
        if is_abort_requested():
            return {"status": "aborted", "message": "Process aborted by user"}
            
        try:
            # First try using simple async processing method
            result = run_async_task_simple(
                process_input_async(
                    input_source, input_type, enable_indexing, update_progress
                )
            )
        except Exception as e:
            error_msg = f"Primary async method failed: {e}"
            st.warning(error_msg)
            print(f"⚠️ {error_msg}")
            update_progress(0, "Retrying with fallback method...", error_msg)
            
            # Fallback method: use original thread pool method
            try:
                result = run_async_task(
                    process_input_async(
                        input_source, input_type, enable_indexing, update_progress
                    )
                )
            except Exception as backup_error:
                error_msg = f"Both async methods failed. Error: {backup_error}"
                st.error(error_msg)
                print(f"❌ {error_msg}")
                update_progress(0, "Processing failed", error_msg)
                return {
                    "status": "error",
                    "error": str(backup_error),
                    "traceback": traceback.format_exc(),
                }

    # Update final status based on results
    if result["status"] == "success":
        # Complete all steps
        update_progress(100, "✅ All processing stages completed successfully!")
        update_step_indicator(
            step_indicators, workflow_steps, len(workflow_steps), "completed"
        )

        # Display success information
        st.balloons()  # Add celebration animation
        if chat_mode:
            display_status(
                "🎉 Chat workflow completed! Your requirements have been analyzed and code has been generated.",
                "success",
            )
        elif enable_indexing:
            display_status(
                "🎉 Workflow completed! Your research paper has been successfully processed and code has been generated.",
                "success",
            )
        else:
            display_status(
                "🎉 Fast workflow completed! Your research paper has been processed (indexing skipped for faster processing).",
                "success",
            )
        log_sidebar_event(
            "COMPLETE",
            "All stages completed successfully.",
            level="success",
            extra={
                "input_type": input_type,
                "indexing": enable_indexing,
                "timestamp": datetime.utcnow().isoformat(),
            },
        )

    else:
        # Processing failed
        update_progress(0, "❌ Processing failed - see error details below")
        update_step_indicator(step_indicators, workflow_steps, current_step, "error")
        display_status(
            f"❌ Processing encountered an error: {result.get('error', 'Unknown error')}",
            "error",
        )
        failure_stage = (
            workflow_steps[current_step]["title"]
            if workflow_steps and current_step < len(workflow_steps)
            else "ERROR"
        )
        log_sidebar_event(
            failure_stage,
            f"Processing failed: {result.get('error', 'Unknown error')}",
            level="error",
        )

    # Wait a moment for users to see completion status
    time.sleep(2.5)

    return result


def update_session_state_with_result(result: Dict[str, Any], input_type: str):
    """
    Update session state with result

    Args:
        result: Processing result
        input_type: Input type
    """
    if result["status"] == "success":
        # Save result to session state
        st.session_state.last_result = result
        st.session_state.show_results = True

        # Save to history
        st.session_state.results.append(
            {
                "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
                "input_type": input_type,
                "status": "success",
                "result": result,
            }
        )
    else:
        # Save error information to session state for display
        st.session_state.last_error = result.get("error", "Unknown error")

        # Save error to history
        st.session_state.results.append(
            {
                "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
                "input_type": input_type,
                "status": "error",
                "error": result.get("error", "Unknown error"),
            }
        )

    # Limit history to maximum 50 records
    if len(st.session_state.results) > 50:
        st.session_state.results = st.session_state.results[-50:]


def cleanup_temp_file(input_source: str, input_type: str):
    """
    Cleanup temporary file using cross-platform safe method.

    Args:
        input_source: Input source
        input_type: Input type
    """
    if input_type == "file" and input_source:
        try:
            from utils.cross_platform_file_handler import get_file_handler

            file_handler = get_file_handler()
            file_handler.safe_remove_file(input_source)
        except Exception as e:
            # Log but don't fail - cleanup is best effort
            import logging

            logging.getLogger(__name__).warning(
                f"Failed to cleanup temp file {input_source}: {e}"
            )


async def handle_requirement_analysis_workflow(
    user_input: str, analysis_mode: str, user_answers: Dict[str, str] = None
) -> Dict[str, Any]:
    """
    Handle requirement analysis workflow

    Args:
        user_input: User initial requirements
        analysis_mode: Analysis mode ("generate_questions" or "summarize_requirements")
        user_answers: User answer dictionary

    Returns:
        Processing result dictionary
    """
    try:
        # Import required modules
        from workflows.agent_orchestration_engine import (
            execute_requirement_analysis_workflow,
        )

        # Create progress callback function
        def update_progress(progress: int, message: str):
            # Display progress in Streamlit
            st.session_state.current_progress = progress
            st.session_state.current_message = message

        # Execute requirement analysis workflow
        result = await execute_requirement_analysis_workflow(
            user_input=user_input,
            analysis_mode=analysis_mode,
            user_answers=user_answers,
            logger=None,  # Can pass in logger
            progress_callback=update_progress,
        )

        return result

    except Exception as e:
        return {
            "status": "error",
            "error": str(e),
            "message": f"Requirement analysis workflow execution failed: {str(e)}",
        }


async def handle_requirement_modification_workflow(
    current_requirements: str, modification_feedback: str
) -> Dict[str, Any]:
    """
    Handle requirement modification workflow

    Args:
        current_requirements: Current requirement document content
        modification_feedback: User's modification requests and feedback

    Returns:
        Processing result dictionary
    """
    try:
        # Import required modules
        from workflows.agents.requirement_analysis_agent import RequirementAnalysisAgent

        # Create progress callback function
        def update_progress(progress: int, message: str):
            # Display progress in Streamlit
            st.session_state.current_progress = progress
            st.session_state.current_message = message

        update_progress(10, "🔧 Initializing requirement modification agent...")

        # Initialize RequirementAnalysisAgent
        agent = RequirementAnalysisAgent()

        # Initialize agent (LLM is initialized internally)
        await agent.initialize()

        update_progress(50, "✏️ Modifying requirements based on your feedback...")

        # Modify requirements
        result = await agent.modify_requirements(
            current_requirements=current_requirements,
            modification_feedback=modification_feedback,
        )

        # Cleanup
        await agent.cleanup()

        update_progress(100, "✅ Requirements modification completed!")

        return {
            "status": "success",
            "result": result,
            "message": "Requirements modification completed successfully",
        }

    except Exception as e:
        return {
            "status": "error",
            "error": str(e),
            "message": f"Requirements modification workflow execution failed: {str(e)}",
        }


def handle_guided_mode_processing():
    """Handle asynchronous processing for guided mode"""
    # Check if questions need to be generated
    if st.session_state.get("questions_generating", False):
        st.session_state.questions_generating = False

        # Asynchronously generate questions
        initial_req = st.session_state.get("initial_requirement", "")
        if initial_req:
            try:
                # Use asynchronous processing to generate questions
                result = run_async_task_simple(
                    handle_requirement_analysis_workflow(
                        user_input=initial_req, analysis_mode="generate_questions"
                    )
                )

                if result["status"] == "success":
                    # Parse JSON result
                    import json

                    questions = json.loads(result["result"])
                    st.session_state.generated_questions = questions
                else:
                    st.error(
                        f"Question generation failed: {result.get('error', 'Unknown error')}"
                    )

            except Exception as e:
                st.error(f"Question generation exception: {str(e)}")

    # Check if detailed requirements need to be generated
    if st.session_state.get("requirements_generating", False):
        st.session_state.requirements_generating = False

        # Asynchronously generate detailed requirements
        initial_req = st.session_state.get("initial_requirement", "")
        user_answers = st.session_state.get("user_answers", {})

        if initial_req:
            try:
                # Use asynchronous processing to generate requirement summary
                result = run_async_task_simple(
                    handle_requirement_analysis_workflow(
                        user_input=initial_req,
                        analysis_mode="summarize_requirements",
                        user_answers=user_answers,
                    )
                )

                if result["status"] == "success":
                    st.session_state.detailed_requirements = result["result"]
                else:
                    st.error(
                        f"Requirement summary generation failed: {result.get('error', 'Unknown error')}"
                    )

            except Exception as e:
                st.error(f"Requirement summary generation exception: {str(e)}")

    # Check if requirements need to be edited
    if st.session_state.get("requirements_editing", False):
        st.session_state.requirements_editing = False
        st.info("🔧 Starting requirement modification process...")

        # Asynchronously modify requirements based on user feedback
        current_requirements = st.session_state.get("detailed_requirements", "")
        edit_feedback = st.session_state.get("edit_feedback", "")

        if current_requirements and edit_feedback:
            try:
                # Use asynchronous processing to modify requirements
                result = run_async_task_simple(
                    handle_requirement_modification_workflow(
                        current_requirements=current_requirements,
                        modification_feedback=edit_feedback,
                    )
                )

                if result["status"] == "success":
                    st.session_state.detailed_requirements = result["result"]
                    st.session_state.requirement_analysis_step = "summary"
                    st.session_state.edit_feedback = ""
                    st.success("✅ Requirements updated successfully!")
                    st.rerun()
                else:
                    st.error(
                        f"Requirements modification failed: {result.get('error', 'Unknown error')}"
                    )

            except Exception as e:
                st.error(f"Requirements modification exception: {str(e)}")


def _background_workflow_runner(
    input_source: str, input_type: str, enable_indexing: bool, session_id: str
):
    """
    Background thread function to run the workflow WITHOUT any Streamlit UI calls
    This runs in a separate thread to avoid blocking Streamlit's main thread
    """
    import logging

    # Store results in a thread-safe way using a simple dict
    if not hasattr(_background_workflow_runner, "results"):
        _background_workflow_runner.results = {}

    # Create a simple progress callback that only logs (no Streamlit UI calls)
    def background_progress_callback(progress: int, message: str):
        # Just log to Python logger, which will be captured by our logging handler
        logging.info(f"Progress: {progress}% - {message}")

    try:
        # Call the core async workflow directly without UI components
        import asyncio
        import nest_asyncio

        nest_asyncio.apply()

        loop = asyncio.new_event_loop()
        asyncio.set_event_loop(loop)
        try:
            result = loop.run_until_complete(
                process_input_async(
                    input_source,
                    input_type,
                    enable_indexing,
                    background_progress_callback,
                )
            )
            _background_workflow_runner.results[session_id] = {
                "status": "completed",
                "result": result,
            }
        finally:
            loop.close()
            asyncio.set_event_loop(None)

    except Exception as e:
        logging.error(f"Background workflow error: {e}", exc_info=True)
        _background_workflow_runner.results[session_id] = {
            "status": "error",
            "error": str(e),
            "traceback": traceback.format_exc(),
        }


def handle_start_processing_button(input_source: str, input_type: str):
    """
    Handle start processing button click - synchronous execution

    Args:
        input_source: Input source
        input_type: Input type
    """
    from .components import display_status

    st.session_state.processing = True
    st.session_state.workflow_start_time = time.time()
    st.session_state.active_log_file = None

    # Get indexing toggle status
    enable_indexing = st.session_state.get("enable_indexing", True)
    log_sidebar_event(
        "SYSTEM",
        "Engaging DeepCode pipeline...",
        extra={
            "input_type": input_type,
            "indexing": enable_indexing,
        },
    )

    try:
        # Process workflow synchronously
        result = handle_processing_workflow(input_source, input_type, enable_indexing)

        # Display result status
        if result["status"] == "success":
            display_status("All operations completed successfully! 🎉", "success")
        else:
            display_status("Error during processing", "error")

        # Update session state
        update_session_state_with_result(result, input_type)

    except Exception as e:
        # Handle exceptional cases
        st.error(f"Unexpected error during processing: {e}")
        result = {"status": "error", "error": str(e)}
        update_session_state_with_result(result, input_type)

    finally:
        # Reset state and clean up resources after processing
        st.session_state.processing = False

        # Clean up temporary files
        cleanup_temp_file(input_source, input_type)

        # Clean up system resources
        cleanup_resources()
        
        # Reset abort flag
        reset_abort_flag()

        # Rerun to display results or errors
        st.rerun()


def check_background_workflow_status():
    """
    Check if background workflow has completed and handle results
    This should be called on every Streamlit rerun
    """
    from .components import display_status

    if not st.session_state.get("processing"):
        return

    session_id = st.session_state.get("workflow_session_id")
    if not session_id:
        return

    # Check if background thread has finished
    if (
        hasattr(_background_workflow_runner, "results")
        and session_id in _background_workflow_runner.results
    ):
        workflow_result = _background_workflow_runner.results[session_id]

        # Clean up the result from the cache
        del _background_workflow_runner.results[session_id]

        # Process the result
        if workflow_result["status"] == "completed":
            result = workflow_result["result"]

            # Display result status
            if result["status"] == "success":
                display_status("All operations completed successfully! 🎉", "success")
            else:
                display_status("Error during processing", "error")

            # Update session state
            update_session_state_with_result(
                result, st.session_state.get("workflow_input_type", "")
            )

        elif workflow_result["status"] == "error":
            st.error(f"Unexpected error during processing: {workflow_result['error']}")
            result = {"status": "error", "error": workflow_result["error"]}
            update_session_state_with_result(
                result, st.session_state.get("workflow_input_type", "")
            )

        # Clean up
        st.session_state.processing = False
        cleanup_temp_file(
            st.session_state.get("workflow_input_source"),
            st.session_state.get("workflow_input_type"),
        )
        cleanup_resources()

        # Clear workflow tracking variables
        st.session_state.workflow_session_id = None
        st.session_state.workflow_thread = None
        st.session_state.workflow_input_source = None
        st.session_state.workflow_input_type = None

        # Rerun to show results
        st.rerun()


def handle_error_display():
    """Handle error display"""
    if hasattr(st.session_state, "last_error") and st.session_state.last_error:
        st.error(f"❌ Error: {st.session_state.last_error}")
        if st.button("🔄 Try Again", type="secondary", use_container_width=True):
            st.session_state.last_error = None
            st.session_state.task_counter += 1
            st.rerun()


def initialize_session_state():
    """Initialize session state"""
    if "processing" not in st.session_state:
        st.session_state.processing = False
    if "results" not in st.session_state:
        st.session_state.results = []
    if "current_step" not in st.session_state:
        st.session_state.current_step = 0
    if "task_counter" not in st.session_state:
        st.session_state.task_counter = 0
    if "show_results" not in st.session_state:
        st.session_state.show_results = False
    if "last_result" not in st.session_state:
        st.session_state.last_result = None
    if "last_error" not in st.session_state:
        st.session_state.last_error = None
    if "enable_indexing" not in st.session_state:
        st.session_state.enable_indexing = (
            False  # Default enable indexing functionality
        )

    # Requirement analysis related states
    if "requirement_analysis_mode" not in st.session_state:
        st.session_state.requirement_analysis_mode = "direct"  # direct/guided
    if "requirement_analysis_step" not in st.session_state:
        st.session_state.requirement_analysis_step = "input"  # input/questions/summary
    if "generated_questions" not in st.session_state:
        st.session_state.generated_questions = []
    if "user_answers" not in st.session_state:
        st.session_state.user_answers = {}
    if "detailed_requirements" not in st.session_state:
        st.session_state.detailed_requirements = ""
    if "initial_requirement" not in st.session_state:
        st.session_state.initial_requirement = ""
    if "questions_generating" not in st.session_state:
        st.session_state.questions_generating = False
    if "requirements_generating" not in st.session_state:
        st.session_state.requirements_generating = False
    if "requirements_confirmed" not in st.session_state:
        st.session_state.requirements_confirmed = False
    if "edit_feedback" not in st.session_state:
        st.session_state.edit_feedback = ""
    if "requirements_editing" not in st.session_state:
        st.session_state.requirements_editing = False
    if "guided_initial_requirement" not in st.session_state:
        st.session_state.guided_initial_requirement = ""
    if "guided_edit_feedback" not in st.session_state:
        st.session_state.guided_edit_feedback = ""
    if "confirmed_requirement_text" not in st.session_state:
        st.session_state.confirmed_requirement_text = None
    if "sidebar_events" not in st.session_state:
        st.session_state.sidebar_events = []
    ensure_sidebar_logging()
    if "workflow_start_time" not in st.session_state:
        st.session_state.workflow_start_time = None
    if "active_log_file" not in st.session_state:
        st.session_state.active_log_file = None
    if "workflow_session_id" not in st.session_state:
        st.session_state.workflow_session_id = None
    if "workflow_thread" not in st.session_state:
        st.session_state.workflow_thread = None
    if "workflow_input_source" not in st.session_state:
        st.session_state.workflow_input_source = None
    if "workflow_input_type" not in st.session_state:
        st.session_state.workflow_input_type = None
    if "guided_payload" not in st.session_state:
        st.session_state.guided_payload = None


def cleanup_resources():
    """
    Clean up system resources to prevent memory leaks
    """
    try:
        import gc
        import threading
        import multiprocessing
        import asyncio
        import sys

        # 1. Clean up asyncio-related resources
        try:
            # Get current event loop (if exists)
            try:
                loop = asyncio.get_running_loop()
                # Cancel all pending tasks
                if loop and not loop.is_closed():
                    pending_tasks = [
                        task for task in asyncio.all_tasks(loop) if not task.done()
                    ]
                    if pending_tasks:
                        for task in pending_tasks:
                            if not task.cancelled():
                                task.cancel()
                        # Wait for task cancellation to complete
                        try:
                            if pending_tasks:
                                # Use timeout to avoid blocking too long
                                import time

                                time.sleep(0.1)
                        except Exception:
                            pass
            except RuntimeError:
                # No running event loop, continue with other cleanup
                pass
        except Exception:
            pass

        # 2. Force garbage collection
        gc.collect()

        # 3. Clean up active threads (except main thread)
        active_threads = threading.active_count()
        if active_threads > 1:
            # Wait some time for threads to naturally finish
            import time

            time.sleep(0.5)

        # 4. Clean up multiprocessing resources
        try:
            # Clean up possible multiprocessing resources
            if hasattr(multiprocessing, "active_children"):
                for child in multiprocessing.active_children():
                    if child.is_alive():
                        child.terminate()
                        child.join(timeout=1.0)
                        # If join times out, force kill
                        if child.is_alive():
                            try:
                                child.kill()
                                child.join(timeout=0.5)
                            except Exception:
                                pass

            # Clean up multiprocessing-related resource tracker
            try:
                import multiprocessing.resource_tracker

                if hasattr(multiprocessing.resource_tracker, "_resource_tracker"):
                    tracker = multiprocessing.resource_tracker._resource_tracker
                    if tracker and hasattr(tracker, "_stop"):
                        tracker._stop()
            except Exception:
                pass

        except Exception:
            pass

        # 5. Force clean up Python internal caches
        try:
            # Clean up some temporary objects in module cache
            import sys

            # Don't delete key modules, only clean up possible temporary resources
            if hasattr(sys, "_clear_type_cache"):
                sys._clear_type_cache()
        except Exception:
            pass

        # 6. Final garbage collection
        gc.collect()

    except Exception as e:
        # Silently handle cleanup errors to avoid affecting main flow
        # But can log errors in debug mode
        try:
            import logging

            logging.getLogger(__name__).debug(f"Resource cleanup warning: {e}")
        except Exception:
            pass


================================================
FILE: ui/layout.py
================================================
"""
DeepCode Layout Manager
Organizes the visual structure using the Cyber components.
"""

from typing import Optional

import streamlit as st
from .components import (
    display_features,
    display_header,
    footer_component,
    guided_requirement_workflow,
    input_method_selector,
    requirement_mode_selector,
    results_display_component,
    sidebar_control_panel,
    system_status_component,
)
from .styles import get_main_styles
from .handlers import (
    initialize_session_state,
    handle_start_processing_button,
    handle_error_display,
    handle_guided_mode_processing,
)


def setup_page_config():
    st.set_page_config(
        page_title="DeepCode",
        page_icon="assets/logo.png",
        layout="wide",
        initial_sidebar_state="expanded",
        menu_items={
            "Get Help": "https://github.com/deepcode",
            "About": "DeepCode AI Research Engine v3.0",
        },
    )


def main_layout():
    """Main layout execution"""
    # Initialize Core
    initialize_session_state()
    setup_page_config()

    # Inject Cyber Styles
    st.markdown(get_main_styles(), unsafe_allow_html=True)

    # Render Sidebar
    sidebar_control_panel()

    # Main Content Area
    display_header()

    # Determine Content State
    show_results = st.session_state.get("show_results", False)
    last_result = st.session_state.get("last_result", None)

    if show_results and last_result:
        results_display_component(last_result, st.session_state.task_counter)
    else:
        # Landing State
        display_features()
        system_status_component()

        st.markdown('<div style="height: 2rem;"></div>', unsafe_allow_html=True)

        # Input Interface
        render_input_area()

    # Global Error Handler (Always active)
    handle_error_display()

    # Footer
    footer_component()

    return {}


def render_input_area():
    """Handles the logic for which input to show"""

    # Handle guided mode async processing (background)
    handle_guided_mode_processing()

    mode = requirement_mode_selector()
    is_guided = mode == "guided"
    processing = st.session_state.get("processing", False)
    requirements_confirmed = st.session_state.get("requirements_confirmed", False)

    input_source: Optional[str] = None
    input_type: Optional[str] = None

    with st.container():
        if is_guided:
            input_source, _ = guided_requirement_workflow()
            input_type = "chat" if input_source else None
        else:
            input_source, input_type = input_method_selector(
                st.session_state.task_counter
            )

        st.markdown('<div style="height: 1.5rem;"></div>', unsafe_allow_html=True)

        if is_guided and requirements_confirmed and input_source and not processing:
            payload = input_source
            st.session_state.requirements_confirmed = False
            st.session_state.confirmed_requirement_text = None
            handle_start_processing_button(payload, input_type or "chat")

        elif input_source and not processing:
            col1, col2, col3 = st.columns([1, 2, 1])
            with col2:
                if st.button(
                    "START CODING 🚀", type="primary", use_container_width=True
                ):
                    if is_guided:
                        st.session_state.confirmed_requirement_text = None
                    handle_start_processing_button(input_source, input_type or "chat")

        elif processing:
            st.markdown(
                """
                <div style="padding:1.5rem; border:1px solid var(--primary); border-radius:4px; background:rgba(0, 242, 255, 0.05); text-align:center;">
                    <div class="status-dot" style="display:inline-block; margin-right:10px;"></div>
                    <span style="font-family: var(--font-code); color: var(--primary); animation: pulse-glow 2s infinite;">NEURAL PROCESSING ACTIVE...</span>
                </div>
                """,
                unsafe_allow_html=True,
            )

        elif not input_source and not is_guided:
            st.markdown(
                """
                <div style="text-align:center; color:rgba(255,255,255,0.3); font-family:var(--font-code); font-size:0.8rem;">
                    AWAITING INPUT SIGNAL...
                </div>
                """,
                unsafe_allow_html=True,
            )


================================================
FILE: ui/sidebar_feed.py
================================================
"""
Sidebar mission feed utilities.
"""

from __future__ import annotations

import logging
from datetime import datetime
from typing import Optional, Dict, Any

import streamlit as st


def _init_event_store():
    if "sidebar_events" not in st.session_state:
        st.session_state.sidebar_events = []


def log_sidebar_event(
    stage: str,
    message: str,
    level: str = "info",
    extra: Optional[Dict[str, Any]] = None,
):
    """
    Record a sidebar feed event for live mission status display.
    Thread-safe: if called from background thread, just log to Python logger instead.
    """
    try:
        # Check if we're in a Streamlit context
        from streamlit.runtime.scriptrunner import get_script_run_ctx

        if get_script_run_ctx() is None:
            # Running in background thread, just use Python logging
            import logging

            logging.info(f"[{stage}] {message}")
            return

        _init_event_store()
        events = list(st.session_state.sidebar_events)
        events.append(
            {
                "timestamp": datetime.utcnow().strftime("%H:%M:%S"),
                "stage": stage.upper(),
                "message": message,
                "level": level,
                "extra": extra or {},
            }
        )
        st.session_state.sidebar_events = events[-80:]
    except Exception:
        # Fallback to Python logging
        import logging

        logging.info(f"[{stage}] {message}")


class SidebarLogHandler(logging.Handler):
    """Forward Python logging records to the sidebar mission feed."""

    def emit(self, record: logging.LogRecord):
        try:
            msg = self.format(record)
            stage = getattr(record, "stage", record.name.split(".")[-1]).upper()
            level = record.levelname.lower()
            payload = {
                "logger": record.name,
                "level": record.levelname,
            }
            if record.exc_info:
                payload["exception"] = self.formatException(record.exc_info)
            log_sidebar_event(stage, msg, level=level, extra=payload)
        except Exception:
            pass


def ensure_sidebar_logging():
    """
    Attach sidebar logging handler once per session to bridge backend logs.
    """
    if st.session_state.get("_sidebar_logging_attached"):
        return

    handler = SidebarLogHandler()
    handler.setLevel(logging.INFO)
    formatter = logging.Formatter("%(message)s")
    handler.setFormatter(formatter)

    logging.getLogger().addHandler(handler)
    st.session_state._sidebar_logging_attached = True


================================================
FILE: ui/streamlit_app.py
================================================
"""
DeepCode - AI Research Engine

Streamlit Web Interface Main Application File
"""

import os
import sys

# Disable .pyc file generation
os.environ["PYTHONDONTWRITEBYTECODE"] = "1"

# Add parent directory to path for module imports
current_dir = os.path.dirname(os.path.abspath(__file__))
parent_dir = os.path.dirname(current_dir)
if parent_dir not in sys.path:
    sys.path.insert(0, parent_dir)

# Import UI modules
from ui.layout import main_layout


def main():
    """
    Main function - Streamlit application entry

    All UI logic has been modularized into ui/ folder
    """
    # Run main layout
    sidebar_info = main_layout()

    # Additional global logic can be added here if needed

    return sidebar_info


if __name__ == "__main__":
    main()


================================================
FILE: ui/styles.py
================================================
"""
DeepCode UI Styles - Cyber/AI Tech Theme
Modernized with Glassmorphism, Neon Accents, and Fluid Typography.
"""


def get_main_styles() -> str:
    return """
    <style>
        /* ------------------- IMPORT FONTS ------------------- */
        @import url('https://fonts.googleapis.com/css2?family=Orbitron:wght@400;500;700;900&family=JetBrains+Mono:wght@300;400;600&family=Inter:wght@300;400;600;800&display=swap');

        /* ------------------- VARS (CYBER THEME) ------------------- */
        :root {
            /* Colors */
            --bg-dark: #050505;
            --bg-card: rgba(20, 20, 25, 0.6);
            --bg-card-hover: rgba(30, 30, 40, 0.8);

            --primary: #00f2ff;       /* Cyan Neon */
            --secondary: #7000ff;     /* Electric Purple */
            --accent: #ff0055;        /* Cyber Pink */
            --success: #00ff9d;
            --warning: #ffb800;
            --error: #ff2a6d;
            --text-main: #ffffff;
            --text-muted: rgba(255, 255, 255, 0.6);

            /* Glassmorphism */
            --glass-border: 1px solid rgba(255, 255, 255, 0.08);
            --glass-shadow: 0 8px 32px 0 rgba(0, 0, 0, 0.37);
            --neon-shadow: 0 0 10px rgba(0, 242, 255, 0.3), 0 0 20px rgba(0, 242, 255, 0.2);

            /* Typography */
            --font-display: 'Orbitron', sans-serif;
            --font-body: 'Inter', sans-serif;
            --font-code: 'JetBrains Mono', monospace;
        }

        /* ------------------- GLOBAL RESET & ANIMATIONS ------------------- */
        .stApp {
            background-color: var(--bg-dark);
            background-image:
                radial-gradient(circle at 15% 50%, rgba(112, 0, 255, 0.08) 0%, transparent 25%),
                radial-gradient(circle at 85% 30%, rgba(0, 242, 255, 0.08) 0%, transparent 25%);
            font-family: var(--font-body);
            color: var(--text-main);
        }

        h1, h2, h3, h4, h5, h6 {
            font-family: var(--font-display) !important;
            letter-spacing: 1px;
        }

        @keyframes pulse-glow {
            0% { box-shadow: 0 0 0 0 rgba(0, 242, 255, 0.4); }
            70% { box-shadow: 0 0 0 10px rgba(0, 242, 255, 0); }
            100% { box-shadow: 0 0 0 0 rgba(0, 242, 255, 0); }
        }

        /* ------------------- CUSTOM COMPONENTS ------------------- */

        /* Header Design */
        .cyber-header {
            display: flex;
            align-items: center;
            justify-content: space-between;
            padding: 2rem 0;
            border-bottom: 1px solid rgba(255,255,255,0.1);
            margin-bottom: 2rem;
            background: linear-gradient(90deg, rgba(0,0,0,0) 0%, rgba(0, 242, 255, 0.05) 50%, rgba(0,0,0,0) 100%);
        }

        .brand-container {
            display: flex;
            flex-direction: column;
        }

        .brand-title {
            font-family: var(--font-display);
            font-size: 3.5rem;
            font-weight: 900;
            background: linear-gradient(90deg, #fff, var(--primary));
            -webkit-background-clip: text;
            -webkit-text-fill-color: transparent;
            letter-spacing: -2px;
            text-shadow: 0 0 30px rgba(0, 242, 255, 0.2);
        }

        .brand-subtitle {
            font-family: var(--font-code);
            color: var(--text-muted);
            font-size: 0.9rem;
            letter-spacing: 3px;
            text-transform: uppercase;
            margin-top: 5px;
        }

        .status-indicator {
            display: flex;
            align-items: center;
            gap: 0.8rem;
            padding: 0.6rem 1.2rem;
            background: rgba(0, 255, 157, 0.05);
            border: 1px solid rgba(0, 255, 157, 0.2);
            border-radius: 4px;
            color: var(--success);
            font-family: var(--font-code);
            font-size: 0.8rem;
            text-transform: uppercase;
            letter-spacing: 1px;
        }

        .status-dot {
            width: 8px;
            height: 8px;
            background: var(--success);
            border-radius: 50%;
            box-shadow: 0 0 10px var(--success);
            animation: pulse-glow 2s infinite;
        }

        /* Feature Cards */
        .feature-grid {
            display: grid;
            grid-template-columns: repeat(auto-fit, minmax(280px, 1fr));
            gap: 1.5rem;
            margin-bottom: 3rem;
        }

        .cyber-card {
            background: var(--bg-card);
            backdrop-filter: blur(12px);
            border: var(--glass-border);
            padding: 2rem;
            border-radius: 2px; /* More angular for tech feel */
            transition: all 0.3s ease;
            position: relative;
            overflow: hidden;
            height: 100%;
        }

        .cyber-card::before {
            content: '';
            position: absolute;
            top: 0;
            left: 0;
            width: 3px;
            height: 0%;
            background: var(--primary);
            transition: height 0.3s ease;
        }

        .cyber-card:hover::before {
            height: 100%;
        }

        .cyber-card:hover {
            transform: translateY(-5px);
            background: var(--bg-card-hover);
            box-shadow: var(--neon-shadow);
            border-color: rgba(0, 242, 255, 0.4);
        }

        .card-icon {
            font-size: 2rem;
            margin-bottom: 1.5rem;
            color: var(--primary);
            filter: drop-shadow(0 0 10px rgba(0, 242, 255, 0.5));
        }

        .card-title {
            font-family: var(--font-display);
            font-weight: 700;
            font-size: 1.2rem;
            margin-bottom: 0.8rem;
            color: white;
        }

        .card-desc {
            font-family: var(--font-body);
            font-size: 0.95rem;
            color: var(--text-muted);
            line-height: 1.6;
        }

        /* ------------------- STREAMLIT OVERRIDES ------------------- */

        /* Sidebar */
        [data-testid="stSidebar"] {
            background-color: #020203;
            border-right: 1px solid rgba(255,255,255,0.05);
        }
        [data-testid="stSidebar"] h1, [data-testid="stSidebar"] h2, [data-testid="stSidebar"] h3 {
            color: var(--primary) !important;
        }

        /* Inputs (Text, Select, Area) */
        .stTextInput > div > div > input,
        .stSelectbox > div > div > div,
        .stTextArea > div > div > textarea {
            background-color: rgba(255,255,255,0.03);
            border: 1px solid rgba(255,255,255,0.1);
            color: white;
            border-radius: 4px;
            font-family: var(--font-code);
        }

        .stTextInput > div > div > input:focus,
        .stTextArea > div > div > textarea:focus {
            border-color: var(--primary);
            box-shadow: 0 0 15px rgba(0, 242, 255, 0.1);
            background-color: rgba(0,0,0,0.3);
        }

        /* Tabs */
        .stTabs [data-baseweb="tab-list"] {
            gap: 20px;
            border-bottom: 1px solid rgba(255,255,255,0.1);
        }
        .stTabs [data-baseweb="tab"] {
            background-color: transparent;
            border-radius: 4px 4px 0 0;
            color: var(--text-muted);
            font-family: var(--font-display);
            padding: 10px 20px;
        }
        .stTabs [aria-selected="true"] {
            background-color: rgba(0, 242, 255, 0.1);
            color: var(--primary);
            border-bottom: 2px solid var(--primary);
        }

        /* Buttons */
        .stButton > button {
            background: transparent;
            border: 1px solid var(--primary);
            border-radius: 4px;
            color: var(--primary);
            font-family: var(--font-display);
            font-weight: 600;
            letter-spacing: 2px;
            transition: all 0.3s;
            text-transform: uppercase;
            padding: 0.5rem 2rem;
            box-shadow: 0 0 10px rgba(0, 242, 255, 0.1);
        }
        .stButton > button:hover {
            background: var(--primary);
            color: #000;
            box-shadow: 0 0 25px rgba(0, 242, 255, 0.6);
            transform: translateY(-2px);
        }

        /* Primary Action Button Override */
        button[kind="primary"] {
            background: linear-gradient(90deg, var(--secondary) 0%, var(--primary) 100%);
            border: none;
            color: white !important;
        }

        /* Expanders */
        .streamlit-expanderHeader {
            background-color: rgba(255,255,255,0.02);
            border-radius: 4px;
            border: 1px solid rgba(255,255,255,0.05);
        }

        /* Code Blocks */
        code {
            font-family: var(--font-code) !important;
            color: var(--primary) !important;
            background-color: rgba(0,0,0,0.3) !important;
        }

        /* Sidebar feed */
        .sidebar-feed-card {
            border: 1px solid rgba(255,255,255,0.08);
            border-left: 3px solid var(--primary);
            padding: 0.75rem;
            border-radius: 4px;
            margin-bottom: 0.75rem;
            background: rgba(255,255,255,0.02);
            box-shadow: 0 4px 12px rgba(0,0,0,0.25);
        }
        .sidebar-feed-card .stage-line {
            display: flex;
            justify-content: space-between;
            font-family: var(--font-display);
            font-size: 0.8rem;
            letter-spacing: 1px;
            margin-bottom: 0.35rem;
        }
        .sidebar-feed-card .stage {
            color: var(--primary);
        }
        .sidebar-feed-card .time {
            color: rgba(255,255,255,0.4);
            font-family: var(--font-code);
        }
        .sidebar-feed-card .message {
            font-size: 0.9rem;
            color: rgba(255,255,255,0.85);
            line-height: 1.4;
        }
        .sidebar-feed-card.level-success {
            border-left-color: var(--success);
        }
        .sidebar-feed-card.level-error {
            border-left-color: var(--error);
        }
        .sidebar-feed-card.level-warning {
            border-left-color: var(--warning);
        }

        .system-monitor-card {
            border: 1px solid rgba(255,255,255,0.08);
            border-radius: 6px;
            padding: 1rem;
            background: rgba(0,0,0,0.25);
            margin-bottom: 1.5rem;
            box-shadow: 0 6px 18px rgba(0,0,0,0.35);
        }
        .system-monitor-card .status-grid {
            display: grid;
            grid-template-columns: repeat(2, minmax(0, 1fr));
            gap: 0.75rem;
        }
        .system-monitor-card .status-chip {
            border: 1px solid rgba(255,255,255,0.08);
            border-radius: 4px;
            padding: 0.5rem 0.75rem;
            font-size: 0.8rem;
            letter-spacing: 1px;
            text-transform: uppercase;
            display: flex;
            justify-content: space-between;
        }
        .system-monitor-card .status-chip span:last-child {
            color: var(--primary);
            font-family: var(--font-display);
        }
        .system-monitor-card .latest-stage {
            margin-top: 1rem;
            font-size: 0.85rem;
            color: rgba(255,255,255,0.7);
        }
        .system-monitor-card .latest-stage strong {
            color: var(--text-primary);
        }

        /* Footer area override */
        footer {visibility: hidden;}

    </style>
    """


================================================
FILE: utils/__init__.py
================================================
"""
Utils package for paper processing tools.
"""

from .file_processor import FileProcessor
from .dialogue_logger import (
    DialogueLogger,
    create_dialogue_logger,
    extract_paper_id_from_path,
)

__all__ = [
    "FileProcessor",
    "DialogueLogger",
    "create_dialogue_logger",
    "extract_paper_id_from_path",
]


================================================
FILE: utils/cli_interface.py
================================================
#!/usr/bin/env python3
"""
Professional CLI Interface Module
专业CLI界面模块 - 包含logo、颜色定义和界面组件
"""

import os
import time
import platform
from pathlib import Path
from typing import Optional
import tkinter as tk
from tkinter import filedialog


class Colors:
    """ANSI color codes for terminal styling"""

    HEADER = "\033[95m"
    OKBLUE = "\033[94m"
    OKCYAN = "\033[96m"
    OKGREEN = "\033[92m"
    WARNING = "\033[93m"
    FAIL = "\033[91m"
    ENDC = "\033[0m"
    BOLD = "\033[1m"
    UNDERLINE = "\033[4m"

    # Gradient colors
    PURPLE = "\033[35m"
    MAGENTA = "\033[95m"
    BLUE = "\033[34m"
    CYAN = "\033[36m"
    GREEN = "\033[32m"
    YELLOW = "\033[33m"


class CLIInterface:
    """Professional CLI interface with modern styling"""

    def __init__(self):
        self.uploaded_file = None
        self.is_running = True

        # Check tkinter availability
        self.tkinter_available = True
        try:
            import tkinter as tk

            # Test if tkinter can create a window (some systems have tkinter but no display)
            test_root = tk.Tk()
            test_root.withdraw()
            test_root.destroy()
        except Exception:
            self.tkinter_available = False

    def clear_screen(self):
        """Clear terminal screen"""
        os.system("cls" if os.name == "nt" else "clear")

    def print_logo(self):
        """Print a beautiful ASCII logo with gradient colors and tech elements"""
        # 确保每行总共79个字符（不包括颜色代码），边框完美对齐
        logo = f"""
{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                                                               ║
║  {Colors.BOLD}{Colors.MAGENTA}██████╗  ███████╗██████╗ ██████╗  ██████╗     █████╗ ██╗{Colors.CYAN}                ║
║  {Colors.BOLD}{Colors.PURPLE}██╔══██╗ ██╔════╝██╔══██╗██╔══██╗██╔═══██╗   ██╔══██╗██║{Colors.CYAN}                ║
║  {Colors.BOLD}{Colors.BLUE}██████╔╝ █████╗  ██████╔╝██████╔╝██║   ██║   ███████║██║{Colors.CYAN}                ║
║  {Colors.BOLD}{Colors.OKBLUE}██╔══██╗ ██╔══╝  ██╔═══╝ ██╔══██╗██║   ██║   ██╔══██║██║{Colors.CYAN}                ║
║  {Colors.BOLD}{Colors.OKCYAN}██║  ██║ ███████╗██║     ██║  ██║╚██████╔╝   ██║  ██║██║{Colors.CYAN}                ║
║  {Colors.BOLD}{Colors.GREEN}╚═╝  ╚═╝ ╚══════╝╚═╝     ╚═╝  ╚═╝ ╚═════╝    ╚═╝  ╚═╝╚═╝{Colors.CYAN}                ║
║                                                                               ║
║  {Colors.BOLD}{Colors.YELLOW}┌─────────────────────────────────────────────────────────────────────────┐{Colors.CYAN}   ║
║  {Colors.BOLD}{Colors.YELLOW}│  🤖 AI-POWERED RESEARCH PAPER REPRODUCTION ENGINE 🚀                  │{Colors.CYAN}   ║
║  {Colors.BOLD}{Colors.YELLOW}│  ⚡ INTELLIGENT • AUTOMATED • CUTTING-EDGE ⚡                        │{Colors.CYAN}   ║
║  {Colors.BOLD}{Colors.YELLOW}└─────────────────────────────────────────────────────────────────────────┘{Colors.CYAN}   ║
║                                                                               ║
║  {Colors.BOLD}{Colors.GREEN}💎 CORE CAPABILITIES:{Colors.ENDC}                                                        {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Neural PDF Analysis & Code Extraction                                 {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Advanced Document Processing Engine                                   {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Multi-Format Support (PDF•DOCX•PPTX•HTML)                           {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Smart File Upload Interface                                          {Colors.CYAN}║
║    {Colors.BOLD}{Colors.OKCYAN}▶ Automated Repository Management                                      {Colors.CYAN}║
║                                                                               ║
║  {Colors.BOLD}{Colors.PURPLE}🔬 TECH STACK: Python•AI•MCP•Docling•LLM                                   {Colors.CYAN}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(logo)

    def print_welcome_banner(self):
        """Print welcome banner with version info"""
        banner = f"""
{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                              WELCOME TO ReproAI                              ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║                                                                               ║
║  {Colors.YELLOW}Version: 2.0.0 | Build: Professional Edition                                 {Colors.CYAN}║
║  {Colors.GREEN}Status: Ready | Engine: Initialized                                          {Colors.CYAN}║
║  {Colors.PURPLE}Author: AI Research Team | License: MIT                                      {Colors.CYAN}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(banner)

    def print_separator(self, char="═", length=79, color=Colors.CYAN):
        """Print a styled separator line"""
        print(f"{color}{char * length}{Colors.ENDC}")

    def print_status(self, message: str, status_type: str = "info"):
        """Print status message with appropriate styling"""
        status_styles = {
            "success": f"{Colors.OKGREEN}✅",
            "error": f"{Colors.FAIL}❌",
            "warning": f"{Colors.WARNING}⚠️ ",
            "info": f"{Colors.OKBLUE}ℹ️ ",
            "processing": f"{Colors.YELLOW}⏳",
            "upload": f"{Colors.PURPLE}📁",
            "download": f"{Colors.CYAN}📥",
            "analysis": f"{Colors.MAGENTA}🔍",
        }

        icon = status_styles.get(status_type, status_styles["info"])
        print(f"{icon} {Colors.BOLD}{message}{Colors.ENDC}")

    def create_menu(self):
        """Create an interactive menu"""
        menu = f"""
{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                MAIN MENU                                      ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║                                                                               ║
║  {Colors.OKGREEN}🌐 [U] Process URL       {Colors.CYAN}│  {Colors.PURPLE}📁 [F] Upload File    {Colors.CYAN}│  {Colors.FAIL}❌ [Q] Quit{Colors.CYAN}         ║
║                                                                               ║
║  {Colors.YELLOW}📝 Enter a research paper URL (arXiv, IEEE, ACM, etc.)                      {Colors.CYAN}║
║  {Colors.YELLOW}   or upload a PDF/DOC file for intelligent analysis                        {Colors.CYAN}║
║                                                                               ║
║  {Colors.OKCYAN}💡 Tip: Press 'F' to open file browser or 'U' to enter URL manually        {Colors.CYAN}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(menu)

    def get_user_input(self):
        """Get user input with styled prompt"""
        print(f"\n{Colors.BOLD}{Colors.OKCYAN}➤ Your choice: {Colors.ENDC}", end="")
        return input().strip().lower()

    def upload_file_gui(self) -> Optional[str]:
        """Modern file upload interface using tkinter with cross-platform compatibility"""
        # Check if tkinter is available
        if not self.tkinter_available:
            self.print_status("GUI file dialog not available on this system", "warning")
            self.print_status("Using manual file path input instead", "info")
            return self._get_manual_file_path()

        def select_file():
            try:
                # Create a hidden root window
                root = tk.Tk()
                root.withdraw()  # Hide the main window

                # Platform-specific configurations
                system = platform.system()

                if system == "Darwin":  # macOS
                    # macOS specific settings
                    try:
                        root.call("wm", "attributes", ".", "-topmost", True)
                    except Exception:
                        pass

                    # macOS compatible file types
                    file_types = [
                        ("PDF Files", ".pdf"),
                        ("Word Documents", ".docx .doc"),
                        ("PowerPoint Files", ".pptx .ppt"),
                        ("HTML Files", ".html .htm"),
                        ("Text Files", ".txt .md"),
                        ("All Files", ".*"),
                    ]
                else:
                    # Windows and Linux
                    root.attributes("-topmost", True)

                    # Windows/Linux compatible file types
                    file_types = [
                        ("PDF Files", "*.pdf"),
                        ("Word Documents", "*.docx;*.doc"),
                        ("PowerPoint Files", "*.pptx;*.ppt"),
                        ("HTML Files", "*.html;*.htm"),
                        ("Text Files", "*.txt;*.md"),
                        ("All Files", "*.*"),
                    ]

                # Set window title
                root.title("Repro-AI - File Selector")

                try:
                    # Open file dialog with platform-appropriate settings
                    file_path = filedialog.askopenfilename(
                        title="Select Research Paper File",
                        filetypes=file_types,
                        initialdir=os.getcwd(),
                    )
                except Exception as e:
                    self.print_status(f"File dialog error: {str(e)}", "error")
                    return None
                finally:
                    # Clean up
                    try:
                        root.destroy()
                    except Exception:
                        pass

                return file_path

            except Exception as e:
                # Fallback: destroy root if it exists
                try:
                    if "root" in locals():
                        root.destroy()
                except Exception:
                    pass

                # Print error and suggest alternative
                self.print_status(f"GUI file dialog failed: {str(e)}", "error")
                self.print_status(
                    "Please use manual file path input instead", "warning"
                )
                return self._get_manual_file_path()

        self.print_status("Opening file browser dialog...", "upload")
        file_path = select_file()

        if file_path:
            # Validate file
            if not os.path.exists(file_path):
                self.print_status("File not found!", "error")
                return None

            file_size = os.path.getsize(file_path) / (1024 * 1024)  # Size in MB
            file_ext = Path(file_path).suffix.lower()

            # Display file info with beautiful formatting
            file_name = Path(file_path).name
            directory = str(Path(file_path).parent)

            # Truncate long paths for display
            if len(file_name) > 50:
                display_name = file_name[:47] + "..."
            else:
                display_name = file_name

            if len(directory) > 49:
                display_dir = "..." + directory[-46:]
            else:
                display_dir = directory

            print(f"""
{Colors.OKGREEN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                               FILE SELECTED                                   ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║                                                                               ║
║  {Colors.BOLD}📄 File Name:{Colors.ENDC} {Colors.CYAN}{display_name:<50}{Colors.OKGREEN}║
║  {Colors.BOLD}📁 Directory:{Colors.ENDC} {Colors.YELLOW}{display_dir:<49}{Colors.OKGREEN}║
║  {Colors.BOLD}📊 File Size:{Colors.ENDC} {Colors.PURPLE}{file_size:.2f} MB{Colors.OKGREEN}                                      ║
║  {Colors.BOLD}🔖 File Type:{Colors.ENDC} {Colors.MAGENTA}{file_ext.upper():<50}{Colors.OKGREEN}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
""")

            self.print_status(f"File successfully selected: {file_name}", "success")
            return file_path
        else:
            self.print_status("No file selected", "warning")
            return None

    def _get_manual_file_path(self) -> Optional[str]:
        """Fallback method for manual file path input when GUI fails"""
        print(
            f"\n{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗"
        )
        print(
            "║                           MANUAL FILE INPUT                                   ║"
        )
        print(
            f"╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}"
        )

        print(f"\n{Colors.YELLOW}📝 Supported file types:{Colors.ENDC}")
        print(f"   {Colors.CYAN}• PDF files (.pdf)")
        print(f"   {Colors.CYAN}• Word documents (.docx, .doc)")
        print(f"   {Colors.CYAN}• PowerPoint files (.pptx, .ppt)")
        print(f"   {Colors.CYAN}• HTML files (.html, .htm)")
        print(f"   {Colors.CYAN}• Text files (.txt, .md){Colors.ENDC}")

        print(
            f"\n{Colors.BOLD}{Colors.OKCYAN}📁 Enter file path (or drag & drop): {Colors.ENDC}",
            end="",
        )
        file_path = input().strip()

        # Clean up the path (remove quotes if present)
        file_path = file_path.strip("\"'")

        if file_path:
            # Expand user directory if needed
            file_path = os.path.expanduser(file_path)

            # Check if file exists
            if os.path.exists(file_path):
                self.print_status(
                    f"File found: {os.path.basename(file_path)}", "success"
                )
                return file_path
            else:
                self.print_status("File not found at the specified path", "error")
                return None
        else:
            self.print_status("No file path provided", "warning")
            return None

    def get_url_input(self) -> str:
        """Get URL input with validation and examples"""
        print(
            f"\n{Colors.BOLD}{Colors.CYAN}╔═══════════════════════════════════════════════════════════════════════════════╗"
        )
        print(
            "║                              URL INPUT                                        ║"
        )
        print(
            f"╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}"
        )

        print(f"\n{Colors.YELLOW}📝 Supported URL Examples:{Colors.ENDC}")
        print(f"   {Colors.CYAN}• arXiv: https://arxiv.org/pdf/2403.00813")
        print(f"   {Colors.CYAN}• arXiv: @https://arxiv.org/pdf/2403.00813")
        print(f"   {Colors.CYAN}• IEEE:  https://ieeexplore.ieee.org/document/...")
        print(f"   {Colors.CYAN}• ACM:   https://dl.acm.org/doi/...")
        print(
            f"   {Colors.CYAN}• Direct PDF: https://example.com/paper.pdf{Colors.ENDC}"
        )

        print(
            f"\n{Colors.BOLD}{Colors.OKCYAN}🌐 Enter paper URL: {Colors.ENDC}", end=""
        )
        url = input().strip()

        if url:
            # Basic URL validation
            if any(
                domain in url.lower()
                for domain in ["arxiv.org", "ieee", "acm.org", ".pdf", "researchgate"]
            ):
                self.print_status(f"URL received: {url}", "success")
                return url
            else:
                self.print_status("URL appears valid, proceeding...", "info")
                return url
        else:
            self.print_status("No URL provided", "warning")
            return ""

    def show_progress_bar(self, message: str, duration: float = 2.0):
        """Show a progress animation with enhanced styling"""
        print(f"\n{Colors.YELLOW}{message}{Colors.ENDC}")

        # Progress bar animation with different styles
        bar_length = 50
        for i in range(bar_length + 1):
            percent = (i / bar_length) * 100
            filled = "█" * i
            empty = "░" * (bar_length - i)

            # Color gradient effect
            if percent < 33:
                color = Colors.FAIL
            elif percent < 66:
                color = Colors.WARNING
            else:
                color = Colors.OKGREEN

            print(
                f"\r{color}[{filled}{empty}] {percent:6.1f}%{Colors.ENDC}",
                end="",
                flush=True,
            )
            time.sleep(duration / bar_length)

        print(f"\n{Colors.OKGREEN}✅ {message} completed!{Colors.ENDC}\n")

    def show_spinner(self, message: str, duration: float = 1.0):
        """Show a spinner animation"""
        spinner_chars = "⠋⠙⠹⠸⠼⠴⠦⠧⠇⠏"
        end_time = time.time() + duration

        while time.time() < end_time:
            for char in spinner_chars:
                print(
                    f"\r{Colors.CYAN}{char} {Colors.BOLD}{message}{Colors.ENDC}",
                    end="",
                    flush=True,
                )
                time.sleep(0.1)
                if time.time() >= end_time:
                    break

        print(f"\r{Colors.OKGREEN}✅ {Colors.BOLD}{message} - Done!{Colors.ENDC}")

    def print_results_header(self):
        """Print results section header"""
        header = f"""
{Colors.OKGREEN}╔═══════════════════════════════════════════════════════════════════════════════╗
║                             PROCESSING RESULTS                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(header)

    def print_error_box(self, title: str, error_msg: str):
        """Print error message in a styled box"""
        print(f"""
{Colors.FAIL}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                  ERROR                                        ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║                                                                               ║
║  {Colors.BOLD}Title: {title:<66}{Colors.FAIL}║
║  {Colors.BOLD}Error: {error_msg:<66}{Colors.FAIL}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
""")

    def print_goodbye(self):
        """Print goodbye message"""
        goodbye = f"""
{Colors.BOLD}{Colors.YELLOW}╔═══════════════════════════════════════════════════════════════════════════════╗
║                                GOODBYE!                                       ║
╠═══════════════════════════════════════════════════════════════════════════════╣
║                                                                               ║
║  {Colors.CYAN}Thank you for using ReproAI!                                               {Colors.YELLOW}║
║  {Colors.GREEN}🌟 Star us on GitHub: https://github.com/your-repo                        {Colors.YELLOW}║
║  {Colors.PURPLE}📧 Contact: support@reproai.com                                          {Colors.YELLOW}║
║  {Colors.MAGENTA}🐛 Report issues: https://github.com/your-repo/issues                    {Colors.YELLOW}║
║                                                                               ║
║  {Colors.OKGREEN}✨ Happy coding! See you next time! ✨                                   {Colors.YELLOW}║
║                                                                               ║
╚═══════════════════════════════════════════════════════════════════════════════╝{Colors.ENDC}
"""
        print(goodbye)

    def ask_continue(self) -> bool:
        """Ask user if they want to continue"""
        print(
            f"\n{Colors.BOLD}{Colors.CYAN}Press Enter to continue or 'q' to quit: {Colors.ENDC}",
            end="",
        )
        choice = input().strip().lower()
        return choice not in ["q", "quit", "exit"]


================================================
FILE: utils/cross_platform_file_handler.py
================================================
#!/usr/bin/env python3
"""
Cross-Platform File Handler
跨平台文件处理模块

This module provides robust file handling utilities that work consistently
across Windows, Linux, and macOS, with proper error handling and cleanup.

Key features:
- Safe temporary file creation with proper cleanup
- Cross-platform path handling
- Atomic file operations
- Comprehensive error handling and logging
"""

import os
import shutil
import tempfile
import logging
import atexit
import platform
from pathlib import Path
from typing import Optional, Union
from contextlib import contextmanager


class CrossPlatformFileHandler:
    """
    Robust cross-platform file handler with proper error handling.

    Handles common pitfalls in file operations across different operating systems:
    - Windows file handle issues
    - Path separator inconsistencies
    - Permission problems
    - Temporary file cleanup
    """

    def __init__(self, logger: Optional[logging.Logger] = None):
        """
        Initialize the file handler.

        Args:
            logger: Optional logger instance for tracking operations
        """
        self.logger = logger or self._create_default_logger()
        self.temp_files = []  # Track temporary files for cleanup
        self.platform = platform.system()

        # Register cleanup handler
        atexit.register(self.cleanup_all_temp_files)

        self.logger.info(f"CrossPlatformFileHandler initialized on {self.platform}")

    def _create_default_logger(self) -> logging.Logger:
        """Create a default logger if none provided."""
        logger = logging.getLogger(__name__)
        if not logger.handlers:
            handler = logging.StreamHandler()
            formatter = logging.Formatter(
                "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
            )
            handler.setFormatter(formatter)
            logger.addHandler(handler)
            logger.setLevel(logging.INFO)
        return logger

    @staticmethod
    def normalize_path(path: Union[str, Path]) -> Path:
        """
        Normalize a path to use proper separators for the current OS.

        Args:
            path: Input path (string or Path object)

        Returns:
            Normalized Path object

        Example:
            >>> handler = CrossPlatformFileHandler()
            >>> handler.normalize_path("data/files\\test.txt")
            PosixPath('data/files/test.txt')  # On Linux/Mac
            WindowsPath('data\\files\\test.txt')  # On Windows
        """
        if isinstance(path, str):
            # Replace all path separators with the OS-specific one
            path = path.replace("\\", os.sep).replace("/", os.sep)
            return Path(path).resolve()
        return Path(path).resolve()

    def create_safe_temp_file(
        self,
        suffix: str = "",
        prefix: str = "deepcode_",
        content: Optional[bytes] = None,
    ) -> Path:
        """
        Create a temporary file with proper cross-platform handling.

        This method addresses Windows file handle issues by:
        1. Properly closing the file before returning
        2. Setting delete=False to prevent premature deletion
        3. Tracking the file for later cleanup

        Args:
            suffix: File suffix (e.g., ".pdf", ".txt")
            prefix: File prefix for identification
            content: Optional content to write to the file

        Returns:
            Path to the created temporary file

        Raises:
            IOError: If file creation or writing fails
        """
        try:
            # Create temporary file with proper flags
            fd, temp_path = tempfile.mkstemp(
                suffix=suffix,
                prefix=prefix,
                dir=None,  # Use system default temp directory
                text=False,  # Always use binary mode for consistency
            )

            # Convert to Path object
            temp_path_obj = Path(temp_path)

            # Write content if provided
            if content is not None:
                try:
                    # Write using the file descriptor (more reliable on Windows)
                    os.write(fd, content)
                finally:
                    # Always close the file descriptor
                    os.close(fd)

                self.logger.info(
                    f"Created temp file with content: {temp_path_obj.name} "
                    f"({len(content)} bytes)"
                )
            else:
                # Close immediately if no content
                os.close(fd)
                self.logger.info(f"Created empty temp file: {temp_path_obj.name}")

            # Track for cleanup
            self.temp_files.append(temp_path_obj)

            return temp_path_obj

        except Exception as e:
            self.logger.error(f"Failed to create temporary file: {e}")
            raise IOError(f"Temporary file creation failed: {e}")

    @contextmanager
    def temp_directory(self, prefix: str = "deepcode_"):
        """
        Context manager for temporary directory with automatic cleanup.

        Args:
            prefix: Directory prefix for identification

        Yields:
            Path to temporary directory

        Example:
            >>> with handler.temp_directory() as temp_dir:
            ...     # Use temp_dir
            ...     print(temp_dir)
            # Directory automatically cleaned up after context
        """
        temp_dir = None
        try:
            temp_dir = Path(tempfile.mkdtemp(prefix=prefix))
            self.logger.info(f"Created temporary directory: {temp_dir}")
            yield temp_dir
        finally:
            if temp_dir and temp_dir.exists():
                try:
                    shutil.rmtree(temp_dir, ignore_errors=True)
                    self.logger.info(f"Cleaned up temporary directory: {temp_dir}")
                except Exception as e:
                    self.logger.warning(
                        f"Failed to clean up temporary directory {temp_dir}: {e}"
                    )

    def safe_copy_file(
        self,
        source: Union[str, Path],
        destination: Union[str, Path],
        preserve_metadata: bool = True,
        overwrite: bool = False,
    ) -> Path:
        """
        Safely copy a file with proper error handling.

        This method uses copy instead of move to preserve the original file,
        addressing the issue mentioned by the user.

        Args:
            source: Source file path
            destination: Destination file path
            preserve_metadata: Whether to preserve file metadata (timestamps, etc.)
            overwrite: Whether to overwrite if destination exists

        Returns:
            Path to the destination file

        Raises:
            FileNotFoundError: If source file doesn't exist
            FileExistsError: If destination exists and overwrite=False
            IOError: If copy operation fails
        """
        source_path = self.normalize_path(source)
        dest_path = self.normalize_path(destination)

        # Validate source
        if not source_path.exists():
            raise FileNotFoundError(f"Source file not found: {source_path}")

        # Check destination
        if dest_path.exists() and not overwrite:
            raise FileExistsError(
                f"Destination already exists: {dest_path}. "
                f"Use overwrite=True to replace."
            )

        try:
            # Ensure destination directory exists
            dest_path.parent.mkdir(parents=True, exist_ok=True)

            # Copy file (preserves original!)
            if preserve_metadata:
                shutil.copy2(source_path, dest_path)
            else:
                shutil.copy(source_path, dest_path)

            self.logger.info(
                f"Copied file: {source_path.name} -> {dest_path} "
                f"({source_path.stat().st_size} bytes)"
            )

            return dest_path

        except Exception as e:
            self.logger.error(
                f"Failed to copy file from {source_path} to {dest_path}: {e}"
            )
            raise IOError(f"File copy failed: {e}")

    def safe_move_file(
        self,
        source: Union[str, Path],
        destination: Union[str, Path],
        overwrite: bool = False,
    ) -> Path:
        """
        Safely move a file (only if explicitly needed).

        Note: Prefer safe_copy_file to preserve originals.

        Args:
            source: Source file path
            destination: Destination file path
            overwrite: Whether to overwrite if destination exists

        Returns:
            Path to the destination file

        Raises:
            FileNotFoundError: If source file doesn't exist
            FileExistsError: If destination exists and overwrite=False
            IOError: If move operation fails
        """
        source_path = self.normalize_path(source)
        dest_path = self.normalize_path(destination)

        # Validate source
        if not source_path.exists():
            raise FileNotFoundError(f"Source file not found: {source_path}")

        # Check destination
        if dest_path.exists() and not overwrite:
            raise FileExistsError(
                f"Destination already exists: {dest_path}. "
                f"Use overwrite=True to replace."
            )

        try:
            # Ensure destination directory exists
            dest_path.parent.mkdir(parents=True, exist_ok=True)

            # Move file
            shutil.move(str(source_path), str(dest_path))

            self.logger.info(f"Moved file: {source_path.name} -> {dest_path}")

            return dest_path

        except Exception as e:
            self.logger.error(
                f"Failed to move file from {source_path} to {dest_path}: {e}"
            )
            raise IOError(f"File move failed: {e}")

    def safe_remove_file(self, file_path: Union[str, Path]) -> bool:
        """
        Safely remove a file with proper error handling.

        Args:
            file_path: Path to file to remove

        Returns:
            True if file was removed, False if it didn't exist or removal failed
        """
        path = self.normalize_path(file_path)

        if not path.exists():
            self.logger.debug(f"File already removed or doesn't exist: {path}")
            return False

        try:
            # On Windows, ensure file is not read-only
            if self.platform == "Windows":
                os.chmod(path, 0o777)

            path.unlink()
            self.logger.info(f"Removed file: {path.name}")

            # Remove from tracking list if present
            if path in self.temp_files:
                self.temp_files.remove(path)

            return True

        except PermissionError as e:
            self.logger.warning(f"Permission denied when removing {path}: {e}")
            return False
        except Exception as e:
            self.logger.error(f"Failed to remove file {path}: {e}")
            return False

    def cleanup_all_temp_files(self):
        """
        Clean up all tracked temporary files.

        This is automatically called on program exit via atexit,
        but can also be called manually.
        """
        if not self.temp_files:
            return

        self.logger.info(f"Cleaning up {len(self.temp_files)} temporary files...")

        cleaned = 0
        failed = 0

        for temp_file in self.temp_files[
            :
        ]:  # Copy list to avoid modification during iteration
            if self.safe_remove_file(temp_file):
                cleaned += 1
            else:
                failed += 1

        self.logger.info(f"Cleanup complete: {cleaned} files removed, {failed} failed")

        self.temp_files.clear()

    def get_system_temp_dir(self) -> Path:
        """
        Get the system temporary directory with proper cross-platform handling.

        Returns:
            Path to system temporary directory
        """
        return Path(tempfile.gettempdir())

    def create_workspace_directory(
        self, base_dir: Union[str, Path], workspace_name: str, clean: bool = False
    ) -> Path:
        """
        Create a workspace directory with proper structure.

        Args:
            base_dir: Base directory for workspace
            workspace_name: Name of the workspace
            clean: Whether to clean the directory if it exists

        Returns:
            Path to the created workspace directory
        """
        base_path = self.normalize_path(base_dir)
        workspace_path = base_path / workspace_name

        if clean and workspace_path.exists():
            self.logger.info(f"Cleaning existing workspace: {workspace_path}")
            shutil.rmtree(workspace_path, ignore_errors=True)

        workspace_path.mkdir(parents=True, exist_ok=True)
        self.logger.info(f"Created workspace directory: {workspace_path}")

        return workspace_path


# Singleton instance for convenience
_file_handler_instance: Optional[CrossPlatformFileHandler] = None


def get_file_handler(
    logger: Optional[logging.Logger] = None,
) -> CrossPlatformFileHandler:
    """
    Get or create a singleton file handler instance.

    Args:
        logger: Optional logger instance

    Returns:
        CrossPlatformFileHandler instance
    """
    global _file_handler_instance
    if _file_handler_instance is None:
        _file_handler_instance = CrossPlatformFileHandler(logger)
    return _file_handler_instance


# Example usage
if __name__ == "__main__":
    # Configure logging
    logging.basicConfig(level=logging.INFO)

    # Create handler
    handler = CrossPlatformFileHandler()

    print(f"\n{'='*70}")
    print("Cross-Platform File Handler - Demo")
    print(f"{'='*70}\n")

    print(f"Platform: {handler.platform}")
    print(f"System temp directory: {handler.get_system_temp_dir()}")

    # Demo: Create temporary file
    print("\n1. Creating temporary file...")
    temp_file = handler.create_safe_temp_file(
        suffix=".txt", content=b"Test content for cross-platform file handling"
    )
    print(f"   Created: {temp_file}")

    # Demo: Use temporary directory
    print("\n2. Using temporary directory...")
    with handler.temp_directory() as temp_dir:
        print(f"   Temp directory: {temp_dir}")
        test_file = temp_dir / "test.txt"
        test_file.write_text("Hello from temp directory!")
        print(f"   Created file in temp dir: {test_file}")
    print("   Temp directory automatically cleaned up")

    # Demo: Path normalization
    print("\n3. Path normalization:")
    test_paths = [
        "data/files\\test.txt",
        "data\\files/test.txt",
        "data\\files\\test.txt",
    ]
    for path in test_paths:
        normalized = handler.normalize_path(path)
        print(f"   {path} -> {normalized}")

    # Demo: Cleanup
    print("\n4. Cleaning up tracked files...")
    handler.cleanup_all_temp_files()

    print(f"\n{'='*70}")
    print("Demo completed successfully!")
    print(f"{'='*70}\n")


================================================
FILE: utils/dialogue_logger.py
================================================
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Comprehensive Dialogue Logger for Code Implementation Workflow
Logs complete conversation rounds with detailed formatting and paper-specific organization
"""

import json
import os
from datetime import datetime
from pathlib import Path
from typing import Dict, Any, List


class DialogueLogger:
    """
    Comprehensive dialogue logger for code implementation workflow
    Captures complete conversation rounds with proper formatting and organization
    """

    def __init__(self, paper_id: str, base_path: str = None):
        """
        Initialize dialogue logger for a specific paper

        Args:
            paper_id: Paper identifier (e.g., "1", "2", etc.)
            base_path: Base path for logs (defaults to agent_folders structure)
        """
        self.paper_id = paper_id
        self.base_path = (
            base_path
            or "/data2/bjdwhzzh/project-hku/Code-Agent2.0/Code-Agent/deepcode-mcp/agent_folders"
        )
        self.log_directory = os.path.join(
            self.base_path, "papers", str(paper_id), "logs"
        )

        # Create log directory if it doesn't exist
        Path(self.log_directory).mkdir(parents=True, exist_ok=True)

        # Session tracking (initialize before log file creation)
        self.round_counter = 0
        self.session_start_time = datetime.now()
        self.current_round_data = {}

        # Generate log filename with timestamp
        timestamp = self.session_start_time.strftime("%Y%m%d_%H%M%S")
        self.log_filename = f"dialogue_log_{timestamp}.md"
        self.log_filepath = os.path.join(self.log_directory, self.log_filename)

        # Initialize log file with header
        self._initialize_log_file()

        print(f"📝 Dialogue Logger initialized for Paper {paper_id}")
        print(f"📁 Log file: {self.log_filepath}")

    def _initialize_log_file(self):
        """Initialize the log file with header information"""
        header = f"""# Code Implementation Dialogue Log

**Paper ID:** {self.paper_id}
**Session Start:** {self.session_start_time.strftime('%Y-%m-%d %H:%M:%S')}
**Log File:** {self.log_filename}

---

## Session Overview

This log contains the complete conversation rounds between the user and assistant during the code implementation workflow. Each round includes:

- System prompts and user messages
- Assistant responses with tool calls
- Tool execution results
- Implementation progress markers

---

"""
        try:
            with open(self.log_filepath, "w", encoding="utf-8") as f:
                f.write(header)
        except Exception as e:
            print(f"⚠️ Failed to initialize log file: {e}")

    def start_new_round(
        self, round_type: str = "implementation", context: Dict[str, Any] = None
    ):
        """
        Start a new dialogue round

        Args:
            round_type: Type of round (implementation, summary, error_handling, etc.)
            context: Additional context information (may include 'iteration' to sync with workflow)
        """
        # Use iteration from context if provided, otherwise increment round_counter
        if context and "iteration" in context:
            self.round_counter = context["iteration"]
        else:
            self.round_counter += 1

        self.current_round_data = {
            "round_number": self.round_counter,
            "round_type": round_type,
            "start_time": datetime.now(),
            "context": context or {},
            "messages": [],
            "tool_calls": [],
            "results": [],
            "metadata": {},
        }

        print(f"🔄 Starting Round {self.round_counter}: {round_type}")

    def log_system_prompt(self, prompt: str, prompt_type: str = "system"):
        """
        Log system prompt or instructions

        Args:
            prompt: System prompt content
            prompt_type: Type of prompt (system, instruction, etc.)
        """
        if not self.current_round_data:
            self.start_new_round("system_setup")

        self.current_round_data["messages"].append(
            {
                "role": "system",
                "type": prompt_type,
                "content": prompt,
                "timestamp": datetime.now().isoformat(),
            }
        )

    def log_user_message(self, message: str, message_type: str = "user_input"):
        """
        Log user message

        Args:
            message: User message content
            message_type: Type of message (user_input, feedback, guidance, etc.)
        """
        if not self.current_round_data:
            self.start_new_round("user_interaction")

        self.current_round_data["messages"].append(
            {
                "role": "user",
                "type": message_type,
                "content": message,
                "timestamp": datetime.now().isoformat(),
            }
        )

    def log_assistant_response(
        self, response: str, response_type: str = "assistant_response"
    ):
        """
        Log assistant response

        Args:
            response: Assistant response content
            response_type: Type of response (assistant_response, analysis, etc.)
        """
        if not self.current_round_data:
            self.start_new_round("assistant_interaction")

        self.current_round_data["messages"].append(
            {
                "role": "assistant",
                "type": response_type,
                "content": response,
                "timestamp": datetime.now().isoformat(),
            }
        )

    def log_tool_calls(self, tool_calls: List[Dict[str, Any]]):
        """
        Log tool calls made by the assistant

        Args:
            tool_calls: List of tool calls with id, name, and input
        """
        if not self.current_round_data:
            self.start_new_round("tool_execution")

        for tool_call in tool_calls:
            self.current_round_data["tool_calls"].append(
                {
                    "id": tool_call.get("id", ""),
                    "name": tool_call.get("name", ""),
                    "input": tool_call.get("input", {}),
                    "timestamp": datetime.now().isoformat(),
                }
            )

    def log_tool_results(self, tool_results: List[Dict[str, Any]]):
        """
        Log tool execution results

        Args:
            tool_results: List of tool results with tool_name and result
        """
        if not self.current_round_data:
            self.start_new_round("tool_results")

        for result in tool_results:
            self.current_round_data["results"].append(
                {
                    "tool_name": result.get("tool_name", ""),
                    "result": result.get("result", ""),
                    "timestamp": datetime.now().isoformat(),
                }
            )

    def log_metadata(self, key: str, value: Any):
        """
        Log metadata information

        Args:
            key: Metadata key
            value: Metadata value
        """
        if not self.current_round_data:
            self.start_new_round("metadata")

        self.current_round_data["metadata"][key] = value

    def log_memory_optimization(
        self,
        messages_before: List[Dict],
        messages_after: List[Dict],
        optimization_stats: Dict[str, Any],
        approach: str = "memory_optimization",
    ):
        """
        Log memory optimization details including before/after message content

        Args:
            messages_before: Messages before optimization
            messages_after: Messages after optimization
            optimization_stats: Statistics about the optimization
            approach: Optimization approach used
        """
        if not self.current_round_data:
            self.start_new_round("memory_optimization")

        # Calculate what was removed/kept
        removed_count = len(messages_before) - len(messages_after)
        compression_ratio = (
            (removed_count / len(messages_before) * 100) if messages_before else 0
        )

        # Log the optimization details
        optimization_data = {
            "approach": approach,
            "messages_before_count": len(messages_before),
            "messages_after_count": len(messages_after),
            "messages_removed_count": removed_count,
            "compression_ratio": f"{compression_ratio:.1f}%",
            "optimization_stats": optimization_stats,
            "timestamp": datetime.now().isoformat(),
        }

        # Store the optimization data
        if "memory_optimizations" not in self.current_round_data:
            self.current_round_data["memory_optimizations"] = []

        self.current_round_data["memory_optimizations"].append(
            {
                "optimization_data": optimization_data,
                "messages_before": messages_before,
                "messages_after": messages_after,
            }
        )

        # Log metadata
        self.log_metadata("memory_optimization", optimization_data)

        print(
            f"🧹 Memory optimization logged: {len(messages_before)} → {len(messages_after)} messages ({compression_ratio:.1f}% compression)"
        )

    def complete_round(self, summary: str = "", status: str = "completed"):
        """
        Complete the current round and write to log file

        Args:
            summary: Round summary
            status: Round completion status
        """
        if not self.current_round_data:
            print("⚠️ No active round to complete")
            return

        self.current_round_data["end_time"] = datetime.now()
        self.current_round_data["duration"] = (
            self.current_round_data["end_time"] - self.current_round_data["start_time"]
        ).total_seconds()
        self.current_round_data["summary"] = summary
        self.current_round_data["status"] = status

        # Write round to log file
        self._write_round_to_log()

        print(f"✅ Round {self.round_counter} completed: {status}")

        # Clear current round data
        self.current_round_data = {}

    def _write_round_to_log(self):
        """Write the current round data to the log file in markdown format"""
        try:
            with open(self.log_filepath, "a", encoding="utf-8") as f:
                round_data = self.current_round_data

                # Round header
                f.write(
                    f"\n## Round {round_data['round_number']}: {round_data['round_type'].title()}\n\n"
                )
                f.write(
                    f"**Start Time:** {round_data['start_time'].strftime('%Y-%m-%d %H:%M:%S')}\n"
                )
                f.write(
                    f"**End Time:** {round_data['end_time'].strftime('%Y-%m-%d %H:%M:%S')}\n"
                )
                f.write(f"**Duration:** {round_data['duration']:.2f} seconds\n")
                f.write(f"**Status:** {round_data['status']}\n\n")

                # Context information
                if round_data.get("context"):
                    f.write("### Context\n\n")
                    for key, value in round_data["context"].items():
                        f.write(f"- **{key}:** {value}\n")
                    f.write("\n")

                # Messages
                if round_data.get("messages"):
                    f.write("### Messages\n\n")
                    for i, msg in enumerate(round_data["messages"], 1):
                        role_emoji = {
                            "system": "🔧",
                            "user": "👤",
                            "assistant": "🤖",
                        }.get(msg["role"], "📝")
                        f.write(
                            f"#### {role_emoji} {msg['role'].title()} Message {i}\n\n"
                        )
                        f.write(f"**Type:** {msg['type']}\n")
                        f.write(f"**Timestamp:** {msg['timestamp']}\n\n")
                        f.write("```\n")
                        f.write(msg["content"])
                        f.write("\n```\n\n")

                # Tool calls
                if round_data.get("tool_calls"):
                    f.write("### Tool Calls\n\n")
                    for i, tool_call in enumerate(round_data["tool_calls"], 1):
                        f.write(f"#### 🛠️ Tool Call {i}: {tool_call['name']}\n\n")
                        f.write(f"**ID:** {tool_call['id']}\n")
                        f.write(f"**Timestamp:** {tool_call['timestamp']}\n\n")
                        f.write("**Input:**\n")
                        f.write("```json\n")
                        f.write(
                            json.dumps(tool_call["input"], indent=2, ensure_ascii=False)
                        )
                        f.write("\n```\n\n")

                # Tool results
                if round_data.get("results"):
                    f.write("### Tool Results\n\n")
                    for i, result in enumerate(round_data["results"], 1):
                        f.write(f"#### 📊 Result {i}: {result['tool_name']}\n\n")
                        f.write(f"**Timestamp:** {result['timestamp']}\n\n")
                        f.write("**Result:**\n")
                        f.write("```\n")
                        f.write(str(result["result"]))
                        f.write("\n```\n\n")

                # Memory Optimizations
                if round_data.get("memory_optimizations"):
                    f.write("### Memory Optimizations\n\n")
                    for i, opt in enumerate(round_data["memory_optimizations"], 1):
                        opt_data = opt["optimization_data"]
                        messages_before = opt["messages_before"]
                        messages_after = opt["messages_after"]

                        f.write(f"#### 🧹 Memory Optimization {i}\n\n")
                        f.write(f"**Approach:** {opt_data['approach']}\n")
                        f.write(
                            f"**Messages Before:** {opt_data['messages_before_count']}\n"
                        )
                        f.write(
                            f"**Messages After:** {opt_data['messages_after_count']}\n"
                        )
                        f.write(
                            f"**Messages Removed:** {opt_data['messages_removed_count']}\n"
                        )
                        f.write(
                            f"**Compression Ratio:** {opt_data['compression_ratio']}\n"
                        )
                        f.write(f"**Timestamp:** {opt_data['timestamp']}\n\n")

                        # Show optimization stats
                        if opt_data.get("optimization_stats"):
                            f.write("**Optimization Statistics:**\n")
                            f.write("```json\n")
                            f.write(
                                json.dumps(
                                    opt_data["optimization_stats"],
                                    indent=2,
                                    ensure_ascii=False,
                                )
                            )
                            f.write("\n```\n\n")

                        # Show messages before optimization (limited to last 5 for readability)
                        if messages_before:
                            f.write("**Messages Before Optimization (last 5):**\n\n")
                            for j, msg in enumerate(messages_before[-5:], 1):
                                role = msg.get("role", "unknown")
                                content = msg.get("content", "")
                                # Truncate very long messages
                                if len(content) > 3000:
                                    content = content[:3000] + "...[truncated]"
                                f.write(
                                    f"- **{role} {j}:** {content[:3000]}{'...' if len(content) > 100 else ''}\n"
                                )
                            f.write("\n")

                        # Show messages after optimization
                        if messages_after:
                            f.write("**Messages After Optimization:**\n\n")
                            for j, msg in enumerate(messages_after, 1):
                                role = msg.get("role", "unknown")
                                content = msg.get("content", "")
                                # Truncate very long messages
                                if len(content) > 3000:
                                    content = content[:3000] + "...[truncated]"
                                f.write(
                                    f"- **{role} {j}:** {content[:3000]}{'...' if len(content) > 100 else ''}\n"
                                )
                            f.write("\n")

                        # Show what was removed
                        if len(messages_before) > len(messages_after):
                            removed_messages = (
                                messages_before[: -len(messages_after)]
                                if messages_after
                                else messages_before
                            )
                            f.write(
                                f"**Messages Removed ({len(removed_messages)}):**\n\n"
                            )
                            for j, msg in enumerate(
                                removed_messages[-3:], 1
                            ):  # Show last 3 removed
                                role = msg.get("role", "unknown")
                                content = msg.get("content", "")
                                if len(content) > 3000:
                                    content = content[:3000] + "...[truncated]"
                                f.write(f"- **{role} {j}:** {content}\n")
                            f.write("\n")

                        f.write("\n")

                # Metadata
                if round_data.get("metadata"):
                    f.write("### Metadata\n\n")
                    for key, value in round_data["metadata"].items():
                        if (
                            key != "memory_optimization"
                        ):  # Skip memory optimization metadata as it's shown above
                            f.write(f"- **{key}:** {value}\n")
                    f.write("\n")

                # Summary
                if round_data.get("summary"):
                    f.write("### Summary\n\n")
                    f.write(round_data["summary"])
                    f.write("\n\n")

                # Separator
                f.write("---\n\n")

        except Exception as e:
            print(f"⚠️ Failed to write round to log: {e}")

    def log_complete_exchange(
        self,
        system_prompt: str = "",
        user_message: str = "",
        assistant_response: str = "",
        tool_calls: List[Dict] = None,
        tool_results: List[Dict] = None,
        round_type: str = "exchange",
        context: Dict = None,
        summary: str = "",
    ):
        """
        Log a complete exchange in a single call

        Args:
            system_prompt: System prompt (optional)
            user_message: User message
            assistant_response: Assistant response
            tool_calls: Tool calls made
            tool_results: Tool execution results
            round_type: Type of round
            context: Additional context
            summary: Round summary
        """
        self.start_new_round(round_type, context)

        if system_prompt:
            self.log_system_prompt(system_prompt)

        if user_message:
            self.log_user_message(user_message)

        if assistant_response:
            self.log_assistant_response(assistant_response)

        if tool_calls:
            self.log_tool_calls(tool_calls)

        if tool_results:
            self.log_tool_results(tool_results)

        self.complete_round(summary)

    def get_session_stats(self) -> Dict[str, Any]:
        """Get session statistics"""
        return {
            "paper_id": self.paper_id,
            "session_start": self.session_start_time.isoformat(),
            "total_rounds": self.round_counter,
            "log_file": self.log_filepath,
            "session_duration": (
                datetime.now() - self.session_start_time
            ).total_seconds(),
        }

    def finalize_session(self, final_summary: str = ""):
        """
        Finalize the logging session

        Args:
            final_summary: Final session summary
        """
        try:
            with open(self.log_filepath, "a", encoding="utf-8") as f:
                f.write("\n## Session Summary\n\n")
                f.write(f"**Total Rounds:** {self.round_counter}\n")
                f.write(
                    f"**Session Duration:** {(datetime.now() - self.session_start_time).total_seconds():.2f} seconds\n"
                )
                f.write(
                    f"**End Time:** {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}\n\n"
                )

                if final_summary:
                    f.write("### Final Summary\n\n")
                    f.write(final_summary)
                    f.write("\n\n")

                f.write("---\n\n")
                f.write("*End of Session*\n")

        except Exception as e:
            print(f"⚠️ Failed to finalize session: {e}")

        print(f"🎯 Session finalized: {self.round_counter} rounds logged")


# Utility functions for easy integration
def create_dialogue_logger(paper_id: str, base_path: str = None) -> DialogueLogger:
    """
    Create a dialogue logger for a specific paper

    Args:
        paper_id: Paper identifier
        base_path: Base path for logs

    Returns:
        DialogueLogger instance
    """
    return DialogueLogger(paper_id, base_path)


def extract_paper_id_from_path(path: str) -> str:
    """
    Extract paper ID from a file path

    Args:
        path: File path containing paper information

    Returns:
        Paper ID string
    """
    # Extract paper ID from path like "/data2/.../papers/1/initial_plan.txt"
    parts = path.split("/")
    for i, part in enumerate(parts):
        if part == "papers" and i + 1 < len(parts):
            return parts[i + 1]
    return "unknown"


# Example usage
if __name__ == "__main__":
    # Test the dialogue logger
    logger = DialogueLogger("1")

    # Log a complete exchange
    logger.log_complete_exchange(
        system_prompt="You are a code implementation assistant.",
        user_message="Implement the transformer model",
        assistant_response="I'll implement the transformer model step by step.",
        tool_calls=[
            {"id": "1", "name": "write_file", "input": {"filename": "transformer.py"}}
        ],
        tool_results=[
            {"tool_name": "write_file", "result": "File created successfully"}
        ],
        round_type="implementation",
        context={"files_implemented": 1},
        summary="Successfully implemented transformer model",
    )

    # Test memory optimization logging
    logger.start_new_round(
        "memory_optimization", {"trigger_reason": "write_file_detected"}
    )

    # Mock messages before and after optimization
    messages_before = [
        {"role": "user", "content": "Original message 1"},
        {"role": "assistant", "content": "Original response 1"},
        {"role": "user", "content": "Original message 2"},
        {"role": "assistant", "content": "Original response 2"},
        {"role": "user", "content": "Original message 3"},
    ]

    messages_after = [
        {"role": "user", "content": "Original message 1"},
        {"role": "assistant", "content": "Original response 1"},
        {"role": "user", "content": "Original message 3"},
    ]

    # Mock optimization stats
    optimization_stats = {
        "implemented_files_tracked": 2,
        "current_round": 5,
        "concise_mode_active": True,
    }

    # Log memory optimization
    logger.log_memory_optimization(
        messages_before=messages_before,
        messages_after=messages_after,
        optimization_stats=optimization_stats,
        approach="clear_after_write_file",
    )

    logger.complete_round("Memory optimization test completed")

    # Finalize session
    logger.finalize_session(
        "Test session with memory optimization logging completed successfully"
    )

    print("✅ Dialogue logger test completed with memory optimization")


================================================
FILE: utils/file_processor.py
================================================
"""
File processing utilities for handling paper files and related operations.
"""

import json
import os
import re
from typing import Dict, List, Optional, Union


class FileProcessor:
    """
    A class to handle file processing operations including path extraction and file reading.
    """

    @staticmethod
    def extract_file_path(file_info: Union[str, Dict]) -> Optional[str]:
        """
        Extract paper directory path from the input information.

        Args:
            file_info: Either a JSON string or a dictionary containing file information

        Returns:
            Optional[str]: The extracted paper directory path or None if not found
        """
        try:
            # Handle direct file path input
            if isinstance(file_info, str):
                # Check if it's a file path (existing or not)
                if file_info.endswith(
                    (".md", ".pdf", ".txt", ".docx", ".doc", ".html", ".htm")
                ):
                    # It's a file path, return the directory
                    return os.path.dirname(os.path.abspath(file_info))
                elif os.path.exists(file_info):
                    if os.path.isfile(file_info):
                        return os.path.dirname(os.path.abspath(file_info))
                    elif os.path.isdir(file_info):
                        return os.path.abspath(file_info)

                # Try to parse as JSON
                try:
                    info_dict = json.loads(file_info)
                except json.JSONDecodeError:
                    # Try to extract JSON from text
                    info_dict = FileProcessor.extract_json_from_text(file_info)
                    if not info_dict:
                        # If not JSON and doesn't look like a file path, raise error
                        raise ValueError(
                            f"Input is neither a valid file path nor JSON: {file_info}"
                        )
            else:
                info_dict = file_info

            # Extract paper path from dictionary
            paper_path = info_dict.get("paper_path")
            if not paper_path:
                raise ValueError("No paper_path found in input dictionary")

            # Get the directory path instead of the file path
            paper_dir = os.path.dirname(paper_path)

            # Convert to absolute path if relative
            if not os.path.isabs(paper_dir):
                paper_dir = os.path.abspath(paper_dir)

            return paper_dir

        except (AttributeError, TypeError) as e:
            raise ValueError(f"Invalid input format: {str(e)}")

    @staticmethod
    def find_markdown_file(directory: str) -> Optional[str]:
        """
        Find the first markdown file in the given directory.

        Args:
            directory: Directory path to search

        Returns:
            Optional[str]: Path to the markdown file or None if not found
        """
        if not os.path.isdir(directory):
            return None

        for file in os.listdir(directory):
            if file.endswith(".md"):
                return os.path.join(directory, file)
        return None

    @staticmethod
    def parse_markdown_sections(content: str) -> List[Dict[str, Union[str, int, List]]]:
        """
        Parse markdown content and organize it by sections based on headers.

        Args:
            content: The markdown content to parse

        Returns:
            List[Dict]: A list of sections, each containing:
                - level: The header level (1-6)
                - title: The section title
                - content: The section content
                - subsections: List of subsections
        """
        # Split content into lines
        lines = content.split("\n")
        sections = []
        current_section = None
        current_content = []

        for line in lines:
            # Check if line is a header
            header_match = re.match(r"^(#{1,6})\s+(.+)$", line)

            if header_match:
                # If we were building a section, save its content
                if current_section is not None:
                    current_section["content"] = "\n".join(current_content).strip()
                    sections.append(current_section)

                # Start a new section
                level = len(header_match.group(1))
                title = header_match.group(2).strip()
                current_section = {
                    "level": level,
                    "title": title,
                    "content": "",
                    "subsections": [],
                }
                current_content = []
            elif current_section is not None:
                current_content.append(line)

        # Don't forget to save the last section
        if current_section is not None:
            current_section["content"] = "\n".join(current_content).strip()
            sections.append(current_section)

        return FileProcessor._organize_sections(sections)

    @staticmethod
    def _organize_sections(sections: List[Dict]) -> List[Dict]:
        """
        Organize sections into a hierarchical structure based on their levels.

        Args:
            sections: List of sections with their levels

        Returns:
            List[Dict]: Organized hierarchical structure of sections
        """
        result = []
        section_stack = []

        for section in sections:
            while section_stack and section_stack[-1]["level"] >= section["level"]:
                section_stack.pop()

            if section_stack:
                section_stack[-1]["subsections"].append(section)
            else:
                result.append(section)

            section_stack.append(section)

        return result

    @staticmethod
    async def read_file_content(file_path: str) -> str:
        """
        Read the content of a file asynchronously.

        Args:
            file_path: Path to the file to read

        Returns:
            str: The content of the file

        Raises:
            FileNotFoundError: If the file doesn't exist
            IOError: If there's an error reading the file
        """
        try:
            # Ensure the file exists
            if not os.path.exists(file_path):
                raise FileNotFoundError(f"File not found: {file_path}")

            # Check if file is actually a PDF by reading the first few bytes
            with open(file_path, "rb") as f:
                header = f.read(8)
                if header.startswith(b"%PDF"):
                    # Try to convert PDF to markdown automatically
                    try:
                        from tools.pdf_downloader import SimplePdfConverter
                        converter = SimplePdfConverter()
                        conversion_result = converter.convert_pdf_to_markdown(file_path)
                        
                        if conversion_result["success"]:
                            # Use the converted markdown file instead
                            file_path = conversion_result["output_file"]
                        else:
                            raise IOError(f"PDF conversion failed: {conversion_result['error']}")
                    except Exception as conv_error:
                        raise IOError(
                            f"File {file_path} is a PDF file, not a text file. PDF conversion failed: {str(conv_error)}"
                        )

            # Read file content
            # Note: Using async with would be better for large files
            # but for simplicity and compatibility, using regular file reading
            with open(file_path, "r", encoding="utf-8") as f:
                content = f.read()

            return content

        except UnicodeDecodeError as e:
            raise IOError(
                f"Error reading file {file_path}: File encoding is not UTF-8. Original error: {str(e)}"
            )
        except Exception as e:
            raise IOError(f"Error reading file {file_path}: {str(e)}")

    @staticmethod
    def format_section_content(section: Dict) -> str:
        """
        Format a section's content with standardized spacing and structure.

        Args:
            section: Dictionary containing section information

        Returns:
            str: Formatted section content
        """
        # Start with section title
        formatted = f"\n{'#' * section['level']} {section['title']}\n"

        # Add section content if it exists
        if section["content"]:
            formatted += f"\n{section['content'].strip()}\n"

        # Process subsections
        if section["subsections"]:
            # Add a separator before subsections if there's content
            if section["content"]:
                formatted += "\n---\n"

            # Process each subsection
            for subsection in section["subsections"]:
                formatted += FileProcessor.format_section_content(subsection)

        # Add section separator
        formatted += "\n" + "=" * 80 + "\n"

        return formatted

    @staticmethod
    def standardize_output(sections: List[Dict]) -> str:
        """
        Convert structured sections into a standardized string format.

        Args:
            sections: List of section dictionaries

        Returns:
            str: Standardized string output
        """
        output = []

        # Process each top-level section
        for section in sections:
            output.append(FileProcessor.format_section_content(section))

        # Join all sections with clear separation
        return "\n".join(output)

    @classmethod
    async def process_file_input(
        cls, file_input: Union[str, Dict], base_dir: str = None
    ) -> Dict:
        """
        Process file input information and return the structured content.

        Args:
            file_input: File input information (JSON string, dict, or direct file path)
            base_dir: Optional base directory to use for creating paper directories (for sync support)

        Returns:
            Dict: The structured content with sections and standardized text
        """
        try:
            # First try to extract markdown file path from string
            if isinstance(file_input, str):
                import re

                # Try to extract path from backticks first
                file_path_match = re.search(r"`([^`]+\.md)`", file_input)
                if file_path_match:
                    paper_path = file_path_match.group(1)
                    file_input = {"paper_path": paper_path}
                else:
                    # Try to extract from "Saved Path:" or similar patterns
                    path_patterns = [
                        r"[Ss]aved [Pp]ath[:\s]+([^\s\n]+\.md)",
                        r"[Pp]aper [Pp]ath[:\s]+([^\s\n]+\.md)",
                        r"[Ff]ile[:\s]+([^\s\n]+\.md)",
                        r"[Oo]utput[:\s]+([^\s\n]+\.md)",
                    ]
                    for pattern in path_patterns:
                        match = re.search(pattern, file_input)
                        if match:
                            paper_path = match.group(1)
                            file_input = {"paper_path": paper_path}
                            break

            # Extract paper directory path
            paper_dir = cls.extract_file_path(file_input)

            # If base_dir is provided, adjust paper_dir to be relative to base_dir
            if base_dir and paper_dir:
                # If paper_dir is using default location, move it to base_dir
                if paper_dir.endswith(("deepcode_lab", "agent_folders")):
                    paper_dir = base_dir
                else:
                    # Extract the relative part and combine with base_dir
                    paper_name = os.path.basename(paper_dir)
                    # Keep original directory name unchanged, no replacements
                    paper_dir = os.path.join(base_dir, "papers", paper_name)

                # Ensure the directory exists
                os.makedirs(paper_dir, exist_ok=True)

            if not paper_dir:
                raise ValueError("Could not determine paper directory path")

            # Get the actual file path
            file_path = None
            if isinstance(file_input, str):
                # Try to parse as JSON (handle download results)
                try:
                    parsed_json = json.loads(file_input)
                    if isinstance(parsed_json, dict) and "paper_path" in parsed_json:
                        file_path = parsed_json.get("paper_path")
                        # If file doesn't exist, try to find markdown file
                        if file_path and not os.path.exists(file_path):
                            paper_dir = os.path.dirname(file_path)
                            if os.path.isdir(paper_dir):
                                file_path = cls.find_markdown_file(paper_dir)
                                if not file_path:
                                    raise ValueError(
                                        f"No markdown file found in directory: {paper_dir}"
                                    )
                    else:
                        raise ValueError("Invalid JSON format: missing paper_path")
                except json.JSONDecodeError:
                    # Try to extract JSON from text (handle download results with extra text)
                    extracted_json = cls.extract_json_from_text(file_input)
                    if extracted_json and "paper_path" in extracted_json:
                        file_path = extracted_json.get("paper_path")
                        # If file doesn't exist, try to find markdown file
                        if file_path and not os.path.exists(file_path):
                            paper_dir = os.path.dirname(file_path)
                            if os.path.isdir(paper_dir):
                                file_path = cls.find_markdown_file(paper_dir)
                                if not file_path:
                                    raise ValueError(
                                        f"No markdown file found in directory: {paper_dir}"
                                    )
                    else:
                        # Not JSON, handle as file path
                        # Check if it's a file path (existing or not)
                        if file_input.endswith(
                            (".md", ".pdf", ".txt", ".docx", ".doc", ".html", ".htm")
                        ):
                            if os.path.exists(file_input):
                                file_path = file_input
                            else:
                                # File doesn't exist, try to find markdown in the directory
                                file_path = cls.find_markdown_file(paper_dir)
                                if not file_path:
                                    raise ValueError(
                                        f"No markdown file found in directory: {paper_dir}"
                                    )
                        elif os.path.exists(file_input):
                            if os.path.isfile(file_input):
                                file_path = file_input
                            elif os.path.isdir(file_input):
                                # If it's a directory, find the markdown file
                                file_path = cls.find_markdown_file(file_input)
                                if not file_path:
                                    raise ValueError(
                                        f"No markdown file found in directory: {file_input}"
                                    )
                        else:
                            raise ValueError(f"Invalid input: {file_input}")
            else:
                # Dictionary input
                file_path = file_input.get("paper_path")
                # If the file doesn't exist, try to find markdown in the directory
                if file_path and not os.path.exists(file_path):
                    paper_dir = os.path.dirname(file_path)
                    if os.path.isdir(paper_dir):
                        file_path = cls.find_markdown_file(paper_dir)
                        if not file_path:
                            raise ValueError(
                                f"No markdown file found in directory: {paper_dir}"
                            )

            if not file_path:
                raise ValueError("No valid file path found")

            # Read file content
            content = await cls.read_file_content(file_path)

            # Parse and structure the content
            structured_content = cls.parse_markdown_sections(content)

            # Generate standardized text output
            standardized_text = cls.standardize_output(structured_content)

            return {
                "paper_dir": paper_dir,
                "file_path": file_path,
                "sections": structured_content,
                "standardized_text": standardized_text,
            }

        except Exception as e:
            raise ValueError(f"Error processing file input: {str(e)}")

    @staticmethod
    def extract_json_from_text(text: str) -> Optional[Dict]:
        """
        Extract JSON from text that may contain markdown code blocks or other content.

        Args:
            text: Text that may contain JSON

        Returns:
            Optional[Dict]: Extracted JSON as dictionary or None if not found
        """
        import re

        # Try to find JSON in markdown code blocks
        json_pattern = r"```json\s*(\{.*?\})\s*```"
        match = re.search(json_pattern, text, re.DOTALL)
        if match:
            try:
                return json.loads(match.group(1))
            except json.JSONDecodeError:
                pass

        # Try to find standalone JSON
        json_pattern = r"(\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\})"
        matches = re.findall(json_pattern, text, re.DOTALL)
        for match in matches:
            try:
                parsed = json.loads(match)
                if isinstance(parsed, dict) and "paper_path" in parsed:
                    return parsed
            except json.JSONDecodeError:
                continue

        return None


================================================
FILE: utils/llm_utils.py
================================================
"""
LLM utility functions for DeepCode project.

This module provides common LLM-related utilities to avoid circular imports
and reduce code duplication across the project.
"""

import os
import yaml
from typing import Any, Type, Dict, Tuple


def get_api_keys(secrets_path: str = "mcp_agent.secrets.yaml") -> Dict[str, str]:
    """
    Get API keys from secrets file, with environment variables as fallback.

    Priority: secrets file > environment variables
    This ensures mcp_agent.secrets.yaml configuration is respected.

    Environment variable fallbacks (only used if secrets file has no value):
    - GOOGLE_API_KEY or GEMINI_API_KEY
    - ANTHROPIC_API_KEY
    - OPENAI_API_KEY

    Args:
        secrets_path: Path to the secrets YAML file

    Returns:
        Dict with 'google', 'anthropic', 'openai' keys
    """
    secrets = {}
    if os.path.exists(secrets_path):
        with open(secrets_path, "r", encoding="utf-8") as f:
            secrets = yaml.safe_load(f) or {}

    # Config file takes priority, env vars are fallback only
    return {
        "google": (
            secrets.get("google", {}).get("api_key", "")
            or os.environ.get("GOOGLE_API_KEY")
            or os.environ.get("GEMINI_API_KEY")
            or ""
        ).strip(),
        "anthropic": (
            secrets.get("anthropic", {}).get("api_key", "")
            or os.environ.get("ANTHROPIC_API_KEY")
            or ""
        ).strip(),
        "openai": (
            secrets.get("openai", {}).get("api_key", "")
            or os.environ.get("OPENAI_API_KEY")
            or ""
        ).strip(),
    }


def load_api_config(secrets_path: str = "mcp_agent.secrets.yaml") -> Dict[str, Any]:
    """
    Load API configuration with environment variable override.

    Environment variables take precedence over YAML values:
    - GOOGLE_API_KEY or GEMINI_API_KEY
    - ANTHROPIC_API_KEY
    - OPENAI_API_KEY

    Args:
        secrets_path: Path to the secrets YAML file

    Returns:
        Dict with provider configs including api_key values
    """
    # Load base config from YAML
    config = {}
    if os.path.exists(secrets_path):
        with open(secrets_path, "r", encoding="utf-8") as f:
            config = yaml.safe_load(f) or {}

    # Get keys with env var override
    keys = get_api_keys(secrets_path)

    # Merge into config structure
    for provider, key in keys.items():
        if key:
            config.setdefault(provider, {})["api_key"] = key

    return config


def _get_llm_class(provider: str) -> Type[Any]:
    """Lazily import and return the LLM class for a given provider."""
    if provider == "anthropic":
        from mcp_agent.workflows.llm.augmented_llm_anthropic import (
            AnthropicAugmentedLLM,
        )

        return AnthropicAugmentedLLM
    elif provider == "openai":
        from mcp_agent.workflows.llm.augmented_llm_openai import OpenAIAugmentedLLM

        return OpenAIAugmentedLLM
    elif provider == "google":
        from mcp_agent.workflows.llm.augmented_llm_google import GoogleAugmentedLLM

        return GoogleAugmentedLLM
    else:
        raise ValueError(f"Unknown provider: {provider}")


def get_preferred_llm_class(config_path: str = "mcp_agent.secrets.yaml") -> Type[Any]:
    """
    Select the LLM class based on user preference and API key availability.

    Priority:
    1. Check mcp_agent.config.yaml for llm_provider preference
    2. Verify the preferred provider has API key
    3. Fallback to first available provider

    Args:
        config_path: Path to the secrets YAML configuration file

    Returns:
        class: The preferred LLM class
    """
    try:
        # Get API keys with environment variable override
        keys = get_api_keys(config_path)
        google_key = keys["google"]
        anthropic_key = keys["anthropic"]
        openai_key = keys["openai"]

        # Read user preference from main config (derive path from secrets path)
        secrets_dir = os.path.dirname(os.path.abspath(config_path))
        main_config_path = os.path.join(secrets_dir, "mcp_agent.config.yaml")
        preferred_provider = None
        if os.path.exists(main_config_path):
            with open(main_config_path, "r", encoding="utf-8") as f:
                main_config = yaml.safe_load(f)
                preferred_provider = main_config.get("llm_provider", "").strip().lower()

        # Map of providers to their keys and class names
        provider_keys = {
            "anthropic": (anthropic_key, "AnthropicAugmentedLLM"),
            "google": (google_key, "GoogleAugmentedLLM"),
            "openai": (openai_key, "OpenAIAugmentedLLM"),
        }

        # Try user's preferred provider first
        if preferred_provider and preferred_provider in provider_keys:
            api_key, class_name = provider_keys[preferred_provider]
            if api_key:
                print(f"🤖 Using {class_name} (user preference: {preferred_provider})")
                return _get_llm_class(preferred_provider)
            else:
                print(
                    f"⚠️ Preferred provider '{preferred_provider}' has no API key, checking alternatives..."
                )

        # Fallback: try providers in order of availability
        for provider, (api_key, class_name) in provider_keys.items():
            if api_key:
                print(f"🤖 Using {class_name} ({provider} API key found)")
                return _get_llm_class(provider)

        # No API keys found - default to google
        print("⚠️ No API keys configured, falling back to GoogleAugmentedLLM")
        return _get_llm_class("google")

    except Exception as e:
        print(f"🤖 Error reading config file {config_path}: {e}")
        print("🤖 Falling back to GoogleAugmentedLLM")
        return _get_llm_class("google")


def get_token_limits(config_path: str = "mcp_agent.config.yaml") -> Tuple[int, int]:
    """
    Get token limits from configuration.

    Args:
        config_path: Path to the main configuration file

    Returns:
        tuple: (base_max_tokens, retry_max_tokens)
    """
    # Default values that work with qwen/qwen-max (32768 total context)
    default_base = 20000
    default_retry = 15000

    try:
        if os.path.exists(config_path):
            with open(config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)

            openai_config = config.get("openai", {})
            base_tokens = openai_config.get("base_max_tokens", default_base)
            retry_tokens = openai_config.get("retry_max_tokens", default_retry)

            print(
                f"⚙️ Token limits from config: base={base_tokens}, retry={retry_tokens}"
            )
            return base_tokens, retry_tokens
        else:
            print(
                f"⚠️ Config file {config_path} not found, using defaults: base={default_base}, retry={default_retry}"
            )
            return default_base, default_retry
    except Exception as e:
        print(f"⚠️ Error reading token config from {config_path}: {e}")
        print(
            f"🔧 Falling back to default token limits: base={default_base}, retry={default_retry}"
        )
        return default_base, default_retry


def get_default_models(config_path: str = "mcp_agent.config.yaml"):
    """
    Get default models from configuration file.

    Args:
        config_path: Path to the configuration file

    Returns:
        dict: Dictionary with 'anthropic', 'openai', 'google' default models,
              plus 'google_planning' and 'google_implementation' for phase-specific models
    """
    try:
        if os.path.exists(config_path):
            with open(config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)

            # Handle null values in config sections
            anthropic_config = config.get("anthropic") or {}
            openai_config = config.get("openai") or {}
            google_config = config.get("google") or {}

            anthropic_model = anthropic_config.get(
                "default_model", "claude-sonnet-4-20250514"
            )
            openai_model = openai_config.get("default_model", "o3-mini")
            google_model = google_config.get("default_model", "gemini-2.0-flash")

            # Phase-specific models (fall back to default if not specified)
            # Google
            google_planning = google_config.get("planning_model", google_model)
            google_implementation = google_config.get(
                "implementation_model", google_model
            )
            # Anthropic
            anthropic_planning = anthropic_config.get("planning_model", anthropic_model)
            anthropic_implementation = anthropic_config.get(
                "implementation_model", anthropic_model
            )
            # OpenAI
            openai_planning = openai_config.get("planning_model", openai_model)
            openai_implementation = openai_config.get(
                "implementation_model", openai_model
            )

            return {
                "anthropic": anthropic_model,
                "openai": openai_model,
                "google": google_model,
                "google_planning": google_planning,
                "google_implementation": google_implementation,
                "anthropic_planning": anthropic_planning,
                "anthropic_implementation": anthropic_implementation,
                "openai_planning": openai_planning,
                "openai_implementation": openai_implementation,
            }
        else:
            print(f"Config file {config_path} not found, using default models")
            return _get_fallback_models()

    except Exception as e:
        print(f"❌Error reading config file {config_path}: {e}")
        return _get_fallback_models()


def _get_fallback_models():
    """Return fallback model configuration when config file is unavailable."""
    google = "gemini-2.0-flash"
    anthropic = "claude-sonnet-4-20250514"
    openai = "o3-mini"
    return {
        "google": google,
        "google_planning": google,
        "google_implementation": google,
        "anthropic": anthropic,
        "anthropic_planning": anthropic,
        "anthropic_implementation": anthropic,
        "openai": openai,
        "openai_planning": openai,
        "openai_implementation": openai,
    }


def get_document_segmentation_config(
    config_path: str = "mcp_agent.config.yaml",
) -> Dict[str, Any]:
    """
    Get document segmentation configuration from config file.

    Args:
        config_path: Path to the main configuration file

    Returns:
        Dict containing segmentation configuration with default values
    """
    try:
        if os.path.exists(config_path):
            with open(config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)

            # Get document segmentation config with defaults
            seg_config = config.get("document_segmentation", {})
            return {
                "enabled": seg_config.get("enabled", True),
                "size_threshold_chars": seg_config.get("size_threshold_chars", 50000),
            }
        else:
            print(
                f"📄 Config file {config_path} not found, using default segmentation settings"
            )
            return {"enabled": True, "size_threshold_chars": 50000}

    except Exception as e:
        print(f"📄 Error reading segmentation config from {config_path}: {e}")
        print("📄 Using default segmentation settings")
        return {"enabled": True, "size_threshold_chars": 50000}


def should_use_document_segmentation(
    document_content: str, config_path: str = "mcp_agent.config.yaml"
) -> Tuple[bool, str]:
    """
    Determine whether to use document segmentation based on configuration and document size.

    Args:
        document_content: The content of the document to analyze
        config_path: Path to the configuration file

    Returns:
        Tuple of (should_segment, reason) where:
        - should_segment: Boolean indicating whether to use segmentation
        - reason: String explaining the decision
    """
    seg_config = get_document_segmentation_config(config_path)

    if not seg_config["enabled"]:
        return False, "Document segmentation disabled in configuration"

    doc_size = len(document_content)
    threshold = seg_config["size_threshold_chars"]

    if doc_size > threshold:
        return (
            True,
            f"Document size ({doc_size:,} chars) exceeds threshold ({threshold:,} chars)",
        )
    else:
        return (
            False,
            f"Document size ({doc_size:,} chars) below threshold ({threshold:,} chars)",
        )


def get_adaptive_agent_config(
    use_segmentation: bool, search_server_names: list = None
) -> Dict[str, list]:
    """
    Get adaptive agent configuration based on whether to use document segmentation.

    Args:
        use_segmentation: Whether to include document-segmentation server
        search_server_names: Base search server names (from get_search_server_names)

    Returns:
        Dict containing server configurations for different agents
    """
    if search_server_names is None:
        search_server_names = []

    # Base configuration
    config = {
        "concept_analysis": [],
        "algorithm_analysis": search_server_names.copy(),
        "code_planner": search_server_names.copy(),
    }

    # Add document-segmentation server if needed
    if use_segmentation:
        config["concept_analysis"] = ["document-segmentation"]
        if "document-segmentation" not in config["algorithm_analysis"]:
            config["algorithm_analysis"].append("document-segmentation")
        if "document-segmentation" not in config["code_planner"]:
            config["code_planner"].append("document-segmentation")
    else:
        config["concept_analysis"] = ["filesystem"]
        if "filesystem" not in config["algorithm_analysis"]:
            config["algorithm_analysis"].append("filesystem")
        if "filesystem" not in config["code_planner"]:
            config["code_planner"].append("filesystem")

    return config


def get_adaptive_prompts(use_segmentation: bool) -> Dict[str, str]:
    """
    Get appropriate prompt versions based on segmentation usage.

    Args:
        use_segmentation: Whether to use segmented reading prompts

    Returns:
        Dict containing prompt configurations
    """
    # Import here to avoid circular imports
    from prompts.code_prompts import (
        PAPER_CONCEPT_ANALYSIS_PROMPT,
        PAPER_ALGORITHM_ANALYSIS_PROMPT,
        CODE_PLANNING_PROMPT,
        PAPER_CONCEPT_ANALYSIS_PROMPT_TRADITIONAL,
        PAPER_ALGORITHM_ANALYSIS_PROMPT_TRADITIONAL,
        CODE_PLANNING_PROMPT_TRADITIONAL,
    )

    if use_segmentation:
        return {
            "concept_analysis": PAPER_CONCEPT_ANALYSIS_PROMPT,
            "algorithm_analysis": PAPER_ALGORITHM_ANALYSIS_PROMPT,
            "code_planning": CODE_PLANNING_PROMPT,
        }
    else:
        return {
            "concept_analysis": PAPER_CONCEPT_ANALYSIS_PROMPT_TRADITIONAL,
            "algorithm_analysis": PAPER_ALGORITHM_ANALYSIS_PROMPT_TRADITIONAL,
            "code_planning": CODE_PLANNING_PROMPT_TRADITIONAL,
        }


================================================
FILE: utils/loop_detector.py
================================================
"""
Loop Detection and Timeout Safeguards for Code Implementation Workflow

This module provides tools to detect infinite loops, timeouts, and progress stalls
in the code implementation process to prevent hanging processes.
"""

import time
from typing import List, Dict, Any, Optional
from datetime import datetime, timedelta


class LoopDetector:
    """
    Detects infinite loops, timeouts, and progress stalls in workflow execution.
    
    Features:
    - Track tool call history to detect repeated patterns
    - Monitor time per file/operation
    - Detect progress stalls
    - Force stop after consecutive errors
    """
    
    def __init__(self, max_repeats: int = 5, timeout_seconds: int = 300, 
                 stall_threshold: int = 180, max_errors: int = 10):
        """
        Initialize loop detector.
        
        Args:
            max_repeats: Maximum consecutive calls to same tool before flagging
            timeout_seconds: Maximum time per file/operation (5 minutes default)
            stall_threshold: Maximum time without progress (3 minutes default)
            max_errors: Maximum consecutive errors before force stop
        """
        self.max_repeats = max_repeats
        self.timeout_seconds = timeout_seconds
        self.stall_threshold = stall_threshold
        self.max_errors = max_errors
        
        # Tracking state
        self.tool_history: List[str] = []
        self.start_time = time.time()
        self.last_progress_time = time.time()
        self.consecutive_errors = 0
        self.current_file = None
        self.file_start_time = None
        
    def start_file(self, filename: str):
        """Start tracking a new file."""
        self.current_file = filename
        self.file_start_time = time.time()
        self.last_progress_time = time.time()
        print(f"📁 Starting file: {filename}")
        
    def check_tool_call(self, tool_name: str) -> Dict[str, Any]:
        """
        Check if tool call indicates a loop or timeout.
        
        Args:
            tool_name: Name of the tool being called
            
        Returns:
            Dict with status and warnings
        """
        current_time = time.time()
        self.tool_history.append(tool_name)
        
        # Keep only recent history (last 10 calls)
        if len(self.tool_history) > 10:
            self.tool_history = self.tool_history[-10:]
        
        # Check for repeated tool calls
        if len(self.tool_history) >= self.max_repeats:
            recent_tools = self.tool_history[-self.max_repeats:]
            if len(set(recent_tools)) == 1:  # All same tool
                return {
                    "status": "loop_detected",
                    "message": f"⚠️ Loop detected: {tool_name} called {self.max_repeats} times consecutively",
                    "should_stop": True
                }
        
        # Check file timeout
        if self.file_start_time and (current_time - self.file_start_time) > self.timeout_seconds:
            return {
                "status": "timeout",
                "message": f"⏰ Timeout: File {self.current_file} processing exceeded {self.timeout_seconds}s",
                "should_stop": True
            }
        
        # Check progress stall
        if (current_time - self.last_progress_time) > self.stall_threshold:
            return {
                "status": "stall",
                "message": f"🐌 Progress stall: No progress for {self.stall_threshold}s",
                "should_stop": True
            }
        
        # Check consecutive errors
        if self.consecutive_errors >= self.max_errors:
            return {
                "status": "max_errors",
                "message": f"❌ Too many errors: {self.consecutive_errors} consecutive errors",
                "should_stop": True
            }
        
        return {
            "status": "ok",
            "message": "Processing normally",
            "should_stop": False
        }
    
    def record_progress(self):
        """Record that progress has been made."""
        self.last_progress_time = time.time()
        self.consecutive_errors = 0  # Reset error counter on progress
        
    def record_error(self, error_message: str):
        """Record an error occurred."""
        self.consecutive_errors += 1
        print(f"❌ Error #{self.consecutive_errors}: {error_message}")
        
    def record_success(self):
        """Record a successful operation."""
        self.consecutive_errors = 0
        self.record_progress()
        
    def get_status_summary(self) -> Dict[str, Any]:
        """Get current status summary."""
        current_time = time.time()
        file_elapsed = (current_time - self.file_start_time) if self.file_start_time else 0
        total_elapsed = current_time - self.start_time
        
        return {
            "current_file": self.current_file,
            "file_elapsed_seconds": file_elapsed,
            "total_elapsed_seconds": total_elapsed,
            "consecutive_errors": self.consecutive_errors,
            "recent_tools": self.tool_history[-5:],  # Last 5 tools
            "time_since_last_progress": current_time - self.last_progress_time
        }
    
    def should_abort(self) -> bool:
        """Check if process should be aborted."""
        status = self.check_tool_call("")  # Check without adding to history
        return status["should_stop"]
    
    def get_abort_reason(self) -> Optional[str]:
        """Get reason for abort if should abort."""
        if self.should_abort():
            status = self.check_tool_call("")
            return status["message"]
        return None


class ProgressTracker:
    """
    Track progress through implementation phases and files.
    """
    
    def __init__(self, total_files: int = 0):
        self.total_files = total_files
        self.completed_files = 0
        self.current_phase = "Initializing"
        self.phase_progress = 0
        self.start_time = time.time()
        
    def set_phase(self, phase_name: str, progress_percent: int):
        """Set current phase and progress percentage."""
        self.current_phase = phase_name
        self.phase_progress = progress_percent
        print(f"📊 Progress: {progress_percent}% - {phase_name}")
        
    def complete_file(self, filename: str):
        """Record completion of a file."""
        self.completed_files += 1
        print(f"✅ Completed file {self.completed_files}/{self.total_files}: {filename}")
        
    def get_progress_info(self) -> Dict[str, Any]:
        """Get current progress information."""
        elapsed = time.time() - self.start_time
        
        # Estimate remaining time
        if self.completed_files > 0 and self.total_files > 0:
            avg_time_per_file = elapsed / self.completed_files
            remaining_files = self.total_files - self.completed_files
            estimated_remaining = avg_time_per_file * remaining_files
        else:
            estimated_remaining = 0
            
        return {
            "phase": self.current_phase,
            "phase_progress": self.phase_progress,
            "files_completed": self.completed_files,
            "total_files": self.total_files,
            "file_progress": (self.completed_files / self.total_files * 100) if self.total_files > 0 else 0,
            "elapsed_seconds": elapsed,
            "estimated_remaining_seconds": estimated_remaining
        }


================================================
FILE: utils/model_limits.py
================================================
"""
Model Limits and Capabilities Detection

This module provides utilities to detect LLM model capabilities and limits
dynamically, avoiding hardcoded values and supporting model changes.
"""

from typing import Dict, Tuple, Optional
import yaml


# Model capability database
# Format: {model_name_pattern: {max_completion_tokens, max_context_tokens, cost_per_1m_input, cost_per_1m_output}}
MODEL_LIMITS = {
    # OpenAI Models
    "gpt-4o-mini": {
        "max_completion_tokens": 16384,
        "max_context_tokens": 128000,
        "input_cost_per_1m": 0.15,
        "output_cost_per_1m": 0.60,
        "provider": "openai"
    },
    "gpt-4o": {
        "max_completion_tokens": 16384,
        "max_context_tokens": 128000,
        "input_cost_per_1m": 2.50,
        "output_cost_per_1m": 10.00,
        "provider": "openai"
    },
    "gpt-4-turbo": {
        "max_completion_tokens": 4096,
        "max_context_tokens": 128000,
        "input_cost_per_1m": 10.00,
        "output_cost_per_1m": 30.00,
        "provider": "openai"
    },
    "gpt-4": {
        "max_completion_tokens": 8192,
        "max_context_tokens": 8192,
        "input_cost_per_1m": 30.00,
        "output_cost_per_1m": 60.00,
        "provider": "openai"
    },
    "gpt-3.5-turbo": {
        "max_completion_tokens": 4096,
        "max_context_tokens": 16385,
        "input_cost_per_1m": 0.50,
        "output_cost_per_1m": 1.50,
        "provider": "openai"
    },
    "o1-mini": {
        "max_completion_tokens": 65536,
        "max_context_tokens": 128000,
        "input_cost_per_1m": 3.00,
        "output_cost_per_1m": 12.00,
        "provider": "openai"
    },
    "o1": {
        "max_completion_tokens": 100000,
        "max_context_tokens": 200000,
        "input_cost_per_1m": 15.00,
        "output_cost_per_1m": 60.00,
        "provider": "openai"
    },
    # Anthropic Models
    "claude-3-5-sonnet": {
        "max_completion_tokens": 8192,
        "max_context_tokens": 200000,
        "input_cost_per_1m": 3.00,
        "output_cost_per_1m": 15.00,
        "provider": "anthropic"
    },
    "claude-3-opus": {
        "max_completion_tokens": 4096,
        "max_context_tokens": 200000,
        "input_cost_per_1m": 15.00,
        "output_cost_per_1m": 75.00,
        "provider": "anthropic"
    },
    "claude-3-sonnet": {
        "max_completion_tokens": 4096,
        "max_context_tokens": 200000,
        "input_cost_per_1m": 3.00,
        "output_cost_per_1m": 15.00,
        "provider": "anthropic"
    },
    "claude-3-haiku": {
        "max_completion_tokens": 4096,
        "max_context_tokens": 200000,
        "input_cost_per_1m": 0.25,
        "output_cost_per_1m": 1.25,
        "provider": "anthropic"
    },
}


def get_model_from_config(config_path: str = "mcp_agent.config.yaml") -> Optional[str]:
    """
    Get the default model from configuration file.
    
    Args:
        config_path: Path to the configuration file
        
    Returns:
        Model name or None if not found
    """
    try:
        with open(config_path, "r", encoding="utf-8") as f:
            config = yaml.safe_load(f)
            
        # Check OpenAI config first
        if "openai" in config and "default_model" in config["openai"]:
            return config["openai"]["default_model"]
        
        # Check Anthropic config
        if "anthropic" in config and "default_model" in config["anthropic"]:
            return config["anthropic"]["default_model"]
            
        return None
    except Exception as e:
        print(f"⚠️ Warning: Could not read model from config: {e}")
        return None


def get_model_limits(model_name: Optional[str] = None, config_path: str = "mcp_agent.config.yaml") -> Dict:
    """
    Get the limits and capabilities for a specific model.
    
    Args:
        model_name: Name of the model (if None, reads from config)
        config_path: Path to the configuration file
        
    Returns:
        Dictionary with model limits and capabilities
    """
    # Get model name from config if not provided
    if not model_name:
        model_name = get_model_from_config(config_path)
    
    if not model_name:
        print("⚠️ Warning: Could not determine model, using safe defaults")
        return {
            "max_completion_tokens": 4096,
            "max_context_tokens": 8192,
            "input_cost_per_1m": 1.00,
            "output_cost_per_1m": 3.00,
            "provider": "unknown"
        }
    
    # Find matching model in database
    for pattern, limits in MODEL_LIMITS.items():
        if pattern.lower() in model_name.lower():
            print(f"📊 Detected model: {model_name} → {pattern}")
            print(f"   Max completion tokens: {limits['max_completion_tokens']}")
            print(f"   Max context tokens: {limits['max_context_tokens']}")
            return limits.copy()
    
    # Model not in database - use conservative defaults
    print(f"⚠️ Warning: Model '{model_name}' not in database, using conservative defaults")
    return {
        "max_completion_tokens": 4096,
        "max_context_tokens": 8192,
        "input_cost_per_1m": 1.00,
        "output_cost_per_1m": 3.00,
        "provider": "unknown"
    }


def get_safe_max_tokens(
    model_name: Optional[str] = None, 
    config_path: str = "mcp_agent.config.yaml",
    safety_margin: float = 0.9
) -> int:
    """
    Get a safe max_tokens value for the model with a safety margin.
    
    Args:
        model_name: Name of the model (if None, reads from config)
        config_path: Path to the configuration file
        safety_margin: Percentage of max to use (0.9 = 90% of max)
        
    Returns:
        Safe max_tokens value
    """
    limits = get_model_limits(model_name, config_path)
    safe_tokens = int(limits["max_completion_tokens"] * safety_margin)
    print(f"🔧 Safe max_tokens for {model_name or 'current model'}: {safe_tokens} ({safety_margin*100:.0f}% of {limits['max_completion_tokens']})")
    return safe_tokens


def calculate_token_cost(
    input_tokens: int,
    output_tokens: int,
    model_name: Optional[str] = None,
    config_path: str = "mcp_agent.config.yaml"
) -> float:
    """
    Calculate the cost for a given number of tokens.
    
    Args:
        input_tokens: Number of input/prompt tokens
        output_tokens: Number of output/completion tokens
        model_name: Name of the model (if None, reads from config)
        config_path: Path to the configuration file
        
    Returns:
        Total cost in dollars
    """
    limits = get_model_limits(model_name, config_path)
    
    input_cost = (input_tokens / 1_000_000) * limits["input_cost_per_1m"]
    output_cost = (output_tokens / 1_000_000) * limits["output_cost_per_1m"]
    total_cost = input_cost + output_cost
    
    return total_cost


def get_retry_token_limits(
    base_tokens: int,
    retry_count: int,
    model_name: Optional[str] = None,
    config_path: str = "mcp_agent.config.yaml"
) -> int:
    """
    Get adjusted token limits for retries, respecting model maximum.
    
    Args:
        base_tokens: Base token limit
        retry_count: Current retry attempt (0, 1, 2, ...)
        model_name: Name of the model (if None, reads from config)
        config_path: Path to the configuration file
        
    Returns:
        Adjusted token limit for retry
    """
    limits = get_model_limits(model_name, config_path)
    max_allowed = limits["max_completion_tokens"]
    
    # Increase tokens with each retry, but cap at model maximum
    if retry_count == 0:
        # First retry: 87.5% of max
        new_tokens = int(max_allowed * 0.875)
    elif retry_count == 1:
        # Second retry: 95% of max
        new_tokens = int(max_allowed * 0.95)
    else:
        # Third+ retry: Use max with small safety margin
        new_tokens = int(max_allowed * 0.98)
    
    # Ensure we don't exceed the model's hard limit
    new_tokens = min(new_tokens, max_allowed)
    
    print(f"🔧 Retry {retry_count + 1}: Adjusting tokens from {base_tokens} → {new_tokens} (max: {max_allowed})")
    
    return new_tokens


def get_provider_from_model(model_name: Optional[str] = None, config_path: str = "mcp_agent.config.yaml") -> str:
    """
    Determine the provider (openai/anthropic) for a given model.
    
    Args:
        model_name: Name of the model (if None, reads from config)
        config_path: Path to the configuration file
        
    Returns:
        Provider name: "openai", "anthropic", or "unknown"
    """
    limits = get_model_limits(model_name, config_path)
    return limits.get("provider", "unknown")


================================================
FILE: utils/simple_llm_logger.py
================================================
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
超简化LLM响应日志记录器
专注于记录LLM回复的核心内容，配置简单易用
"""

import json
import os
import yaml
from datetime import datetime
from pathlib import Path
from typing import Dict, Any


class SimpleLLMLogger:
    """超简化的LLM响应日志记录器"""

    def __init__(self, config_path: str = "mcp_agent.config.yaml"):
        """
        初始化日志记录器

        Args:
            config_path: 配置文件路径
        """
        self.config = self._load_config(config_path)
        self.llm_config = self.config.get("llm_logger", {})

        # 如果禁用则直接返回
        if not self.llm_config.get("enabled", True):
            self.enabled = False
            return

        self.enabled = True
        self._setup_logger()

    def _load_config(self, config_path: str) -> Dict[str, Any]:
        """加载配置文件"""
        try:
            with open(config_path, "r", encoding="utf-8") as f:
                return yaml.safe_load(f)
        except Exception as e:
            print(f"⚠️ 配置文件加载失败: {e}，使用默认配置")
            return self._get_default_config()

    def _get_default_config(self) -> Dict[str, Any]:
        """获取默认配置"""
        return {
            "llm_logger": {
                "enabled": True,
                "output_format": "json",
                "log_level": "basic",
                "log_directory": "logs/llm_responses",
                "filename_pattern": "llm_responses_{timestamp}.jsonl",
                "include_models": ["claude-sonnet-4", "gpt-4", "o3-mini"],
                "min_response_length": 50,
            }
        }

    def _setup_logger(self):
        """设置日志记录器"""
        log_dir = self.llm_config.get("log_directory", "logs/llm_responses")

        # 创建日志目录
        Path(log_dir).mkdir(parents=True, exist_ok=True)

        # 生成日志文件名
        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
        filename_pattern = self.llm_config.get(
            "filename_pattern", "llm_responses_{timestamp}.jsonl"
        )
        self.log_file = os.path.join(
            log_dir, filename_pattern.format(timestamp=timestamp)
        )

        print(f"📝 LLM响应日志: {self.log_file}")

    def log_response(self, content: str, model: str = "", agent: str = "", **kwargs):
        """
        记录LLM响应 - 简化版本

        Args:
            content: LLM响应内容
            model: 模型名称
            agent: Agent名称
            **kwargs: 其他可选信息
        """
        if not self.enabled:
            return

        # 检查是否应该记录
        if not self._should_log(content, model):
            return

        # 构建日志记录
        log_entry = self._build_entry(content, model, agent, kwargs)

        # 写入日志
        self._write_log(log_entry)

        # 控制台显示
        self._console_log(content, model, agent)

    def _should_log(self, content: str, model: str) -> bool:
        """检查是否应该记录"""
        # 检查长度
        min_length = self.llm_config.get("min_response_length", 50)
        if len(content) < min_length:
            return False

        # 检查模型
        include_models = self.llm_config.get("include_models", [])
        if include_models and not any(m in model for m in include_models):
            return False

        return True

    def _build_entry(self, content: str, model: str, agent: str, extra: Dict) -> Dict:
        """构建日志条目"""
        log_level = self.llm_config.get("log_level", "basic")

        if log_level == "basic":
            # 基础级别：只记录核心内容
            return {
                "timestamp": datetime.now().isoformat(),
                "content": content,
                "model": model,
            }
        else:
            # 详细级别：包含更多信息
            entry = {
                "timestamp": datetime.now().isoformat(),
                "content": content,
                "model": model,
                "agent": agent,
            }
            # 添加额外信息
            if "token_usage" in extra:
                entry["tokens"] = extra["token_usage"]
            if "session_id" in extra:
                entry["session"] = extra["session_id"]
            return entry

    def _write_log(self, entry: Dict):
        """写入日志文件"""
        output_format = self.llm_config.get("output_format", "json")

        try:
            with open(self.log_file, "a", encoding="utf-8") as f:
                if output_format == "json":
                    f.write(json.dumps(entry, ensure_ascii=False) + "\n")
                elif output_format == "text":
                    timestamp = entry.get("timestamp", "")
                    model = entry.get("model", "")
                    content = entry.get("content", "")
                    f.write(f"[{timestamp}] {model}: {content}\n\n")
                elif output_format == "markdown":
                    timestamp = entry.get("timestamp", "")
                    model = entry.get("model", "")
                    content = entry.get("content", "")
                    f.write(f"**{timestamp}** | {model}\n\n{content}\n\n---\n\n")
        except Exception as e:
            print(f"⚠️ 写入日志失败: {e}")

    def _console_log(self, content: str, model: str, agent: str):
        """控制台简要显示"""
        preview = content[:80] + "..." if len(content) > 80 else content
        print(f"🤖 {model} ({agent}): {preview}")


# 全局实例
_global_logger = None


def get_llm_logger() -> SimpleLLMLogger:
    """获取全局LLM日志记录器实例"""
    global _global_logger
    if _global_logger is None:
        _global_logger = SimpleLLMLogger()
    return _global_logger


def log_llm_response(content: str, model: str = "", agent: str = "", **kwargs):
    """便捷函数：记录LLM响应"""
    logger = get_llm_logger()
    logger.log_response(content, model, agent, **kwargs)


# 示例使用
if __name__ == "__main__":
    # 测试日志记录
    log_llm_response(
        content="这是一个测试的LLM响应内容，用于验证简化日志记录器的功能是否正常工作。",
        model="claude-sonnet-4-20250514",
        agent="TestAgent",
    )

    print("✅ 简化LLM日志测试完成")


================================================
FILE: workflows/__init__.py
================================================
"""
Intelligent Agent Orchestration Workflows for Research-to-Code Automation.

This package provides advanced AI-driven workflow orchestration capabilities
for automated research analysis and code implementation synthesis.
"""

from .agent_orchestration_engine import (
    run_research_analyzer,
    run_resource_processor,
    run_code_analyzer,
    github_repo_download,
    paper_reference_analyzer,
    execute_multi_agent_research_pipeline,
    paper_code_preparation,  # Deprecated, for backward compatibility
)

from .code_implementation_workflow import CodeImplementationWorkflow

__all__ = [
    # Initial workflows
    "run_research_analyzer",
    "run_resource_processor",
    "run_code_analyzer",
    "github_repo_download",
    "paper_reference_analyzer",
    "execute_multi_agent_research_pipeline",  # Main multi-agent pipeline function
    "paper_code_preparation",  # Deprecated, for backward compatibility
    # Code implementation workflows
    "CodeImplementationWorkflow",
]


================================================
FILE: workflows/agent_orchestration_engine.py
================================================
"""
Intelligent Agent Orchestration Engine for Research-to-Code Automation

This module serves as the core orchestration engine that coordinates multiple specialized
AI agents to automate the complete research-to-code transformation pipeline:

1. Research Analysis Agent - Intelligent content processing and extraction
2. Workspace Infrastructure Agent - Automated environment synthesis
3. Code Architecture Agent - AI-driven design and planning
4. Reference Intelligence Agent - Automated knowledge discovery
5. Repository Acquisition Agent - Intelligent code repository management
6. Codebase Intelligence Agent - Advanced relationship analysis
7. Code Implementation Agent - AI-powered code synthesis

Core Features:
- Multi-agent coordination with intelligent task distribution
- Local environment automation for seamless deployment
- Real-time progress monitoring with comprehensive error handling
- Adaptive workflow optimization based on processing requirements
- Advanced intelligence analysis with configurable performance modes

Architecture:
- Async/await based high-performance agent coordination
- Modular agent design with specialized role separation
- Intelligent resource management and optimization
- Comprehensive logging and monitoring infrastructure
"""

import asyncio
import json
import os
import re
import yaml
from typing import Any, Callable, Dict, List, Optional, Tuple

# MCP Agent imports
from mcp_agent.agents.agent import Agent
from mcp_agent.workflows.llm.augmented_llm import RequestParams
from mcp_agent.workflows.parallel.parallel_llm import ParallelLLM

# Local imports
from prompts.code_prompts import (
    PAPER_INPUT_ANALYZER_PROMPT,
    PAPER_DOWNLOADER_PROMPT,
    PAPER_REFERENCE_ANALYZER_PROMPT,
    CHAT_AGENT_PLANNING_PROMPT,
)
from utils.file_processor import FileProcessor
from workflows.code_implementation_workflow import CodeImplementationWorkflow
from tools.pdf_downloader import move_file_to, download_file_to
from workflows.code_implementation_workflow_index import (
    CodeImplementationWorkflowWithIndex,
)
from utils.llm_utils import (
    get_preferred_llm_class,
    should_use_document_segmentation,
    get_adaptive_agent_config,
    get_adaptive_prompts,
    get_token_limits,
)
from workflows.agents.document_segmentation_agent import prepare_document_segments
from workflows.agents.requirement_analysis_agent import RequirementAnalysisAgent

# Environment configuration
os.environ["PYTHONDONTWRITEBYTECODE"] = "1"  # Prevent .pyc file generation


def _assess_output_completeness(text: str) -> float:
    """
    Accurately assess the completeness of YAML-formatted implementation plans.

    Based on the actual requirements of CODE_PLANNING_PROMPT_TRADITIONAL:
    1. Check if all 5 required YAML sections are present
    2. Verify YAML structure integrity (start and end markers)
    3. Check if the last line is truncated
    4. Verify minimum reasonable length

    Returns:
        float: Completeness score (0.0-1.0), higher indicates more complete
    """
    if not text or len(text.strip()) < 500:
        return 0.0

    score = 0.0
    text_lower = text.lower()

    # 1. Check for 5 required YAML sections (weight: 0.5 - most important)
    # These are the 5 sections explicitly required by the prompt
    required_sections = [
        "file_structure:",
        "implementation_components:",
        "validation_approach:",
        "environment_setup:",
        "implementation_strategy:",
    ]

    sections_found = sum(1 for section in required_sections if section in text_lower)
    section_score = sections_found / len(required_sections)
    score += section_score * 0.5

    print(f"   📋 Required sections: {sections_found}/{len(required_sections)}")

    # 2. Check YAML structure integrity (weight: 0.2)
    has_yaml_start = any(
        marker in text
        for marker in ["```yaml", "complete_reproduction_plan:", "paper_info:"]
    )
    has_yaml_end = any(
        marker in text[-500:]
        for marker in ["```", "implementation_strategy:", "validation_approach:"]
    )

    if has_yaml_start and has_yaml_end:
        score += 0.2
    elif has_yaml_start:
        score += 0.1

    # 3. Check last line integrity (weight: 0.15)
    lines = text.strip().split("\n")
    if lines:
        last_line = lines[-1].strip()
        # YAML's last line is usually an indented content line or end marker
        if (
            last_line.endswith(("```", ".", ":", "]", "}"))
            or last_line.startswith(("-", "*", " "))  # YAML list items or indented content
            or (
                len(last_line) < 100 and not last_line.endswith(",")
            )  # Short line and not truncated
        ):
            score += 0.15
        else:
            # Long line without proper ending, likely truncated
            print(f"   ⚠️  Last line suspicious: '{last_line[-50:]}'")

    # 4. Check reasonable minimum length (weight: 0.15)
    # A complete 5-section plan should be at least 8000 characters
    length = len(text)
    if length >= 10000:
        score += 0.15
    elif length >= 5000:
        score += 0.10
    elif length >= 2000:
        score += 0.05

    print(f"   📏 Content length: {length} chars")

    return min(score, 1.0)


def _adjust_params_for_retry(
    params: RequestParams, retry_count: int, config_path: str = "mcp_agent.config.yaml"
) -> RequestParams:
    """
    Token减少策略以适应模型context限制

    策略说明（针对qwen/qwen-max的32768 token限制）：
    - 第1次重试：REDUCE到retry_max_tokens（从config读取，默认15000）
    - 第2次重试：REDUCE到retry_max_tokens的80%
    - 第3次重试：REDUCE到retry_max_tokens的60%
    - 降低temperature提高稳定性和可预测性

    为什么要REDUCE而不是INCREASE？
    - qwen/qwen-max最大context = 32768 tokens (input + output 总和)
    - 当遇到 "maximum context length exceeded" 错误时，说明 input + requested_output > 32768
    - INCREASING max_tokens只会让问题更严重！
    - 正确做法：DECREASE output tokens，为更多input留出空间
    - 模型可以用更简洁的输出表达相同内容
    """
    # 从配置文件读取retry token limit
    _, retry_max_tokens = get_token_limits(config_path)

    # Token减少策略 - 为input腾出更多空间
    if retry_count == 0:
        # 第一次重试：使用配置的retry_max_tokens
        new_max_tokens = retry_max_tokens
    elif retry_count == 1:
        # 第二次重试：减少到retry_max_tokens的80%
        new_max_tokens = int(retry_max_tokens * 0.9)
    else:
        # 第三次及以上：减少到retry_max_tokens的60%
        new_max_tokens = int(retry_max_tokens * 0.8)

    # Decrease temperature with each retry to get more consistent and predictable output
    new_temperature = max(params.temperature - (retry_count * 0.15), 0.05)

    print(f"🔧 Adjusting parameters for retry {retry_count + 1}:")
    print(f"   Token limit: {params.maxTokens} → {new_max_tokens}")
    print(f"   Temperature: {params.temperature:.2f} → {new_temperature:.2f}")
    print(
        "   💡 Strategy: REDUCE output tokens to fit within model's total context limit"
    )

    # return RequestParams(
    #     maxTokens=new_max_tokens,  # 注意：使用 camelCase
    #     temperature=new_temperature,
    # )
    return new_max_tokens, new_temperature


async def execute_requirement_analysis_workflow(
    user_input: str,
    analysis_mode: str,
    user_answers: Optional[Dict[str, str]] = None,
    logger=None,
    progress_callback: Optional[Callable[[int, str], None]] = None,
) -> Dict[str, Any]:
    """
    Lightweight orchestrator to run requirement-analysis-specific flows.
    """

    normalized_input = (user_input or "").strip()
    if not normalized_input:
        return {
            "status": "error",
            "error": "User requirement input cannot be empty.",
        }

    user_answers = user_answers or {}

    try:
        async with RequirementAnalysisAgent(logger=logger) as agent:
            if progress_callback:
                progress_callback(5, "🤖 Initializing requirement analysis agent...")

            if analysis_mode == "generate_questions":
                questions = await agent.generate_guiding_questions(normalized_input)
                if progress_callback:
                    progress_callback(100, "🧠 Guiding questions generated.")
                return {
                    "status": "success",
                    "result": json.dumps(questions, ensure_ascii=False),
                }

            if analysis_mode == "summarize_requirements":
                summary = await agent.summarize_detailed_requirements(
                    normalized_input, user_answers
                )
                if progress_callback:
                    progress_callback(100, "📄 Requirement document created.")
                return {"status": "success", "result": summary}

            raise ValueError(f"Unsupported analysis_mode: {analysis_mode}")

    except Exception as exc:
        message = str(exc)
        if logger:
            try:
                logger.error("Requirement analysis workflow failed: %s", message)
            except Exception:
                pass
        return {"status": "error", "error": message}


def get_default_search_server(config_path: str = "mcp_agent.config.yaml"):
    """
    Get the default search server from configuration.

    Args:
        config_path: Path to the main configuration file

    Returns:
        str: The default search server name ("brave" or "bocha-mcp")
    """
    try:
        if os.path.exists(config_path):
            with open(config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)

            default_server = config.get("default_search_server", "brave")
            print(f"🔍 Using search server: {default_server}")
            return default_server
        else:
            print(f"⚠️ Config file {config_path} not found, using default: brave")
            return "brave"
    except Exception as e:
        print(f"⚠️ Error reading config file {config_path}: {e}")
        print("🔍 Falling back to default search server: brave")
        return "brave"


def get_search_server_names(
    additional_servers: Optional[List[str]] = None,
) -> List[str]:
    """
    Get server names list with the configured default search server.

    Args:
        additional_servers: Optional list of additional servers to include

    Returns:
        List[str]: List of server names including the default search server
    """
    default_search = get_default_search_server()
    server_names = [default_search]

    if additional_servers:
        # Add additional servers, avoiding duplicates
        for server in additional_servers:
            if server not in server_names:
                server_names.append(server)

    return server_names


def extract_clean_json(llm_output: str) -> str:
    """
    Extract clean JSON from LLM output, removing all extra text and formatting.

    Args:
        llm_output: Raw LLM output

    Returns:
        str: Clean JSON string
    """
    try:
        # Try to parse the entire output as JSON first
        json.loads(llm_output.strip())
        return llm_output.strip()
    except json.JSONDecodeError:
        pass

    # Remove markdown code blocks
    if "```json" in llm_output:
        pattern = r"```json\s*(.*?)\s*```"
        match = re.search(pattern, llm_output, re.DOTALL)
        if match:
            json_text = match.group(1).strip()
            try:
                json.loads(json_text)
                return json_text
            except json.JSONDecodeError:
                pass

    # Find JSON object starting with {
    lines = llm_output.split("\n")
    json_lines = []
    in_json = False
    brace_count = 0

    for line in lines:
        stripped = line.strip()
        if not in_json and stripped.startswith("{"):
            in_json = True
            json_lines = [line]
            brace_count = stripped.count("{") - stripped.count("}")
        elif in_json:
            json_lines.append(line)
            brace_count += stripped.count("{") - stripped.count("}")
            if brace_count == 0:
                break

    if json_lines:
        json_text = "\n".join(json_lines).strip()
        try:
            json.loads(json_text)
            return json_text
        except json.JSONDecodeError:
            pass

    # Last attempt: use regex to find JSON
    pattern = r"\{[^{}]*(?:\{[^{}]*\}[^{}]*)*\}"
    matches = re.findall(pattern, llm_output, re.DOTALL)
    for match in matches:
        try:
            json.loads(match)
            return match
        except json.JSONDecodeError:
            continue

    # If all methods fail, return original output
    return llm_output


async def run_research_analyzer(prompt_text: str, logger) -> str:
    """
    Run the research analysis workflow using ResearchAnalyzerAgent.

    Args:
        prompt_text: Input prompt text containing research information
        logger: Logger instance for logging information

    Returns:
        str: Analysis result from the agent
    """
    try:
        # Log input information for debugging
        print("📊 Starting research analysis...")
        print(f"Input prompt length: {len(prompt_text) if prompt_text else 0}")
        print(f"Input preview: {prompt_text[:200] if prompt_text else 'None'}...")

        if not prompt_text or prompt_text.strip() == "":
            raise ValueError(
                "Empty or None prompt_text provided to run_research_analyzer"
            )

        analyzer_agent = Agent(
            name="ResearchAnalyzerAgent",
            instruction=PAPER_INPUT_ANALYZER_PROMPT,
            server_names=get_search_server_names(),
        )

        async with analyzer_agent:
            print("analyzer: Connected to server, calling list_tools...")
            try:
                tools = await analyzer_agent.list_tools()
                print(
                    "Tools available:",
                    tools.model_dump() if hasattr(tools, "model_dump") else str(tools),
                )
            except Exception as e:
                print(f"Failed to list tools: {e}")

            try:
                analyzer = await analyzer_agent.attach_llm(get_preferred_llm_class())
                print("✅ LLM attached successfully")
            except Exception as e:
                print(f"❌ Failed to attach LLM: {e}")
                raise

            # Set higher token output for research analysis
            analysis_params = RequestParams(
                maxTokens=6144,  # Using camelCase
                temperature=0.3,
            )

            print(
                f"🔄 Making LLM request with params: maxTokens={analysis_params.maxTokens}, temperature={analysis_params.temperature}"
            )

            try:
                raw_result = await analyzer.generate_str(
                    message=prompt_text, request_params=analysis_params
                )

                print("✅ LLM request completed")
                print(f"Raw result type: {type(raw_result)}")
                print(f"Raw result length: {len(raw_result) if raw_result else 0}")

                if not raw_result:
                    print("❌ CRITICAL: raw_result is empty or None!")
                    print("This could indicate:")
                    print("1. LLM API call failed silently")
                    print("2. API rate limiting or quota exceeded")
                    print("3. Network connectivity issues")
                    print("4. MCP server communication problems")
                    raise ValueError("LLM returned empty result")

            except Exception as e:
                print(f"❌ LLM generation failed: {e}")
                print(f"Exception type: {type(e)}")
                raise

            # Clean LLM output to ensure only pure JSON is returned
            try:
                clean_result = extract_clean_json(raw_result)
                print(f"Raw LLM output: {raw_result}")
                print(f"Cleaned JSON output: {clean_result}")

                # Log to SimpleLLMLogger
                if hasattr(logger, "log_response"):
                    logger.log_response(
                        clean_result,
                        model="ResearchAnalyzer",
                        agent="ResearchAnalyzerAgent",
                    )

                if not clean_result or clean_result.strip() == "":
                    print("❌ CRITICAL: clean_result is empty after JSON extraction!")
                    print(f"Original raw_result was: {raw_result}")
                    raise ValueError("JSON extraction resulted in empty output")

                return clean_result

            except Exception as e:
                print(f"❌ JSON extraction failed: {e}")
                print(f"Raw result was: {raw_result}")
                raise

    except Exception as e:
        print(f"❌ run_research_analyzer failed: {e}")
        print(f"Exception details: {type(e).__name__}: {str(e)}")
        raise


async def run_resource_processor(analysis_result: str, logger) -> str:
    """
    Run the resource processing workflow - deterministic file operations without LLM.

    This function handles file downloading/moving using direct logic rather than LLM,
    since the paper directory structure and ID are pre-computed and deterministic.

    Args:
        analysis_result: Result from the research analyzer (contains file path/URL)
        logger: Logger instance for logging information

    Returns:
        str: Processing result with paper directory path
    """
    # Pre-compute paper ID - deterministic, no LLM needed
    papers_dir = "./deepcode_lab/papers"
    os.makedirs(papers_dir, exist_ok=True)
    existing_ids = [
        int(d)
        for d in os.listdir(papers_dir)
        if os.path.isdir(os.path.join(papers_dir, d)) and d.isdigit()
    ]
    next_id = max(existing_ids) + 1 if existing_ids else 1
    paper_dir = os.path.join(papers_dir, str(next_id))
    os.makedirs(paper_dir, exist_ok=True)

    logger.info(f"📋 Paper ID: {next_id}")
    logger.info(f"📂 Paper directory: {paper_dir}")

    # Extract file path/URL from analysis_result - simple parsing, no LLM needed
    # The analysis_result should contain the path/URL identified by the analyzer
    try:
        # Parse the analysis result to extract path
        analysis_data = json.loads(analysis_result)
        source_path = analysis_data.get("path") or analysis_data.get("input_path")
        input_type = analysis_data.get("input_type", "unknown")

        logger.info(f"📥 Processing {input_type}: {source_path}")

        # Try direct function calls first - no LLM needed for deterministic operations
        direct_call_success = False
        operation_result = None

        # 1. Handle local file - direct copy
        if input_type == "file" and source_path and os.path.exists(source_path):
            logger.info(f"📄 Direct file copy: {source_path} -> {paper_dir}")
            try:
                operation_result = await move_file_to(
                    source=source_path, destination=paper_dir, filename=f"{next_id}.pdf"
                )
                # Check if operation succeeded
                if (
                    "[SUCCESS]" in operation_result
                    and "[ERROR]" not in operation_result
                ):
                    direct_call_success = True
                    logger.info(f"✅ Direct file copy succeeded:\n{operation_result}")
                else:
                    logger.warning(f"⚠️ Direct file copy had issues: {operation_result}")
            except Exception as e:
                logger.warning(f"⚠️ Direct file copy failed: {e}")

        # 2. Handle URL - direct download
        elif input_type == "url" and source_path:
            logger.info(f"🌐 Direct URL download: {source_path} -> {paper_dir}")
            try:
                operation_result = await download_file_to(
                    url=source_path,
                    destination=paper_dir,
                    filename=f"{next_id}.pdf",  # Default to PDF, conversion will handle it
                )
                # Check if operation succeeded
                if (
                    "[SUCCESS]" in operation_result
                    and "[ERROR]" not in operation_result
                ):
                    direct_call_success = True
                    logger.info(f"✅ Direct download succeeded:\n{operation_result}")
                else:
                    logger.warning(f"⚠️ Direct download had issues: {operation_result}")
            except Exception as e:
                logger.warning(f"⚠️ Direct download failed: {e}")

        # 3. If direct call succeeded, format result
        if direct_call_success:
            dest_path = os.path.join(paper_dir, f"{next_id}.md")
            result = json.dumps(
                {
                    "status": "success",
                    "paper_id": next_id,
                    "paper_dir": paper_dir,
                    "file_path": dest_path,
                    "message": f"File successfully processed to {paper_dir}",
                    "operation_details": operation_result,
                }
            )
        else:
            # 4. Fallback to LLM agent if direct call failed or unsupported type
            logger.info(
                f"🤖 Falling back to LLM agent for: {input_type} - {source_path}"
            )
            processor_agent = Agent(
                name="ResourceProcessorAgent",
                instruction=PAPER_DOWNLOADER_PROMPT,
                server_names=["file-downloader"],
            )

            async with processor_agent:
                processor = await processor_agent.attach_llm(get_preferred_llm_class())
                processor_params = RequestParams(
                    maxTokens=4096,
                    temperature=0.2,
                    tool_filter={
                        "file-downloader": {"download_file_to", "move_file_to"}
                    },
                )

                # Provide context about what failed if available
                context = (
                    f"\nPrevious attempt result: {operation_result}"
                    if operation_result
                    else ""
                )
                message = f"""Download/move the file to paper directory: {paper_dir}
Source: {source_path}
Input Type: {input_type}
Paper ID: {next_id}
Target filename: {next_id}.md (after conversion){context}

Use the appropriate tool to complete this task."""

                result = await processor.generate_str(
                    message=message, request_params=processor_params
                )

        return result

    except (json.JSONDecodeError, KeyError, Exception) as e:
        logger.error(f"❌ Error processing resource: {e}")
        # Fallback - return paper directory for manual processing
        return json.dumps(
            {
                "status": "partial",
                "paper_id": next_id,
                "paper_dir": paper_dir,
                "message": f"Paper directory created at {paper_dir}, manual file placement may be needed",
            }
        )


async def run_code_analyzer(
    paper_dir: str, logger, use_segmentation: bool = True
) -> str:
    """
    Run the adaptive code analysis workflow with optimized file reading.

    This function minimizes LLM tool calls by:
    1. Reading paper file directly (deterministic, no LLM needed)
    2. Passing paper content directly to agents
    3. LLM only used for analysis and search decisions

    Orchestrates three specialized agents:
    - ConceptAnalysisAgent: Analyzes system architecture and conceptual framework
    - AlgorithmAnalysisAgent: Extracts algorithms, formulas, and technical details
    - CodePlannerAgent: Integrates outputs into a comprehensive implementation plan

    Args:
        paper_dir: Directory path containing the research paper and related resources
        logger: Logger instance for logging information
        use_segmentation: Whether to use document segmentation capabilities

    Returns:
        str: Comprehensive analysis result from the coordinated agents
    """
    print(
        f"📊 Code analysis mode: {'Segmented' if use_segmentation else 'Traditional'}"
    )
    print("   🔧 Optimized workflow: Direct file reading, LLM only for analysis")

    # STEP 1: Read paper file directly - no LLM needed for deterministic file operations
    paper_content = None
    paper_file_path = None

    try:
        # Find .md file in paper directory - simple file system operation
        for filename in os.listdir(paper_dir):
            if filename.endswith(".md"):
                paper_file_path = os.path.join(paper_dir, filename)
                with open(paper_file_path, "r", encoding="utf-8") as f:
                    paper_content = f.read()
                logger.info(
                    f"📄 Paper file loaded: {paper_file_path} ({len(paper_content)} chars)"
                )
                break

        if not paper_content:
            logger.warning(
                f"⚠️ No .md file found in {paper_dir}, agents will search for it"
            )
    except Exception as e:
        logger.warning(f"⚠️ Error reading paper file: {e}, agents will search for it")

    # STEP 2: Configure agents with minimal tool access
    search_server_names = get_search_server_names()
    agent_config = get_adaptive_agent_config(use_segmentation, search_server_names)
    prompts = get_adaptive_prompts(use_segmentation)

    if paper_content:
        # When paper content is already loaded, agents don't need search tools
        agent_config = {
            "concept_analysis": [],
            "algorithm_analysis": search_server_names,
            "code_planner": search_server_names,
        }
    else:
        agent_config = {
            "concept_analysis": ["filesystem"],
            "algorithm_analysis": search_server_names + ["filesystem"],
            "code_planner": search_server_names + ["filesystem"],
        }

    print(f"   Agent configurations: {agent_config}")

    concept_analysis_agent = Agent(
        name="ConceptAnalysisAgent",
        instruction=prompts["concept_analysis"],
        server_names=agent_config["concept_analysis"],
    )
    algorithm_analysis_agent = Agent(
        name="AlgorithmAnalysisAgent",
        instruction=prompts["algorithm_analysis"],
        server_names=agent_config["algorithm_analysis"],
    )
    code_planner_agent = Agent(
        name="CodePlannerAgent",
        instruction=prompts["code_planning"],
        server_names=agent_config["code_planner"],
    )

    code_aggregator_agent = ParallelLLM(
        fan_in_agent=code_planner_agent,
        fan_out_agents=[concept_analysis_agent, algorithm_analysis_agent],
        llm_factory=get_preferred_llm_class(),
    )

    base_max_tokens, _ = get_token_limits()

    # STEP 3: Configure parameters - minimal tool filter since paper content is provided
    if use_segmentation:
        max_tokens_limit = base_max_tokens
        temperature = 0.2
        max_iterations = 5
        print(
            f"🧠 Using SEGMENTED mode: max_tokens={base_max_tokens} for complete YAML output"
        )

        # Segmentation mode: Only use segmentation tools if needed (paper content already provided)
        tool_filter = {
            "document-segmentation": {"read_document_segments", "get_document_overview"}
            if not paper_content
            else set(),  # Empty if paper already loaded
            # "brave" not in filter = all brave tools available for searching
        }
    else:
        max_tokens_limit = base_max_tokens
        temperature = 0.3
        max_iterations = 2
        print(
            f"🧠 Using TRADITIONAL mode: max_tokens={base_max_tokens} for complete YAML output"
        )

        # Traditional mode: No filesystem tools needed (paper content already provided)
        if paper_content:
            tool_filter = {
                # Only brave search available - no filesystem tools needed
            }
        else:
            tool_filter = {
                "filesystem": {
                    "read_text_file",
                    "list_directory",
                }
            }

    enhanced_params = RequestParams(
        maxTokens=max_tokens_limit,
        temperature=temperature,
        max_iterations=max_iterations,
        tool_filter=tool_filter
        if tool_filter
        else None,  # None = all tools, empty dict = no filtering
    )

    # STEP 4: Construct message with paper content directly included
    if paper_content:
        # Paper content provided directly - LLM only needs to analyze, not read files
        message = f"""Analyze the research paper provided below. The paper file has been pre-loaded for you.

=== PAPER CONTENT START ===
{paper_content}
=== PAPER CONTENT END ===

Based on this paper, generate a comprehensive code reproduction plan that includes:

1. Complete system architecture and component breakdown
2. All algorithms, formulas, and implementation details
3. Detailed file structure and implementation roadmap

You may use web search (brave_web_search) if you need clarification on algorithms, methods, or concepts.

The goal is to create a reproduction plan detailed enough for independent implementation."""
    else:
        # Fallback: paper not found, agents will need to find it
        message = f"""Analyze the research paper in directory: {paper_dir}

Please locate and analyze the markdown (.md) file containing the research paper. Based on your analysis, generate a comprehensive code reproduction plan that includes:

1. Complete system architecture and component breakdown
2. All algorithms, formulas, and implementation details
3. Detailed file structure and implementation roadmap

The goal is to create a reproduction plan detailed enough for independent implementation."""

    max_retries = 3
    retry_count = 0

    while retry_count < max_retries:
        try:
            print(
                f"🚀 Attempting code analysis (attempt {retry_count + 1}/{max_retries})"
            )
            result = await code_aggregator_agent.generate_str(
                message=message, request_params=enhanced_params
            )

            print(f"🔍 Code analysis result:\n{result}")

            completeness_score = _assess_output_completeness(
                result
            )  # need to add file structure val
            print(f"📊 Output completeness score: {completeness_score:.2f}/1.0")

            if completeness_score >= 0.8:
                print(
                    f"✅ Code analysis completed successfully (length: {len(result)} chars)"
                )
                return result
            else:
                print(
                    f"⚠️ Output appears truncated (score: {completeness_score:.2f}), retrying with enhanced parameters..."
                )
                new_max_tokens, new_temperature = _adjust_params_for_retry(
                    enhanced_params, retry_count
                )
                enhanced_params = RequestParams(
                    maxTokens=new_max_tokens,
                    temperature=new_temperature,
                    max_iterations=max_iterations,
                    tool_filter=tool_filter
                    if tool_filter
                    else None,  # None = all tools, empty dict = no filtering
                )
                retry_count += 1

        except Exception as e:
            print(f"❌ Error in code analysis attempt {retry_count + 1}: {e}")
            retry_count += 1
            if retry_count >= max_retries:
                raise

    print(f"⚠️ Returning potentially incomplete result after {max_retries} attempts")
    return result


async def github_repo_download(search_result: str, paper_dir: str, logger) -> str:
    """
    Download GitHub repositories based on search results.

    Args:
        search_result: Result from GitHub repository search
        paper_dir: Directory where the paper and its code will be stored
        logger: Logger instance for logging information

    Returns:
        str: Download result
    """
    github_download_agent = Agent(
        name="GithubDownloadAgent",
        instruction="Download github repo to the directory {paper_dir}/code_base".format(
            paper_dir=paper_dir
        ),
        server_names=["filesystem", "github-downloader"],
    )

    async with github_download_agent:
        print("GitHub downloader: Downloading repositories...")
        downloader = await github_download_agent.attach_llm(get_preferred_llm_class())

        # Set higher token output for GitHub download
        github_params = RequestParams(
            maxTokens=4096,  # Using camelCase
            temperature=0.1,
        )

        return await downloader.generate_str(
            message=search_result, request_params=github_params
        )


async def paper_reference_analyzer(paper_dir: str, logger) -> str:
    """
    Run the paper reference analysis and GitHub repository workflow.

    Args:
        analysis_result: Result from the paper analyzer
        logger: Logger instance for logging information

    Returns:
        str: Reference analysis result
    """
    reference_analysis_agent = Agent(
        name="ReferenceAnalysisAgent",
        instruction=PAPER_REFERENCE_ANALYZER_PROMPT,
        server_names=["filesystem", "fetch"],
    )
    message = f"""Analyze the research paper in directory: {paper_dir}

Please locate and analyze the markdown (.md) file containing the research paper. **Focus specifically on the References/Bibliography section** to identify and analyze the 5 most relevant references that have GitHub repositories.

Goal: Find the most valuable GitHub repositories from the paper's reference list for code implementation reference."""

    async with reference_analysis_agent:
        print("Reference analyzer: Connected to server, analyzing references...")
        analyzer = await reference_analysis_agent.attach_llm(get_preferred_llm_class())

        # Filter tools to only essential ones for reference analysis
        reference_params = RequestParams(
            maxTokens=4096,
            temperature=0.2,
            tool_filter={
                "filesystem": {"read_text_file", "list_directory"},
                "fetch": {"fetch"},
            },
        )

        reference_result = await analyzer.generate_str(
            message=message, request_params=reference_params
        )
        return reference_result


async def _process_input_source(input_source: str, logger) -> str:
    """
    Process and validate input source (file path or URL).

    Args:
        input_source: Input source (file path or analysis result)
        logger: Logger instance

    Returns:
        str: Processed input source
    """
    if input_source.startswith("file://"):
        file_path = input_source[7:]
        if os.name == "nt" and file_path.startswith("/"):
            file_path = file_path.lstrip("/")
        return file_path
    return input_source


async def orchestrate_research_analysis_agent(
    input_source: str, logger, progress_callback: Optional[Callable] = None
) -> Tuple[str, str]:
    """
    Orchestrate intelligent research analysis and resource processing automation.

    This agent coordinates multiple AI components to analyze research content
    and process associated resources with automated workflow management.

    Args:
        input_source: Research input source for analysis
        logger: Logger instance for process tracking
        progress_callback: Progress callback function for workflow monitoring

    Returns:
        tuple: (analysis_result, resource_processing_result)
    """
    # Step 1: Research Analysis
    if progress_callback:
        progress_callback(
            10, "📊 Analyzing research content and extracting key information..."
        )
    analysis_result = await run_research_analyzer(input_source, logger)

    # Add brief pause for system stability
    await asyncio.sleep(5)

    # Step 2: Download Processing
    if progress_callback:
        progress_callback(
            25, "📥 Processing downloads and preparing document structure..."
        )
    download_result = await run_resource_processor(analysis_result, logger)
    print("download result:", download_result)

    return analysis_result, download_result


async def synthesize_workspace_infrastructure_agent(
    download_result: str, logger, workspace_dir: Optional[str] = None
) -> Dict[str, str]:
    """
    Synthesize intelligent research workspace infrastructure with automated structure generation.

    This agent autonomously creates and configures the optimal workspace architecture
    for research project implementation with AI-driven path optimization.

    Args:
        download_result: Resource processing result from analysis agent
        logger: Logger instance for infrastructure tracking
        workspace_dir: Optional workspace directory path for environment customization

    Returns:
        dict: Comprehensive workspace infrastructure metadata
    """
    # Parse download result to get file information
    result = await FileProcessor.process_file_input(
        download_result, base_dir=workspace_dir
    )
    paper_dir = result["paper_dir"]

    # Log workspace infrastructure synthesis
    print("🏗️ Intelligent workspace infrastructure synthesized:")
    print(f"   Base workspace environment: {workspace_dir or 'auto-detected'}")
    print(f"   Research workspace: {paper_dir}")
    print("   AI-driven path optimization: active")

    return {
        "paper_dir": paper_dir,
        "standardized_text": result["standardized_text"],
        "reference_path": os.path.join(paper_dir, "reference.txt"),
        "initial_plan_path": os.path.join(paper_dir, "initial_plan.txt"),
        "download_path": os.path.join(paper_dir, "github_download.txt"),
        "index_report_path": os.path.join(paper_dir, "codebase_index_report.txt"),
        "implementation_report_path": os.path.join(
            paper_dir, "code_implementation_report.txt"
        ),
        "workspace_dir": workspace_dir,
    }


async def orchestrate_reference_intelligence_agent(
    dir_info: Dict[str, str], logger, progress_callback: Optional[Callable] = None
) -> str:
    """
    Orchestrate intelligent reference analysis with automated research discovery.

    This agent autonomously processes research references and discovers
    related work using advanced AI-powered analysis algorithms.

    Args:
        dir_info: Workspace infrastructure metadata
        logger: Logger instance for intelligence tracking
        progress_callback: Progress callback function for monitoring

    Returns:
        str: Comprehensive reference intelligence analysis result
    """
    if progress_callback:
        progress_callback(50, "🧠 Orchestrating reference intelligence discovery...")

    reference_path = dir_info["reference_path"]

    # Check if reference analysis already exists
    if os.path.exists(reference_path):
        print(f"Found existing reference analysis at {reference_path}")
        with open(reference_path, "r", encoding="utf-8") as f:
            return f.read()

    # Execute reference analysis
    reference_result = await paper_reference_analyzer(dir_info["paper_dir"], logger)

    # Save reference analysis result
    with open(reference_path, "w", encoding="utf-8") as f:
        f.write(reference_result)
    print(f"Reference analysis saved to {reference_path}")

    return reference_result


async def orchestrate_document_preprocessing_agent(
    dir_info: Dict[str, str], logger
) -> Dict[str, Any]:
    """
    Orchestrate adaptive document preprocessing with intelligent segmentation control.

    This agent autonomously determines whether to use document segmentation based on
    configuration settings and document size, then applies the appropriate processing strategy.

    Args:
        dir_info: Workspace infrastructure metadata
        logger: Logger instance for preprocessing tracking

    Returns:
        dict: Document preprocessing result with segmentation metadata
    """

    try:
        print("🔍 Starting adaptive document preprocessing...")
        print(f"   Paper directory: {dir_info['paper_dir']}")

        # Step 1: Check if any markdown files exist
        md_files = []
        try:
            md_files = [
                f for f in os.listdir(dir_info["paper_dir"]) if f.endswith(".md")
            ]
        except Exception as e:
            print(f"⚠️ Error reading paper directory: {e}")

        if not md_files:
            print("ℹ️ No markdown files found - skipping document preprocessing")
            dir_info["segments_ready"] = False
            dir_info["use_segmentation"] = False
            return {
                "status": "skipped",
                "reason": "no_markdown_files",
                "paper_dir": dir_info["paper_dir"],
                "segments_ready": False,
                "use_segmentation": False,
            }

        # Step 2: Read document content to determine size
        md_path = os.path.join(dir_info["paper_dir"], md_files[0])
        try:
            # Check if file is actually a PDF by reading the first few bytes
            with open(md_path, "rb") as f:
                header = f.read(8)
                if header.startswith(b"%PDF"):
                    # If we find a PDF file where we expected markdown, try to convert it
                    print(f"⚠️ Found PDF file instead of markdown: {md_path}")
                    print("🔄 Attempting to convert PDF to markdown...")
                    
                    # Try to convert the PDF to markdown
                    try:
                        from tools.pdf_downloader import SimplePdfConverter
                        converter = SimplePdfConverter()
                        conversion_result = converter.convert_pdf_to_markdown(md_path)
                        
                        if conversion_result["success"]:
                            print(f"✅ PDF converted to markdown: {conversion_result['output_file']}")
                            # Use the converted markdown file instead
                            md_path = conversion_result["output_file"]
                        else:
                            raise IOError(f"PDF conversion failed: {conversion_result['error']}")
                    except Exception as conv_error:
                        raise IOError(
                            f"File {md_path} is a PDF file, not a text file. PDF conversion failed: {str(conv_error)}"
                        )

            with open(md_path, "r", encoding="utf-8") as f:
                document_content = f.read()
        except Exception as e:
            print(f"⚠️ Error reading document content: {e}")
            dir_info["segments_ready"] = False
            dir_info["use_segmentation"] = False
            return {
                "status": "error",
                "error_message": f"Failed to read document: {str(e)}",
                "paper_dir": dir_info["paper_dir"],
                "segments_ready": False,
                "use_segmentation": False,
            }

        # Step 3: Determine if segmentation should be used
        should_segment, reason = should_use_document_segmentation(document_content)
        
        print(f"📊 Segmentation decision: {should_segment}")
        print(f"   Reason: {reason}")

        # Store decision in dir_info for downstream agents
        dir_info["use_segmentation"] = should_segment

        if should_segment:
            print("🔧 Using intelligent document segmentation workflow...")

            # Prepare document segments using the segmentation agent
            segmentation_result = await prepare_document_segments(
                paper_dir=dir_info["paper_dir"], logger=logger
            )

            if segmentation_result["status"] == "success":
                print("✅ Document segmentation completed successfully!")
                print(f"   Segments directory: {segmentation_result['segments_dir']}")
                print("   🧠 Intelligent segments ready for planning agents")

                # Add segment information to dir_info for downstream agents
                dir_info["segments_dir"] = segmentation_result["segments_dir"]
                dir_info["segments_ready"] = True

                return segmentation_result

            else:
                print(
                    f"⚠️ Document segmentation failed: {segmentation_result.get('error_message', 'Unknown error')}"
                )
                print("   Falling back to traditional full-document processing...")
                dir_info["segments_ready"] = False
                dir_info["use_segmentation"] = False

                return {
                    "status": "fallback_to_traditional",
                    "original_error": segmentation_result.get(
                        "error_message", "Unknown error"
                    ),
                    "paper_dir": dir_info["paper_dir"],
                    "segments_ready": False,
                    "use_segmentation": False,
                    "fallback_reason": "segmentation_failed",
                }
        else:
            print("📖 Using traditional full-document reading workflow...")
            dir_info["segments_ready"] = False

            return {
                "status": "traditional",
                "reason": reason,
                "paper_dir": dir_info["paper_dir"],
                "segments_ready": False,
                "use_segmentation": False,
                "document_size": len(document_content),
            }

    except Exception as e:
        print(f"❌ Error during document preprocessing: {e}")
        print("   Continuing with traditional full-document processing...")

        # Ensure fallback settings
        dir_info["segments_ready"] = False
        dir_info["use_segmentation"] = False

        return {
            "status": "error",
            "paper_dir": dir_info["paper_dir"],
            "segments_ready": False,
            "use_segmentation": False,
            "error_message": str(e),
        }


async def orchestrate_code_planning_agent(
    dir_info: Dict[str, str], logger, progress_callback: Optional[Callable] = None
):
    """
    Orchestrate intelligent code planning with automated design analysis.

    This agent autonomously generates optimal code reproduction plans and implementation
    strategies using AI-driven code analysis and planning principles.

    Args:
        dir_info: Workspace infrastructure metadata
        logger: Logger instance for planning tracking
        progress_callback: Progress callback function for monitoring
    """
    if progress_callback:
        progress_callback(40, "🏗️ Synthesizing intelligent code architecture...")

    initial_plan_path = dir_info["initial_plan_path"]

    # Check if initial plan already exists
    if not os.path.exists(initial_plan_path):
        # Use segmentation setting from preprocessing phase
        use_segmentation = dir_info.get("use_segmentation", True)
        print(f"📊 Planning mode: {'Segmented' if use_segmentation else 'Traditional'}")

        # First, verify there's a markdown file to analyze
        import glob
        md_files = glob.glob(os.path.join(dir_info["paper_dir"], "*.md"))
        md_files = [f for f in md_files if not f.endswith("implement_code_summary.md")]  # Exclude summary
        
        if not md_files:
            error_msg = f"❌ No markdown file found in {dir_info['paper_dir']}. PDF conversion may have failed."
            print(error_msg)
            print(f"   Paper directory: {dir_info['paper_dir']}")
            print(f"   Directory exists: {os.path.exists(dir_info['paper_dir'])}")
            if os.path.exists(dir_info['paper_dir']):
                all_files = os.listdir(dir_info['paper_dir'])
                print(f"   Available files ({len(all_files)}): {all_files}")
                
                # Check for PDF files that might need conversion
                pdf_files = [f for f in all_files if f.endswith('.pdf')]
                if pdf_files:
                    print(f"   Found PDF files that weren't converted: {pdf_files}")
            else:
                print(f"   ⚠️ Directory doesn't exist!")
            raise ValueError(error_msg)
        
        print(f"📄 Found markdown file for analysis: {os.path.basename(md_files[0])}")

        initial_plan_result = await run_code_analyzer(
            dir_info["paper_dir"], logger, use_segmentation=use_segmentation
        )
        
        # Check if plan is empty or invalid
        if not initial_plan_result or len(initial_plan_result.strip()) < 100:
            error_msg = f"❌ Code planning failed: Generated plan is empty or too short ({len(initial_plan_result)} chars)"
            print(error_msg)
            raise ValueError(error_msg)
        
        with open(initial_plan_path, "w", encoding="utf-8") as f:
            f.write(initial_plan_result)
        print(f"✅ Initial plan saved to {initial_plan_path} ({len(initial_plan_result)} chars)")


async def automate_repository_acquisition_agent(
    reference_result: str,
    dir_info: Dict[str, str],
    logger,
    progress_callback: Optional[Callable] = None,
):
    """
    Automate intelligent repository acquisition with AI-guided selection.

    This agent autonomously identifies, evaluates, and acquires relevant
    repositories using intelligent filtering and automated download protocols.

    Args:
        reference_result: Reference intelligence analysis result
        dir_info: Workspace infrastructure metadata
        logger: Logger instance for acquisition tracking
        progress_callback: Progress callback function for monitoring
    """
    if progress_callback:
        progress_callback(60, "🤖 Automating intelligent repository acquisition...")

    await asyncio.sleep(5)  # Brief pause for stability

    try:
        download_result = await github_repo_download(
            reference_result, dir_info["paper_dir"], logger
        )

        # Save download results
        with open(dir_info["download_path"], "w", encoding="utf-8") as f:
            f.write(download_result)
        print(f"GitHub download results saved to {dir_info['download_path']}")

        # Verify if any repositories were actually downloaded
        code_base_path = os.path.join(dir_info["paper_dir"], "code_base")
        if os.path.exists(code_base_path):
            downloaded_repos = [
                d
                for d in os.listdir(code_base_path)
                if os.path.isdir(os.path.join(code_base_path, d))
                and not d.startswith(".")
            ]

            if downloaded_repos:
                print(
                    f"Successfully downloaded {len(downloaded_repos)} repositories: {downloaded_repos}"
                )
            else:
                print(
                    "GitHub download phase completed, but no repositories were found in the code_base directory"
                )
                print("This might indicate:")
                print(
                    "1. No relevant repositories were identified in the reference analysis"
                )
                print(
                    "2. Repository downloads failed due to access permissions or network issues"
                )
                print(
                    "3. The download agent encountered errors during the download process"
                )
        else:
            print(f"Code base directory was not created: {code_base_path}")

    except Exception as e:
        print(f"Error during GitHub repository download: {e}")
        # Still save the error information
        error_message = f"GitHub download failed: {str(e)}"
        with open(dir_info["download_path"], "w", encoding="utf-8") as f:
            f.write(error_message)
        print(f"GitHub download error saved to {dir_info['download_path']}")
        raise e  # Re-raise to be handled by the main pipeline


async def orchestrate_codebase_intelligence_agent(
    dir_info: Dict[str, str], logger, progress_callback: Optional[Callable] = None
) -> Dict:
    """
    Orchestrate intelligent codebase analysis with automated knowledge extraction.

    This agent autonomously processes and indexes codebases using advanced
    AI algorithms for intelligent relationship mapping and knowledge synthesis.

    Args:
        dir_info: Workspace infrastructure metadata
        logger: Logger instance for intelligence tracking
        progress_callback: Progress callback function for monitoring

    Returns:
        dict: Comprehensive codebase intelligence analysis result
    """
    if progress_callback:
        progress_callback(70, "🧮 Orchestrating codebase intelligence analysis...")

    print(
        "Initiating intelligent codebase analysis with AI-powered relationship mapping..."
    )
    await asyncio.sleep(2)  # Brief pause before starting indexing

    # Check if code_base directory exists and has content
    code_base_path = os.path.join(dir_info["paper_dir"], "code_base")
    if not os.path.exists(code_base_path):
        print(f"Code base directory not found: {code_base_path}")
        return {
            "status": "skipped",
            "message": "No code base directory found - skipping indexing",
        }

    # Check if there are any repositories in the code_base directory
    try:
        repo_dirs = [
            d
            for d in os.listdir(code_base_path)
            if os.path.isdir(os.path.join(code_base_path, d)) and not d.startswith(".")
        ]

        if not repo_dirs:
            print(f"No repositories found in {code_base_path}")
            print("This might be because:")
            print("1. GitHub download phase didn't complete successfully")
            print("2. No relevant repositories were identified for download")
            print("3. Repository download failed due to access issues")
            print("Continuing with code implementation without codebase indexing...")

            # Save a report about the skipped indexing
            skip_report = {
                "status": "skipped",
                "reason": "no_repositories_found",
                "message": f"No repositories found in {code_base_path}",
                "suggestions": [
                    "Check if GitHub download phase completed successfully",
                    "Verify if relevant repositories were identified in reference analysis",
                    "Check network connectivity and GitHub access permissions",
                ],
            }

            with open(dir_info["index_report_path"], "w", encoding="utf-8") as f:
                f.write(str(skip_report))
            print(f"Indexing skip report saved to {dir_info['index_report_path']}")

            return skip_report

    except Exception as e:
        print(f"Error checking code base directory: {e}")
        return {
            "status": "error",
            "message": f"Error checking code base directory: {str(e)}",
        }

    try:
        from workflows.codebase_index_workflow import run_codebase_indexing

        print(f"Found {len(repo_dirs)} repositories to index: {repo_dirs}")

        # Run codebase index workflow
        index_result = await run_codebase_indexing(
            paper_dir=dir_info["paper_dir"],
            initial_plan_path=dir_info["initial_plan_path"],
            config_path="mcp_agent.secrets.yaml",
            logger=logger,
        )

        # Log indexing results
        if index_result["status"] == "success":
            print("Code indexing completed successfully!")
            print(
                f"Indexed {index_result['statistics']['total_repositories'] if index_result.get('statistics') else len(index_result['output_files'])} repositories"
            )
            print(f"Generated {len(index_result['output_files'])} index files")

            # Save indexing results to file
            with open(dir_info["index_report_path"], "w", encoding="utf-8") as f:
                f.write(str(index_result))
            print(f"Indexing report saved to {dir_info['index_report_path']}")

        elif index_result["status"] == "warning":
            print(f"Code indexing completed with warnings: {index_result['message']}")
        else:
            print(f"Code indexing failed: {index_result['message']}")

        return index_result

    except Exception as e:
        print(f"Error during codebase indexing workflow: {e}")
        print("Continuing with code implementation despite indexing failure...")

        # Save error report
        error_report = {
            "status": "error",
            "message": str(e),
            "phase": "codebase_indexing",
            "recovery_action": "continuing_with_code_implementation",
        }

        with open(dir_info["index_report_path"], "w", encoding="utf-8") as f:
            f.write(str(error_report))
        print(f"Indexing error report saved to {dir_info['index_report_path']}")

        return error_report


async def synthesize_code_implementation_agent(
    dir_info: Dict[str, str],
    logger,
    progress_callback: Optional[Callable] = None,
    enable_indexing: bool = True,
) -> Dict:
    """
    Synthesize intelligent code implementation with automated development.

    This agent autonomously generates high-quality code implementations using
    AI-powered development strategies and intelligent code synthesis algorithms.

    Args:
        dir_info: Workspace infrastructure metadata
        logger: Logger instance for implementation tracking
        progress_callback: Progress callback function for monitoring
        enable_indexing: Whether to enable code reference indexing for enhanced implementation

    Returns:
        dict: Comprehensive code implementation synthesis result
    """
    if progress_callback:
        progress_callback(85, "🔬 Synthesizing intelligent code implementation...")

    print(
        "Launching intelligent code synthesis with AI-driven implementation strategies..."
    )
    await asyncio.sleep(3)  # Brief pause before starting implementation

    try:
        # Create code implementation workflow instance based on indexing preference
        if enable_indexing:
            print(
                "🔍 Using enhanced code implementation workflow with reference indexing..."
            )
            code_workflow = CodeImplementationWorkflowWithIndex()
        else:
            print("⚡ Using standard code implementation workflow (fast mode)...")
            code_workflow = CodeImplementationWorkflow()

        # Check if initial plan file exists
        if os.path.exists(dir_info["initial_plan_path"]):
            print(f"Using initial plan from {dir_info['initial_plan_path']}")

            # Run code implementation workflow with pure code mode
            # Pass segmentation information to help with token management
            use_segmentation = dir_info.get("use_segmentation", False)
            print(f"🔧 Code implementation using segmentation: {use_segmentation}")
            
            implementation_result = await code_workflow.run_workflow(
                plan_file_path=dir_info["initial_plan_path"],
                target_directory=dir_info["paper_dir"],
                pure_code_mode=True,  # Focus on code implementation, skip testing
            )

            # Log implementation results
            if implementation_result["status"] == "success":
                print("Code implementation completed successfully!")
                print(f"Code directory: {implementation_result['code_directory']}")

                # Save implementation results to file
                with open(
                    dir_info["implementation_report_path"], "w", encoding="utf-8"
                ) as f:
                    f.write(str(implementation_result))
                print(
                    f"Implementation report saved to {dir_info['implementation_report_path']}"
                )

            else:
                print(
                    f"Code implementation failed: {implementation_result.get('message', 'Unknown error')}"
                )

            return implementation_result
        else:
            print(
                f"Initial plan file not found at {dir_info['initial_plan_path']}, skipping code implementation"
            )
            return {
                "status": "warning",
                "message": "Initial plan not found - code implementation skipped",
            }

    except Exception as e:
        print(f"Error during code implementation workflow: {e}")
        return {"status": "error", "message": str(e)}


async def run_chat_planning_agent(user_input: str, logger) -> str:
    """
    Run the chat-based planning agent for user-provided coding requirements.

    This agent transforms user's coding description into a comprehensive implementation plan
    that can be directly used for code generation. It handles both academic and engineering
    requirements with intelligent context adaptation.

    Args:
        user_input: User's coding requirements and description
        logger: Logger instance for logging information

    Returns:
        str: Comprehensive implementation plan in YAML format
    """
    try:
        print("💬 Starting chat-based planning agent...")
        print(f"Input length: {len(user_input) if user_input else 0}")
        print(f"Input preview: {user_input[:200] if user_input else 'None'}...")

        if not user_input or user_input.strip() == "":
            raise ValueError(
                "Empty or None user_input provided to run_chat_planning_agent"
            )

        # Create the chat planning agent
        chat_planning_agent = Agent(
            name="ChatPlanningAgent",
            instruction=CHAT_AGENT_PLANNING_PROMPT,
            server_names=get_search_server_names(),  # Dynamic search server configuration
        )

        async with chat_planning_agent:
            print("chat_planning: Connected to server, calling list_tools...")
            try:
                tools = await chat_planning_agent.list_tools()
                print(
                    "Tools available:",
                    tools.model_dump() if hasattr(tools, "model_dump") else str(tools),
                )
            except Exception as e:
                print(f"Failed to list tools: {e}")

            try:
                planner = await chat_planning_agent.attach_llm(
                    get_preferred_llm_class()
                )
                print("✅ LLM attached successfully")
            except Exception as e:
                print(f"❌ Failed to attach LLM: {e}")
                raise

            # Set higher token output for comprehensive planning
            planning_params = RequestParams(
                maxTokens=8192,  # Using camelCase - Higher token limit for detailed plans
                temperature=0.2,  # Lower temperature for more structured output
            )

            print(
                f"🔄 Making LLM request with params: maxTokens={planning_params.maxTokens}, temperature={planning_params.temperature}"
            )

            # Format the input message for the agent
            formatted_message = f"""Please analyze the following coding requirements and generate a comprehensive implementation plan:

User Requirements:
{user_input}

Please provide a detailed implementation plan that covers all aspects needed for successful development."""

            try:
                raw_result = await planner.generate_str(
                    message=formatted_message, request_params=planning_params
                )

                print("✅ Planning request completed")
                print(f"Raw result type: {type(raw_result)}")
                print(f"Raw result length: {len(raw_result) if raw_result else 0}")

                if not raw_result:
                    print("❌ CRITICAL: raw_result is empty or None!")
                    raise ValueError("Chat planning agent returned empty result")

            except Exception as e:
                print(f"❌ Planning generation failed: {e}")
                print(f"Exception type: {type(e)}")
                raise

            # Log to SimpleLLMLogger
            if hasattr(logger, "log_response"):
                logger.log_response(
                    raw_result, model="ChatPlanningAgent", agent="ChatPlanningAgent"
                )

            if not raw_result or raw_result.strip() == "":
                print("❌ CRITICAL: Planning result is empty!")
                raise ValueError("Chat planning agent produced empty output")

            print("🎯 Chat planning completed successfully")
            print(f"Planning result preview: {raw_result[:500]}...")

            return raw_result

    except Exception as e:
        print(f"❌ run_chat_planning_agent failed: {e}")
        print(f"Exception details: {type(e).__name__}: {str(e)}")
        raise


async def execute_multi_agent_research_pipeline(
    input_source: str,
    logger,
    progress_callback: Optional[Callable] = None,
    enable_indexing: bool = True,
) -> str:
    """
    Execute the complete intelligent multi-agent research orchestration pipeline.

    This is the main AI orchestration engine that coordinates autonomous research workflow agents:
    - Local workspace automation for seamless environment management
    - Intelligent research analysis with automated content processing
    - AI-driven code architecture synthesis and design automation
    - Reference intelligence discovery with automated knowledge extraction (optional)
    - Codebase intelligence orchestration with automated relationship analysis (optional)
    - Intelligent code implementation synthesis with AI-powered development

    Args:
        input_source: Research input source (file path, URL, or preprocessed analysis)
        logger: Logger instance for comprehensive workflow intelligence tracking
        progress_callback: Progress callback function for real-time monitoring
        enable_indexing: Whether to enable advanced intelligence analysis (default: True)

    Returns:
        str: The comprehensive pipeline execution result with status and outcomes
    """
    try:
        # Phase 0: Workspace Setup (5%)
        if progress_callback:
            progress_callback(5, "🔄 Setting up workspace for file processing...")

        print("🚀 Initializing intelligent multi-agent research orchestration system")
        print("📊 Progress: 5% - Workspace Setup")

        # Setup local workspace directory
        workspace_dir = os.path.join(os.getcwd(), "deepcode_lab")
        os.makedirs(workspace_dir, exist_ok=True)

        print("📁 Working environment: local")
        print(f"📂 Workspace directory: {workspace_dir}")
        print("✅ Workspace status: ready")

        # Log intelligence functionality status
        if enable_indexing:
            print("🧠 Advanced intelligence analysis enabled - comprehensive workflow")
        else:
            print("⚡ Optimized mode - advanced intelligence analysis disabled")

        # Phase 1: Input Processing and Validation (10%)
        if progress_callback:
            progress_callback(10, "📄 Processing and validating input source...")
        print("📊 Progress: 10% - Input Processing")
        
        input_source = await _process_input_source(input_source, logger)

        # Phase 2: Research Analysis and Resource Processing (25%)
        if progress_callback:
            progress_callback(25, "🔍 Analyzing research content and downloading resources...")
        print("📊 Progress: 25% - Research Analysis")
        
        # Check if input_source is already a JSON with paper_path in a paper_{timestamp} folder
        skip_processing = False
        if isinstance(input_source, str):
            try:
                import json
                import re
                input_dict = json.loads(input_source)
                if "paper_path" in input_dict:
                    paper_path = input_dict["paper_path"]
                    paper_dir = os.path.dirname(paper_path)
                    # Check if already in a paper_{timestamp} folder
                    if re.match(r"paper_\d+$", os.path.basename(paper_dir)):
                        print(f"✅ File already in organized folder: {paper_dir}")
                        print(f"   Skipping research analysis phase (file already processed)")
                        
                        # Convert PDF to markdown if not already done
                        if paper_path.endswith('.pdf'):
                            print(f"🔄 Converting PDF to markdown...")
                            try:
                                from tools.pdf_downloader import SimplePdfConverter
                                converter = SimplePdfConverter()
                                conversion_result = converter.convert_pdf_to_markdown(paper_path)
                                if conversion_result["success"]:
                                    print(f"✅ PDF converted to markdown: {conversion_result['output_file']}")
                                    # Update paper_path to point to markdown file
                                    input_dict["paper_path"] = conversion_result["output_file"]
                                    download_result = json.dumps(input_dict)
                                else:
                                    print(f"⚠️ PDF conversion failed: {conversion_result.get('error')}")
                                    download_result = input_source
                            except Exception as e:
                                print(f"⚠️ PDF conversion error: {e}")
                                download_result = input_source
                        else:
                            download_result = input_source
                        
                        skip_processing = True
            except:
                pass  # Not JSON, continue normal processing
        
        if not skip_processing and isinstance(input_source, str) and (
            input_source.endswith((".pdf", ".docx", ".txt", ".html", ".md"))
            or input_source.startswith(("http", "file://"))
        ):
            (
                analysis_result,
                download_result,
            ) = await orchestrate_research_analysis_agent(
                input_source, logger, progress_callback
            )
        elif not skip_processing:
            download_result = input_source  # Use input directly if already processed

        # Phase 3: Workspace Infrastructure Synthesis (40%)
        if progress_callback:
            progress_callback(
                40, "🏗️ Synthesizing intelligent workspace infrastructure..."
            )
        print("📊 Progress: 40% - Workspace Setup")

        dir_info = await synthesize_workspace_infrastructure_agent(
            download_result, logger, workspace_dir
        )
        await asyncio.sleep(5)

        # Phase 4: Document Segmentation and Preprocessing (50%)
        if progress_callback:
            progress_callback(50, "📄 Processing and segmenting document content...")
        print("📊 Progress: 50% - Document Preprocessing")

        segmentation_result = await orchestrate_document_preprocessing_agent(
            dir_info, logger
        )

        # Handle segmentation result
        if segmentation_result["status"] == "success":
            print("✅ Document preprocessing completed successfully!")
            print(
                f"   📊 Using segmentation: {dir_info.get('use_segmentation', False)}"
            )
            if dir_info.get("segments_ready", False):
                print(
                    f"   📁 Segments directory: {segmentation_result.get('segments_dir', 'N/A')}"
                )
        elif segmentation_result["status"] == "fallback_to_traditional":
            print("⚠️ Document segmentation failed, using traditional processing")
            print(
                f"   Original error: {segmentation_result.get('original_error', 'Unknown')}"
            )
        else:
            print(
                f"⚠️ Document preprocessing encountered issues: {segmentation_result.get('error_message', 'Unknown')}"
            )

        # Phase 5: Code Planning Orchestration (65%)
        if progress_callback:
            progress_callback(65, "📋 Generating implementation plan and code structure...")
        print("📊 Progress: 65% - Code Planning")
        
        await orchestrate_code_planning_agent(dir_info, logger, progress_callback)

        # Phase 6: Reference Intelligence (only when indexing is enabled) (70%)
        if progress_callback:
            progress_callback(70, "🔍 Analyzing references and related work...")
        print("📊 Progress: 70% - Reference Analysis")
        
        if enable_indexing:
            reference_result = await orchestrate_reference_intelligence_agent(
                dir_info, logger, progress_callback
            )
        else:
            print("🔶 Skipping reference intelligence analysis (fast mode enabled)")
            # Create empty reference analysis result to maintain file structure consistency
            reference_result = "Reference intelligence analysis skipped - fast mode enabled for optimized processing"
            with open(dir_info["reference_path"], "w", encoding="utf-8") as f:
                f.write(reference_result)

        # Phase 7: Repository Acquisition Automation (optional) (75%)
        if progress_callback:
            progress_callback(75, "📦 Acquiring related repositories and codebases...")
        print("📊 Progress: 75% - Repository Acquisition")
        
        if enable_indexing:
            await automate_repository_acquisition_agent(
                reference_result, dir_info, logger, progress_callback
            )
        else:
            print("🔶 Skipping automated repository acquisition (fast mode enabled)")
            # Create empty download result file to maintain file structure consistency
            with open(dir_info["download_path"], "w", encoding="utf-8") as f:
                f.write(
                    "Automated repository acquisition skipped - fast mode enabled for optimized processing"
                )

        # Phase 8: Codebase Intelligence Orchestration (optional) (80%)
        if progress_callback:
            progress_callback(80, "🧠 Analyzing codebase intelligence and indexing...")
        print("📊 Progress: 80% - Codebase Intelligence")
        
        if enable_indexing:
            index_result = await orchestrate_codebase_intelligence_agent(
                dir_info, logger, progress_callback
            )
        else:
            print("🔶 Skipping codebase intelligence orchestration (fast mode enabled)")
            # Create a skipped indexing result
            index_result = {
                "status": "skipped",
                "reason": "fast_mode_enabled",
                "message": "Codebase intelligence orchestration skipped for optimized processing",
            }
            with open(dir_info["index_report_path"], "w", encoding="utf-8") as f:
                f.write(str(index_result))

        # Phase 9: Code Implementation Synthesis (85%)
        if progress_callback:
            progress_callback(85, "💻 Implementing code based on analysis and planning...")
        print("📊 Progress: 85% - Code Implementation")
        
        implementation_result = await synthesize_code_implementation_agent(
            dir_info, logger, progress_callback, enable_indexing
        )

        # Phase 10: Finalization (100%)
        if progress_callback:
            progress_callback(100, "🎉 Finalizing results and generating summary...")
        print("📊 Progress: 100% - Finalization")
        
        # Final Status Report
        if enable_indexing:
            pipeline_summary = (
                f"Multi-agent research pipeline completed for {dir_info['paper_dir']}"
            )
        else:
            pipeline_summary = f"Multi-agent research pipeline completed (fast mode) for {dir_info['paper_dir']}"

        # Add indexing status to summary
        if not enable_indexing:
            pipeline_summary += (
                "\n⚡ Fast mode: GitHub download and codebase indexing skipped"
            )
        elif index_result["status"] == "skipped":
            pipeline_summary += f"\n🔶 Codebase indexing: {index_result['message']}"
        elif index_result["status"] == "error":
            pipeline_summary += (
                f"\n❌ Codebase indexing failed: {index_result['message']}"
            )
        elif index_result["status"] == "success":
            pipeline_summary += "\n✅ Codebase indexing completed successfully"

        # Add implementation status to summary
        if implementation_result["status"] == "success":
            pipeline_summary += "\n🎉 Code implementation completed successfully!"
            pipeline_summary += (
                f"\n📁 Code generated in: {implementation_result['code_directory']}"
            )
            return pipeline_summary
        elif implementation_result["status"] == "warning":
            pipeline_summary += (
                f"\n⚠️ Code implementation: {implementation_result['message']}"
            )
            return pipeline_summary
        else:
            pipeline_summary += (
                f"\n❌ Code implementation failed: {implementation_result['message']}"
            )
            return pipeline_summary

    except Exception as e:
        error_msg = f"Error in execute_multi_agent_research_pipeline: {e}"
        print(f"❌ {error_msg}")
        print(f"   Error type: {type(e).__name__}")
        print(f"   Error details: {str(e)}")
        
        # Display error in UI if progress callback available
        if progress_callback:
            progress_callback(0, "Pipeline failed", error_msg)
        
        # Ensure all resources are cleaned up on error
        import gc
        gc.collect()
        raise e


# Backward compatibility alias (deprecated)
async def paper_code_preparation(
    input_source: str, logger, progress_callback: Optional[Callable] = None
) -> str:
    """
    Deprecated: Use execute_multi_agent_research_pipeline instead.

    Args:
        input_source: Input source
        logger: Logger instance
        progress_callback: Progress callback function

    Returns:
        str: Pipeline result
    """
    print(
        "paper_code_preparation is deprecated. Use execute_multi_agent_research_pipeline instead."
    )
    return await execute_multi_agent_research_pipeline(
        input_source, logger, progress_callback
    )


async def execute_chat_based_planning_pipeline(
    user_input: str,
    logger,
    progress_callback: Optional[Callable] = None,
    enable_indexing: bool = True,
) -> str:
    """
    Execute the chat-based planning and implementation pipeline.

    This pipeline is designed for users who provide coding requirements directly through chat,
    bypassing the traditional paper analysis phases (Phase 0-7) and jumping directly to
    planning and code implementation.

    Pipeline Flow:
    - Chat Planning: Transform user input into implementation plan
    - Workspace Setup: Create necessary directory structure
    - Code Implementation: Generate code based on the plan

    Args:
        user_input: User's coding requirements and description
        logger: Logger instance for comprehensive workflow tracking
        progress_callback: Progress callback function for real-time monitoring
        enable_indexing: Whether to enable code reference indexing for enhanced implementation

    Returns:
        str: The pipeline execution result with status and outcomes
    """
    try:
        print("🚀 Initializing chat-based planning and implementation pipeline")
        print("💬 Chat mode: Direct user requirements to code implementation")

        # Phase 0: Workspace Setup
        if progress_callback:
            progress_callback(5, "🔄 Setting up workspace for file processing...")

        # Setup local workspace directory
        workspace_dir = os.path.join(os.getcwd(), "deepcode_lab")
        os.makedirs(workspace_dir, exist_ok=True)

        print("📁 Working environment: local")
        print(f"📂 Workspace directory: {workspace_dir}")
        print("✅ Workspace status: ready")

        # Phase 1: Chat-Based Planning
        if progress_callback:
            progress_callback(
                30,
                "💬 Generating comprehensive implementation plan from user requirements...",
            )

        print("🧠 Running chat-based planning agent...")
        planning_result = await run_chat_planning_agent(user_input, logger)

        # Phase 2: Workspace Infrastructure Synthesis
        if progress_callback:
            progress_callback(
                50, "🏗️ Synthesizing intelligent workspace infrastructure..."
            )

        # Create workspace directory structure for chat mode
        # First, let's create a temporary directory structure that mimics a paper workspace
        import time

        # Generate a unique paper directory name
        timestamp = str(int(time.time()))
        paper_name = f"chat_project_{timestamp}"

        # Use workspace directory
        chat_paper_dir = os.path.join(workspace_dir, "papers", paper_name)

        os.makedirs(chat_paper_dir, exist_ok=True)

        # Create a synthetic markdown file with user requirements
        markdown_content = f"""# User Coding Requirements

## Project Description
This is a coding project generated from user requirements via chat interface.

## User Requirements
{user_input}

## Generated Implementation Plan
The following implementation plan was generated by the AI chat planning agent:

```yaml
{planning_result}
```

## Project Metadata
- **Input Type**: Chat Input
- **Generation Method**: AI Chat Planning Agent
- **Timestamp**: {timestamp}
"""

        # Save the markdown file
        markdown_file_path = os.path.join(chat_paper_dir, f"{paper_name}.md")
        with open(markdown_file_path, "w", encoding="utf-8") as f:
            f.write(markdown_content)

        print(f"💾 Created chat project workspace: {chat_paper_dir}")
        print(f"📄 Saved requirements to: {markdown_file_path}")

        # Create a download result that matches FileProcessor expectations
        synthetic_download_result = json.dumps(
            {
                "status": "success",
                "paper_path": markdown_file_path,
                "input_type": "chat_input",
                "paper_info": {
                    "title": "User-Provided Coding Requirements",
                    "source": "chat_input",
                    "description": "Implementation plan generated from user requirements",
                },
            }
        )

        dir_info = await synthesize_workspace_infrastructure_agent(
            synthetic_download_result, logger, workspace_dir
        )
        await asyncio.sleep(10)  # Brief pause for file system operations

        # Phase 3: Save Planning Result
        if progress_callback:
            progress_callback(70, "📝 Saving implementation plan...")

        # Save the planning result to the initial_plan.txt file (same location as Phase 4 in original pipeline)
        initial_plan_path = dir_info["initial_plan_path"]
        with open(initial_plan_path, "w", encoding="utf-8") as f:
            f.write(planning_result)
        print(f"💾 Implementation plan saved to {initial_plan_path}")

        # Phase 4: Code Implementation Synthesis (same as Phase 8 in original pipeline)
        if progress_callback:
            progress_callback(85, "🔬 Synthesizing intelligent code implementation...")

        implementation_result = await synthesize_code_implementation_agent(
            dir_info, logger, progress_callback, enable_indexing
        )

        # Final Status Report
        pipeline_summary = f"Chat-based planning and implementation pipeline completed for {dir_info['paper_dir']}"

        # Add implementation status to summary
        if implementation_result["status"] == "success":
            pipeline_summary += "\n🎉 Code implementation completed successfully!"
            pipeline_summary += (
                f"\n📁 Code generated in: {implementation_result['code_directory']}"
            )
            pipeline_summary += (
                "\n💬 Generated from user requirements via chat interface"
            )
            return pipeline_summary
        elif implementation_result["status"] == "warning":
            pipeline_summary += (
                f"\n⚠️ Code implementation: {implementation_result['message']}"
            )
            return pipeline_summary
        else:
            pipeline_summary += (
                f"\n❌ Code implementation failed: {implementation_result['message']}"
            )
            return pipeline_summary

    except Exception as e:
        print(f"Error in execute_chat_based_planning_pipeline: {e}")
        raise e


================================================
FILE: workflows/agents/__init__.py
================================================
"""
Agents Package for Code Implementation Workflow

This package contains specialized agents for different aspects of code implementation:
- CodeImplementationAgent: Handles file-by-file code generation
- ConciseMemoryAgent: Manages memory optimization and consistency across phases
"""

from .code_implementation_agent import CodeImplementationAgent
from .memory_agent_concise import ConciseMemoryAgent as MemoryAgent

__all__ = ["CodeImplementationAgent", "MemoryAgent"]


================================================
FILE: workflows/agents/code_implementation_agent.py
================================================
"""
Code Implementation Agent for File-by-File Development

Handles systematic code implementation with progress tracking and
memory optimization for long-running development sessions.
"""

import json
import time
import logging
from typing import Dict, Any, List, Optional

# Import tiktoken for token calculation
try:
    import tiktoken

    TIKTOKEN_AVAILABLE = True
except ImportError:
    TIKTOKEN_AVAILABLE = False

# Import prompts from code_prompts
import sys
import os

sys.path.insert(
    0, os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
)
from prompts.code_prompts import (
    GENERAL_CODE_IMPLEMENTATION_SYSTEM_PROMPT,
)


class CodeImplementationAgent:
    """
    Code Implementation Agent for systematic file-by-file development

    Responsibilities:
    - Track file implementation progress
    - Execute MCP tool calls for code generation
    - Monitor implementation status
    - Coordinate with Summary Agent for memory optimization
    - Calculate token usage for context management
    """

    def __init__(
        self,
        mcp_agent,
        logger: Optional[logging.Logger] = None,
        enable_read_tools: bool = True,
    ):
        """
        Initialize Code Implementation Agent

        Args:
            mcp_agent: MCP agent instance for tool calls
            logger: Logger instance for tracking operations
            enable_read_tools: Whether to enable read_file and read_code_mem tools (default: True)
        """
        self.mcp_agent = mcp_agent
        self.logger = logger or self._create_default_logger()
        self.enable_read_tools = enable_read_tools  # Control read tools execution

        self.implementation_summary = {
            "completed_files": [],
            "technical_decisions": [],
            "important_constraints": [],
            "architecture_notes": [],
            "dependency_analysis": [],  # Track dependency analysis and file reads
        }
        self.files_implemented_count = 0
        self.implemented_files_set = (
            set()
        )  # Track unique file paths to avoid duplicate counting
        self.files_read_for_dependencies = (
            set()
        )  # Track files read for dependency analysis
        self.last_summary_file_count = (
            0  # Track the file count when last summary was triggered
        )

        # Token calculation settings
        self.max_context_tokens = (
            200000  # Default max context tokens for Claude-3.5-Sonnet
        )
        self.token_buffer = 10000  # Safety buffer before reaching max
        self.summary_trigger_tokens = (
            self.max_context_tokens - self.token_buffer
        )  # Trigger summary when approaching limit
        self.last_summary_token_count = (
            0  # Track token count when last summary was triggered
        )

        # Initialize tokenizer
        if TIKTOKEN_AVAILABLE:
            try:
                # Use Claude-3 tokenizer (approximation with OpenAI's o200k_base)
                self.tokenizer = tiktoken.get_encoding("o200k_base")
                self.logger.info("Token calculation enabled with o200k_base encoding")
            except Exception as e:
                self.tokenizer = None
                self.logger.warning(f"Failed to initialize tokenizer: {e}")
        else:
            self.tokenizer = None
            self.logger.warning(
                "tiktoken not available, token-based summary triggering disabled"
            )

        # Analysis loop detection
        self.recent_tool_calls = []  # Track recent tool calls to detect analysis loops
        self.max_read_without_write = 5  # Max read_file calls without write_file

        # Memory agent integration
        self.memory_agent = None  # Will be set externally
        self.llm_client = None  # Will be set externally
        self.llm_client_type = None  # Will be set externally

        # Log read tools configuration
        read_tools_status = "ENABLED" if self.enable_read_tools else "DISABLED"
        self.logger.info(
            f"🔧 Code Implementation Agent initialized - Read tools: {read_tools_status}"
        )
        if not self.enable_read_tools:
            self.logger.info(
                "🚫 Testing mode: read_file and read_code_mem will be skipped when called"
            )

    def _create_default_logger(self) -> logging.Logger:
        """Create default logger if none provided"""
        logger = logging.getLogger(f"{__name__}.CodeImplementationAgent")
        # Don't add handlers to child loggers - let them propagate to root
        logger.setLevel(logging.INFO)
        return logger

    def get_system_prompt(self) -> str:
        """
        Get the system prompt for code implementation
        """
        return GENERAL_CODE_IMPLEMENTATION_SYSTEM_PROMPT

    def set_memory_agent(self, memory_agent, llm_client=None, llm_client_type=None):
        """
        Set memory agent for code summary generation

        Args:
            memory_agent: Memory agent instance
            llm_client: LLM client for summary generation
            llm_client_type: Type of LLM client ("anthropic" or "openai")
        """
        self.memory_agent = memory_agent
        self.llm_client = llm_client
        self.llm_client_type = llm_client_type
        self.logger.info("Memory agent integration configured")

    async def execute_tool_calls(self, tool_calls: List[Dict]) -> List[Dict]:
        """
        Execute MCP tool calls and track implementation progress

        Args:
            tool_calls: List of tool calls to execute

        Returns:
            List of tool execution results
        """
        results = []

        for tool_call in tool_calls:
            tool_name = tool_call["name"]
            tool_input = tool_call["input"]

            self.logger.info(f"Executing MCP tool: {tool_name}")

            try:
                # Check if read tools are disabled
                if not self.enable_read_tools and tool_name in [
                    "read_file",
                    "read_code_mem",
                ]:
                    # self.logger.info(f"🚫 SKIPPING {tool_name} - Read tools disabled for testing")
                    # Return a mock result indicating the tool was skipped
                    mock_result = json.dumps(
                        {
                            "status": "skipped",
                            "message": f"{tool_name} tool disabled for testing",
                            "tool_disabled": True,
                            "original_input": tool_input,
                        },
                        ensure_ascii=False,
                    )

                    results.append(
                        {
                            "tool_id": tool_call["id"],
                            "tool_name": tool_name,
                            "result": mock_result,
                        }
                    )
                    continue

                # read_code_mem is now a proper MCP tool, no special handling needed

                # INTERCEPT read_file calls - redirect to read_code_mem first if memory agent is available
                if tool_name == "read_file":
                    file_path = tool_call["input"].get("file_path", "unknown")
                    self.logger.info(f"🔍 READ_FILE CALL DETECTED: {file_path}")
                    self.logger.info(
                        f"📊 Files implemented count: {self.files_implemented_count}"
                    )
                    self.logger.info(
                        f"🧠 Memory agent available: {self.memory_agent is not None}"
                    )

                    # Enable optimization if memory agent is available (more aggressive approach)
                    if self.memory_agent is not None:
                        self.logger.info(
                            f"🔄 INTERCEPTING read_file call for {file_path} (memory agent available)"
                        )
                        result = await self._handle_read_file_with_memory_optimization(
                            tool_call
                        )
                        results.append(result)
                        continue
                    else:
                        self.logger.info(
                            "📁 NO INTERCEPTION: no memory agent available"
                        )

                if self.mcp_agent:
                    # Execute tool call through MCP protocol
                    result = await self.mcp_agent.call_tool(tool_name, tool_input)

                    # Track file implementation progress
                    if tool_name == "write_file":
                        await self._track_file_implementation_with_summary(
                            tool_call, result
                        )
                    elif tool_name == "read_file":
                        self._track_dependency_analysis(tool_call, result)

                    # Track tool calls for analysis loop detection
                    self._track_tool_call_for_loop_detection(tool_name)

                    results.append(
                        {
                            "tool_id": tool_call["id"],
                            "tool_name": tool_name,
                            "result": result,
                        }
                    )
                else:
                    results.append(
                        {
                            "tool_id": tool_call["id"],
                            "tool_name": tool_name,
                            "result": json.dumps(
                                {
                                    "status": "error",
                                    "message": "MCP agent not initialized",
                                },
                                ensure_ascii=False,
                            ),
                        }
                    )

            except Exception as e:
                self.logger.error(f"MCP tool execution failed: {e}")
                results.append(
                    {
                        "tool_id": tool_call["id"],
                        "tool_name": tool_name,
                        "result": json.dumps(
                            {"status": "error", "message": str(e)}, ensure_ascii=False
                        ),
                    }
                )

        return results

    # _handle_read_code_mem method removed - read_code_mem is now a proper MCP tool

    async def _handle_read_file_with_memory_optimization(self, tool_call: Dict) -> Dict:
        """
        Intercept read_file calls and redirect to read_code_mem if a summary exists.
        This prevents unnecessary file reads if the summary is already available.
        """
        file_path = tool_call["input"].get("file_path")
        if not file_path:
            return {
                "tool_id": tool_call["id"],
                "tool_name": "read_file",
                "result": json.dumps(
                    {"status": "error", "message": "file_path parameter is required"},
                    ensure_ascii=False,
                ),
            }

        # Check if a summary exists for this file using read_code_mem MCP tool
        should_use_summary = False
        if self.memory_agent and self.mcp_agent:
            try:
                # Use read_code_mem MCP tool to check if summary exists (pass file path as list)
                read_code_mem_result = await self.mcp_agent.call_tool(
                    "read_code_mem", {"file_paths": [file_path]}
                )

                # Parse the result to check if summary was found
                import json

                if isinstance(read_code_mem_result, str):
                    try:
                        result_data = json.loads(read_code_mem_result)
                        # Check if any summaries were found in the results
                        should_use_summary = (
                            result_data.get("status")
                            in ["all_summaries_found", "partial_summaries_found"]
                            and result_data.get("summaries_found", 0) > 0
                        )
                    except json.JSONDecodeError:
                        should_use_summary = False
            except Exception as e:
                self.logger.debug(f"read_code_mem check failed for {file_path}: {e}")
                should_use_summary = False

        if should_use_summary:
            self.logger.info(f"🔄 READ_FILE INTERCEPTED: Using summary for {file_path}")

            # Use the MCP agent to call read_code_mem tool
            if self.mcp_agent:
                result = await self.mcp_agent.call_tool(
                    "read_code_mem", {"file_paths": [file_path]}
                )

                # Modify the result to indicate it was originally a read_file call
                import json

                try:
                    result_data = (
                        json.loads(result) if isinstance(result, str) else result
                    )
                    if isinstance(result_data, dict):
                        # Extract the specific file result for the single file we requested
                        file_results = result_data.get("results", [])
                        if file_results and len(file_results) > 0:
                            specific_result = file_results[
                                0
                            ]  # Get the first (and only) result
                            # Transform to match the old single-file format for backward compatibility
                            transformed_result = {
                                "status": specific_result.get("status", "no_summary"),
                                "file_path": specific_result.get(
                                    "file_path", file_path
                                ),
                                "summary_content": specific_result.get(
                                    "summary_content"
                                ),
                                "message": specific_result.get("message", ""),
                                "original_tool": "read_file",
                                "optimization": "redirected_to_read_code_mem",
                            }
                            final_result = json.dumps(
                                transformed_result, ensure_ascii=False
                            )
                        else:
                            # Fallback if no results
                            result_data["original_tool"] = "read_file"
                            result_data["optimization"] = "redirected_to_read_code_mem"
                            final_result = json.dumps(result_data, ensure_ascii=False)
                    else:
                        final_result = result
                except (json.JSONDecodeError, TypeError):
                    final_result = result

                return {
                    "tool_id": tool_call["id"],
                    "tool_name": "read_file",  # Keep original tool name for tracking
                    "result": final_result,
                }
            else:
                self.logger.warning(
                    "MCP agent not available for read_code_mem optimization"
                )
        else:
            self.logger.info(
                f"📁 READ_FILE: No summary for {file_path}, using actual file"
            )

            # Execute the original read_file call
            if self.mcp_agent:
                result = await self.mcp_agent.call_tool("read_file", tool_call["input"])

                # Track dependency analysis for the actual file read
                self._track_dependency_analysis(tool_call, result)

                # Track tool calls for analysis loop detection
                self._track_tool_call_for_loop_detection("read_file")

                return {
                    "tool_id": tool_call["id"],
                    "tool_name": "read_file",
                    "result": result,
                }
            else:
                return {
                    "tool_id": tool_call["id"],
                    "tool_name": "read_file",
                    "result": json.dumps(
                        {"status": "error", "message": "MCP agent not initialized"},
                        ensure_ascii=False,
                    ),
                }

    async def _track_file_implementation_with_summary(
        self, tool_call: Dict, result: Any
    ):
        """
        Track file implementation and create code summary

        Args:
            tool_call: The write_file tool call
            result: Result of the tool execution
        """
        # First do the regular tracking
        self._track_file_implementation(tool_call, result)

        # Then create and save code summary if memory agent is available
        if self.memory_agent and self.llm_client and self.llm_client_type:
            try:
                file_path = tool_call["input"].get("file_path")
                file_content = tool_call["input"].get("content", "")

                if file_path and file_content:
                    # Create code implementation summary
                    summary = await self.memory_agent.create_code_implementation_summary(
                        self.llm_client,
                        self.llm_client_type,
                        file_path,
                        file_content,
                        self.get_files_implemented_count(),  # Pass the current file count
                    )

                    self.logger.info(
                        f"Created code summary for implemented file: {file_path}, summary: {summary[:100]}..."
                    )
                else:
                    self.logger.warning(
                        "Missing file path or content for summary generation"
                    )

            except Exception as e:
                self.logger.error(f"Failed to create code summary: {e}")

    def _track_file_implementation(self, tool_call: Dict, result: Any):
        """
        Track file implementation progress
        """
        try:
            # Handle different result types from MCP
            result_data = None

            # Check if result is a CallToolResult object
            if hasattr(result, "content"):
                # Extract content from CallToolResult
                if hasattr(result.content, "text"):
                    result_content = result.content.text
                else:
                    result_content = str(result.content)

                # Try to parse as JSON
                try:
                    result_data = json.loads(result_content)
                except json.JSONDecodeError:
                    # If not JSON, create a structure
                    result_data = {
                        "status": "success",
                        "file_path": tool_call["input"].get("file_path", "unknown"),
                    }
            elif isinstance(result, str):
                # Try to parse string result
                try:
                    result_data = json.loads(result)
                except json.JSONDecodeError:
                    result_data = {
                        "status": "success",
                        "file_path": tool_call["input"].get("file_path", "unknown"),
                    }
            elif isinstance(result, dict):
                # Direct dictionary result
                result_data = result
            else:
                # Fallback: assume success and extract file path from input
                result_data = {
                    "status": "success",
                    "file_path": tool_call["input"].get("file_path", "unknown"),
                }

            # Extract file path for tracking
            file_path = None
            if result_data and result_data.get("status") == "success":
                file_path = result_data.get(
                    "file_path", tool_call["input"].get("file_path", "unknown")
                )
            else:
                file_path = tool_call["input"].get("file_path")

            # Only count unique files, not repeated tool calls on same file
            if file_path and file_path not in self.implemented_files_set:
                # This is a new file implementation
                self.implemented_files_set.add(file_path)
                self.files_implemented_count += 1
                # self.logger.info(f"New file implementation tracked: count={self.files_implemented_count}, file={file_path}")
                # print(f"New file implementation tracked: count={self.files_implemented_count}, file={file_path}")

                # Add to completed files list
                self.implementation_summary["completed_files"].append(
                    {
                        "file": file_path,
                        "iteration": self.files_implemented_count,
                        "timestamp": time.time(),
                        "size": result_data.get("size", 0) if result_data else 0,
                    }
                )

                # self.logger.info(
                #     f"New file implementation tracked: count={self.files_implemented_count}, file={file_path}"
                # )
                # print(f"📝 NEW FILE IMPLEMENTED: count={self.files_implemented_count}, file={file_path}")
                # print(f"🔧 OPTIMIZATION NOW ENABLED: files_implemented_count > 0 = {self.files_implemented_count > 0}")
            elif file_path and file_path in self.implemented_files_set:
                # This file was already implemented (duplicate tool call)
                self.logger.debug(
                    f"File already tracked, skipping duplicate count: {file_path}"
                )
            else:
                # No valid file path found
                self.logger.warning("No valid file path found for tracking")

        except Exception as e:
            self.logger.warning(f"Failed to track file implementation: {e}")
            # Even if tracking fails, try to count based on tool input (but check for duplicates)

            file_path = tool_call["input"].get("file_path")
            if file_path and file_path not in self.implemented_files_set:
                self.implemented_files_set.add(file_path)
                self.files_implemented_count += 1
                self.logger.info(
                    f"File implementation counted (emergency fallback): count={self.files_implemented_count}, file={file_path}"
                )

    def _track_dependency_analysis(self, tool_call: Dict, result: Any):
        """
        Track dependency analysis through read_file calls
        """
        try:
            file_path = tool_call["input"].get("file_path")
            if file_path:
                # Track unique files read for dependency analysis
                if file_path not in self.files_read_for_dependencies:
                    self.files_read_for_dependencies.add(file_path)

                    # Add to dependency analysis summary
                    self.implementation_summary["dependency_analysis"].append(
                        {
                            "file_read": file_path,
                            "timestamp": time.time(),
                            "purpose": "dependency_analysis",
                        }
                    )

                    self.logger.info(
                        f"Dependency analysis tracked: file_read={file_path}"
                    )

        except Exception as e:
            self.logger.warning(f"Failed to track dependency analysis: {e}")

    def calculate_messages_token_count(self, messages: List[Dict]) -> int:
        """
        Calculate total token count for a list of messages

        Args:
            messages: List of chat messages with 'role' and 'content' keys

        Returns:
            Total token count
        """
        if not self.tokenizer:
            # Fallback: rough estimation based on character count
            total_chars = sum(len(str(msg.get("content", ""))) for msg in messages)
            # Rough approximation: 1 token ≈ 4 characters
            return total_chars // 4

        try:
            total_tokens = 0
            for message in messages:
                content = str(message.get("content", ""))
                role = message.get("role", "")

                # Count tokens for content
                if content:
                    content_tokens = len(
                        self.tokenizer.encode(content, disallowed_special=())
                    )
                    total_tokens += content_tokens

                # Add tokens for role and message structure
                role_tokens = len(self.tokenizer.encode(role, disallowed_special=()))
                total_tokens += role_tokens + 4  # Extra tokens for message formatting

            return total_tokens

        except Exception as e:
            self.logger.warning(f"Token calculation failed: {e}")
            # Fallback estimation
            total_chars = sum(len(str(msg.get("content", ""))) for msg in messages)
            return total_chars // 4

    def should_trigger_summary_by_tokens(self, messages: List[Dict]) -> bool:
        """
        Check if summary should be triggered based on token count

        Args:
            messages: Current conversation messages

        Returns:
            True if summary should be triggered based on token count
        """
        if not messages:
            return False

        # Calculate current token count / 计算当前token数
        current_token_count = self.calculate_messages_token_count(messages)

        # Check if we should trigger summary / 检查是否应触发总结
        should_trigger = (
            current_token_count > self.summary_trigger_tokens
            and current_token_count
            > self.last_summary_token_count
            + 10000  # Minimum 10k tokens between summaries / 总结间最少10k tokens
        )

        if should_trigger:
            self.logger.info(
                f"Token-based summary trigger: current={current_token_count:,}, "
                f"threshold={self.summary_trigger_tokens:,}, "
                f"last_summary={self.last_summary_token_count:,}"
            )

        return should_trigger

    def should_trigger_summary(
        self, summary_trigger: int = 5, messages: List[Dict] = None
    ) -> bool:
        """
        Check if summary should be triggered based on token count (preferred) or file count (fallback)
        根据token数（首选）或文件数（回退）检查是否应触发总结

        Args:
            summary_trigger: Number of files after which to trigger summary (fallback)
            messages: Current conversation messages for token calculation

        Returns:
            True if summary should be triggered
        """
        # Primary: Token-based triggering / 主要：基于token的触发
        if messages and self.tokenizer:
            return self.should_trigger_summary_by_tokens(messages)

        # Fallback: File-based triggering (original logic) / 回退：基于文件的触发（原始逻辑）
        self.logger.info("Using fallback file-based summary triggering")
        should_trigger = (
            self.files_implemented_count > 0
            and self.files_implemented_count % summary_trigger == 0
            and self.files_implemented_count > self.last_summary_file_count
        )

        return should_trigger

    def mark_summary_triggered(self, messages: List[Dict] = None):
        """
        Mark that summary has been triggered for current state
        标记当前状态的总结已被触发

        Args:
            messages: Current conversation messages for token tracking
        """
        # Update file-based tracking / 更新基于文件的跟踪
        self.last_summary_file_count = self.files_implemented_count

        # Update token-based tracking / 更新基于token的跟踪
        if messages and self.tokenizer:
            self.last_summary_token_count = self.calculate_messages_token_count(
                messages
            )
            self.logger.info(
                f"Summary marked as triggered - file_count: {self.files_implemented_count}, "
                f"token_count: {self.last_summary_token_count:,}"
            )
        else:
            self.logger.info(
                f"Summary marked as triggered for file count: {self.files_implemented_count}"
            )

    def get_implementation_summary(self) -> Dict[str, Any]:
        """
        Get current implementation summary
        获取当前实现总结
        """
        return self.implementation_summary.copy()

    def get_files_implemented_count(self) -> int:
        """
        Get the number of files implemented so far
        获取到目前为止实现的文件数量
        """
        return self.files_implemented_count

    def get_read_tools_status(self) -> Dict[str, Any]:
        """
        Get read tools configuration status
        获取读取工具配置状态

        Returns:
            Dictionary with read tools status information
        """
        return {
            "read_tools_enabled": self.enable_read_tools,
            "status": "ENABLED" if self.enable_read_tools else "DISABLED",
            "tools_affected": ["read_file", "read_code_mem"],
            "description": "Read tools configuration for testing purposes",
        }

    def add_technical_decision(self, decision: str, context: str = ""):
        """
        Add a technical decision to the implementation summary
        向实现总结添加技术决策

        Args:
            decision: Description of the technical decision
            context: Additional context for the decision
        """
        self.implementation_summary["technical_decisions"].append(
            {"decision": decision, "context": context, "timestamp": time.time()}
        )
        self.logger.info(f"Technical decision recorded: {decision}")

    def add_constraint(self, constraint: str, impact: str = ""):
        """
        Add an important constraint to the implementation summary
        向实现总结添加重要约束

        Args:
            constraint: Description of the constraint
            impact: Impact of the constraint on implementation
        """
        self.implementation_summary["important_constraints"].append(
            {"constraint": constraint, "impact": impact, "timestamp": time.time()}
        )
        self.logger.info(f"Constraint recorded: {constraint}")

    def add_architecture_note(self, note: str, component: str = ""):
        """
        Add an architecture note to the implementation summary
        向实现总结添加架构注释

        Args:
            note: Architecture note description
            component: Related component or module
        """
        self.implementation_summary["architecture_notes"].append(
            {"note": note, "component": component, "timestamp": time.time()}
        )
        self.logger.info(f"Architecture note recorded: {note}")

    def get_implementation_statistics(self) -> Dict[str, Any]:
        """
        Get comprehensive implementation statistics
        获取全面的实现统计信息
        """
        return {
            "total_files_implemented": self.files_implemented_count,
            "files_implemented_count": self.files_implemented_count,
            "technical_decisions_count": len(
                self.implementation_summary["technical_decisions"]
            ),
            "constraints_count": len(
                self.implementation_summary["important_constraints"]
            ),
            "architecture_notes_count": len(
                self.implementation_summary["architecture_notes"]
            ),
            "dependency_analysis_count": len(
                self.implementation_summary["dependency_analysis"]
            ),
            "files_read_for_dependencies": len(self.files_read_for_dependencies),
            "unique_files_implemented": len(self.implemented_files_set),
            "completed_files_list": [
                f["file"] for f in self.implementation_summary["completed_files"]
            ],
            "dependency_files_read": list(self.files_read_for_dependencies),
            "last_summary_file_count": self.last_summary_file_count,
            "read_tools_status": self.get_read_tools_status(),  # Include read tools configuration
        }

    def force_enable_optimization(self):
        """
        Force enable optimization for testing purposes
        强制启用优化用于测试目的
        """
        self.files_implemented_count = 1
        self.logger.info(
            f"🔧 OPTIMIZATION FORCE ENABLED: files_implemented_count set to {self.files_implemented_count}"
        )
        print(
            f"🔧 OPTIMIZATION FORCE ENABLED: files_implemented_count set to {self.files_implemented_count}"
        )

    def reset_implementation_tracking(self):
        """
        Reset implementation tracking (useful for new sessions)
        重置实现跟踪（对新会话有用）
        """
        self.implementation_summary = {
            "completed_files": [],
            "technical_decisions": [],
            "important_constraints": [],
            "architecture_notes": [],
            "dependency_analysis": [],  # Reset dependency analysis and file reads
        }
        self.files_implemented_count = 0
        self.implemented_files_set = (
            set()
        )  # Reset the unique files set / 重置唯一文件集合
        self.files_read_for_dependencies = (
            set()
        )  # Reset files read for dependency analysis / 重置为依赖分析而读取的文件
        self.last_summary_file_count = 0  # Reset the file count when last summary was triggered / 重置上次触发总结时的文件数
        self.last_summary_token_count = 0  # Reset token count when last summary was triggered / 重置上次触发总结时的token数
        self.logger.info("Implementation tracking reset")

        # Reset analysis loop detection / 重置分析循环检测
        self.recent_tool_calls = []
        self.logger.info("Analysis loop detection reset")

    def _track_tool_call_for_loop_detection(self, tool_name: str):
        """
        Track tool calls for analysis loop detection
        跟踪工具调用以检测分析循环

        Args:
            tool_name: Name of the tool called
        """
        self.recent_tool_calls.append(tool_name)
        if len(self.recent_tool_calls) > self.max_read_without_write:
            self.recent_tool_calls.pop(0)

        if len(set(self.recent_tool_calls)) == 1:
            self.logger.warning("Analysis loop detected")

    def is_in_analysis_loop(self) -> bool:
        """
        Check if the agent is in an analysis loop (only reading files, not writing)
        检查代理是否在分析循环中（只读文件，不写文件）

        Returns:
            True if in analysis loop
        """
        if len(self.recent_tool_calls) < self.max_read_without_write:
            return False

        # Check if recent calls are all read_file or search_reference_code / 检查最近的调用是否都是read_file或search_reference_code
        analysis_tools = {
            "read_file",
            "search_reference_code",
            "get_all_available_references",
        }
        recent_calls_set = set(self.recent_tool_calls)

        # If all recent calls are analysis tools, we're in an analysis loop / 如果最近的调用都是分析工具，我们在分析循环中
        in_loop = (
            recent_calls_set.issubset(analysis_tools) and len(recent_calls_set) >= 1
        )

        if in_loop:
            self.logger.warning(
                f"Analysis loop detected! Recent calls: {self.recent_tool_calls}"
            )

        return in_loop

    def get_analysis_loop_guidance(self) -> str:
        """
        Get guidance to break out of analysis loop

        Returns:
            Guidance message to encourage implementation
        """
        return f"""🚨 **ANALYSIS LOOP DETECTED - IMMEDIATE ACTION REQUIRED**

**Problem**: You've been reading/analyzing files for {len(self.recent_tool_calls)} consecutive calls without writing code.
**Recent tool calls**: {' → '.join(self.recent_tool_calls)}

**SOLUTION - IMPLEMENT CODE NOW**:
1. **STOP ANALYZING** - You have enough information
2. **Use write_file** to create the next code file according to the implementation plan
3. **Choose ANY file** from the plan that hasn't been implemented yet
4. **Write complete, working code** - don't ask for permission or clarification

**Files implemented so far**: {self.files_implemented_count}
**Your goal**: Implement MORE files, not analyze existing ones!

**CRITICAL**: Your next response MUST use write_file to create a new code file!"""

    async def test_summary_functionality(self, test_file_path: str = None):
        """
        Test if the code summary functionality is working correctly
        测试代码总结功能是否正常工作

        Args:
            test_file_path: Specific file to test, if None will test all implemented files
        """
        if not self.memory_agent:
            self.logger.warning("No memory agent available for testing")
            return

        if test_file_path:
            files_to_test = [test_file_path]
        else:
            # Use implemented files from tracking
            files_to_test = list(self.implemented_files_set)[
                :3
            ]  # Limit to first 3 files

        if not files_to_test:
            self.logger.warning("No implemented files to test")
            return

        # Test each file silently
        summary_files_found = 0

        for file_path in files_to_test:
            if self.mcp_agent:
                try:
                    result = await self.mcp_agent.call_tool(
                        "read_code_mem", {"file_paths": [file_path]}
                    )

                    # Parse the result to check if summary was found
                    import json

                    result_data = (
                        json.loads(result) if isinstance(result, str) else result
                    )

                    if (
                        result_data.get("status")
                        in ["all_summaries_found", "partial_summaries_found"]
                        and result_data.get("summaries_found", 0) > 0
                    ):
                        summary_files_found += 1
                except Exception as e:
                    self.logger.warning(
                        f"Failed to test read_code_mem for {file_path}: {e}"
                    )
            else:
                self.logger.warning("MCP agent not available for testing")

        self.logger.info(
            f"📋 Summary testing: {summary_files_found}/{len(files_to_test)} files have summaries"
        )

    async def test_automatic_read_file_optimization(self):
        """
        Test the automatic read_file optimization that redirects to read_code_mem
        测试自动read_file优化，重定向到read_code_mem
        """
        print("=" * 80)
        print("🔄 TESTING AUTOMATIC READ_FILE OPTIMIZATION")
        print("=" * 80)

        # Simulate that at least one file has been implemented (to trigger optimization)
        self.files_implemented_count = 1

        # Test with a generic config file that should have a summary
        test_file = "config.py"

        print(f"📁 Testing automatic optimization for: {test_file}")
        print(f"📊 Files implemented count: {self.files_implemented_count}")
        print(
            f"🔧 Optimization should be: {'ENABLED' if self.files_implemented_count > 0 else 'DISABLED'}"
        )

        # Create a simulated read_file tool call
        simulated_read_file_call = {
            "id": "test_read_file_optimization",
            "name": "read_file",
            "input": {"file_path": test_file},
        }

        print("\n🔄 Simulating read_file call:")
        print(f"   Tool: {simulated_read_file_call['name']}")
        print(f"   File: {simulated_read_file_call['input']['file_path']}")

        # Execute the tool call (this should trigger automatic optimization)
        results = await self.execute_tool_calls([simulated_read_file_call])

        if results:
            result = results[0]
            print("\n✅ Tool execution completed:")
            print(f"   Tool name: {result.get('tool_name', 'N/A')}")
            print(f"   Tool ID: {result.get('tool_id', 'N/A')}")

            # Parse the result to check if optimization occurred
            import json

            try:
                result_data = json.loads(result.get("result", "{}"))
                if result_data.get("optimization") == "redirected_to_read_code_mem":
                    print("🎉 SUCCESS: read_file was automatically optimized!")
                    print(
                        f"   Original tool: {result_data.get('original_tool', 'N/A')}"
                    )
                    print(f"   Status: {result_data.get('status', 'N/A')}")
                elif result_data.get("status") == "summary_found":
                    print("🎉 SUCCESS: Summary was found and returned!")
                else:
                    print("ℹ️  INFO: No optimization occurred (no summary available)")
            except json.JSONDecodeError:
                print("⚠️  WARNING: Could not parse result as JSON")
        else:
            print("❌ ERROR: No results returned from tool execution")

        print("\n" + "=" * 80)
        print("🔄 AUTOMATIC READ_FILE OPTIMIZATION TEST COMPLETE")
        print("=" * 80)

    async def test_summary_optimization(self, test_file_path: str = "config.py"):
        """
        Test the summary optimization functionality with a specific file
        测试特定文件的总结优化功能

        Args:
            test_file_path: File path to test (default: config.py which should be in summary)
        """
        if not self.mcp_agent:
            return False

        try:
            # Use MCP agent to call read_code_mem tool
            result = await self.mcp_agent.call_tool(
                "read_code_mem", {"file_paths": [test_file_path]}
            )

            # Parse the result to check if summary was found
            import json

            result_data = json.loads(result) if isinstance(result, str) else result

            return (
                result_data.get("status")
                in ["all_summaries_found", "partial_summaries_found"]
                and result_data.get("summaries_found", 0) > 0
            )
        except Exception as e:
            self.logger.warning(f"Failed to test read_code_mem optimization: {e}")
            return False

    async def test_read_tools_configuration(self):
        """
        Test the read tools configuration to verify enabling/disabling works correctly
        测试读取工具配置以验证启用/禁用是否正常工作
        """
        print("=" * 60)
        print("🧪 TESTING READ TOOLS CONFIGURATION")
        print("=" * 60)

        status = self.get_read_tools_status()
        print(f"Read tools enabled: {status['read_tools_enabled']}")
        print(f"Status: {status['status']}")
        print(f"Tools affected: {status['tools_affected']}")

        # Test with mock tool calls
        test_tools = [
            {
                "id": "test_read_file",
                "name": "read_file",
                "input": {"file_path": "test.py"},
            },
            {
                "id": "test_read_code_mem",
                "name": "read_code_mem",
                "input": {"file_path": "test.py"},
            },
            {
                "id": "test_write_file",
                "name": "write_file",
                "input": {"file_path": "test.py", "content": "# test"},
            },
        ]

        print(
            f"\n🔄 Testing tool execution with read_tools_enabled={self.enable_read_tools}"
        )

        for tool_call in test_tools:
            tool_name = tool_call["name"]
            if not self.enable_read_tools and tool_name in [
                "read_file",
                "read_code_mem",
            ]:
                print(f"🚫 {tool_name}: Would be SKIPPED (disabled)")
            else:
                print(f"✅ {tool_name}: Would be EXECUTED")

        print("=" * 60)
        print("🧪 READ TOOLS CONFIGURATION TEST COMPLETE")
        print("=" * 60)

        return status


================================================
FILE: workflows/agents/document_segmentation_agent.py
================================================
"""
Document Segmentation Agent

A lightweight agent that coordinates with the document segmentation MCP server
to analyze document structure and prepare segments for other agents.
"""

import os
import logging
from typing import Dict, Any, Optional

from mcp_agent.agents.agent import Agent
from utils.llm_utils import get_preferred_llm_class


class DocumentSegmentationAgent:
    """
    Intelligent document segmentation agent with semantic analysis capabilities.

    This enhanced agent provides:
    1. **Semantic Document Classification**: Content-based document type identification
    2. **Adaptive Segmentation Strategy**: Algorithm integrity and semantic coherence preservation
    3. **Planning Agent Optimization**: Segment preparation specifically optimized for downstream agents
    4. **Quality Intelligence Validation**: Advanced metrics for completeness and technical accuracy
    5. **Algorithm Completeness Protection**: Ensures critical algorithms and formulas remain intact

    Key improvements over traditional segmentation:
    - Semantic content analysis vs mechanical structure splitting
    - Dynamic character limits based on content complexity
    - Enhanced relevance scoring for planning agents
    - Algorithm and formula integrity preservation
    - Content type-aware segmentation strategies
    """

    def __init__(self, logger: Optional[logging.Logger] = None):
        self.logger = logger or self._create_default_logger()
        self.mcp_agent = None

    def _create_default_logger(self) -> logging.Logger:
        """Create default logger if none provided"""
        logger = logging.getLogger(f"{__name__}.DocumentSegmentationAgent")
        logger.setLevel(logging.INFO)
        return logger

    async def __aenter__(self):
        """Async context manager entry"""
        await self.initialize()
        return self

    async def __aexit__(self, exc_type, exc_val, exc_tb):
        """Async context manager exit"""
        await self.cleanup()

    async def initialize(self):
        """Initialize the MCP agent connection"""
        try:
            self.mcp_agent = Agent(
                name="DocumentSegmentationCoordinator",
                instruction="""You are an intelligent document segmentation coordinator that leverages advanced semantic analysis for optimal document processing.

Your enhanced capabilities include:
1. **Semantic Content Analysis**: Coordinate intelligent document type classification based on content semantics rather than structural patterns
2. **Algorithm Integrity Protection**: Ensure algorithm blocks, formulas, and related content maintain logical coherence
3. **Adaptive Segmentation Strategy**: Select optimal segmentation approaches (semantic_research_focused, algorithm_preserve_integrity, concept_implementation_hybrid, etc.)
4. **Quality Intelligence Validation**: Assess segmentation quality using enhanced metrics for completeness, relevance, and technical accuracy
5. **Planning Agent Optimization**: Ensure segments are specifically optimized for ConceptAnalysisAgent, AlgorithmAnalysisAgent, and CodePlannerAgent needs

**Key Principles**:
- Prioritize content semantics over mechanical structure
- Preserve algorithm and formula completeness
- Optimize for downstream agent token efficiency
- Ensure technical content integrity
- Provide actionable quality assessments

Use the enhanced document-segmentation tools to deliver superior segmentation results that significantly improve planning agent performance.""",
                server_names=["document-segmentation"],
            )

            # Initialize the agent context
            await self.mcp_agent.__aenter__()

            # Attach LLM
            self.llm = await self.mcp_agent.attach_llm(get_preferred_llm_class())

            self.logger.info("DocumentSegmentationAgent initialized successfully")

        except Exception as e:
            self.logger.error(f"Failed to initialize DocumentSegmentationAgent: {e}")
            raise

    async def cleanup(self):
        """Cleanup resources"""
        if self.mcp_agent:
            try:
                await self.mcp_agent.__aexit__(None, None, None)
            except Exception as e:
                self.logger.warning(f"Error during cleanup: {e}")

    async def analyze_and_prepare_document(
        self, paper_dir: str, force_refresh: bool = False
    ) -> Dict[str, Any]:
        """
        Perform intelligent semantic analysis and create optimized document segments.

        This method coordinates with the enhanced document segmentation server to:
        - Classify document type using semantic content analysis
        - Select optimal segmentation strategy (semantic_research_focused, algorithm_preserve_integrity, etc.)
        - Preserve algorithm and formula integrity
        - Optimize segments for downstream planning agents

        Args:
            paper_dir: Path to the paper directory
            force_refresh: Whether to force re-analysis with latest algorithms

        Returns:
            Dict containing enhanced analysis results and intelligent segment information
        """
        try:
            self.logger.info(f"Starting document analysis for: {paper_dir}")

            # Check if markdown file exists
            md_files = [f for f in os.listdir(paper_dir) if f.endswith(".md")]
            if not md_files:
                raise ValueError(f"No markdown file found in {paper_dir}")

            # Use the enhanced document segmentation tool
            message = f"""Please perform intelligent semantic analysis and segmentation for the document in directory: {paper_dir}

Use the analyze_and_segment_document tool with these parameters:
- paper_dir: {paper_dir}
- force_refresh: {force_refresh}

**Focus on these enhanced objectives**:
1. **Semantic Document Classification**: Identify document type using content semantics (research_paper, algorithm_focused, technical_doc, etc.)
2. **Intelligent Segmentation Strategy**: Select the optimal strategy based on content analysis:
   - `semantic_research_focused` for research papers with high algorithm density
   - `algorithm_preserve_integrity` for algorithm-heavy documents
   - `concept_implementation_hybrid` for mixed concept/implementation content
3. **Algorithm Completeness**: Ensure algorithm blocks, formulas, and related descriptions remain logically connected
4. **Planning Agent Optimization**: Create segments that maximize effectiveness for ConceptAnalysisAgent, AlgorithmAnalysisAgent, and CodePlannerAgent

After segmentation, get a document overview and provide:
- Quality assessment of semantic segmentation approach
- Algorithm/formula integrity verification
- Recommendations for planning agent optimization
- Technical content completeness evaluation"""

            result = await self.llm.generate_str(message=message)

            self.logger.info("Document analysis completed successfully")

            # Parse the result and return structured information
            return {
                "status": "success",
                "paper_dir": paper_dir,
                "analysis_result": result,
                "segments_available": True,
            }

        except Exception as e:
            self.logger.error(f"Error in document analysis: {e}")
            return {
                "status": "error",
                "paper_dir": paper_dir,
                "error_message": str(e),
                "segments_available": False,
            }

    async def get_document_overview(self, paper_dir: str) -> Dict[str, Any]:
        """
        Get overview of document structure and segments.

        Args:
            paper_dir: Path to the paper directory

        Returns:
            Dict containing document overview information
        """
        try:
            message = f"""Please provide an intelligent overview of the enhanced document segmentation for: {paper_dir}

Use the get_document_overview tool to retrieve:
- **Semantic Document Classification**: Document type and confidence score
- **Adaptive Segmentation Strategy**: Strategy used and reasoning
- **Segment Intelligence**: Total segments with enhanced metadata
- **Content Type Distribution**: Breakdown by algorithm, concept, formula, implementation content
- **Quality Intelligence Assessment**: Completeness, coherence, and planning agent optimization

Provide a comprehensive analysis focusing on:
1. Semantic vs structural segmentation quality
2. Algorithm and formula integrity preservation
3. Segment relevance for downstream planning agents
4. Technical content distribution and completeness"""

            result = await self.llm.generate_str(message=message)

            return {
                "status": "success",
                "paper_dir": paper_dir,
                "overview_result": result,
            }

        except Exception as e:
            self.logger.error(f"Error getting document overview: {e}")
            return {"status": "error", "paper_dir": paper_dir, "error_message": str(e)}

    async def validate_segmentation_quality(self, paper_dir: str) -> Dict[str, Any]:
        """
        Validate the quality of document segmentation.

        Args:
            paper_dir: Path to the paper directory

        Returns:
            Dict containing validation results
        """
        try:
            # Get overview first
            overview_result = await self.get_document_overview(paper_dir)

            if overview_result["status"] != "success":
                return overview_result

            # Analyze enhanced segmentation quality
            message = f"""Based on the intelligent document overview for {paper_dir}, please evaluate the enhanced segmentation quality using advanced criteria.

**Enhanced Quality Assessment Factors**:
1. **Semantic Coherence**: Do segments maintain logical content boundaries vs mechanical structural splits?
2. **Algorithm Integrity**: Are algorithm blocks, formulas, and related explanations kept together?
3. **Content Type Optimization**: Are different content types (algorithm, concept, formula, implementation) properly identified and scored?
4. **Planning Agent Effectiveness**: Will ConceptAnalysisAgent, AlgorithmAnalysisAgent, and CodePlannerAgent receive optimal information?
5. **Dynamic Sizing**: Are segments adaptively sized based on content complexity rather than fixed limits?
6. **Technical Completeness**: Are critical technical details preserved without fragmentation?

**Provide specific recommendations for**:
- Semantic segmentation improvements
- Algorithm/formula integrity enhancements
- Planning agent optimization opportunities
- Content distribution balance adjustments"""

            validation_result = await self.llm.generate_str(message=message)

            return {
                "status": "success",
                "paper_dir": paper_dir,
                "validation_result": validation_result,
                "overview_data": overview_result,
            }

        except Exception as e:
            self.logger.error(f"Error validating segmentation quality: {e}")
            return {"status": "error", "paper_dir": paper_dir, "error_message": str(e)}


async def run_document_segmentation_analysis(
    paper_dir: str, logger: Optional[logging.Logger] = None, force_refresh: bool = False
) -> Dict[str, Any]:
    """
    Convenience function to run document segmentation analysis.

    Args:
        paper_dir: Path to the paper directory
        logger: Optional logger instance
        force_refresh: Whether to force re-analysis

    Returns:
        Dict containing analysis results
    """
    async with DocumentSegmentationAgent(logger=logger) as agent:
        # Analyze and prepare document
        analysis_result = await agent.analyze_and_prepare_document(
            paper_dir, force_refresh=force_refresh
        )

        if analysis_result["status"] == "success":
            # Validate segmentation quality
            validation_result = await agent.validate_segmentation_quality(paper_dir)
            analysis_result["validation"] = validation_result

        return analysis_result


# Utility function for integration with existing workflow
async def prepare_document_segments(
    paper_dir: str, logger: Optional[logging.Logger] = None
) -> Dict[str, Any]:
    """
    Prepare intelligent document segments optimized for planning agents.

    This enhanced function leverages semantic analysis to create segments that:
    - Preserve algorithm and formula integrity
    - Optimize for ConceptAnalysisAgent, AlgorithmAnalysisAgent, and CodePlannerAgent
    - Use adaptive character limits based on content complexity
    - Maintain technical content completeness

    Called from the orchestration engine (Phase 3.5) to prepare documents
    before the planning phase with superior segmentation quality.

    Args:
        paper_dir: Path to the paper directory containing markdown file
        logger: Optional logger instance for tracking

    Returns:
        Dict containing enhanced preparation results and intelligent metadata
    """
    try:
        logger = logger or logging.getLogger(__name__)
        logger.info(f"Preparing document segments for: {paper_dir}")

        # Run analysis
        result = await run_document_segmentation_analysis(
            paper_dir=paper_dir,
            logger=logger,
            force_refresh=False,  # Use cached analysis if available
        )

        if result["status"] == "success":
            logger.info("Document segments prepared successfully")

            # Create metadata for downstream agents
            segments_dir = os.path.join(paper_dir, "document_segments")

            return {
                "status": "success",
                "paper_dir": paper_dir,
                "segments_dir": segments_dir,
                "segments_ready": True,
                "analysis_summary": result.get("analysis_result", ""),
                "validation_summary": result.get("validation", {}).get(
                    "validation_result", ""
                ),
            }
        else:
            logger.error(
                f"Document segmentation failed: {result.get('error_message', 'Unknown error')}"
            )
            return {
                "status": "error",
                "paper_dir": paper_dir,
                "segments_ready": False,
                "error_message": result.get(
                    "error_message", "Document segmentation failed"
                ),
            }

    except Exception as e:
        logger.error(f"Error preparing document segments: {e}")
        return {
            "status": "error",
            "paper_dir": paper_dir,
            "segments_ready": False,
            "error_message": str(e),
        }


================================================
FILE: workflows/agents/memory_agent_concise.py
================================================
"""
Concise Memory Agent for Code Implementation Workflow

This memory agent implements a focused approach:
1. Before first file: Normal conversation flow
2. After first file: Keep only system_prompt + initial_plan + current round tool results
3. Clean slate for each new code file generation

Key Features:
- Preserves system prompt and initial plan always
- After first file generation, discards previous conversation history
- Keeps only current round tool results from essential tools:
  * read_code_mem, read_file, write_file
  * execute_python, execute_bash
  * search_code, search_reference_code, get_file_structure
- Provides clean, focused input for next write_file operation
"""

import json
import logging
import os
import time
from datetime import datetime
from typing import Dict, Any, List, Optional


class ConciseMemoryAgent:
    """
    Concise Memory Agent - Focused Information Retention

    Core Philosophy:
    - Preserve essential context (system prompt + initial plan)
    - After first file generation, use clean slate approach
    - Keep only current round tool results from all essential MCP tools
    - Remove conversational clutter and previous tool calls

    Essential Tools Tracked:
    - File Operations: read_code_mem, read_file, write_file
    - Code Analysis: search_code, search_reference_code, get_file_structure
    - Execution: execute_python, execute_bash
    """

    def __init__(
        self,
        initial_plan_content: str,
        logger: Optional[logging.Logger] = None,
        target_directory: Optional[str] = None,
        default_models: Optional[Dict[str, str]] = None,
        code_directory: Optional[str] = None,
    ):
        """
        Initialize Concise Memory Agent

        Args:
            initial_plan_content: Content of initial_plan.txt
            logger: Logger instance
            target_directory: Target directory for saving summaries
            default_models: Default models configuration from workflow
            code_directory: Generated code directory path (e.g., target_directory/generate_code)
        """
        self.logger = logger or self._create_default_logger()
        self.initial_plan = initial_plan_content

        # Store default models configuration
        self.default_models = default_models or {
            "anthropic": "claude-sonnet-4-20250514",
            "openai": "o3-mini",
            "google": "gemini-2.0-flash",
        }

        # Memory state tracking - new logic: trigger after each write_file
        self.last_write_file_detected = (
            False  # Track if write_file was called in current iteration
        )
        self.should_clear_memory_next = False  # Flag to clear memory in next round
        self.current_round = 0

        # Parse phase structure from initial plan
        self.phase_structure = self._parse_phase_structure()

        # Memory configuration
        if target_directory:
            self.save_path = target_directory
        else:
            self.save_path = "./deepcode_lab/papers/1/"

        # Store code directory for file extraction
        self.code_directory = code_directory or os.path.join(
            self.save_path, "generate_code"
        )

        # Extract all files - prioritize generated directory over plan parsing
        self.all_files_list = self._extract_all_files()

        # Code summary file path
        self.code_summary_path = os.path.join(
            self.save_path, "implement_code_summary.md"
        )

        # Current round tool results storage
        self.current_round_tool_results = []

        # Track all implemented files
        self.implemented_files = []

        # Store Next Steps information temporarily (not saved to file)
        self.current_next_steps = ""

        self.logger.info(
            f"Concise Memory Agent initialized with target directory: {self.save_path}"
        )
        self.logger.info(f"Code directory: {self.code_directory}")
        self.logger.info(f"Code summary will be saved to: {self.code_summary_path}")
        # self.logger.info(f"🤖 Using models - Anthropic: {self.default_models['anthropic']}, OpenAI: {self.default_models['openai']}")
        self.logger.info(
            "📝 NEW LOGIC: Memory clearing triggered after each write_file call"
        )

    def _create_default_logger(self) -> logging.Logger:
        """Create default logger"""
        logger = logging.getLogger(f"{__name__}.ConciseMemoryAgent")
        logger.setLevel(logging.INFO)
        return logger

    def _parse_phase_structure(self) -> Dict[str, List[str]]:
        """Parse implementation phases from initial plan"""
        try:
            phases = {}
            lines = self.initial_plan.split("\n")
            current_phase = None

            for line in lines:
                if "Phase" in line and ":" in line:
                    # Extract phase name
                    phase_parts = line.split(":")
                    if len(phase_parts) >= 2:
                        current_phase = phase_parts[0].strip()
                        phases[current_phase] = []
                elif current_phase and line.strip().startswith("-"):
                    # This is a file in the current phase
                    file_line = line.strip()[1:].strip()
                    if file_line.startswith("`") and file_line.endswith("`"):
                        file_name = file_line[1:-1]
                        phases[current_phase].append(file_name)
                elif current_phase and not line.strip():
                    # Empty line might indicate end of phase
                    continue
                elif current_phase and line.strip().startswith("###"):
                    # New section, end current phase
                    current_phase = None

            return phases

        except Exception as e:
            self.logger.warning(f"Failed to parse phase structure: {e}")
            return {}

    def _extract_all_files(self) -> List[str]:
        """
        Extract all code files - prioritizes generated directory over plan parsing

        Strategy:
        1. First try to extract from the generated code directory (reliable)
        2. Fall back to plan parsing if directory doesn't exist yet

        Returns:
            List of all file paths that should be implemented
        """
        # Try extracting from generated directory first (more reliable)
        if os.path.exists(self.code_directory):
            files_from_dir = self._extract_files_from_generated_directory()
            if files_from_dir:
                self.logger.info(
                    f"📁 Extracted {len(files_from_dir)} files from generated directory"
                )
                return files_from_dir

        # Fall back to plan parsing
        self.logger.info(
            "📁 Generated directory not found, extracting from plan (less reliable)"
        )
        return self._extract_all_files_from_plan()

    def _extract_files_from_generated_directory(self) -> List[str]:
        """
        Extract all code files from the generated code directory
        This is more reliable than parsing the LLM-generated plan

        Returns:
            List of relative file paths within the code directory
        """
        code_files = []

        # Define code file extensions to track
        code_extensions = {
            ".py",
            ".js",
            ".ts",
            ".jsx",
            ".tsx",
            ".vue",
            ".html",
            ".css",
            ".scss",
            ".sass",
            ".less",
            ".json",
            ".yaml",
            ".yml",
            ".toml",
            ".xml",
            ".ini",
            ".cfg",
            ".md",
            ".rst",
            ".txt",
            ".sh",
            ".bash",
            ".zsh",
            ".bat",
            ".ps1",
            ".cmd",
            ".c",
            ".cpp",
            ".h",
            ".hpp",
            ".cc",
            ".cxx",
            ".java",
            ".kt",
            ".scala",
            ".go",
            ".rs",
            ".php",
            ".rb",
            ".pl",
            ".lua",
            ".r",
            ".sql",
        }

        # Files and directories to exclude
        exclude_patterns = {
            "__pycache__",
            ".pyc",
            "node_modules",
            ".git",
            ".vscode",
            ".idea",
            "dist",
            "build",
            "output",
            ".egg-info",
            "venv",
            ".venv",
            "env",
            ".env",
        }

        try:
            for root, dirs, files in os.walk(self.code_directory):
                # Filter out excluded directories
                dirs[:] = [
                    d
                    for d in dirs
                    if d not in exclude_patterns and not d.startswith(".")
                ]

                for file in files:
                    # Skip hidden files and excluded patterns
                    if file.startswith("."):
                        continue

                    # Check if file has a code extension
                    has_code_ext = any(
                        file.lower().endswith(ext) for ext in code_extensions
                    )
                    if not has_code_ext:
                        continue

                    # Get full path and convert to relative path
                    full_path = os.path.join(root, file)
                    relative_path = os.path.relpath(full_path, self.code_directory)

                    # Normalize path separators
                    relative_path = relative_path.replace(os.sep, "/")

                    code_files.append(relative_path)

            # Sort for consistency
            code_files = sorted(code_files)

            if code_files:
                self.logger.info(f"📄 Found {len(code_files)} code files in directory")
                self.logger.info(f"📄 Sample files: {code_files[:3]}...")

            return code_files

        except Exception as e:
            self.logger.error(f"Failed to extract files from directory: {e}")
            return []

    def _extract_all_files_from_plan(self) -> List[str]:
        """
        Extract all file paths from the file_structure section in initial plan
        Handles multiple formats: tree structure, YAML, and simple lists

        Returns:
            List of all file paths that should be implemented
        """
        try:
            lines = self.initial_plan.split("\n")
            files = []

            # Method 1: Try to extract from tree structure in file_structure section
            files.extend(self._extract_from_tree_structure(lines))

            # Method 2: If no files found, try to extract from simple list format
            if not files:
                files.extend(self._extract_from_simple_list(lines))

            # Method 3: If still no files, try to extract from anywhere in the plan
            if not files:
                files.extend(self._extract_from_plan_content(lines))

            # Clean and validate file paths
            cleaned_files = self._clean_and_validate_files(files)

            # Log the extracted files
            self.logger.info(
                f"📁 Extracted {len(cleaned_files)} files from initial plan"
            )
            if cleaned_files:
                self.logger.info(f"📁 Sample files: {cleaned_files[:3]}...")

            return cleaned_files

        except Exception as e:
            self.logger.error(f"Failed to extract files from initial plan: {e}")
            return []

    def _extract_from_tree_structure(self, lines: List[str]) -> List[str]:
        """
        Extract files from tree structure format - Advanced algorithm with multi-strategy approach

        Strategy:
        1. Precise indentation-based depth calculation
        2. Smart directory vs file detection using multiple heuristics
        3. Robust path stack management with depth tracking
        4. Fallback to regex pattern matching if tree parsing fails
        """
        files = []
        in_file_structure = False

        # Enhanced path tracking: store (depth, name) pairs
        path_stack = []  # [(depth, dir_name), ...]
        root_dir = None

        # Track the base indentation of tree structure
        base_indent = None

        for line_num, line in enumerate(lines):
            # === Section Boundary Detection ===
            if "file_structure:" in line or "file_structure |" in line:
                in_file_structure = True
                continue

            # End of file_structure section (next YAML key without indentation)
            if (
                in_file_structure
                and line.strip()
                and not line.startswith(" ")
                and ":" in line
            ):
                break

            if not in_file_structure:
                continue

            if not line.strip():
                continue

            # Skip YAML comments and keys that are clearly not files
            stripped = line.strip()
            if stripped.startswith("#") or (
                stripped.endswith(":") and "/" not in stripped
            ):
                continue

            # === Root Directory Detection ===
            # Pattern: "project-name/" at minimal indentation, no tree chars
            if stripped.endswith("/") and not any(
                c in line for c in ["├", "└", "│", "─"]
            ):
                indent = len(line) - len(line.lstrip())
                if indent <= 4:  # Root level
                    root_dir = stripped.rstrip("/")
                    path_stack = []
                    base_indent = None
                    self.logger.debug(f"🌳 Detected root directory: {root_dir}")
                    continue

            # === Tree Structure Line Detection ===
            has_tree_chars = any(c in line for c in ["├", "└", "│", "─"])
            if not has_tree_chars:
                continue

            # === Calculate Precise Depth ===
            # Method: Count the actual tree structure symbols to determine hierarchy
            indent = len(line) - len(line.lstrip())

            # Set base indent on first tree line
            if base_indent is None:
                base_indent = indent

            # Count tree depth indicators
            # Each "│   " or "    " block represents one level
            # "├── " or "└── " marks the current item
            tree_prefix = line[
                : line.find("├")
                if "├" in line
                else line.find("└")
                if "└" in line
                else len(line)
            ]

            # Count depth by analyzing tree prefix structure
            # Pattern: "    │   │   ├── filename" -> depth 3
            # Pattern: "    ├── filename" -> depth 1
            # Pattern: "    │   ├── filename" -> depth 2

            depth = 0
            i = 0
            while i < len(tree_prefix):
                # Look for pipe or tree junction
                if i + 4 <= len(tree_prefix):
                    chunk = tree_prefix[i : i + 4]
                    if "│" in chunk or all(c == " " for c in chunk):
                        depth += 1
                        i += 4
                    else:
                        i += 1
                else:
                    break

            # Fallback: use relative indentation
            if depth == 0:
                depth = max(1, (indent - base_indent) // 4 + 1)

            # === Clean and Extract Item Name ===
            item_name = line
            # Remove all tree characters
            for pattern in ["├──", "└──", "│", "├", "└", "─"]:
                item_name = item_name.replace(pattern, "")
            item_name = item_name.strip()

            # Remove inline comments
            if "#" in item_name:
                item_name = item_name.split("#")[0].strip()

            if not item_name or ":" in item_name:
                continue

            # === Smart Directory vs File Detection ===
            is_directory = self._is_directory(item_name)

            # === Update Path Stack ===
            # Remove items deeper than current depth
            path_stack = [(d, n) for d, n in path_stack if d < depth]

            if is_directory:
                dir_name = item_name.rstrip("/")
                path_stack.append((depth, dir_name))
                self.logger.debug(f"  {'  ' * depth}📁 {dir_name} (depth={depth})")
            else:
                # Construct full file path
                path_parts = [root_dir] if root_dir else []
                path_parts.extend([name for _, name in path_stack])
                path_parts.append(item_name)

                full_path = "/".join(path_parts)
                files.append(full_path)
                self.logger.debug(f"  {'  ' * depth}📄 {full_path}")

        return files

    def _is_directory(self, name: str) -> bool:
        """
        Advanced directory detection using multiple heuristics

        Returns True if the name represents a directory, False if it's a file
        """
        # Rule 1: Explicit directory marker
        if name.endswith("/"):
            return True

        # Rule 2: Has file extension -> definitely a file
        basename = name.split("/")[-1]
        if "." in basename:
            # Check if it's a known file extension
            known_extensions = [
                ".py",
                ".js",
                ".ts",
                ".jsx",
                ".tsx",
                ".vue",
                ".html",
                ".css",
                ".scss",
                ".sass",
                ".json",
                ".yaml",
                ".yml",
                ".xml",
                ".toml",
                ".md",
                ".txt",
                ".rst",
                ".sh",
                ".bat",
                ".ps1",
                ".c",
                ".cpp",
                ".h",
                ".hpp",
                ".java",
                ".go",
                ".rs",
                ".sql",
                ".db",
                ".env",
                ".gitignore",
                ".dockerignore",
                ".lock",
                ".sum",
                ".mod",
            ]
            if any(basename.lower().endswith(ext) for ext in known_extensions):
                return False

            # Has extension but not recognized -> might be config file, treat as file
            if basename.count(".") == 1:
                return False

        # Rule 3: Known special files without extensions
        special_files = [
            "README",
            "LICENSE",
            "CHANGELOG",
            "CONTRIBUTING",
            "Makefile",
            "Dockerfile",
            "Vagrantfile",
            "requirements.txt",
            "setup.py",
            "setup.cfg",
            "package.json",
            "package-lock.json",
            "Cargo.toml",
            "go.mod",
        ]
        if basename in special_files or basename.upper() in special_files:
            return False

        # Rule 4: Common directory names (even without trailing /)
        common_dirs = [
            "src",
            "lib",
            "app",
            "core",
            "api",
            "web",
            "client",
            "server",
            "config",
            "configs",
            "settings",
            "data",
            "datasets",
            "models",
            "model",
            "utils",
            "helpers",
            "common",
            "shared",
            "tests",
            "test",
            "testing",
            "__tests__",
            "docs",
            "documentation",
            "scripts",
            "bin",
            "tools",
            "assets",
            "static",
            "public",
            "resources",
            "components",
            "views",
            "pages",
            "routes",
            "services",
            "controllers",
            "handlers",
            "middleware",
            "middlewares",
            "types",
            "interfaces",
            "schemas",
            "experiments",
            "notebooks",
            "dist",
            "build",
            "output",
            "node_modules",
            "vendor",
            "packages",
            "__pycache__",
            ".git",
            ".vscode",
            "training",
            "evaluation",
            "inference",
        ]
        if basename.lower() in common_dirs:
            return True

        # Rule 5: Plural forms often indicate directories
        if basename.endswith("s") and len(basename) > 3:
            singular = basename[:-1]
            if singular in common_dirs:
                return True

        # Rule 6: Python package indicators
        if basename == "__init__.py":
            return False  # This is a file

        # Default: if no extension and not a known file, likely a directory
        return "." not in basename

    def _extract_from_simple_list(self, lines: List[str]) -> List[str]:
        """Extract files from simple list format (- filename)"""
        files = []

        for line in lines:
            line = line.strip()
            if line.startswith("- ") and not line.startswith('- "'):
                # Remove leading "- " and clean up
                filename = line[2:].strip()

                # Remove quotes if present
                if filename.startswith('"') and filename.endswith('"'):
                    filename = filename[1:-1]

                # Check if it looks like a file (has extension)
                if "." in filename and "/" in filename:
                    files.append(filename)

        return files

    def _extract_from_plan_content(self, lines: List[str]) -> List[str]:
        """
        Advanced fallback extraction: Extract files from anywhere in the plan content
        Uses multiple regex patterns and intelligent filtering
        """
        files = []
        import re

        # === Pattern 1: Standard file paths ===
        # Matches: path/to/file.py, src/model/apt_layer.py
        pattern1 = r"([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.[a-zA-Z0-9]+)"

        # === Pattern 2: Quoted file paths ===
        # Matches: "path/to/file.py", 'src/utils.py'
        pattern2 = r'["\']([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.[a-zA-Z0-9]+)["\']'

        # === Pattern 3: File paths with special characters ===
        # Matches: data/data_loader.py, __init__.py paths
        pattern3 = r"([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)*/__init__\.py)"
        pattern4 = r"([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.(?:py|js|ts|jsx|tsx|html|css|md|txt|json|yaml|yml|xml|sql|sh|bat))"

        # === Pattern 5: Backtick-wrapped paths (in code blocks) ===
        pattern5 = r"`([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.[a-zA-Z0-9]+)`"

        all_patterns = [pattern1, pattern2, pattern3, pattern4, pattern5]

        # Collect all potential matches
        potential_files = set()

        for line in lines:
            # Skip comment-only lines
            stripped = line.strip()
            if stripped.startswith("#") and not ("/" in stripped and "." in stripped):
                continue

            # Apply all patterns
            for pattern in all_patterns:
                matches = re.findall(pattern, line)
                potential_files.update(matches)

        # === Filter and validate matches ===
        code_extensions = {
            ".py",
            ".js",
            ".ts",
            ".jsx",
            ".tsx",
            ".vue",
            ".html",
            ".css",
            ".scss",
            ".sass",
            ".less",
            ".json",
            ".yaml",
            ".yml",
            ".toml",
            ".xml",
            ".ini",
            ".cfg",
            ".md",
            ".rst",
            ".txt",
            ".sh",
            ".bash",
            ".zsh",
            ".bat",
            ".ps1",
            ".cmd",
            ".c",
            ".cpp",
            ".h",
            ".hpp",
            ".cc",
            ".cxx",
            ".java",
            ".kt",
            ".scala",
            ".go",
            ".rs",
            ".php",
            ".rb",
            ".pl",
            ".lua",
            ".r",
            ".sql",
            ".db",
            ".dockerfile",
            ".env",
            ".gitignore",
            ".lock",
            ".sum",
            ".mod",
        }

        for file_path in potential_files:
            # Must have path separator
            if "/" not in file_path:
                continue

            # Must have valid extension
            has_valid_ext = any(
                file_path.lower().endswith(ext) for ext in code_extensions
            )
            if not has_valid_ext:
                continue

            # Filter out obvious non-files
            if any(
                bad in file_path.lower()
                for bad in [
                    "http://",
                    "https://",
                    ".png",
                    ".jpg",
                    ".jpeg",
                    ".gif",
                    ".svg",
                    ".ico",
                ]
            ):
                continue

            # Must not be too short (avoid false positives)
            if len(file_path) < 5:
                continue

            # Path components should be reasonable
            parts = file_path.split("/")
            if any(len(part) == 0 for part in parts):
                continue

            files.append(file_path)

        # Sort for consistency
        files = sorted(list(set(files)))

        return files

    def _clean_and_validate_files(self, files: List[str]) -> List[str]:
        """
        Clean and validate extracted file paths - advanced filtering and deduplication

        Features:
        1. Remove duplicates while preserving order
        2. Normalize paths (handle ../,  ./, double slashes)
        3. Filter out non-code files
        4. Smart deduplication (recognize same file with different path prefixes)
        """
        cleaned_files = []
        seen_normalized = set()

        # Define code file extensions we want to track
        code_extensions = {
            ".py",
            ".js",
            ".ts",
            ".jsx",
            ".tsx",
            ".vue",
            ".html",
            ".css",
            ".scss",
            ".sass",
            ".less",
            ".json",
            ".yaml",
            ".yml",
            ".toml",
            ".xml",
            ".ini",
            ".cfg",
            ".md",
            ".rst",
            ".txt",
            ".sh",
            ".bash",
            ".zsh",
            ".bat",
            ".ps1",
            ".cmd",
            ".c",
            ".cpp",
            ".h",
            ".hpp",
            ".cc",
            ".cxx",
            ".java",
            ".kt",
            ".scala",
            ".go",
            ".rs",
            ".php",
            ".rb",
            ".pl",
            ".lua",
            ".r",
            ".sql",
            ".db",
            ".dockerfile",
            ".env",
            ".gitignore",
            ".lock",
            ".sum",
            ".mod",
        }

        for file_path in files:
            # === Step 1: Basic Cleaning ===
            cleaned_path = file_path.strip().strip('"').strip("'").strip("`")

            if not cleaned_path:
                continue

            # Remove leading/trailing slashes
            cleaned_path = cleaned_path.strip("/")

            # === Step 2: Path Normalization ===
            # Remove double slashes
            while "//" in cleaned_path:
                cleaned_path = cleaned_path.replace("//", "/")

            # Handle relative paths (remove ./ prefix)
            if cleaned_path.startswith("./"):
                cleaned_path = cleaned_path[2:]

            # === Step 3: Validate File Structure ===
            # Must have filename (not just directory)
            if not cleaned_path or "/" not in cleaned_path:
                # Single file without path - only accept if it has extension
                if "." not in cleaned_path:
                    continue

            # Extract basename
            basename = cleaned_path.split("/")[-1]

            # Skip directories (no file extension in basename)
            if "." not in basename:
                continue

            # === Step 4: Extension Validation ===
            # Only include files with code extensions
            has_code_extension = any(
                cleaned_path.lower().endswith(ext) for ext in code_extensions
            )
            if not has_code_extension:
                continue

            # === Step 5: Filter Invalid Patterns ===
            # Skip files that look like YAML keys or config entries
            if ":" in cleaned_path and not any(
                cleaned_path.endswith(ext) for ext in [".yaml", ".yml"]
            ):
                continue

            # Skip paths with invalid characters
            if any(
                char in cleaned_path for char in ['"', "'", "|", "<", ">", "*", "?"]
            ):
                continue

            # Skip obvious build/temp artifacts
            if any(
                part in cleaned_path
                for part in [
                    "__pycache__",
                    ".pyc",
                    "node_modules",
                    ".git/",
                    "dist/build",
                ]
            ):
                continue

            # === Step 6: Smart Deduplication ===
            # Normalize for comparison (lowercase, remove common prefixes)
            normalized_for_comparison = cleaned_path.lower()

            # Check if we've already seen this file (exact match)
            if normalized_for_comparison in seen_normalized:
                continue

            # Check for duplicate with different path (e.g., "src/model/apt_layer.py" vs "model/apt_layer.py")
            # Keep the longer (more specific) path
            is_duplicate = False
            paths_to_remove = []

            for existing_normalized in seen_normalized:
                # If current path is suffix of existing, it's a shorter version - skip it
                if existing_normalized.endswith("/" + normalized_for_comparison):
                    is_duplicate = True
                    break

                # If existing path is suffix of current, current is longer - replace existing
                if normalized_for_comparison.endswith("/" + existing_normalized):
                    paths_to_remove.append(existing_normalized)

            if is_duplicate:
                continue

            # Remove shorter versions
            for path_to_remove in paths_to_remove:
                seen_normalized.discard(path_to_remove)
                # Also remove from cleaned_files list
                cleaned_files = [
                    f for f in cleaned_files if f.lower() != path_to_remove
                ]

            # === Step 7: Add to Results ===
            seen_normalized.add(normalized_for_comparison)
            cleaned_files.append(cleaned_path)

        return sorted(cleaned_files)

    def record_file_implementation(
        self, file_path: str, implementation_content: str = ""
    ):
        """
        Record a newly implemented file (simplified version)
        NEW LOGIC: File implementation is tracked via write_file tool detection

        Args:
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
        """
        # Add file to implemented files list if not already present
        if file_path not in self.implemented_files:
            self.implemented_files.append(file_path)

        self.logger.info(f"📝 File implementation recorded: {file_path}")

    async def create_code_implementation_summary(
        self,
        client,
        client_type: str,
        file_path: str,
        implementation_content: str,
        files_implemented: int,
    ) -> str:
        """
        Create LLM-based code implementation summary after writing a file
        Uses LLM to analyze and summarize the implemented code

        Args:
            client: LLM client instance
            client_type: Type of LLM client ("anthropic" or "openai")
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
            files_implemented: Number of files implemented so far

        Returns:
            LLM-generated formatted code implementation summary
        """
        try:
            # Record the file implementation first
            self.record_file_implementation(file_path, implementation_content)

            # Create prompt for LLM summary
            summary_prompt = self._create_code_summary_prompt(
                file_path, implementation_content, files_implemented
            )
            summary_messages = [{"role": "user", "content": summary_prompt}]

            # Get LLM-generated summary
            llm_response = await self._call_llm_for_summary(
                client, client_type, summary_messages
            )
            llm_summary = llm_response.get("content", "")

            # Extract different sections from LLM summary
            sections = self._extract_summary_sections(llm_summary)

            # Store Next Steps in temporary variable (not saved to file)
            self.current_next_steps = sections.get("next_steps", "")
            if self.current_next_steps:
                self.logger.info("📝 Next Steps stored temporarily (not saved to file)")

            # Format summary with only Implementation Progress and Dependencies for file saving
            file_summary_content = ""
            if sections.get("core_purpose"):
                file_summary_content += sections["core_purpose"] + "\n\n"
            if sections.get("public_interface"):
                file_summary_content += sections["public_interface"] + "\n\n"
            if sections.get("internal_dependencies"):
                file_summary_content += sections["internal_dependencies"] + "\n\n"
            if sections.get("external_dependencies"):
                file_summary_content += sections["external_dependencies"] + "\n\n"
            if sections.get("implementation_notes"):
                file_summary_content += sections["implementation_notes"] + "\n\n"

            # Create the formatted summary for file saving (without Next Steps)
            formatted_summary = self._format_code_implementation_summary(
                file_path, file_summary_content.strip(), files_implemented
            )

            # Save to implement_code_summary.md (append mode) - only Implementation Progress and Dependencies
            await self._save_code_summary_to_file(formatted_summary, file_path)

            self.logger.info(f"Created and saved code summary for: {file_path}")
            return formatted_summary

        except Exception as e:
            self.logger.error(
                f"Failed to create LLM-based code implementation summary: {e}"
            )
            # Fallback to simple summary
            return self._create_fallback_code_summary(
                file_path, implementation_content, files_implemented
            )

    def _create_code_summary_prompt(
        self, file_path: str, implementation_content: str, files_implemented: int
    ) -> str:
        """
        Create prompt for LLM to generate code implementation summary

        Args:
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
            files_implemented: Number of files implemented so far

        Returns:
            Prompt for LLM summarization
        """
        current_round = self.current_round

        # Get formatted file lists
        file_lists = self.get_formatted_files_lists()
        implemented_files_list = file_lists["implemented"]
        unimplemented_files_list = file_lists["unimplemented"]

        prompt = f"""You are an expert code implementation summarizer. Analyze the implemented code file and create a structured summary.

**🚨 CRITICAL: The files listed below are ALREADY IMPLEMENTED - DO NOT suggest them in Next Steps! 🚨**

**All Previously Implemented Files:**
{implemented_files_list}

**Remaining Unimplemented Files (choose ONLY from these for Next Steps):**
{unimplemented_files_list}

**Current Implementation Context:**
- **File Implemented**: {file_path}
- **Current Round**: {current_round}
- **Total Files Implemented**: {files_implemented}


**Initial Plan Reference:**
{self.initial_plan[:]}

**Implemented Code Content:**
```
{implementation_content[:]}
```

**Required Summary Format:**

**Core Purpose** (provide a general overview of the file's main responsibility):
- {{1-2 sentence description of file's main responsibility}}

**Public Interface** (what other files can use, if any):
- Class {{ClassName}}: {{purpose}} | Key methods: {{method_names}} | Constructor params: {{params}}
- Function {{function_name}}({{params}}): {{purpose}} -> {{return_type}}: {{purpose}}
- Constants/Types: {{name}}: {{value/description}}

**Internal Dependencies** (what this file imports/requires, if any):
- From {{module/file}}: {{specific_imports}}
- External packages: {{package_name}} - {{usage_context}}

**External Dependencies** (what depends on this file, if any):
- Expected to be imported by: {{likely_consumer_files}}
- Key exports used elsewhere: {{main_interfaces}}

**Implementation Notes**: (if any)
- Architecture decisions: {{key_choices_made}}
- Cross-File Relationships: {{how_files_work_together}}

**Next Steps**: List the code file (ONLY ONE) that will be implemented in the next round (MUST choose from "Remaining Unimplemented Files" above)
  Format: Code will be implemented: {{file_path}}
  **NEVER suggest any file from the "All Previously Implemented Files" list!**

**Instructions:**
- Be precise and concise
- Focus on function interfaces that other files will need
- Extract actual function signatures from the code
- **CRITICAL: For Next Steps, ONLY choose ONE file from the "Remaining Unimplemented Files" list above**
- **NEVER suggest implementing a file that is already in the implemented files list**
- Choose the next file based on logical dependencies and implementation order
- Use the exact format specified above

**Summary:**"""

        return prompt

    # TODO: The prompt is not good, need to be improved
    # **Implementation Progress**: List the code file completed in current round and core implementation ideas
    #   Format: {{file_path}}: {{core implementation ideas}}

    # **Dependencies**: According to the File Structure and initial plan, list functions that may be called by other files
    #   Format: {{file_path}}: Function {{function_name}}: core ideas--{{ideas}}; Required parameters--{{params}}; Return parameters--{{returns}}
    #   Required packages: {{packages}}

    def _extract_summary_sections(self, llm_summary: str) -> Dict[str, str]:
        """
        Extract different sections from LLM-generated summary

        Args:
            llm_summary: Raw LLM-generated summary text

        Returns:
            Dictionary with extracted sections: core_purpose, public_interface, internal_dependencies,
            external_dependencies, implementation_notes, next_steps
        """
        sections = {
            "core_purpose": "",
            "public_interface": "",
            "internal_dependencies": "",
            "external_dependencies": "",
            "implementation_notes": "",
            "next_steps": "",
        }

        try:
            lines = llm_summary.split("\n")
            current_section = None
            current_content = []

            for line in lines:
                line_lower = line.lower().strip()

                # Check for section headers
                if "core purpose" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "core_purpose"
                    current_content = [line]  # Include the header
                elif "public interface" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "public_interface"
                    current_content = [line]  # Include the header
                elif "internal dependencies" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "internal_dependencies"
                    current_content = [line]  # Include the header
                elif "external dependencies" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "external_dependencies"
                    current_content = [line]  # Include the header
                elif "implementation notes" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "implementation_notes"
                    current_content = [line]  # Include the header
                elif "next steps" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "next_steps"
                    current_content = [line]  # Include the header
                else:
                    # Add content to current section
                    if current_section:
                        current_content.append(line)

            # Don't forget the last section
            if current_section and current_content:
                sections[current_section] = "\n".join(current_content).strip()

            self.logger.info(f"📋 Extracted sections: {list(sections.keys())}")

        except Exception as e:
            self.logger.error(f"Failed to extract summary sections: {e}")
            # Fallback: put everything in core_purpose
            sections["core_purpose"] = llm_summary

        return sections

    def _format_code_implementation_summary(
        self, file_path: str, llm_summary: str, files_implemented: int
    ) -> str:
        """
        Format the LLM-generated summary into the final structure

        Args:
            file_path: Path of the implemented file
            llm_summary: LLM-generated summary content
            files_implemented: Number of files implemented so far

        Returns:
            Formatted summary
        """
        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # # Create formatted list of implemented files
        # implemented_files_list = (
        #     "\n".join([f"- {file}" for file in self.implemented_files])
        #     if self.implemented_files
        #     else "- None yet"
        # )

        #         formatted_summary = f"""# Code Implementation Summary
        # **All Previously Implemented Files:**
        # {implemented_files_list}
        # **Generated**: {timestamp}
        # **File Implemented**: {file_path}
        # **Total Files Implemented**: {files_implemented}

        # {llm_summary}

        # ---
        # *Auto-generated by Memory Agent*
        # """
        formatted_summary = f"""# Code Implementation Summary
**Generated**: {timestamp}
**File Implemented**: {file_path}

{llm_summary}

---
*Auto-generated by Memory Agent*
"""
        return formatted_summary

    def _create_fallback_code_summary(
        self, file_path: str, implementation_content: str, files_implemented: int
    ) -> str:
        """
        Create fallback summary when LLM is unavailable

        Args:
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
            files_implemented: Number of files implemented so far

        Returns:
            Fallback summary
        """
        # Create formatted list of implemented files
        implemented_files_list = (
            "\n".join([f"- {file}" for file in self.implemented_files])
            if self.implemented_files
            else "- None yet"
        )

        summary = f"""# Code Implementation Summary
**All Previously Implemented Files:**
{implemented_files_list}
**Generated**: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}
**File Implemented**: {file_path}
**Total Files Implemented**: {files_implemented}
**Summary failed to generate.**

---
*Auto-generated by Concise Memory Agent (Fallback Mode)*
"""
        return summary

    async def _save_code_summary_to_file(self, new_summary: str, file_path: str):
        """
        Append code implementation summary to implement_code_summary.md
        Accumulates all implementations with clear separators

        Args:
            new_summary: New summary content to append
            file_path: Path of the file for which the summary was generated
        """
        try:
            # Create directory if it doesn't exist
            os.makedirs(os.path.dirname(self.code_summary_path), exist_ok=True)

            # Check if file exists to determine if we need header
            file_exists = os.path.exists(self.code_summary_path)

            # Open in append mode to accumulate all implementations
            with open(self.code_summary_path, "a", encoding="utf-8") as f:
                if not file_exists:
                    # Write header for new file
                    f.write("# Code Implementation Progress Summary\n")
                    f.write("*Accumulated implementation progress for all files*\n\n")

                # Add clear separator between implementations
                f.write("\n" + "=" * 80 + "\n")
                f.write(
                    f"## IMPLEMENTATION File {file_path}; ROUND {self.current_round} \n"
                )
                f.write("=" * 80 + "\n\n")

                # Write the new summary
                f.write(new_summary)
                f.write("\n\n")

            self.logger.info(
                f"Appended LLM-based code implementation summary to: {self.code_summary_path}"
            )

        except Exception as e:
            self.logger.error(f"Failed to save code implementation summary: {e}")

    async def _call_llm_for_summary(
        self, client, client_type: str, summary_messages: List[Dict]
    ) -> Dict[str, Any]:
        """
        Call LLM for code implementation summary generation ONLY

        This method is used only for creating code implementation summaries,
        NOT for conversation summarization which has been removed.
        """
        if client_type == "anthropic":
            response = await client.messages.create(
                model=self.default_models["anthropic"],
                system="You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches.",
                messages=summary_messages,
                max_tokens=5000,
                temperature=0.2,
            )

            content = ""
            if response and hasattr(response, "content") and response.content:
                for block in response.content:
                    if block.type == "text":
                        content += block.text
            else:
                self.logger.warning("Anthropic response is empty or malformed")

            return {"content": content}

        elif client_type == "openai":
            openai_messages = [
                {
                    "role": "system",
                    "content": "You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches.",
                }
            ]
            openai_messages.extend(summary_messages)

            # Try max_tokens and temperature first, fallback to max_completion_tokens without temperature if unsupported
            try:
                response = await client.chat.completions.create(
                    model=self.default_models["openai"],
                    messages=openai_messages,
                    max_tokens=5000,
                    temperature=0.2,
                )
            except Exception as e:
                if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                    # Retry with max_completion_tokens and no temperature for models that require it
                    response = await client.chat.completions.create(
                        model=self.default_models["openai"],
                        messages=openai_messages,
                        max_completion_tokens=5000,
                    )
                else:
                    raise

            # Safely extract content from response
            if response and hasattr(response, "choices") and response.choices:
                return {"content": response.choices[0].message.content or ""}
            else:
                self.logger.warning("OpenAI response is empty or malformed")
                return {"content": ""}

        elif client_type == "google":
            from google.genai import types

            # Convert messages to Gemini format
            system_instruction = "You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches."

            gemini_messages = []
            for msg in summary_messages:
                role = msg.get("role", "user")
                content = msg.get("content", "")

                # Convert role names: "assistant" -> "model"
                if role == "assistant":
                    role = "model"
                elif role not in ["user", "model"]:
                    role = "user"

                gemini_messages.append(
                    types.Content(role=role, parts=[types.Part.from_text(text=content)])
                )

            config = types.GenerateContentConfig(
                max_output_tokens=5000,
                temperature=0.2,
                system_instruction=system_instruction,
            )

            response = await client.aio.models.generate_content(
                model=self.default_models.get("google", "gemini-2.0-flash"),
                contents=gemini_messages,
                config=config,
            )

            # Extract content from Gemini response
            content = ""
            if response and hasattr(response, "candidates") and response.candidates:
                candidate = response.candidates[0]
                if hasattr(candidate, "content") and candidate.content:
                    if hasattr(candidate.content, "parts") and candidate.content.parts:
                        for part in candidate.content.parts:
                            if hasattr(part, "text") and part.text:
                                content += part.text

            if not content:
                self.logger.warning("Google response is empty or malformed")

            return {"content": content}

        else:
            raise ValueError(f"Unsupported client type: {client_type}")

    def start_new_round(self, iteration: Optional[int] = None):
        """Start a new dialogue round and reset tool results

        Args:
            iteration: Optional iteration number from workflow to sync with current_round
        """
        if iteration is not None:
            # Sync with workflow iteration
            self.current_round = iteration
            # self.logger.info(f"🔄 Synced round with workflow iteration {iteration}")
        else:
            # Default behavior: increment round counter
            self.current_round += 1
            self.logger.info(f"🔄 Started new round {self.current_round}")

        self.current_round_tool_results = []  # Clear previous round results
        # Note: Don't reset last_write_file_detected and should_clear_memory_next here
        # These flags persist across rounds until memory optimization is applied
        # self.logger.info(f"🔄 Round {self.current_round} - Tool results cleared, memory flags preserved")

    def record_tool_result(
        self, tool_name: str, tool_input: Dict[str, Any], tool_result: Any
    ):
        """
        Record tool result for current round and detect write_file calls

        Args:
            tool_name: Name of the tool called
            tool_input: Input parameters for the tool
            tool_result: Result returned by the tool
        """
        # Detect write_file calls to trigger memory clearing
        if tool_name == "write_file":
            self.last_write_file_detected = True
            self.should_clear_memory_next = True

            # self.logger.info(f"🔄 WRITE_FILE DETECTED: {file_path} - Memory will be cleared in next round")

        # Only record specific tools that provide essential information
        essential_tools = [
            "read_code_mem",  # Read code summary from implement_code_summary.md
            "read_file",  # Read file contents
            "write_file",  # Write file contents (important for tracking implementations)
            "execute_python",  # Execute Python code (for testing/validation)
            "execute_bash",  # Execute bash commands (for build/execution)
            "search_code",  # Search code patterns
            "search_reference_code",  # Search reference code (if available)
            "get_file_structure",  # Get file structure (for understanding project layout)
        ]

        if tool_name in essential_tools:
            tool_record = {
                "tool_name": tool_name,
                "tool_input": tool_input,
                "tool_result": tool_result,
                "timestamp": time.time(),
            }
            self.current_round_tool_results.append(tool_record)
            # self.logger.info(f"📊 Essential tool result recorded: {tool_name} ({len(self.current_round_tool_results)} total)")

    def should_use_concise_mode(self) -> bool:
        """
        Check if concise memory mode should be used

        Returns:
            True if first file has been generated and concise mode should be active
        """
        return self.last_write_file_detected

    def create_concise_messages(
        self,
        system_prompt: str,
        messages: List[Dict[str, Any]],
        files_implemented: int,
    ) -> List[Dict[str, Any]]:
        """
        Create concise message list for LLM input
        NEW LOGIC: Always clear after write_file, keep system_prompt + initial_plan + current round tools

        Args:
            system_prompt: Current system prompt
            messages: Original message list
            files_implemented: Number of files implemented so far

        Returns:
            Concise message list containing only essential information
        """
        if not self.last_write_file_detected:
            # Before any write_file, use normal flow
            self.logger.info(
                "🔄 Using normal conversation flow (before any write_file)"
            )
            return messages

        # After write_file detection, use concise approach with clean slate
        self.logger.info(
            f"🎯 Using CONCISE memory mode - Clear slate after write_file, Round {self.current_round}"
        )

        concise_messages = []

        # Get formatted file lists
        file_lists = self.get_formatted_files_lists()
        implemented_files_list = file_lists["implemented"]
        unimplemented_files_list = file_lists["unimplemented"]

        # Debug output for unimplemented files (clean format without dashes)
        unimplemented_files = self.get_unimplemented_files()
        print("✅ Unimplemented Files:")
        for file_path in unimplemented_files:
            print(f"{file_path}")
        if self.current_next_steps.strip():
            print(f"\n📋 {self.current_next_steps}")

        # 1. Add initial plan message (always preserved)
        initial_plan_message = {
            "role": "user",
            "content": f"""**Task: Implement code based on the following reproduction plan**

**Code Reproduction Plan:**
{self.initial_plan}

**Working Directory:** Current workspace

**All Previously Implemented Files:**
{implemented_files_list}

**Current Status:** {files_implemented} files implemented

**Remaining Files to Implement:**
{unimplemented_files_list}

**IMPORTANT:** If the remaining files list shows "All files implemented!", you MUST reply with "All files implemented" to complete the task. Do NOT continue calling tools.

**Objective:** {"Reply 'All files implemented' to finish" if not unimplemented_files else "Continue implementation by analyzing dependencies and implementing the next required file according to the plan's priority order."}""",
        }

        # Append Next Steps information if available
        # if self.current_next_steps.strip():
        #     initial_plan_message["content"] += (
        #         f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"
        #     )

        concise_messages.append(initial_plan_message)

        # 2. Add Knowledge Base
        knowledge_base_message = {
            "role": "user",
            "content": f"""**Below is the Knowledge Base of the LATEST implemented code file:**
{self._read_code_knowledge_base()}

**Development Cycle - START HERE:**

**FIRST - Check completion status:**
- If "Remaining Files to Implement" above shows "All files implemented!", reply "All files implemented" immediately

**For NEW file implementation (if remaining files exist):**
Write_file can be used to implement the new component

**Remember:** Stop and declare completion when all files are done!""",
        }
        if self.current_next_steps.strip():
            knowledge_base_message["content"] += (
                f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"
            )
        concise_messages.append(knowledge_base_message)

        #         # 3. Add current tool results (essential information for next file generation)
        #         if self.current_round_tool_results:
        #             tool_results_content = self._format_tool_results()

        #             # # Append Next Steps information if available
        #             # if self.current_next_steps.strip():
        #             #     tool_results_content += f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"

        #             tool_results_message = {
        #                 "role": "user",
        #                 "content": f"""**Current Tool Results:**
        # {tool_results_content}""",
        #             }
        #             concise_messages.append(tool_results_message)
        #         else:
        #             # If no tool results yet, add guidance for next steps
        #             guidance_content = f"""**Current Round:** {self.current_round}

        # **Development Cycle - START HERE:**

        # **For NEW file implementation:**
        # Write_file can be used to implement the new component"""

        #             # # Append Next Steps information if available (even when no tool results)
        #             # if self.current_next_steps.strip():
        #             #     guidance_content += f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"

        #             guidance_message = {
        #                 "role": "user",
        #                 "content": guidance_content,
        #             }
        #             concise_messages.append(guidance_message)
        #         # **Available Essential Tools:** read_code_mem, write_file, execute_python, execute_bash
        #         # **Remember:** Start with read_code_mem when implementing NEW files to understand existing code. When all files are implemented, focus on testing and completion. Implement according to the original paper's specifications - any reference code is for inspiration only."""
        #         # self.logger.info(f"✅ Concise messages created: {len(concise_messages)} messages (original: {len(messages)})")
        return concise_messages

    def _read_code_knowledge_base(self) -> Optional[str]:
        """
        Read the implement_code_summary.md file as code knowledge base
        Returns all content from the file

        Returns:
            Full content of the file if it exists, None otherwise
        """
        try:
            if os.path.exists(self.code_summary_path):
                with open(self.code_summary_path, "r", encoding="utf-8") as f:
                    content = f.read().strip()

                if content:
                    # Return all content instead of just the latest entry
                    return content
                else:
                    return None
            else:
                return None

        except Exception as e:
            self.logger.error(f"Failed to read code knowledge base: {e}")
            return None

    def _extract_latest_implementation_entry(self, content: str) -> Optional[str]:
        """
        Extract the latest/final implementation entry from the implement_code_summary.md content
        Uses a simpler approach to find the last implementation section

        Args:
            content: Full content of implement_code_summary.md

        Returns:
            Latest implementation entry content, or None if not found
        """
        try:
            import re

            # Pattern to match the start of implementation sections
            section_pattern = (
                r"={80}\s*\n## IMPLEMENTATION File .+?; ROUND \d+\s*\n={80}"
            )

            # Find all implementation section starts
            matches = list(re.finditer(section_pattern, content))

            if not matches:
                # No implementation sections found
                lines = content.split("\n")
                fallback_content = (
                    "\n".join(lines[:10]) + "\n... (truncated for brevity)"
                    if len(lines) > 10
                    else content
                )
                self.logger.info(
                    "📖 No implementation sections found, using fallback content"
                )
                return fallback_content

            # Get the start position of the last implementation section
            last_match = matches[-1]
            start_pos = last_match.start()

            # Take everything from the last section start to the end of content
            latest_entry = content[start_pos:].strip()

            # self.logger.info(f"📖 Extracted latest implementation entry from knowledge base")
            # print(f"DEBUG: Extracted content length: {len(latest_entry)}")
            # print(f"DEBUG: First 200 chars: {latest_entry[:]}")

            return latest_entry

        except Exception as e:
            self.logger.error(f"Failed to extract latest implementation entry: {e}")
            # Return last 1000 characters as fallback
            return content[-500:] if len(content) > 500 else content

    def _format_tool_results(self) -> str:
        """
        Format current round tool results for LLM input

        Returns:
            Formatted string of tool results
        """
        if not self.current_round_tool_results:
            return "No tool results in current round."

        formatted_results = []

        for result in self.current_round_tool_results:
            tool_name = result["tool_name"]
            tool_input = result["tool_input"]
            tool_result = result["tool_result"]

            # Format based on tool type
            if tool_name == "read_code_mem":
                file_path = tool_input.get("file_path", "unknown")
                formatted_results.append(f"""
**read_code_mem Result for {file_path}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "read_file":
                file_path = tool_input.get("file_path", "unknown")
                formatted_results.append(f"""
**read_file Result for {file_path}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "write_file":
                file_path = tool_input.get("file_path", "unknown")
                formatted_results.append(f"""
**write_file Result for {file_path}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "execute_python":
                code_snippet = (
                    tool_input.get("code", "")[:50] + "..."
                    if len(tool_input.get("code", "")) > 50
                    else tool_input.get("code", "")
                )
                formatted_results.append(f"""
**execute_python Result (code: {code_snippet}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "execute_bash":
                command = tool_input.get("command", "unknown")
                formatted_results.append(f"""
**execute_bash Result (command: {command}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "search_code":
                pattern = tool_input.get("pattern", "unknown")
                file_pattern = tool_input.get("file_pattern", "")
                formatted_results.append(f"""
**search_code Result (pattern: {pattern}, files: {file_pattern}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "search_reference_code":
                target_file = tool_input.get("target_file", "unknown")
                keywords = tool_input.get("keywords", "")
                formatted_results.append(f"""
**search_reference_code Result for {target_file} (keywords: {keywords}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "get_file_structure":
                directory = tool_input.get(
                    "directory_path", tool_input.get("path", "current")
                )
                formatted_results.append(f"""
**get_file_structure Result for {directory}:**
{self._format_tool_result_content(tool_result)}
""")

        return "\n".join(formatted_results)

    def _format_tool_result_content(self, tool_result: Any) -> str:
        """
        Format tool result content for display

        Args:
            tool_result: Tool result to format

        Returns:
            Formatted string representation
        """
        if isinstance(tool_result, str):
            # Try to parse as JSON for better formatting
            try:
                result_data = json.loads(tool_result)
                if isinstance(result_data, dict):
                    # Format key information
                    if result_data.get("status") == "summary_found":
                        return (
                            f"Summary found:\n{result_data.get('summary_content', '')}"
                        )
                    elif result_data.get("status") == "no_summary":
                        return "No summary available"
                    else:
                        return json.dumps(result_data, indent=2)
                else:
                    return str(result_data)
            except json.JSONDecodeError:
                return tool_result
        else:
            return str(tool_result)

    def get_memory_statistics(self, files_implemented: int = 0) -> Dict[str, Any]:
        """Get memory agent statistics"""
        unimplemented_files = self.get_unimplemented_files()
        return {
            "last_write_file_detected": self.last_write_file_detected,
            "should_clear_memory_next": self.should_clear_memory_next,
            "current_round": self.current_round,
            "concise_mode_active": self.should_use_concise_mode(),
            "current_round_tool_results": len(self.current_round_tool_results),
            "essential_tools_recorded": [
                r["tool_name"] for r in self.current_round_tool_results
            ],
            "implemented_files_tracked": files_implemented,
            "implemented_files_list": self.implemented_files.copy(),
            "phases_parsed": len(self.phase_structure),
            "next_steps_available": bool(self.current_next_steps.strip()),
            "next_steps_length": len(self.current_next_steps.strip())
            if self.current_next_steps
            else 0,
            # File tracking statistics
            "total_files_in_plan": len(self.all_files_list),
            "files_implemented_count": len(self.implemented_files),
            "files_remaining_count": len(unimplemented_files),
            "all_files_list": self.all_files_list.copy(),
            "unimplemented_files_list": unimplemented_files,
            "implementation_progress_percent": (
                len(self.implemented_files) / len(self.all_files_list) * 100
            )
            if self.all_files_list
            else 0,
        }

    def get_implemented_files(self) -> List[str]:
        """Get list of all implemented files"""
        return self.implemented_files.copy()

    def get_all_files_list(self) -> List[str]:
        """Get list of all files that should be implemented according to the plan"""
        return self.all_files_list.copy()

    def refresh_files_list_from_directory(self) -> bool:
        """
        Refresh the files list by extracting from the generated directory
        Useful when the directory structure has been updated after initialization

        Returns:
            True if successfully refreshed from directory, False if fell back to plan
        """
        if os.path.exists(self.code_directory):
            files_from_dir = self._extract_files_from_generated_directory()
            if files_from_dir:
                old_count = len(self.all_files_list)
                self.all_files_list = files_from_dir
                new_count = len(self.all_files_list)
                self.logger.info(
                    f"🔄 Files list refreshed from directory: {old_count} → {new_count} files"
                )
                return True

        self.logger.warning("Cannot refresh from directory, keeping current list")
        return False

    def get_unimplemented_files(self) -> List[str]:
        """
        Get list of files that haven't been implemented yet
        Uses fuzzy path matching to handle partial paths

        Returns:
            List of file paths that still need to be implemented
        """

        # def is_implemented(plan_file: str) -> bool:
        #     """Check if a file from plan is implemented (with fuzzy matching)"""
        #     # Normalize paths for comparison
        #     plan_file_normalized = plan_file.replace("\\", "/").strip("/")
        #     plan_filename = plan_file_normalized.split("/")[-1]  # Extract filename

        #     for impl_file in self.implemented_files:
        #         impl_file_normalized = impl_file.replace("\\", "/").strip("/")
        #         impl_filename = impl_file_normalized.split("/")[-1]  # Extract filename

        #         # Strategy 1: Exact path match
        #         if plan_file_normalized == impl_file_normalized:
        #             return True

        #         # Strategy 2: One path ends with the other (partial path match)
        #         if plan_file_normalized.endswith(
        #             impl_file_normalized
        #         ) or impl_file_normalized.endswith(plan_file_normalized):
        #             # Ensure match is at a path boundary (not middle of directory name)
        #             if (
        #                 plan_file_normalized.endswith("/" + impl_file_normalized)
        #                 or impl_file_normalized.endswith("/" + plan_file_normalized)
        #             ):
        #                 return True

        #         # Strategy 3: Same filename (fallback for different directory structures)
        #         # Only match if filenames are identical and reasonably unique (length > 5)
        #         if (plan_filename == impl_filename and len(plan_filename) > 5):
        #             return True

        #     return False
        def is_implemented(plan_file: str) -> bool:
            """Check if a file from plan is implemented (with fuzzy matching)"""
            # Normalize paths for comparison
            plan_file_normalized = plan_file.replace("\\", "/").strip("/")

            for impl_file in self.implemented_files:
                impl_file_normalized = impl_file.replace("\\", "/").strip("/")

                # Check if plan_file ends with impl_file (partial path match)
                # or impl_file ends with plan_file (reverse partial match)
                if plan_file_normalized.endswith(
                    impl_file_normalized
                ) or impl_file_normalized.endswith(plan_file_normalized):
                    # Ensure match is at a path boundary (not middle of directory name)
                    if (
                        plan_file_normalized.endswith("/" + impl_file_normalized)
                        or plan_file_normalized == impl_file_normalized
                        or impl_file_normalized.endswith("/" + plan_file_normalized)
                    ):
                        return True
            return False

        # unimplemented = [f for f in self.all_files_list if not is_implemented(f)]
        # return unimplemented

        unimplemented = [f for f in self.all_files_list if not is_implemented(f)]
        return unimplemented

    def get_formatted_files_lists(self) -> Dict[str, str]:
        """
        Get formatted strings for implemented and unimplemented files

        Returns:
            Dictionary with 'implemented' and 'unimplemented' formatted lists
        """
        implemented_list = (
            "\n".join([f"- {file}" for file in self.implemented_files])
            if self.implemented_files
            else "- None yet"
        )

        unimplemented_files = self.get_unimplemented_files()
        unimplemented_list = (
            "\n".join([f"- {file}" for file in unimplemented_files])
            if unimplemented_files
            else "- All files implemented!"
        )

        return {"implemented": implemented_list, "unimplemented": unimplemented_list}

    def get_current_next_steps(self) -> str:
        """Get the current Next Steps information"""
        return self.current_next_steps

    def clear_next_steps(self):
        """Clear the stored Next Steps information"""
        if self.current_next_steps.strip():
            self.logger.info("🧹 Next Steps information cleared")
        self.current_next_steps = ""

    def set_next_steps(self, next_steps: str):
        """Manually set Next Steps information"""
        self.current_next_steps = next_steps
        self.logger.info(
            f"📝 Next Steps manually set ({len(next_steps.strip())} chars)"
        )

    def should_trigger_memory_optimization(
        self, messages: List[Dict[str, Any]], files_implemented: int = 0
    ) -> bool:
        """
        Check if memory optimization should be triggered
        NEW LOGIC: Trigger after write_file has been detected

        Args:
            messages: Current message list
            files_implemented: Number of files implemented so far

        Returns:
            True if concise mode should be applied
        """
        # Trigger if we detected write_file and should clear memory
        if self.should_clear_memory_next:
            # self.logger.info(f"🎯 Triggering CONCISE memory optimization (write_file detected, files: {files_implemented})")
            return True

        # No optimization before any write_file
        return False

    def apply_memory_optimization(
        self, system_prompt: str, messages: List[Dict[str, Any]], files_implemented: int
    ) -> List[Dict[str, Any]]:
        """
        Apply memory optimization using concise approach
        NEW LOGIC: Clear all history after write_file, keep only system_prompt + initial_plan + current tools

        Args:
            system_prompt: Current system prompt
            messages: Original message list
            files_implemented: Number of files implemented so far

        Returns:
            Optimized message list
        """
        if not self.should_clear_memory_next:
            # Before any write_file, return original messages
            return messages

        # Apply concise memory optimization after write_file detection
        # self.logger.info(f"🧹 CLEARING MEMORY after write_file - creating clean slate")
        optimized_messages = self.create_concise_messages(
            system_prompt, messages, files_implemented
        )

        # Clear the flag after applying optimization
        self.should_clear_memory_next = False

        compression_ratio = (
            ((len(messages) - len(optimized_messages)) / len(messages) * 100)
            if messages
            else 0
        )
        print(
            f"🎯 CONCISE optimization applied: {len(messages)} → {len(optimized_messages)} messages ({compression_ratio:.1f}% compression)"
        )

        return optimized_messages

    def clear_current_round_tool_results(self):
        """Clear current round tool results (called when starting new round)"""
        self.current_round_tool_results = []
        self.logger.info("🧹 Current round tool results cleared")

    def debug_concise_state(self, files_implemented: int = 0):
        """Debug method to show current concise memory state"""
        stats = self.get_memory_statistics(files_implemented)

        print("=" * 60)
        print("🎯 CONCISE MEMORY AGENT STATE (Write-File-Based)")
        print("=" * 60)
        print(f"Last write_file detected: {stats['last_write_file_detected']}")
        print(f"Should clear memory next: {stats['should_clear_memory_next']}")
        print(f"Files implemented: {stats['implemented_files_tracked']}")
        print(f"Current round: {stats['current_round']}")
        print(f"Concise mode active: {stats['concise_mode_active']}")
        print(f"Current round tool results: {stats['current_round_tool_results']}")
        print(f"Essential tools recorded: {stats['essential_tools_recorded']}")
        print(f"Implemented files tracked: {len(self.implemented_files)}")
        print(f"Implemented files list: {self.implemented_files}")
        print(f"Code summary file exists: {os.path.exists(self.code_summary_path)}")
        print(f"Next Steps available: {stats['next_steps_available']}")
        print(f"Next Steps length: {stats['next_steps_length']} chars")
        if self.current_next_steps.strip():
            print(f"Next Steps preview: {self.current_next_steps[:100]}...")
        print("")
        print("📋 FILE TRACKING:")
        print(f"  Total files in plan: {stats['total_files_in_plan']}")
        print(f"  Files implemented: {stats['files_implemented_count']}")
        print(f"  Files remaining: {stats['files_remaining_count']}")
        print(f"  Progress: {stats['implementation_progress_percent']:.1f}%")
        if stats["unimplemented_files_list"]:
            print(f"  Next possible files: {stats['unimplemented_files_list'][:3]}...")
        print("")
        print(
            "📊 NEW LOGIC: write_file → clear memory → accumulate tools → next write_file"
        )
        print("📊 NEXT STEPS: Stored separately from file, included in tool results")
        print(
            "📊 FILE TRACKING: All files extracted from plan, unimplemented files guide LLM decisions"
        )
        print("📊 Essential Tools Tracked:")
        essential_tools = [
            "read_code_mem",
            "read_file",
            "write_file",
            "execute_python",
            "execute_bash",
            "search_code",
            "search_reference_code",
            "get_file_structure",
        ]
        for tool in essential_tools:
            tool_count = sum(
                1 for r in self.current_round_tool_results if r["tool_name"] == tool
            )
            print(f"  - {tool}: {tool_count} calls")
        print("=" * 60)


================================================
FILE: workflows/agents/memory_agent_concise_index.py
================================================
"""
Concise Memory Agent for Code Implementation Workflow

This memory agent implements a focused approach:
1. Before first file: Normal conversation flow
2. After first file: Keep only system_prompt + initial_plan + current round tool results
3. Clean slate for each new code file generation

Key Features:
- Preserves system prompt and initial plan always
- After first file generation, discards previous conversation history
- Keeps only current round tool results from essential tools:
  * read_code_mem, read_file, write_file
  * execute_python, execute_bash
  * search_code, search_reference_code, get_file_structure
- Provides clean, focused input for next write_file operation
"""

import json
import logging
import os
import time
from datetime import datetime
from typing import Dict, Any, List, Optional


class ConciseMemoryAgent:
    """
    Concise Memory Agent - Focused Information Retention

    Core Philosophy:
    - Preserve essential context (system prompt + initial plan)
    - After first file generation, use clean slate approach
    - Keep only current round tool results from all essential MCP tools
    - Remove conversational clutter and previous tool calls

    Essential Tools Tracked:
    - File Operations: read_code_mem, read_file, write_file
    - Code Analysis: search_code, search_reference_code, get_file_structure
    - Execution: execute_python, execute_bash
    """

    def __init__(
        self,
        initial_plan_content: str,
        logger: Optional[logging.Logger] = None,
        target_directory: Optional[str] = None,
        default_models: Optional[Dict[str, str]] = None,
        code_directory: Optional[str] = None,
    ):
        """
        Initialize Concise Memory Agent

        Args:
            initial_plan_content: Content of initial_plan.txt
            logger: Logger instance
            target_directory: Target directory for saving summaries
            default_models: Default models configuration from workflow
            code_directory: Generated code directory path (e.g., target_directory/generate_code)
        """
        self.logger = logger or self._create_default_logger()
        self.initial_plan = initial_plan_content

        # Store default models configuration
        self.default_models = default_models or {
            "anthropic": "claude-sonnet-4-20250514",
            "openai": "o3-mini",
            "google": "gemini-2.0-flash",
        }

        # Memory state tracking - new logic: trigger after each write_file
        self.last_write_file_detected = (
            False  # Track if write_file was called in current iteration
        )
        self.should_clear_memory_next = False  # Flag to clear memory in next round
        self.current_round = 0

        # Parse phase structure from initial plan
        self.phase_structure = self._parse_phase_structure()

        # Memory configuration
        if target_directory:
            self.save_path = target_directory
        else:
            self.save_path = "./deepcode_lab/papers/1/"

        # Store code directory for file extraction
        self.code_directory = code_directory or os.path.join(
            self.save_path, "generate_code"
        )

        # Extract all files - prioritize generated directory over plan parsing
        self.all_files_list = self._extract_all_files()

        # Code summary file path
        self.code_summary_path = os.path.join(
            self.save_path, "implement_code_summary.md"
        )

        # Current round tool results storage
        self.current_round_tool_results = []

        # Track all implemented files
        self.implemented_files = []

        # Store Next Steps information temporarily (not saved to file)
        self.current_next_steps = ""

        self.logger.info(
            f"Concise Memory Agent initialized with target directory: {self.save_path}"
        )
        self.logger.info(f"Code directory: {self.code_directory}")
        self.logger.info(f"Code summary will be saved to: {self.code_summary_path}")
        # self.logger.info(f"🤖 Using models - Anthropic: {self.default_models['anthropic']}, OpenAI: {self.default_models['openai']}")
        self.logger.info(
            "📝 NEW LOGIC: Memory clearing triggered after each write_file call"
        )

    def _create_default_logger(self) -> logging.Logger:
        """Create default logger"""
        logger = logging.getLogger(f"{__name__}.ConciseMemoryAgent")
        logger.setLevel(logging.INFO)
        return logger

    def _parse_phase_structure(self) -> Dict[str, List[str]]:
        """Parse implementation phases from initial plan"""
        try:
            phases = {}
            lines = self.initial_plan.split("\n")
            current_phase = None

            for line in lines:
                if "Phase" in line and ":" in line:
                    # Extract phase name
                    phase_parts = line.split(":")
                    if len(phase_parts) >= 2:
                        current_phase = phase_parts[0].strip()
                        phases[current_phase] = []
                elif current_phase and line.strip().startswith("-"):
                    # This is a file in the current phase
                    file_line = line.strip()[1:].strip()
                    if file_line.startswith("`") and file_line.endswith("`"):
                        file_name = file_line[1:-1]
                        phases[current_phase].append(file_name)
                elif current_phase and not line.strip():
                    # Empty line might indicate end of phase
                    continue
                elif current_phase and line.strip().startswith("###"):
                    # New section, end current phase
                    current_phase = None

            return phases

        except Exception as e:
            self.logger.warning(f"Failed to parse phase structure: {e}")
            return {}

    def _extract_all_files(self) -> List[str]:
        """
        Extract all code files - prioritizes generated directory over plan parsing

        Strategy:
        1. First try to extract from the generated code directory (reliable)
        2. Fall back to plan parsing if directory doesn't exist yet

        Returns:
            List of all file paths that should be implemented
        """
        # Try extracting from generated directory first (more reliable)
        if os.path.exists(self.code_directory):
            files_from_dir = self._extract_files_from_generated_directory()
            if files_from_dir:
                self.logger.info(
                    f"📁 Extracted {len(files_from_dir)} files from generated directory"
                )
                return files_from_dir

        # Fall back to plan parsing
        self.logger.info(
            "📁 Generated directory not found, extracting from plan (less reliable)"
        )
        return self._extract_all_files_from_plan()

    def _extract_files_from_generated_directory(self) -> List[str]:
        """
        Extract all code files from the generated code directory
        This is more reliable than parsing the LLM-generated plan

        Returns:
            List of relative file paths within the code directory
        """
        code_files = []

        # Define code file extensions to track
        code_extensions = {
            ".py",
            ".js",
            ".ts",
            ".jsx",
            ".tsx",
            ".vue",
            ".html",
            ".css",
            ".scss",
            ".sass",
            ".less",
            ".json",
            ".yaml",
            ".yml",
            ".toml",
            ".xml",
            ".ini",
            ".cfg",
            ".md",
            ".rst",
            ".txt",
            ".sh",
            ".bash",
            ".zsh",
            ".bat",
            ".ps1",
            ".cmd",
            ".c",
            ".cpp",
            ".h",
            ".hpp",
            ".cc",
            ".cxx",
            ".java",
            ".kt",
            ".scala",
            ".go",
            ".rs",
            ".php",
            ".rb",
            ".pl",
            ".lua",
            ".r",
            ".sql",
        }

        # Files and directories to exclude
        exclude_patterns = {
            "__pycache__",
            ".pyc",
            "node_modules",
            ".git",
            ".vscode",
            ".idea",
            "dist",
            "build",
            "output",
            ".egg-info",
            "venv",
            ".venv",
            "env",
            ".env",
        }

        try:
            for root, dirs, files in os.walk(self.code_directory):
                # Filter out excluded directories
                dirs[:] = [
                    d
                    for d in dirs
                    if d not in exclude_patterns and not d.startswith(".")
                ]

                for file in files:
                    # Skip hidden files and excluded patterns
                    if file.startswith("."):
                        continue

                    # Check if file has a code extension
                    has_code_ext = any(
                        file.lower().endswith(ext) for ext in code_extensions
                    )
                    if not has_code_ext:
                        continue

                    # Get full path and convert to relative path
                    full_path = os.path.join(root, file)
                    relative_path = os.path.relpath(full_path, self.code_directory)

                    # Normalize path separators
                    relative_path = relative_path.replace(os.sep, "/")

                    code_files.append(relative_path)

            # Sort for consistency
            code_files = sorted(code_files)

            if code_files:
                self.logger.info(f"📄 Found {len(code_files)} code files in directory")
                self.logger.info(f"📄 Sample files: {code_files[:3]}...")

            return code_files

        except Exception as e:
            self.logger.error(f"Failed to extract files from directory: {e}")
            return []

    def _extract_all_files_from_plan(self) -> List[str]:
        """
        Extract all file paths from the file_structure section in initial plan
        Handles multiple formats: tree structure, YAML, and simple lists

        Returns:
            List of all file paths that should be implemented
        """
        try:
            lines = self.initial_plan.split("\n")
            files = []

            # Method 1: Try to extract from tree structure in file_structure section
            files.extend(self._extract_from_tree_structure(lines))

            # Method 2: If no files found, try to extract from simple list format
            if not files:
                files.extend(self._extract_from_simple_list(lines))

            # Method 3: If still no files, try to extract from anywhere in the plan
            if not files:
                files.extend(self._extract_from_plan_content(lines))

            # Clean and validate file paths
            cleaned_files = self._clean_and_validate_files(files)

            # Log the extracted files
            self.logger.info(
                f"📁 Extracted {len(cleaned_files)} files from initial plan"
            )
            if cleaned_files:
                self.logger.info(f"📁 Sample files: {cleaned_files[:3]}...")

            return cleaned_files

        except Exception as e:
            self.logger.error(f"Failed to extract files from initial plan: {e}")
            return []

    def _extract_from_tree_structure(self, lines: List[str]) -> List[str]:
        """
        Extract files from tree structure format - Advanced algorithm with multi-strategy approach

        Strategy:
        1. Precise indentation-based depth calculation
        2. Smart directory vs file detection using multiple heuristics
        3. Robust path stack management with depth tracking
        4. Fallback to regex pattern matching if tree parsing fails
        """
        files = []
        in_file_structure = False

        # Enhanced path tracking: store (depth, name) pairs
        path_stack = []  # [(depth, dir_name), ...]
        root_dir = None

        # Track the base indentation of tree structure
        base_indent = None

        for line_num, line in enumerate(lines):
            # === Section Boundary Detection ===
            if "file_structure:" in line or "file_structure |" in line:
                in_file_structure = True
                continue

            # End of file_structure section (next YAML key without indentation)
            if (
                in_file_structure
                and line.strip()
                and not line.startswith(" ")
                and ":" in line
            ):
                break

            if not in_file_structure:
                continue

            if not line.strip():
                continue

            # Skip YAML comments and keys that are clearly not files
            stripped = line.strip()
            if stripped.startswith("#") or (
                stripped.endswith(":") and "/" not in stripped
            ):
                continue

            # === Root Directory Detection ===
            # Pattern: "project-name/" at minimal indentation, no tree chars
            if stripped.endswith("/") and not any(
                c in line for c in ["├", "└", "│", "─"]
            ):
                indent = len(line) - len(line.lstrip())
                if indent <= 4:  # Root level
                    root_dir = stripped.rstrip("/")
                    path_stack = []
                    base_indent = None
                    self.logger.debug(f"🌳 Detected root directory: {root_dir}")
                    continue

            # === Tree Structure Line Detection ===
            has_tree_chars = any(c in line for c in ["├", "└", "│", "─"])
            if not has_tree_chars:
                continue

            # === Calculate Precise Depth ===
            # Method: Count the actual tree structure symbols to determine hierarchy
            indent = len(line) - len(line.lstrip())

            # Set base indent on first tree line
            if base_indent is None:
                base_indent = indent

            # Count tree depth indicators
            # Each "│   " or "    " block represents one level
            # "├── " or "└── " marks the current item
            tree_prefix = line[
                : line.find("├")
                if "├" in line
                else line.find("└")
                if "└" in line
                else len(line)
            ]

            # Count depth by analyzing tree prefix structure
            # Pattern: "    │   │   ├── filename" -> depth 3
            # Pattern: "    ├── filename" -> depth 1
            # Pattern: "    │   ├── filename" -> depth 2

            depth = 0
            i = 0
            while i < len(tree_prefix):
                # Look for pipe or tree junction
                if i + 4 <= len(tree_prefix):
                    chunk = tree_prefix[i : i + 4]
                    if "│" in chunk or all(c == " " for c in chunk):
                        depth += 1
                        i += 4
                    else:
                        i += 1
                else:
                    break

            # Fallback: use relative indentation
            if depth == 0:
                depth = max(1, (indent - base_indent) // 4 + 1)

            # === Clean and Extract Item Name ===
            item_name = line
            # Remove all tree characters
            for pattern in ["├──", "└──", "│", "├", "└", "─"]:
                item_name = item_name.replace(pattern, "")
            item_name = item_name.strip()

            # Remove inline comments
            if "#" in item_name:
                item_name = item_name.split("#")[0].strip()

            if not item_name or ":" in item_name:
                continue

            # === Smart Directory vs File Detection ===
            is_directory = self._is_directory(item_name)

            # === Update Path Stack ===
            # Remove items deeper than current depth
            path_stack = [(d, n) for d, n in path_stack if d < depth]

            if is_directory:
                dir_name = item_name.rstrip("/")
                path_stack.append((depth, dir_name))
                self.logger.debug(f"  {'  ' * depth}📁 {dir_name} (depth={depth})")
            else:
                # Construct full file path
                path_parts = [root_dir] if root_dir else []
                path_parts.extend([name for _, name in path_stack])
                path_parts.append(item_name)

                full_path = "/".join(path_parts)
                files.append(full_path)
                self.logger.debug(f"  {'  ' * depth}📄 {full_path}")

        return files

    def _is_directory(self, name: str) -> bool:
        """
        Advanced directory detection using multiple heuristics

        Returns True if the name represents a directory, False if it's a file
        """
        # Rule 1: Explicit directory marker
        if name.endswith("/"):
            return True

        # Rule 2: Has file extension -> definitely a file
        basename = name.split("/")[-1]
        if "." in basename:
            # Check if it's a known file extension
            known_extensions = [
                ".py",
                ".js",
                ".ts",
                ".jsx",
                ".tsx",
                ".vue",
                ".html",
                ".css",
                ".scss",
                ".sass",
                ".json",
                ".yaml",
                ".yml",
                ".xml",
                ".toml",
                ".md",
                ".txt",
                ".rst",
                ".sh",
                ".bat",
                ".ps1",
                ".c",
                ".cpp",
                ".h",
                ".hpp",
                ".java",
                ".go",
                ".rs",
                ".sql",
                ".db",
                ".env",
                ".gitignore",
                ".dockerignore",
                ".lock",
                ".sum",
                ".mod",
            ]
            if any(basename.lower().endswith(ext) for ext in known_extensions):
                return False

            # Has extension but not recognized -> might be config file, treat as file
            if basename.count(".") == 1:
                return False

        # Rule 3: Known special files without extensions
        special_files = [
            "README",
            "LICENSE",
            "CHANGELOG",
            "CONTRIBUTING",
            "Makefile",
            "Dockerfile",
            "Vagrantfile",
            "requirements.txt",
            "setup.py",
            "setup.cfg",
            "package.json",
            "package-lock.json",
            "Cargo.toml",
            "go.mod",
        ]
        if basename in special_files or basename.upper() in special_files:
            return False

        # Rule 4: Common directory names (even without trailing /)
        common_dirs = [
            "src",
            "lib",
            "app",
            "core",
            "api",
            "web",
            "client",
            "server",
            "config",
            "configs",
            "settings",
            "data",
            "datasets",
            "models",
            "model",
            "utils",
            "helpers",
            "common",
            "shared",
            "tests",
            "test",
            "testing",
            "__tests__",
            "docs",
            "documentation",
            "scripts",
            "bin",
            "tools",
            "assets",
            "static",
            "public",
            "resources",
            "components",
            "views",
            "pages",
            "routes",
            "services",
            "controllers",
            "handlers",
            "middleware",
            "middlewares",
            "types",
            "interfaces",
            "schemas",
            "experiments",
            "notebooks",
            "dist",
            "build",
            "output",
            "node_modules",
            "vendor",
            "packages",
            "__pycache__",
            ".git",
            ".vscode",
            "training",
            "evaluation",
            "inference",
        ]
        if basename.lower() in common_dirs:
            return True

        # Rule 5: Plural forms often indicate directories
        if basename.endswith("s") and len(basename) > 3:
            singular = basename[:-1]
            if singular in common_dirs:
                return True

        # Rule 6: Python package indicators
        if basename == "__init__.py":
            return False  # This is a file

        # Default: if no extension and not a known file, likely a directory
        return "." not in basename

    def _extract_from_simple_list(self, lines: List[str]) -> List[str]:
        """Extract files from simple list format (- filename)"""
        files = []

        for line in lines:
            line = line.strip()
            if line.startswith("- ") and not line.startswith('- "'):
                # Remove leading "- " and clean up
                filename = line[2:].strip()

                # Remove quotes if present
                if filename.startswith('"') and filename.endswith('"'):
                    filename = filename[1:-1]

                # Check if it looks like a file (has extension)
                if "." in filename and "/" in filename:
                    files.append(filename)

        return files

    def _extract_from_plan_content(self, lines: List[str]) -> List[str]:
        """
        Advanced fallback extraction: Extract files from anywhere in the plan content
        Uses multiple regex patterns and intelligent filtering
        """
        files = []
        import re

        # === Pattern 1: Standard file paths ===
        # Matches: path/to/file.py, src/model/apt_layer.py
        pattern1 = r"([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.[a-zA-Z0-9]+)"

        # === Pattern 2: Quoted file paths ===
        # Matches: "path/to/file.py", 'src/utils.py'
        pattern2 = r'["\']([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.[a-zA-Z0-9]+)["\']'

        # === Pattern 3: File paths with special characters ===
        # Matches: data/data_loader.py, __init__.py paths
        pattern3 = r"([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)*/__init__\.py)"
        pattern4 = r"([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.(?:py|js|ts|jsx|tsx|html|css|md|txt|json|yaml|yml|xml|sql|sh|bat))"

        # === Pattern 5: Backtick-wrapped paths (in code blocks) ===
        pattern5 = r"`([a-zA-Z0-9_\-]+(?:/[a-zA-Z0-9_\-]+)+\.[a-zA-Z0-9]+)`"

        all_patterns = [pattern1, pattern2, pattern3, pattern4, pattern5]

        # Collect all potential matches
        potential_files = set()

        for line in lines:
            # Skip comment-only lines
            stripped = line.strip()
            if stripped.startswith("#") and not ("/" in stripped and "." in stripped):
                continue

            # Apply all patterns
            for pattern in all_patterns:
                matches = re.findall(pattern, line)
                potential_files.update(matches)

        # === Filter and validate matches ===
        code_extensions = {
            ".py",
            ".js",
            ".ts",
            ".jsx",
            ".tsx",
            ".vue",
            ".html",
            ".css",
            ".scss",
            ".sass",
            ".less",
            ".json",
            ".yaml",
            ".yml",
            ".toml",
            ".xml",
            ".ini",
            ".cfg",
            ".md",
            ".rst",
            ".txt",
            ".sh",
            ".bash",
            ".zsh",
            ".bat",
            ".ps1",
            ".cmd",
            ".c",
            ".cpp",
            ".h",
            ".hpp",
            ".cc",
            ".cxx",
            ".java",
            ".kt",
            ".scala",
            ".go",
            ".rs",
            ".php",
            ".rb",
            ".pl",
            ".lua",
            ".r",
            ".sql",
            ".db",
            ".dockerfile",
            ".env",
            ".gitignore",
            ".lock",
            ".sum",
            ".mod",
        }

        for file_path in potential_files:
            # Must have path separator
            if "/" not in file_path:
                continue

            # Must have valid extension
            has_valid_ext = any(
                file_path.lower().endswith(ext) for ext in code_extensions
            )
            if not has_valid_ext:
                continue

            # Filter out obvious non-files
            if any(
                bad in file_path.lower()
                for bad in [
                    "http://",
                    "https://",
                    ".png",
                    ".jpg",
                    ".jpeg",
                    ".gif",
                    ".svg",
                    ".ico",
                ]
            ):
                continue

            # Must not be too short (avoid false positives)
            if len(file_path) < 5:
                continue

            # Path components should be reasonable
            parts = file_path.split("/")
            if any(len(part) == 0 for part in parts):
                continue

            files.append(file_path)

        # Sort for consistency
        files = sorted(list(set(files)))

        return files

    def _clean_and_validate_files(self, files: List[str]) -> List[str]:
        """
        Clean and validate extracted file paths - advanced filtering and deduplication

        Features:
        1. Remove duplicates while preserving order
        2. Normalize paths (handle ../,  ./, double slashes)
        3. Filter out non-code files
        4. Smart deduplication (recognize same file with different path prefixes)
        """
        cleaned_files = []
        seen_normalized = set()

        # Define code file extensions we want to track
        code_extensions = {
            ".py",
            ".js",
            ".ts",
            ".jsx",
            ".tsx",
            ".vue",
            ".html",
            ".css",
            ".scss",
            ".sass",
            ".less",
            ".json",
            ".yaml",
            ".yml",
            ".toml",
            ".xml",
            ".ini",
            ".cfg",
            ".md",
            ".rst",
            ".txt",
            ".sh",
            ".bash",
            ".zsh",
            ".bat",
            ".ps1",
            ".cmd",
            ".c",
            ".cpp",
            ".h",
            ".hpp",
            ".cc",
            ".cxx",
            ".java",
            ".kt",
            ".scala",
            ".go",
            ".rs",
            ".php",
            ".rb",
            ".pl",
            ".lua",
            ".r",
            ".sql",
            ".db",
            ".dockerfile",
            ".env",
            ".gitignore",
            ".lock",
            ".sum",
            ".mod",
        }

        for file_path in files:
            # === Step 1: Basic Cleaning ===
            cleaned_path = file_path.strip().strip('"').strip("'").strip("`")

            if not cleaned_path:
                continue

            # Remove leading/trailing slashes
            cleaned_path = cleaned_path.strip("/")

            # === Step 2: Path Normalization ===
            # Remove double slashes
            while "//" in cleaned_path:
                cleaned_path = cleaned_path.replace("//", "/")

            # Handle relative paths (remove ./ prefix)
            if cleaned_path.startswith("./"):
                cleaned_path = cleaned_path[2:]

            # === Step 3: Validate File Structure ===
            # Must have filename (not just directory)
            if not cleaned_path or "/" not in cleaned_path:
                # Single file without path - only accept if it has extension
                if "." not in cleaned_path:
                    continue

            # Extract basename
            basename = cleaned_path.split("/")[-1]

            # Skip directories (no file extension in basename)
            if "." not in basename:
                continue

            # === Step 4: Extension Validation ===
            # Only include files with code extensions
            has_code_extension = any(
                cleaned_path.lower().endswith(ext) for ext in code_extensions
            )
            if not has_code_extension:
                continue

            # === Step 5: Filter Invalid Patterns ===
            # Skip files that look like YAML keys or config entries
            if ":" in cleaned_path and not any(
                cleaned_path.endswith(ext) for ext in [".yaml", ".yml"]
            ):
                continue

            # Skip paths with invalid characters
            if any(
                char in cleaned_path for char in ['"', "'", "|", "<", ">", "*", "?"]
            ):
                continue

            # Skip obvious build/temp artifacts
            if any(
                part in cleaned_path
                for part in [
                    "__pycache__",
                    ".pyc",
                    "node_modules",
                    ".git/",
                    "dist/build",
                ]
            ):
                continue

            # === Step 6: Smart Deduplication ===
            # Normalize for comparison (lowercase, remove common prefixes)
            normalized_for_comparison = cleaned_path.lower()

            # Check if we've already seen this file (exact match)
            if normalized_for_comparison in seen_normalized:
                continue

            # Check for duplicate with different path (e.g., "src/model/apt_layer.py" vs "model/apt_layer.py")
            # Keep the longer (more specific) path
            is_duplicate = False
            paths_to_remove = []

            for existing_normalized in seen_normalized:
                # If current path is suffix of existing, it's a shorter version - skip it
                if existing_normalized.endswith("/" + normalized_for_comparison):
                    is_duplicate = True
                    break

                # If existing path is suffix of current, current is longer - replace existing
                if normalized_for_comparison.endswith("/" + existing_normalized):
                    paths_to_remove.append(existing_normalized)

            if is_duplicate:
                continue

            # Remove shorter versions
            for path_to_remove in paths_to_remove:
                seen_normalized.discard(path_to_remove)
                # Also remove from cleaned_files list
                cleaned_files = [
                    f for f in cleaned_files if f.lower() != path_to_remove
                ]

            # === Step 7: Add to Results ===
            seen_normalized.add(normalized_for_comparison)
            cleaned_files.append(cleaned_path)

        return sorted(cleaned_files)

    def record_file_implementation(
        self, file_path: str, implementation_content: str = ""
    ):
        """
        Record a newly implemented file (simplified version)
        NEW LOGIC: File implementation is tracked via write_file tool detection

        Args:
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
        """
        # Add file to implemented files list if not already present
        if file_path not in self.implemented_files:
            self.implemented_files.append(file_path)

        self.logger.info(f"📝 File implementation recorded: {file_path}")

    async def create_code_implementation_summary(
        self,
        client,
        client_type: str,
        file_path: str,
        implementation_content: str,
        files_implemented: int,
    ) -> str:
        """
        Create LLM-based code implementation summary after writing a file
        Uses LLM to analyze and summarize the implemented code

        Args:
            client: LLM client instance
            client_type: Type of LLM client ("anthropic" or "openai")
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
            files_implemented: Number of files implemented so far

        Returns:
            LLM-generated formatted code implementation summary
        """
        try:
            # Record the file implementation first
            self.record_file_implementation(file_path, implementation_content)

            # Create prompt for LLM summary
            summary_prompt = self._create_code_summary_prompt(
                file_path, implementation_content, files_implemented
            )
            summary_messages = [{"role": "user", "content": summary_prompt}]

            # Get LLM-generated summary
            llm_response = await self._call_llm_for_summary(
                client, client_type, summary_messages
            )
            llm_summary = llm_response.get("content", "")

            # Extract different sections from LLM summary
            sections = self._extract_summary_sections(llm_summary)

            # Store Next Steps in temporary variable (not saved to file)
            self.current_next_steps = sections.get("next_steps", "")
            if self.current_next_steps:
                self.logger.info("📝 Next Steps stored temporarily (not saved to file)")

            # Format summary with only Implementation Progress and Dependencies for file saving
            file_summary_content = ""
            if sections.get("core_purpose"):
                file_summary_content += sections["core_purpose"] + "\n\n"
            if sections.get("public_interface"):
                file_summary_content += sections["public_interface"] + "\n\n"
            if sections.get("internal_dependencies"):
                file_summary_content += sections["internal_dependencies"] + "\n\n"
            if sections.get("external_dependencies"):
                file_summary_content += sections["external_dependencies"] + "\n\n"
            if sections.get("implementation_notes"):
                file_summary_content += sections["implementation_notes"] + "\n\n"

            # Create the formatted summary for file saving (without Next Steps)
            formatted_summary = self._format_code_implementation_summary(
                file_path, file_summary_content.strip(), files_implemented
            )

            # Save to implement_code_summary.md (append mode) - only Implementation Progress and Dependencies
            await self._save_code_summary_to_file(formatted_summary, file_path)

            self.logger.info(f"Created and saved code summary for: {file_path}")
            return formatted_summary

        except Exception as e:
            self.logger.error(
                f"Failed to create LLM-based code implementation summary: {e}"
            )
            # Fallback to simple summary
            return self._create_fallback_code_summary(
                file_path, implementation_content, files_implemented
            )

    def _create_code_summary_prompt(
        self, file_path: str, implementation_content: str, files_implemented: int
    ) -> str:
        """
        Create prompt for LLM to generate code implementation summary

        Args:
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
            files_implemented: Number of files implemented so far

        Returns:
            Prompt for LLM summarization
        """
        current_round = self.current_round

        # Get formatted file lists
        file_lists = self.get_formatted_files_lists()
        implemented_files_list = file_lists["implemented"]
        unimplemented_files_list = file_lists["unimplemented"]

        prompt = f"""You are an expert code implementation summarizer. Analyze the implemented code file and create a structured summary.

**🚨 CRITICAL: The files listed below are ALREADY IMPLEMENTED - DO NOT suggest them in Next Steps! 🚨**

**All Previously Implemented Files:**
{implemented_files_list}

**Remaining Unimplemented Files (choose ONLY from these for Next Steps):**
{unimplemented_files_list}

**Current Implementation Context:**
- **File Implemented**: {file_path}
- **Current Round**: {current_round}
- **Total Files Implemented**: {files_implemented}


**Initial Plan Reference:**
{self.initial_plan[:]}

**Implemented Code Content:**
```
{implementation_content[:]}
```

**Required Summary Format:**

**Core Purpose** (provide a general overview of the file's main responsibility):
- {{1-2 sentence description of file's main responsibility}}

**Public Interface** (what other files can use, if any):
- Class {{ClassName}}: {{purpose}} | Key methods: {{method_names}} | Constructor params: {{params}}
- Function {{function_name}}({{params}}): {{purpose}} -> {{return_type}}: {{purpose}}
- Constants/Types: {{name}}: {{value/description}}

**Internal Dependencies** (what this file imports/requires, if any):
- From {{module/file}}: {{specific_imports}}
- External packages: {{package_name}} - {{usage_context}}

**External Dependencies** (what depends on this file, if any):
- Expected to be imported by: {{likely_consumer_files}}
- Key exports used elsewhere: {{main_interfaces}}

**Implementation Notes**: (if any)
- Architecture decisions: {{key_choices_made}}
- Cross-File Relationships: {{how_files_work_together}}

**Next Steps**: List the code file (ONLY ONE) that will be implemented in the next round (MUST choose from "Remaining Unimplemented Files" above)
  Format: Code will be implemented: {{file_path}}
  **NEVER suggest any file from the "All Previously Implemented Files" list!**

**Instructions:**
- Be precise and concise
- Focus on function interfaces that other files will need
- Extract actual function signatures from the code
- **CRITICAL: For Next Steps, ONLY choose ONE file from the "Remaining Unimplemented Files" list above**
- **NEVER suggest implementing a file that is already in the implemented files list**
- Choose the next file based on logical dependencies and implementation order
- Use the exact format specified above

**Summary:**"""

        return prompt

    # TODO: The prompt is not good, need to be improved
    # **Implementation Progress**: List the code file completed in current round and core implementation ideas
    #   Format: {{file_path}}: {{core implementation ideas}}

    # **Dependencies**: According to the File Structure and initial plan, list functions that may be called by other files
    #   Format: {{file_path}}: Function {{function_name}}: core ideas--{{ideas}}; Required parameters--{{params}}; Return parameters--{{returns}}
    #   Required packages: {{packages}}

    def _extract_summary_sections(self, llm_summary: str) -> Dict[str, str]:
        """
        Extract different sections from LLM-generated summary

        Args:
            llm_summary: Raw LLM-generated summary text

        Returns:
            Dictionary with extracted sections: core_purpose, public_interface, internal_dependencies,
            external_dependencies, implementation_notes, next_steps
        """
        sections = {
            "core_purpose": "",
            "public_interface": "",
            "internal_dependencies": "",
            "external_dependencies": "",
            "implementation_notes": "",
            "next_steps": "",
        }

        try:
            lines = llm_summary.split("\n")
            current_section = None
            current_content = []

            for line in lines:
                line_lower = line.lower().strip()

                # Check for section headers
                if "core purpose" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "core_purpose"
                    current_content = [line]  # Include the header
                elif "public interface" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "public_interface"
                    current_content = [line]  # Include the header
                elif "internal dependencies" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "internal_dependencies"
                    current_content = [line]  # Include the header
                elif "external dependencies" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "external_dependencies"
                    current_content = [line]  # Include the header
                elif "implementation notes" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "implementation_notes"
                    current_content = [line]  # Include the header
                elif "next steps" in line_lower:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "next_steps"
                    current_content = [line]  # Include the header
                else:
                    # Add content to current section
                    if current_section:
                        current_content.append(line)

            # Don't forget the last section
            if current_section and current_content:
                sections[current_section] = "\n".join(current_content).strip()

            self.logger.info(f"📋 Extracted sections: {list(sections.keys())}")

        except Exception as e:
            self.logger.error(f"Failed to extract summary sections: {e}")
            # Fallback: put everything in core_purpose
            sections["core_purpose"] = llm_summary

        return sections

    def _format_code_implementation_summary(
        self, file_path: str, llm_summary: str, files_implemented: int
    ) -> str:
        """
        Format the LLM-generated summary into the final structure

        Args:
            file_path: Path of the implemented file
            llm_summary: LLM-generated summary content
            files_implemented: Number of files implemented so far

        Returns:
            Formatted summary
        """
        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # # Create formatted list of implemented files
        # implemented_files_list = (
        #     "\n".join([f"- {file}" for file in self.implemented_files])
        #     if self.implemented_files
        #     else "- None yet"
        # )

        #         formatted_summary = f"""# Code Implementation Summary
        # **All Previously Implemented Files:**
        # {implemented_files_list}
        # **Generated**: {timestamp}
        # **File Implemented**: {file_path}
        # **Total Files Implemented**: {files_implemented}

        # {llm_summary}

        # ---
        # *Auto-generated by Memory Agent*
        # """
        formatted_summary = f"""# Code Implementation Summary
**Generated**: {timestamp}
**File Implemented**: {file_path}

{llm_summary}

---
*Auto-generated by Memory Agent*
"""
        return formatted_summary

    def _create_fallback_code_summary(
        self, file_path: str, implementation_content: str, files_implemented: int
    ) -> str:
        """
        Create fallback summary when LLM is unavailable

        Args:
            file_path: Path of the implemented file
            implementation_content: Content of the implemented file
            files_implemented: Number of files implemented so far

        Returns:
            Fallback summary
        """
        # Create formatted list of implemented files
        implemented_files_list = (
            "\n".join([f"- {file}" for file in self.implemented_files])
            if self.implemented_files
            else "- None yet"
        )

        summary = f"""# Code Implementation Summary
**All Previously Implemented Files:**
{implemented_files_list}
**Generated**: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}
**File Implemented**: {file_path}
**Total Files Implemented**: {files_implemented}
**Summary failed to generate.**

---
*Auto-generated by Concise Memory Agent (Fallback Mode)*
"""
        return summary

    async def _save_code_summary_to_file(self, new_summary: str, file_path: str):
        """
        Append code implementation summary to implement_code_summary.md
        Accumulates all implementations with clear separators

        Args:
            new_summary: New summary content to append
            file_path: Path of the file for which the summary was generated
        """
        try:
            # Create directory if it doesn't exist
            os.makedirs(os.path.dirname(self.code_summary_path), exist_ok=True)

            # Check if file exists to determine if we need header
            file_exists = os.path.exists(self.code_summary_path)

            # Open in append mode to accumulate all implementations
            with open(self.code_summary_path, "a", encoding="utf-8") as f:
                if not file_exists:
                    # Write header for new file
                    f.write("# Code Implementation Progress Summary\n")
                    f.write("*Accumulated implementation progress for all files*\n\n")

                # Add clear separator between implementations
                f.write("\n" + "=" * 80 + "\n")
                f.write(
                    f"## IMPLEMENTATION File {file_path}; ROUND {self.current_round} \n"
                )
                f.write("=" * 80 + "\n\n")

                # Write the new summary
                f.write(new_summary)
                f.write("\n\n")

            self.logger.info(
                f"Appended LLM-based code implementation summary to: {self.code_summary_path}"
            )

        except Exception as e:
            self.logger.error(f"Failed to save code implementation summary: {e}")

    async def _call_llm_for_summary(
        self, client, client_type: str, summary_messages: List[Dict]
    ) -> Dict[str, Any]:
        """
        Call LLM for code implementation summary generation ONLY

        This method is used only for creating code implementation summaries,
        NOT for conversation summarization which has been removed.
        """
        if client_type == "anthropic":
            response = await client.messages.create(
                model=self.default_models["anthropic"],
                system="You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches.",
                messages=summary_messages,
                max_tokens=5000,
                temperature=0.2,
            )

            content = ""
            if response and hasattr(response, "content") and response.content:
                for block in response.content:
                    if block.type == "text":
                        content += block.text
            else:
                self.logger.warning("Anthropic response is empty or malformed")

            return {"content": content}

        elif client_type == "openai":
            openai_messages = [
                {
                    "role": "system",
                    "content": "You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches.",
                }
            ]
            openai_messages.extend(summary_messages)

            # Try max_tokens and temperature first, fallback to max_completion_tokens without temperature if unsupported
            try:
                response = await client.chat.completions.create(
                    model=self.default_models["openai"],
                    messages=openai_messages,
                    max_tokens=5000,
                    temperature=0.2,
                )
            except Exception as e:
                if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                    # Retry with max_completion_tokens and no temperature for models that require it
                    response = await client.chat.completions.create(
                        model=self.default_models["openai"],
                        messages=openai_messages,
                        max_completion_tokens=5000,
                    )
                else:
                    raise

            # Safely extract content from response
            if response and hasattr(response, "choices") and response.choices:
                return {"content": response.choices[0].message.content or ""}
            else:
                self.logger.warning("OpenAI response is empty or malformed")
                return {"content": ""}

        elif client_type == "google":
            from google.genai import types

            # Convert messages to Gemini format
            system_instruction = "You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches."

            gemini_messages = []
            for msg in summary_messages:
                role = msg.get("role", "user")
                content = msg.get("content", "")

                # Convert role names: "assistant" -> "model"
                if role == "assistant":
                    role = "model"
                elif role not in ["user", "model"]:
                    role = "user"

                gemini_messages.append(
                    types.Content(role=role, parts=[types.Part.from_text(text=content)])
                )

            config = types.GenerateContentConfig(
                max_output_tokens=5000,
                temperature=0.2,
                system_instruction=system_instruction,
            )

            response = await client.aio.models.generate_content(
                model=self.default_models.get("google", "gemini-2.0-flash"),
                contents=gemini_messages,
                config=config,
            )

            # Extract content from Gemini response
            content = ""
            if response and hasattr(response, "candidates") and response.candidates:
                candidate = response.candidates[0]
                if hasattr(candidate, "content") and candidate.content:
                    if hasattr(candidate.content, "parts") and candidate.content.parts:
                        for part in candidate.content.parts:
                            if hasattr(part, "text") and part.text:
                                content += part.text

            if not content:
                self.logger.warning("Google response is empty or malformed")

            return {"content": content}

        else:
            raise ValueError(f"Unsupported client type: {client_type}")

    def start_new_round(self, iteration: Optional[int] = None):
        """Start a new dialogue round and reset tool results

        Args:
            iteration: Optional iteration number from workflow to sync with current_round
        """
        if iteration is not None:
            # Sync with workflow iteration
            self.current_round = iteration
            # self.logger.info(f"🔄 Synced round with workflow iteration {iteration}")
        else:
            # Default behavior: increment round counter
            self.current_round += 1
            self.logger.info(f"🔄 Started new round {self.current_round}")

        self.current_round_tool_results = []  # Clear previous round results
        # Note: Don't reset last_write_file_detected and should_clear_memory_next here
        # These flags persist across rounds until memory optimization is applied
        # self.logger.info(f"🔄 Round {self.current_round} - Tool results cleared, memory flags preserved")

    def record_tool_result(
        self, tool_name: str, tool_input: Dict[str, Any], tool_result: Any
    ):
        """
        Record tool result for current round and detect write_file calls

        Args:
            tool_name: Name of the tool called
            tool_input: Input parameters for the tool
            tool_result: Result returned by the tool
        """
        # Detect write_file calls to trigger memory clearing
        if tool_name == "write_file":
            self.last_write_file_detected = True
            self.should_clear_memory_next = True

            # self.logger.info(f"🔄 WRITE_FILE DETECTED: {file_path} - Memory will be cleared in next round")

        # Only record specific tools that provide essential information
        essential_tools = [
            # "read_code_mem",  # Read code summary from implement_code_summary.md
            # "read_file",  # Read file contents
            "write_file",  # Write file contents (important for tracking implementations)
            # "execute_python",  # Execute Python code (for testing/validation)
            "execute_bash",  # Execute bash commands (for build/execution)
            # "search_code",  # Search code patterns
            "search_reference_code",  # Search reference code (if available)
            # "get_file_structure",  # Get file structure (for understanding project layout)
        ]

        if tool_name in essential_tools:
            tool_record = {
                "tool_name": tool_name,
                "tool_input": tool_input,
                "tool_result": tool_result,
                "timestamp": time.time(),
            }
            self.current_round_tool_results.append(tool_record)
            # self.logger.info(f"📊 Essential tool result recorded: {tool_name} ({len(self.current_round_tool_results)} total)")

    def should_use_concise_mode(self) -> bool:
        """
        Check if concise memory mode should be used

        Returns:
            True if first file has been generated and concise mode should be active
        """
        return self.last_write_file_detected

    def create_concise_messages(
        self,
        system_prompt: str,
        messages: List[Dict[str, Any]],
        files_implemented: int,
    ) -> List[Dict[str, Any]]:
        """
        Create concise message list for LLM input
        NEW LOGIC: Always clear after write_file, keep system_prompt + initial_plan + current round tools

        Args:
            system_prompt: Current system prompt
            messages: Original message list
            files_implemented: Number of files implemented so far

        Returns:
            Concise message list containing only essential information
        """
        if not self.last_write_file_detected:
            # Before any write_file, use normal flow
            self.logger.info(
                "🔄 Using normal conversation flow (before any write_file)"
            )
            return messages

        # After write_file detection, use concise approach with clean slate
        self.logger.info(
            f"🎯 Using CONCISE memory mode - Clear slate after write_file, Round {self.current_round}"
        )

        concise_messages = []

        # Get formatted file lists
        file_lists = self.get_formatted_files_lists()
        implemented_files_list = file_lists["implemented"]
        unimplemented_files_list = file_lists["unimplemented"]

        # Debug output for unimplemented files (clean format without dashes)
        unimplemented_files = self.get_unimplemented_files()
        print("✅ Unimplemented Files:")
        for file_path in unimplemented_files:
            print(f"{file_path}")
        if self.current_next_steps.strip():
            print(f"\n📋 {self.current_next_steps}")

        # 1. Add initial plan message (always preserved)
        initial_plan_message = {
            "role": "user",
            "content": f"""**Task: Implement code based on the following reproduction plan**

**Code Reproduction Plan:**
{self.initial_plan}

**Working Directory:** Current workspace

**All Previously Implemented Files:**
{implemented_files_list}

**Current Status:** {files_implemented} files implemented

**Remaining Files to Implement:**
{unimplemented_files_list}

**IMPORTANT:** If the remaining files list shows "All files implemented!", you MUST reply with "All files implemented" to complete the task. Do NOT continue calling tools.

**Objective:** {"Reply 'All files implemented' to finish" if not unimplemented_files else "Continue implementation by analyzing dependencies and implementing the next required file according to the plan's priority order."}""",
        }

        # Append Next Steps information if available
        # if self.current_next_steps.strip():
        #     initial_plan_message["content"] += (
        #         f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"
        #     )

        concise_messages.append(initial_plan_message)

        # 2. Add Knowledge Base
        knowledge_base_message = {
            "role": "user",
            "content": f"""**Below is the Knowledge Base of the LATEST implemented code file:**
{self._read_code_knowledge_base()}

**Development Cycle - START HERE:**

**FIRST - Check completion status:**
- If "Remaining Files to Implement" above shows "All files implemented!", reply "All files implemented" immediately

**For NEW file implementation (if remaining files exist):**
1. `search_code_references` → OPTIONALLY search reference patterns for inspiration (use for reference only, original paper specs take priority)
2. Write_file can be used to implement the new component

**Remember:** Stop and declare completion when all files are done!""",
        }
        if self.current_next_steps.strip():
            knowledge_base_message["content"] += (
                f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"
            )
        concise_messages.append(knowledge_base_message)

        # 3. Add current tool results (essential information for next file generation)
        if self.current_round_tool_results:
            tool_results_content = self._format_tool_results()

            # # Append Next Steps information if available
            # if self.current_next_steps.strip():
            #     tool_results_content += f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"

            tool_results_message = {
                "role": "user",
                "content": f"""**Current Tool Results:**
{tool_results_content}""",
            }
            concise_messages.append(tool_results_message)
        else:
            # If no tool results yet, add guidance for next steps
            guidance_content = f"""**Current Round:** {self.current_round}

**Development Cycle - START HERE:**

**For NEW file implementation:**
1. `search_code_references` → OPTIONALLY search reference patterns for inspiration (use for reference only, original paper specs take priority)
2. Write_file can be used to implement the new component"""

            # # Append Next Steps information if available (even when no tool results)
            # if self.current_next_steps.strip():
            #     guidance_content += f"\n\n**Next Steps (from previous analysis):**\n{self.current_next_steps}"

            guidance_message = {
                "role": "user",
                "content": guidance_content,
            }
            concise_messages.append(guidance_message)
        # **Available Essential Tools:** read_code_mem, write_file, execute_python, execute_bash
        # **Remember:** Start with read_code_mem when implementing NEW files to understand existing code. When all files are implemented, focus on testing and completion. Implement according to the original paper's specifications - any reference code is for inspiration only.
        # self.logger.info(f"✅ Concise messages created: {len(concise_messages)} messages (original: {len(messages)})")
        return concise_messages

    def _read_code_knowledge_base(self) -> Optional[str]:
        """
        Read the implement_code_summary.md file as code knowledge base
        Returns all content from the file

        Returns:
            Full content of the file if it exists, None otherwise
        """
        try:
            if os.path.exists(self.code_summary_path):
                with open(self.code_summary_path, "r", encoding="utf-8") as f:
                    content = f.read().strip()

                if content:
                    # Return all content instead of just the latest entry
                    return content
                else:
                    return None
            else:
                return None

        except Exception as e:
            self.logger.error(f"Failed to read code knowledge base: {e}")
            return None

    def _extract_latest_implementation_entry(self, content: str) -> Optional[str]:
        """
        Extract the latest/final implementation entry from the implement_code_summary.md content
        Uses a simpler approach to find the last implementation section

        Args:
            content: Full content of implement_code_summary.md

        Returns:
            Latest implementation entry content, or None if not found
        """
        try:
            import re

            # Pattern to match the start of implementation sections
            section_pattern = (
                r"={80}\s*\n## IMPLEMENTATION File .+?; ROUND \d+\s*\n={80}"
            )

            # Find all implementation section starts
            matches = list(re.finditer(section_pattern, content))

            if not matches:
                # No implementation sections found
                lines = content.split("\n")
                fallback_content = (
                    "\n".join(lines[:10]) + "\n... (truncated for brevity)"
                    if len(lines) > 10
                    else content
                )
                self.logger.info(
                    "📖 No implementation sections found, using fallback content"
                )
                return fallback_content

            # Get the start position of the last implementation section
            last_match = matches[-1]
            start_pos = last_match.start()

            # Take everything from the last section start to the end of content
            latest_entry = content[start_pos:].strip()

            # self.logger.info(f"📖 Extracted latest implementation entry from knowledge base")
            # print(f"DEBUG: Extracted content length: {len(latest_entry)}")
            # print(f"DEBUG: First 200 chars: {latest_entry[:]}")

            return latest_entry

        except Exception as e:
            self.logger.error(f"Failed to extract latest implementation entry: {e}")
            # Return last 1000 characters as fallback
            return content[-500:] if len(content) > 500 else content

    def _format_tool_results(self) -> str:
        """
        Format current round tool results for LLM input

        Returns:
            Formatted string of tool results
        """
        if not self.current_round_tool_results:
            return "No tool results in current round."

        formatted_results = []

        for result in self.current_round_tool_results:
            tool_name = result["tool_name"]
            tool_input = result["tool_input"]
            tool_result = result["tool_result"]

            # Format based on tool type
            if tool_name == "read_code_mem":
                file_path = tool_input.get("file_path", "unknown")
                formatted_results.append(f"""
**read_code_mem Result for {file_path}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "read_file":
                file_path = tool_input.get("file_path", "unknown")
                formatted_results.append(f"""
**read_file Result for {file_path}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "write_file":
                file_path = tool_input.get("file_path", "unknown")
                formatted_results.append(f"""
**write_file Result for {file_path}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "execute_python":
                code_snippet = (
                    tool_input.get("code", "")[:50] + "..."
                    if len(tool_input.get("code", "")) > 50
                    else tool_input.get("code", "")
                )
                formatted_results.append(f"""
**execute_python Result (code: {code_snippet}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "execute_bash":
                command = tool_input.get("command", "unknown")
                formatted_results.append(f"""
**execute_bash Result (command: {command}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "search_code":
                pattern = tool_input.get("pattern", "unknown")
                file_pattern = tool_input.get("file_pattern", "")
                formatted_results.append(f"""
**search_code Result (pattern: {pattern}, files: {file_pattern}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "search_reference_code":
                target_file = tool_input.get("target_file", "unknown")
                keywords = tool_input.get("keywords", "")
                formatted_results.append(f"""
**search_reference_code Result for {target_file} (keywords: {keywords}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "get_file_structure":
                directory = tool_input.get(
                    "directory_path", tool_input.get("path", "current")
                )
                formatted_results.append(f"""
**get_file_structure Result for {directory}:**
{self._format_tool_result_content(tool_result)}
""")

        return "\n".join(formatted_results)

    def _format_tool_result_content(self, tool_result: Any) -> str:
        """
        Format tool result content for display

        Args:
            tool_result: Tool result to format

        Returns:
            Formatted string representation
        """
        if isinstance(tool_result, str):
            # Try to parse as JSON for better formatting
            try:
                result_data = json.loads(tool_result)
                if isinstance(result_data, dict):
                    # Format key information
                    if result_data.get("status") == "summary_found":
                        return (
                            f"Summary found:\n{result_data.get('summary_content', '')}"
                        )
                    elif result_data.get("status") == "no_summary":
                        return "No summary available"
                    else:
                        return json.dumps(result_data, indent=2)
                else:
                    return str(result_data)
            except json.JSONDecodeError:
                return tool_result
        else:
            return str(tool_result)

    def get_memory_statistics(self, files_implemented: int = 0) -> Dict[str, Any]:
        """Get memory agent statistics"""
        unimplemented_files = self.get_unimplemented_files()
        return {
            "last_write_file_detected": self.last_write_file_detected,
            "should_clear_memory_next": self.should_clear_memory_next,
            "current_round": self.current_round,
            "concise_mode_active": self.should_use_concise_mode(),
            "current_round_tool_results": len(self.current_round_tool_results),
            "essential_tools_recorded": [
                r["tool_name"] for r in self.current_round_tool_results
            ],
            "implemented_files_tracked": files_implemented,
            "implemented_files_list": self.implemented_files.copy(),
            "phases_parsed": len(self.phase_structure),
            "next_steps_available": bool(self.current_next_steps.strip()),
            "next_steps_length": len(self.current_next_steps.strip())
            if self.current_next_steps
            else 0,
            # File tracking statistics
            "total_files_in_plan": len(self.all_files_list),
            "files_implemented_count": len(self.implemented_files),
            "files_remaining_count": len(unimplemented_files),
            "all_files_list": self.all_files_list.copy(),
            "unimplemented_files_list": unimplemented_files,
            "implementation_progress_percent": (
                len(self.implemented_files) / len(self.all_files_list) * 100
            )
            if self.all_files_list
            else 0,
        }

    def get_implemented_files(self) -> List[str]:
        """Get list of all implemented files"""
        return self.implemented_files.copy()

    def get_all_files_list(self) -> List[str]:
        """Get list of all files that should be implemented according to the plan"""
        return self.all_files_list.copy()

    def refresh_files_list_from_directory(self) -> bool:
        """
        Refresh the files list by extracting from the generated directory
        Useful when the directory structure has been updated after initialization

        Returns:
            True if successfully refreshed from directory, False if fell back to plan
        """
        if os.path.exists(self.code_directory):
            files_from_dir = self._extract_files_from_generated_directory()
            if files_from_dir:
                old_count = len(self.all_files_list)
                self.all_files_list = files_from_dir
                new_count = len(self.all_files_list)
                self.logger.info(
                    f"🔄 Files list refreshed from directory: {old_count} → {new_count} files"
                )
                return True

        self.logger.warning("Cannot refresh from directory, keeping current list")
        return False

    def get_unimplemented_files(self) -> List[str]:
        """
        Get list of files that haven't been implemented yet
        Uses fuzzy path matching to handle partial paths

        Returns:
            List of file paths that still need to be implemented
        """

        # def is_implemented(plan_file: str) -> bool:
        #     """Check if a file from plan is implemented (with fuzzy matching)"""
        #     # Normalize paths for comparison
        #     plan_file_normalized = plan_file.replace("\\", "/").strip("/")
        #     plan_filename = plan_file_normalized.split("/")[-1]  # Extract filename

        #     for impl_file in self.implemented_files:
        #         impl_file_normalized = impl_file.replace("\\", "/").strip("/")
        #         impl_filename = impl_file_normalized.split("/")[-1]  # Extract filename

        #         # Strategy 1: Exact path match
        #         if plan_file_normalized == impl_file_normalized:
        #             return True

        #         # Strategy 2: One path ends with the other (partial path match)
        #         if plan_file_normalized.endswith(
        #             impl_file_normalized
        #         ) or impl_file_normalized.endswith(plan_file_normalized):
        #             # Ensure match is at a path boundary (not middle of directory name)
        #             if (
        #                 plan_file_normalized.endswith("/" + impl_file_normalized)
        #                 or impl_file_normalized.endswith("/" + plan_file_normalized)
        #             ):
        #                 return True

        #         # Strategy 3: Same filename (fallback for different directory structures)
        #         # Only match if filenames are identical and reasonably unique (length > 5)
        #         if (plan_filename == impl_filename and len(plan_filename) > 5):
        #             return True

        #     return False
        def is_implemented(plan_file: str) -> bool:
            """Check if a file from plan is implemented (with fuzzy matching)"""
            # Normalize paths for comparison
            plan_file_normalized = plan_file.replace("\\", "/").strip("/")

            for impl_file in self.implemented_files:
                impl_file_normalized = impl_file.replace("\\", "/").strip("/")

                # Check if plan_file ends with impl_file (partial path match)
                # or impl_file ends with plan_file (reverse partial match)
                if plan_file_normalized.endswith(
                    impl_file_normalized
                ) or impl_file_normalized.endswith(plan_file_normalized):
                    # Ensure match is at a path boundary (not middle of directory name)
                    if (
                        plan_file_normalized.endswith("/" + impl_file_normalized)
                        or plan_file_normalized == impl_file_normalized
                        or impl_file_normalized.endswith("/" + plan_file_normalized)
                    ):
                        return True
            return False

        # unimplemented = [f for f in self.all_files_list if not is_implemented(f)]
        # return unimplemented

        unimplemented = [f for f in self.all_files_list if not is_implemented(f)]
        return unimplemented

    def get_formatted_files_lists(self) -> Dict[str, str]:
        """
        Get formatted strings for implemented and unimplemented files

        Returns:
            Dictionary with 'implemented' and 'unimplemented' formatted lists
        """
        implemented_list = (
            "\n".join([f"- {file}" for file in self.implemented_files])
            if self.implemented_files
            else "- None yet"
        )

        unimplemented_files = self.get_unimplemented_files()
        unimplemented_list = (
            "\n".join([f"- {file}" for file in unimplemented_files])
            if unimplemented_files
            else "- All files implemented!"
        )

        return {"implemented": implemented_list, "unimplemented": unimplemented_list}

    def get_current_next_steps(self) -> str:
        """Get the current Next Steps information"""
        return self.current_next_steps

    def clear_next_steps(self):
        """Clear the stored Next Steps information"""
        if self.current_next_steps.strip():
            self.logger.info("🧹 Next Steps information cleared")
        self.current_next_steps = ""

    def set_next_steps(self, next_steps: str):
        """Manually set Next Steps information"""
        self.current_next_steps = next_steps
        self.logger.info(
            f"📝 Next Steps manually set ({len(next_steps.strip())} chars)"
        )

    def should_trigger_memory_optimization(
        self, messages: List[Dict[str, Any]], files_implemented: int = 0
    ) -> bool:
        """
        Check if memory optimization should be triggered
        NEW LOGIC: Trigger after write_file has been detected

        Args:
            messages: Current message list
            files_implemented: Number of files implemented so far

        Returns:
            True if concise mode should be applied
        """
        # Trigger if we detected write_file and should clear memory
        if self.should_clear_memory_next:
            # self.logger.info(f"🎯 Triggering CONCISE memory optimization (write_file detected, files: {files_implemented})")
            return True

        # No optimization before any write_file
        return False

    def apply_memory_optimization(
        self, system_prompt: str, messages: List[Dict[str, Any]], files_implemented: int
    ) -> List[Dict[str, Any]]:
        """
        Apply memory optimization using concise approach
        NEW LOGIC: Clear all history after write_file, keep only system_prompt + initial_plan + current tools

        Args:
            system_prompt: Current system prompt
            messages: Original message list
            files_implemented: Number of files implemented so far

        Returns:
            Optimized message list
        """
        if not self.should_clear_memory_next:
            # Before any write_file, return original messages
            return messages

        # Apply concise memory optimization after write_file detection
        # self.logger.info(f"🧹 CLEARING MEMORY after write_file - creating clean slate")
        optimized_messages = self.create_concise_messages(
            system_prompt, messages, files_implemented
        )

        # Clear the flag after applying optimization
        self.should_clear_memory_next = False

        compression_ratio = (
            ((len(messages) - len(optimized_messages)) / len(messages) * 100)
            if messages
            else 0
        )
        print(
            f"🎯 CONCISE optimization applied: {len(messages)} → {len(optimized_messages)} messages ({compression_ratio:.1f}% compression)"
        )

        return optimized_messages

    def clear_current_round_tool_results(self):
        """Clear current round tool results (called when starting new round)"""
        self.current_round_tool_results = []
        self.logger.info("🧹 Current round tool results cleared")

    def debug_concise_state(self, files_implemented: int = 0):
        """Debug method to show current concise memory state"""
        stats = self.get_memory_statistics(files_implemented)

        print("=" * 60)
        print("🎯 CONCISE MEMORY AGENT STATE (Write-File-Based)")
        print("=" * 60)
        print(f"Last write_file detected: {stats['last_write_file_detected']}")
        print(f"Should clear memory next: {stats['should_clear_memory_next']}")
        print(f"Files implemented: {stats['implemented_files_tracked']}")
        print(f"Current round: {stats['current_round']}")
        print(f"Concise mode active: {stats['concise_mode_active']}")
        print(f"Current round tool results: {stats['current_round_tool_results']}")
        print(f"Essential tools recorded: {stats['essential_tools_recorded']}")
        print(f"Implemented files tracked: {len(self.implemented_files)}")
        print(f"Implemented files list: {self.implemented_files}")
        print(f"Code summary file exists: {os.path.exists(self.code_summary_path)}")
        print(f"Next Steps available: {stats['next_steps_available']}")
        print(f"Next Steps length: {stats['next_steps_length']} chars")
        if self.current_next_steps.strip():
            print(f"Next Steps preview: {self.current_next_steps[:100]}...")
        print("")
        print("📋 FILE TRACKING:")
        print(f"  Total files in plan: {stats['total_files_in_plan']}")
        print(f"  Files implemented: {stats['files_implemented_count']}")
        print(f"  Files remaining: {stats['files_remaining_count']}")
        print(f"  Progress: {stats['implementation_progress_percent']:.1f}%")
        if stats["unimplemented_files_list"]:
            print(f"  Next possible files: {stats['unimplemented_files_list'][:3]}...")
        print("")
        print(
            "📊 NEW LOGIC: write_file → clear memory → accumulate tools → next write_file"
        )
        print("📊 NEXT STEPS: Stored separately from file, included in tool results")
        print(
            "📊 FILE TRACKING: All files extracted from plan, unimplemented files guide LLM decisions"
        )
        print("📊 Essential Tools Tracked:")
        essential_tools = [
            "read_code_mem",
            "read_file",
            "write_file",
            "execute_python",
            "execute_bash",
            "search_code",
            "search_reference_code",
            "get_file_structure",
        ]
        for tool in essential_tools:
            tool_count = sum(
                1 for r in self.current_round_tool_results if r["tool_name"] == tool
            )
            print(f"  - {tool}: {tool_count} calls")
        print("=" * 60)


================================================
FILE: workflows/agents/memory_agent_concise_multi.py
================================================
"""
Concise Memory Agent for Code Implementation Workflow - Multi-File Only Support

This memory agent implements a focused approach with ONLY multi-file capabilities:
1. Before first batch: Normal conversation flow
2. After first batch: Keep only system_prompt + initial_plan + current round tool results
3. Clean slate for each new code batch generation
4. MULTI-FILE ONLY: Support for summarizing multiple files simultaneously (max 5)

Key Features:
- Preserves system prompt and initial plan always
- After first batch generation, discards previous conversation history
- Keeps only current round tool results from essential tools:
  * read_multiple_files, write_multiple_files
  * execute_python, execute_bash
  * search_code, search_reference_code, get_file_structure
- Provides clean, focused input for next write_multiple_files operation
- MULTI-FILE ONLY: No single file support
- FILE TRACKING: Gets ALL file information from workflow, no internal tracking
"""

import json
import logging
import os
import time
from datetime import datetime
from typing import Dict, Any, List, Optional


class ConciseMemoryAgent:
    """
    Concise Memory Agent - Focused Information Retention with MULTI-FILE ONLY Support

    Core Philosophy:
    - Preserve essential context (system prompt + initial plan)
    - After first batch generation, use clean slate approach
    - Keep only current round tool results from multi-file MCP tools
    - Remove conversational clutter and previous tool calls
    - MULTI-FILE ONLY: Support for multiple file implementations in single operation
    - FILE TRACKING: Receives ALL file information from workflow (no internal tracking)

    Essential Tools Tracked:
    - Multi-File Operations: read_multiple_files, write_multiple_files
    - Code Analysis: search_code, search_reference_code, get_file_structure
    - Execution: execute_python, execute_bash
    """

    def __init__(
        self,
        initial_plan_content: str,
        logger: Optional[logging.Logger] = None,
        target_directory: Optional[str] = None,
        default_models: Optional[Dict[str, str]] = None,
        max_files_per_batch: int = 3,
    ):
        """
        Initialize Concise Memory Agent with MULTI-FILE ONLY support

        Args:
            initial_plan_content: Content of initial_plan.txt
            logger: Logger instance
            target_directory: Target directory for saving summaries
            default_models: Default models configuration from workflow
            max_files_per_batch: Maximum number of files to implement simultaneously (default: 3)
        """
        self.logger = logger or self._create_default_logger()
        self.initial_plan = initial_plan_content
        self.max_files_per_batch = max_files_per_batch

        # Store default models configuration
        self.default_models = default_models or {
            "anthropic": "claude-sonnet-4-20250514",
            "openai": "o3-mini",
            "google": "gemini-2.0-flash",
        }

        # Memory state tracking - new logic: trigger after each write_multiple_files
        self.last_write_multiple_files_detected = (
            False  # Track if write_multiple_files was called in current iteration
        )
        self.should_clear_memory_next = False  # Flag to clear memory in next round
        self.current_round = 0

        # self.phase_structure = self._parse_phase_structure()

        # Memory configuration
        if target_directory:
            self.save_path = target_directory
        else:
            self.save_path = "./deepcode_lab/papers/1/"

        # Code summary file path
        self.code_summary_path = os.path.join(
            self.save_path, "implement_code_summary.md"
        )

        # Current round tool results storage
        self.current_round_tool_results = []

        self.logger.info(
            f"Concise Memory Agent initialized with target directory: {self.save_path}"
        )
        self.logger.info(f"Code summary will be saved to: {self.code_summary_path}")
        self.logger.info(f"Max files per batch: {self.max_files_per_batch}")
        self.logger.info(
            "📝 MULTI-FILE LOGIC: Memory clearing triggered after each write_multiple_files call"
        )
        self.logger.info(
            "🆕 MULTI-FILE ONLY: No single file support - batch operations only"
        )
        self.logger.info(
            "📊 FILE TRACKING: ALL file information received from workflow (no internal tracking)"
        )

    def _create_default_logger(self) -> logging.Logger:
        """Create default logger"""
        logger = logging.getLogger(f"{__name__}.ConciseMemoryAgent")
        logger.setLevel(logging.INFO)
        return logger

    async def create_multi_code_implementation_summary(
        self,
        client,
        client_type: str,
        file_implementations: Dict[str, str],
        files_implemented: int,
        implemented_files: List[str],  # Receive from workflow
    ) -> str:
        """
        Create LLM-based code implementation summary for multiple files
        ONLY AVAILABLE METHOD: Handles multiple files simultaneously with separate summaries for each

        Args:
            client: LLM client instance
            client_type: Type of LLM client ("anthropic" or "openai")
            file_implementations: Dictionary mapping file_path to implementation_content
            files_implemented: Number of files implemented so far
            implemented_files: List of all implemented files (from workflow)

        Returns:
            LLM-generated formatted code implementation summaries for all files
        """
        try:
            # Validate input
            if not file_implementations:
                raise ValueError("No file implementations provided")

            if len(file_implementations) > self.max_files_per_batch:
                raise ValueError(
                    f"Too many files provided ({len(file_implementations)}), max is {self.max_files_per_batch}"
                )

            # Create prompt for LLM summary of multiple files
            summary_prompt = self._create_multi_code_summary_prompt(
                file_implementations, files_implemented, implemented_files
            )
            summary_messages = [{"role": "user", "content": summary_prompt}]

            # Get LLM-generated summary
            llm_response = await self._call_llm_for_summary(
                client, client_type, summary_messages
            )
            llm_summary = llm_response.get("content", "")

            # Extract sections for each file and next steps
            multi_sections = self._extract_multi_summary_sections(
                llm_summary, file_implementations.keys()
            )

            # Format and save summary for each file (WITHOUT Next Steps)
            all_formatted_summaries = []

            for file_path in file_implementations.keys():
                file_sections = multi_sections.get("files", {}).get(file_path, {})

                # Format summary with ONLY Implementation Progress and Dependencies for file saving
                file_summary_content = ""
                if file_sections.get("core_purpose"):
                    file_summary_content += file_sections["core_purpose"] + "\n\n"
                if file_sections.get("public_interface"):
                    file_summary_content += file_sections["public_interface"] + "\n\n"
                if file_sections.get("internal_dependencies"):
                    file_summary_content += (
                        file_sections["internal_dependencies"] + "\n\n"
                    )
                if file_sections.get("external_dependencies"):
                    file_summary_content += (
                        file_sections["external_dependencies"] + "\n\n"
                    )
                if file_sections.get("implementation_notes"):
                    file_summary_content += (
                        file_sections["implementation_notes"] + "\n\n"
                    )

                # Create the formatted summary for file saving (WITHOUT Next Steps)
                formatted_summary = self._format_code_implementation_summary(
                    file_path, file_summary_content.strip(), files_implemented
                )

                all_formatted_summaries.append(formatted_summary)

                # Save to implement_code_summary.md (append mode) - ONLY Implementation Progress and Dependencies
                await self._save_code_summary_to_file(formatted_summary, file_path)

            # Combine all summaries for return
            combined_summary = "\n".join(all_formatted_summaries)

            self.logger.info(
                f"Created and saved multi-file code summaries for {len(file_implementations)} files"
            )

            return combined_summary

        except Exception as e:
            self.logger.error(
                f"Failed to create LLM-based multi-file code implementation summary: {e}"
            )
            # Fallback to simple summary for each file
            return self._create_fallback_multi_code_summary(
                file_implementations, files_implemented
            )

    def _create_multi_code_summary_prompt(
        self,
        file_implementations: Dict[str, str],
        files_implemented: int,
        implemented_files: List[str],
    ) -> str:
        """
        Create prompt for LLM to generate multi-file code implementation summary

        Args:
            file_implementations: Dictionary mapping file_path to implementation_content
            files_implemented: Number of files implemented so far
            implemented_files: List of all implemented files (from workflow)

        Returns:
            Prompt for LLM multi-file summarization
        """

        # Format file lists using workflow data
        implemented_files_list = (
            "\n".join([f"- {file}" for file in implemented_files])
            if implemented_files
            else "- None yet"
        )

        # Note: We don't have unimplemented files list anymore - workflow will provide when needed

        # Format file implementations for the prompt
        implementation_sections = []
        for file_path, content in file_implementations.items():
            implementation_sections.append(f"""
            **File: {file_path}**
            {content}
            """)

        files_list = list(file_implementations.keys())
        files_count = len(files_list)

        prompt = f"""You are an expert code implementation summarizer. Analyze the {files_count} implemented code files and create structured summaries for each.

**All Previously Implemented Files:**
{implemented_files_list}

**Current Implementation Context:**
- **Files Implemented**: {', '.join(files_list)}
- **Total Files Implemented**: {files_implemented}
- **Files in This Batch**: {files_count}

**Initial Plan Reference:**
{self.initial_plan[:]}

**Implemented Code Content:**
{''.join(implementation_sections)}

**Required Summary Format:**

**FOR EACH FILE, provide separate sections:**

**File: {{file_path}}**
**Core Purpose** (provide a general overview of the file's main responsibility):
- {{1-2 sentence description of file's main responsibility}}

**Public Interface** (what other files can use, if any):
- Class {{ClassName}}: {{purpose}} | Key methods: {{method_names}} | Constructor params: {{params}}
- Function {{function_name}}({{params}}): {{purpose}} -> {{return_type}}: {{purpose}}
- Constants/Types: {{name}}: {{value/description}}

**Internal Dependencies** (what this file imports/requires, if any):
- From {{module/file}}: {{specific_imports}}
- External packages: {{package_name}} - {{usage_context}}

**External Dependencies** (what depends on this file, if any):
- Expected to be imported by: {{likely_consumer_files}}
- Key exports used elsewhere: {{main_interfaces}}

**Implementation Notes**: (if any)
- Architecture decisions: {{key_choices_made}}
- Cross-File Relationships: {{how_files_work_together}}

[Repeat for all {files_count} files...]

**Instructions:**
- Provide separate Implementation Progress and Dependencies sections for each of the {files_count} files
- Be precise and concise for each file
- Focus on function interfaces that other files will need
- Extract actual function signatures from the code
- Use the exact format specified above

**Summary:**"""

        return prompt

    def _extract_multi_summary_sections(
        self, llm_summary: str, file_paths: List[str]
    ) -> Dict[str, Any]:
        """
        Extract different sections from LLM-generated multi-file summary
        """
        result = {
            "files": {},
        }

        try:
            # Convert dict_keys to list if needed
            if hasattr(file_paths, "keys"):
                file_paths = list(file_paths)
            elif not isinstance(file_paths, list):
                file_paths = list(file_paths)

            lines = llm_summary.split("\n")
            current_file = None
            current_section = None
            current_content = []
            file_sections = {}

            for i, line in enumerate(lines):
                line_lower = line.lower().strip()
                original_line = line.strip()

                # Skip empty lines
                if not original_line:
                    if current_section:
                        current_content.append(line)
                    continue

                # File header detection
                if (
                    "**file:" in line_lower or "file:" in line_lower
                ) and "**" in original_line:
                    # Save previous section
                    if current_file and current_section and current_content:
                        if current_file not in file_sections:
                            file_sections[current_file] = {}
                        file_sections[current_file][current_section] = "\n".join(
                            current_content
                        ).strip()

                    # Extract file path
                    file_header = original_line.lower()
                    if "**file:" in file_header:
                        file_header = original_line[
                            original_line.lower().find("file:") + 5 :
                        ]
                        if "**" in file_header:
                            file_header = file_header[: file_header.find("**")]
                    else:
                        file_header = original_line[
                            original_line.lower().find("file:") + 5 :
                        ]

                    file_header = file_header.strip()
                    current_file = None

                    # File matching
                    for file_path in file_paths:
                        file_name = file_path.split("/")[-1]
                        if (
                            file_path in file_header
                            or file_header in file_path
                            or file_name in file_header
                            or file_header in file_name
                        ):
                            current_file = file_path
                            break

                    current_section = None
                    current_content = []
                    continue

                # Section detection within files
                if current_file:
                    section_matched = False

                    if "core purpose" in line_lower and "**" in original_line:
                        if current_section and current_content:
                            if current_file not in file_sections:
                                file_sections[current_file] = {}
                            file_sections[current_file][current_section] = "\n".join(
                                current_content
                            ).strip()
                        current_section = "core_purpose"
                        current_content = []
                        section_matched = True
                    elif "public interface" in line_lower and "**" in original_line:
                        if current_section and current_content:
                            if current_file not in file_sections:
                                file_sections[current_file] = {}
                            file_sections[current_file][current_section] = "\n".join(
                                current_content
                            ).strip()
                        current_section = "public_interface"
                        current_content = []
                        section_matched = True
                    elif (
                        "internal dependencies" in line_lower and "**" in original_line
                    ):
                        if current_section and current_content:
                            if current_file not in file_sections:
                                file_sections[current_file] = {}
                            file_sections[current_file][current_section] = "\n".join(
                                current_content
                            ).strip()
                        current_section = "internal_dependencies"
                        current_content = []
                        section_matched = True
                    elif (
                        "external dependencies" in line_lower and "**" in original_line
                    ):
                        if current_section and current_content:
                            if current_file not in file_sections:
                                file_sections[current_file] = {}
                            file_sections[current_file][current_section] = "\n".join(
                                current_content
                            ).strip()
                        current_section = "external_dependencies"
                        current_content = []
                        section_matched = True
                    elif "implementation notes" in line_lower and "**" in original_line:
                        if current_section and current_content:
                            if current_file not in file_sections:
                                file_sections[current_file] = {}
                            file_sections[current_file][current_section] = "\n".join(
                                current_content
                            ).strip()
                        current_section = "implementation_notes"
                        current_content = []
                        section_matched = True

                    # If no section header matched, add to current content
                    if not section_matched and current_section:
                        current_content.append(line)

            # Save the final section
            if current_file and current_section and current_content:
                if current_file not in file_sections:
                    file_sections[current_file] = {}
                file_sections[current_file][current_section] = "\n".join(
                    current_content
                ).strip()

            # Build final result
            for file_path in file_paths:
                sections = file_sections.get(file_path, {})
                result["files"][file_path] = {}
                if "core_purpose" in sections:
                    result["files"][file_path]["core_purpose"] = (
                        "**Core Purpose**:\n" + sections["core_purpose"]
                    )
                if "public_interface" in sections:
                    result["files"][file_path]["public_interface"] = (
                        "**Public Interface**:\n" + sections["public_interface"]
                    )
                if "implementation_notes" in sections:
                    result["files"][file_path]["implementation_notes"] = (
                        "**Implementation Notes**:\n" + sections["implementation_notes"]
                    )
                if "internal_dependencies" in sections:
                    result["files"][file_path]["internal_dependencies"] = (
                        "**Internal Dependencies**:\n"
                        + sections["internal_dependencies"]
                    )
                if "external_dependencies" in sections:
                    result["files"][file_path]["external_dependencies"] = (
                        "**External Dependencies**:\n"
                        + sections["external_dependencies"]
                    )

            self.logger.info(
                f"📋 Extracted multi-file sections for {len(result['files'])} files"
            )

        except Exception as e:
            self.logger.error(f"Failed to extract multi-file summary sections: {e}")
            self.logger.error(f"📋 file_paths type: {type(file_paths)}")
            self.logger.error(f"📋 file_paths value: {file_paths}")
            self.logger.error(f"📋 file_paths length: {len(file_paths)}")
            for file_path in file_paths:
                result["files"][file_path] = {
                    "core_purpose": f"**Core Purpose**: {file_path} completed.",
                    "public_interface": "**Public Interface**: Public interface need manual review.",
                    "internal_dependencies": "**Internal Dependencies**: Internal dependencies need manual review.",
                    "external_dependencies": "**External Dependencies**: External dependencies need manual review.",
                    "implementation_notes": "**Implementation Notes**: Implementation notes need manual review.",
                }

        return result

    def _format_code_implementation_summary(
        self, file_path: str, llm_summary: str, files_implemented: int
    ) -> str:
        """
        Format the LLM-generated summary into the final structure

        Args:
            file_path: Path of the implemented file
            llm_summary: LLM-generated summary content
            files_implemented: Number of files implemented so far

        Returns:
            Formatted summary
        """
        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        formatted_summary = f"""# Code Implementation Summary
**Generated**: {timestamp}
**File Implemented**: {file_path}

{llm_summary}

---
*Auto-generated by Memory Agent*
"""
        return formatted_summary

    def _create_fallback_multi_code_summary(
        self, file_implementations: Dict[str, str], files_implemented: int
    ) -> str:
        """
        Create fallback multi-file summary when LLM is unavailable

        Args:
            file_implementations: Dictionary mapping file_path to implementation_content
            files_implemented: Number of files implemented so far

        Returns:
            Fallback multi-file summary
        """
        # Create fallback summaries for each file
        fallback_summaries = []
        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        for file_path in file_implementations.keys():
            fallback_summary = f"""# Code Implementation Summary
**Generated**: {timestamp}
**File Implemented**: {file_path}
**Multi-file batch summary failed to generate.**

---
*Auto-generated by Concise Memory Agent (Multi-File Fallback Mode)*
"""
            fallback_summaries.append(fallback_summary)

        return "\n".join(fallback_summaries)

    async def _save_code_summary_to_file(self, new_summary: str, file_path: str):
        """
        Append code implementation summary to implement_code_summary.md
        Accumulates all implementations with clear separators

        Args:
            new_summary: New summary content to append
            file_path: Path of the file for which the summary was generated
        """
        try:
            # Create directory if it doesn't exist
            os.makedirs(os.path.dirname(self.code_summary_path), exist_ok=True)

            # Check if file exists to determine if we need header
            file_exists = os.path.exists(self.code_summary_path)

            # Open in append mode to accumulate all implementations
            with open(self.code_summary_path, "a", encoding="utf-8") as f:
                if not file_exists:
                    # Write header for new file
                    f.write("# Code Implementation Progress Summary\n")
                    f.write("*Accumulated implementation progress for all files*\n\n")

                # Add clear separator between implementations
                f.write("\n" + "=" * 80 + "\n")
                f.write(f"## IMPLEMENTATION File {file_path}\n")
                f.write("=" * 80 + "\n\n")

                # Write the new summary
                f.write(new_summary)
                f.write("\n\n")

            self.logger.info(
                f"Appended LLM-based code implementation summary to: {self.code_summary_path}"
            )

        except Exception as e:
            self.logger.error(f"Failed to save code implementation summary: {e}")

    async def _call_llm_for_summary(
        self, client, client_type: str, summary_messages: List[Dict]
    ) -> Dict[str, Any]:
        """
        Call LLM for code implementation summary generation ONLY

        This method is used only for creating code implementation summaries,
        NOT for conversation summarization which has been removed.
        """
        if client_type == "anthropic":
            response = await client.messages.create(
                model=self.default_models["anthropic"],
                system="You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches.",
                messages=summary_messages,
                max_tokens=8000,  # Increased for multi-file support
                temperature=0.2,
            )

            content = ""
            for block in response.content:
                if block.type == "text":
                    content += block.text

            return {"content": content}

        elif client_type == "openai":
            openai_messages = [
                {
                    "role": "system",
                    "content": "You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches.",
                }
            ]
            openai_messages.extend(summary_messages)

            # Try max_tokens and temperature first, fallback to max_completion_tokens without temperature if unsupported
            try:
                response = await client.chat.completions.create(
                    model=self.default_models["openai"],
                    messages=openai_messages,
                    max_tokens=8000,  # Increased for multi-file support
                    temperature=0.2,
                )
            except Exception as e:
                if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                    # Retry with max_completion_tokens and no temperature for models that require it
                    response = await client.chat.completions.create(
                        model=self.default_models["openai"],
                        messages=openai_messages,
                        max_completion_tokens=8000,  # Increased for multi-file support
                    )
                else:
                    raise

            return {"content": response.choices[0].message.content or ""}

        elif client_type == "google":
            from google.genai import types

            # Convert messages to Gemini format
            system_instruction = "You are an expert code implementation summarizer. Create structured summaries of implemented code files that preserve essential information about functions, dependencies, and implementation approaches."

            gemini_messages = []
            for msg in summary_messages:
                role = msg.get("role", "user")
                content = msg.get("content", "")

                # Convert role names: "assistant" -> "model"
                if role == "assistant":
                    role = "model"
                elif role not in ["user", "model"]:
                    role = "user"

                gemini_messages.append(
                    types.Content(role=role, parts=[types.Part.from_text(text=content)])
                )

            config = types.GenerateContentConfig(
                max_output_tokens=8000,  # Increased for multi-file support
                temperature=0.2,
                system_instruction=system_instruction,
            )

            response = await client.aio.models.generate_content(
                model=self.default_models.get("google", "gemini-2.0-flash"),
                contents=gemini_messages,
                config=config,
            )

            # Extract content from Gemini response
            content = ""
            if response and hasattr(response, "candidates") and response.candidates:
                candidate = response.candidates[0]
                if hasattr(candidate, "content") and candidate.content:
                    if hasattr(candidate.content, "parts") and candidate.content.parts:
                        for part in candidate.content.parts:
                            if hasattr(part, "text") and part.text:
                                content += part.text

            if not content:
                self.logger.warning("Google response is empty or malformed")

            return {"content": content}

        else:
            raise ValueError(f"Unsupported client type: {client_type}")

    def start_new_round(self, iteration: Optional[int] = None):
        """Start a new dialogue round and reset tool results

        Args:
            iteration: Optional iteration number from workflow to sync with current_round
        """
        if iteration is not None:
            # Sync with workflow iteration
            self.current_round = iteration
        else:
            # Default behavior: increment round counter
            self.current_round += 1
            self.logger.info(f"🔄 Started new round {self.current_round}")

        self.current_round_tool_results = []  # Clear previous round results

    def record_tool_result(
        self, tool_name: str, tool_input: Dict[str, Any], tool_result: Any
    ):
        """
        Record tool result for current round and detect write_multiple_files calls

        Args:
            tool_name: Name of the tool called
            tool_input: Input parameters for the tool
            tool_result: Result returned by the tool
        """
        # Detect write_multiple_files calls to trigger memory clearing
        if tool_name == "write_multiple_files":
            self.last_write_multiple_files_detected = True
            self.should_clear_memory_next = True

        # Only record specific tools that provide essential information
        essential_tools = [
            "read_multiple_files",  # Read multiple file contents
            "write_multiple_files",  # Write multiple file contents (important for tracking implementations)
            "execute_python",  # Execute Python code (for testing/validation)
            "execute_bash",  # Execute bash commands (for build/execution)
            "search_code",  # Search code patterns
            "search_reference_code",  # Search reference code (if available)
            "get_file_structure",  # Get file structure (for understanding project layout)
        ]

        if tool_name in essential_tools:
            tool_record = {
                "tool_name": tool_name,
                "tool_input": tool_input,
                "tool_result": tool_result,
                "timestamp": time.time(),
            }
            self.current_round_tool_results.append(tool_record)

    def should_use_concise_mode(self) -> bool:
        """
        Check if concise memory mode should be used

        Returns:
            True if first batch has been generated and concise mode should be active
        """
        return self.last_write_multiple_files_detected

    def create_concise_messages_revise(
        self,
        system_prompt: str,
        messages: List[Dict[str, Any]],
        files_implemented: int,
        task_description: str,
        file_batch: List[str],
        is_first_batch: bool = True,
        implemented_files: List[str] = None,  # Receive from workflow
        all_files: List[str] = None,  # NEW: Receive all files from workflow
    ) -> List[Dict[str, Any]]:
        """
        Create concise message list for LLM input specifically for revision execution
        ALIGNED with _execute_multi_file_batch_revision in code_evaluation_workflow

        Args:
            system_prompt: Current system prompt
            messages: Original message list
            files_implemented: Number of files implemented so far
            task_description: Description of the current task
            file_batch: Files to implement in this batch
            is_first_batch: Whether this is the first batch (use file_batch) or subsequent
            implemented_files: List of all implemented files (from workflow)
            all_files: List of all files that should be implemented (from workflow)

        Returns:
            Concise message list containing only essential information for revision
        """
        # Use empty lists if not provided
        if implemented_files is None:
            implemented_files = []
        if all_files is None:
            all_files = []

        self.logger.info(
            "🎯 Using CONCISE memory mode for revision - Clear slate after write_multiple_files"
        )

        concise_messages = []

        # Format file lists using workflow data
        implemented_files_list = (
            "\n".join([f"- {file}" for file in implemented_files])
            if implemented_files
            else "- None yet"
        )

        # Calculate unimplemented files from workflow data

        # Read initial plan and memory content
        initial_plan_content = self.initial_plan
        memory_content = (
            self._read_code_knowledge_base()
            or "No previous implementation memory available"
        )

        files_to_implement = file_batch
        file_list = "\n".join([f"- {file_path}" for file_path in files_to_implement])

        # Create revision-specific task message
        task_message = f"""Task: {task_description}

    Files to implement in this batch ({len(files_to_implement)} files):
    {file_list}

    MANDATORY JSON FORMAT REQUIREMENTS:
    1. Use write_multiple_files tool
    2. Parameter name: "file_implementations"
    3. Value must be a VALID JSON string with ESCAPED newlines
    4. Use \\n for newlines, \\t for tabs, \\" for quotes
    5. NO literal newlines in the JSON string

    CORRECT JSON FORMAT EXAMPLE:
    {{
    "file1.py": "# Comment\\nclass MyClass:\\n    def __init__(self):\\n        pass\\n",
    "file2.py": "import os\\n\\ndef main():\\n    print('Hello')\\n"
    }}

    Initial Implementation Plan Context:
    {initial_plan_content}

    Previous Implementation Memory:
    {memory_content}

    **All Previously Implemented Files:**
    {implemented_files_list}

    **Current Status:** {files_implemented} files implemented

    IMPLEMENTATION REQUIREMENTS:
    - Create functional code for each file
    - Use proper Python syntax and imports
    - Include docstrings and comments
    - Follow the existing patterns from memory

    Files to implement: {files_to_implement}

    Call write_multiple_files NOW with PROPERLY ESCAPED JSON containing all {len(files_to_implement)} files."""

        concise_messages.append({"role": "user", "content": task_message})

        # Debug output for files to implement
        print("✅ Files to implement:")
        for file_path in files_to_implement:
            print(f"{file_path}")

        return concise_messages

    def _calculate_message_statistics(
        self, messages: List[Dict[str, Any]], label: str
    ) -> Dict[str, Any]:
        """
        Calculate statistics for a message list

        Args:
            messages: List of messages to analyze
            label: Label for logging

        Returns:
            Dictionary with statistics
        """
        total_chars = 0
        total_words = 0

        for msg in messages:
            content = msg.get("content", "")
            total_chars += len(content)
            total_words += len(content.split())

        # Estimate tokens (rough approximation: ~4 characters per token)
        estimated_tokens = total_chars // 4

        stats = {
            "message_count": len(messages),
            "total_characters": total_chars,
            "total_words": total_words,
            "estimated_tokens": estimated_tokens,
            "summary": f"{len(messages)} msgs, {total_chars:,} chars, ~{estimated_tokens:,} tokens",
        }

        return stats

    def _calculate_memory_savings(
        self, original_stats: Dict[str, Any], optimized_stats: Dict[str, Any]
    ) -> Dict[str, Any]:
        """
        Calculate memory savings between original and optimized messages

        Args:
            original_stats: Statistics for original messages
            optimized_stats: Statistics for optimized messages

        Returns:
            Dictionary with savings calculations
        """
        messages_saved = (
            original_stats["message_count"] - optimized_stats["message_count"]
        )
        chars_saved = (
            original_stats["total_characters"] - optimized_stats["total_characters"]
        )
        tokens_saved_estimate = (
            original_stats["estimated_tokens"] - optimized_stats["estimated_tokens"]
        )

        # Calculate percentages (avoid division by zero)
        messages_saved_percent = (
            messages_saved / max(original_stats["message_count"], 1)
        ) * 100
        chars_saved_percent = (
            chars_saved / max(original_stats["total_characters"], 1)
        ) * 100
        tokens_saved_percent = (
            tokens_saved_estimate / max(original_stats["estimated_tokens"], 1)
        ) * 100

        return {
            "messages_saved": messages_saved,
            "chars_saved": chars_saved,
            "tokens_saved_estimate": tokens_saved_estimate,
            "messages_saved_percent": messages_saved_percent,
            "chars_saved_percent": chars_saved_percent,
            "tokens_saved_percent": tokens_saved_percent,
        }

    def _read_code_knowledge_base(self) -> Optional[str]:
        """
        Read the implement_code_summary.md file as code knowledge base
        Returns only the final/latest implementation entry, not all historical entries

        Returns:
            Content of the latest implementation entry if it exists, None otherwise
        """
        try:
            if os.path.exists(self.code_summary_path):
                with open(self.code_summary_path, "r", encoding="utf-8") as f:
                    content = f.read().strip()
                return content
            else:
                return None

        except Exception as e:
            self.logger.error(f"Failed to read code knowledge base: {e}")
            return None

    def _extract_latest_implementation_entry(self, content: str) -> Optional[str]:
        """
        Extract the latest/final implementation entry from the implement_code_summary.md content
        Uses a simpler approach to find the last implementation section

        Args:
            content: Full content of implement_code_summary.md

        Returns:
            Latest implementation entry content, or None if not found
        """
        try:
            import re

            # Pattern to match the start of implementation sections
            section_pattern = r"={80}\s*\n## IMPLEMENTATION File .+?"

            # Find all implementation section starts
            matches = list(re.finditer(section_pattern, content))

            if not matches:
                # No implementation sections found
                lines = content.split("\n")
                fallback_content = (
                    "\n".join(lines[:10]) + "\n... (truncated for brevity)"
                    if len(lines) > 10
                    else content
                )
                self.logger.info(
                    "📖 No implementation sections found, using fallback content"
                )
                return fallback_content

            # Get the start position of the last implementation section
            last_match = matches[-1]
            start_pos = last_match.start()

            # Take everything from the last section start to the end of content
            latest_entry = content[start_pos:].strip()

            return latest_entry

        except Exception as e:
            self.logger.error(f"Failed to extract latest implementation entry: {e}")
            # Return last 1000 characters as fallback
            return content[-500:] if len(content) > 500 else content

    def _format_tool_results(self) -> str:
        """
        Format current round tool results for LLM input

        Returns:
            Formatted string of tool results
        """
        if not self.current_round_tool_results:
            return "No tool results in current round."

        formatted_results = []

        for result in self.current_round_tool_results:
            tool_name = result["tool_name"]
            tool_input = result["tool_input"]
            tool_result = result["tool_result"]

            # Format based on tool type
            if tool_name == "read_multiple_files":
                file_requests = tool_input.get("file_requests", "unknown")
                formatted_results.append(f"""
**read_multiple_files Result for {file_requests}:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "write_multiple_files":
                formatted_results.append(f"""
**write_multiple_files Result for batch:**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "execute_python":
                code_snippet = (
                    tool_input.get("code", "")[:50] + "..."
                    if len(tool_input.get("code", "")) > 50
                    else tool_input.get("code", "")
                )
                formatted_results.append(f"""
**execute_python Result (code: {code_snippet}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "execute_bash":
                command = tool_input.get("command", "unknown")
                formatted_results.append(f"""
**execute_bash Result (command: {command}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "search_code":
                pattern = tool_input.get("pattern", "unknown")
                file_pattern = tool_input.get("file_pattern", "")
                formatted_results.append(f"""
**search_code Result (pattern: {pattern}, files: {file_pattern}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "search_reference_code":
                target_file = tool_input.get("target_file", "unknown")
                keywords = tool_input.get("keywords", "")
                formatted_results.append(f"""
**search_reference_code Result for {target_file} (keywords: {keywords}):**
{self._format_tool_result_content(tool_result)}
""")
            elif tool_name == "get_file_structure":
                directory = tool_input.get(
                    "directory_path", tool_input.get("path", "current")
                )
                formatted_results.append(f"""
**get_file_structure Result for {directory}:**
{self._format_tool_result_content(tool_result)}
""")

        return "\n".join(formatted_results)

    def _format_tool_result_content(self, tool_result: Any) -> str:
        """
        Format tool result content for display

        Args:
            tool_result: Tool result to format

        Returns:
            Formatted string representation
        """
        if isinstance(tool_result, str):
            # Try to parse as JSON for better formatting
            try:
                result_data = json.loads(tool_result)
                if isinstance(result_data, dict):
                    # Format key information
                    if result_data.get("status") == "success":
                        return json.dumps(result_data, indent=2)
                    else:
                        return json.dumps(result_data, indent=2)
                else:
                    return str(result_data)
            except json.JSONDecodeError:
                return tool_result
        else:
            return str(tool_result)

    def get_memory_statistics(
        self, all_files: List[str] = None, implemented_files: List[str] = None
    ) -> Dict[str, Any]:
        """
        Get memory agent statistics for multi-file operations

        Args:
            all_files: List of all files that should be implemented (from workflow)
            implemented_files: List of all implemented files (from workflow)
        """
        if all_files is None:
            all_files = []
        if implemented_files is None:
            implemented_files = []

        # Calculate unimplemented files from workflow data
        unimplemented_files = [f for f in all_files if f not in implemented_files]

        return {
            "last_write_multiple_files_detected": self.last_write_multiple_files_detected,
            "should_clear_memory_next": self.should_clear_memory_next,
            "current_round": self.current_round,
            "concise_mode_active": self.should_use_concise_mode(),
            "current_round_tool_results": len(self.current_round_tool_results),
            "essential_tools_recorded": [
                r["tool_name"] for r in self.current_round_tool_results
            ],
            # File tracking statistics (from workflow)
            "total_files_in_plan": len(all_files),
            "files_implemented_count": len(implemented_files),
            "files_remaining_count": len(unimplemented_files),
            "all_files_list": all_files.copy(),
            "implemented_files_list": implemented_files.copy(),
            "unimplemented_files_list": unimplemented_files,
            "implementation_progress_percent": (
                len(implemented_files) / len(all_files) * 100
            )
            if all_files
            else 0,
            # Multi-file support statistics
            "max_files_per_batch": self.max_files_per_batch,
            "multi_file_support": True,
            "single_file_support": False,  # Explicitly disabled
        }

    def record_multi_file_implementation(self, file_implementations: Dict[str, str]):
        """
        Record multi-file implementation (for compatibility with workflow)
        NOTE: This method doesn't track files internally - workflow manages file tracking

        Args:
            file_implementations: Dictionary mapping file_path to implementation_content
        """
        self.logger.info(
            f"📝 Recorded multi-file implementation batch: {len(file_implementations)} files"
        )
        # Note: We don't track files internally anymore - workflow handles this

    # ===== ENHANCED MEMORY SYNCHRONIZATION METHODS (Phase 4+) =====

    async def synchronize_revised_file_memory(
        self,
        client,
        client_type: str,
        revised_file_path: str,
        diff_content: str,
        new_content: str,
        revision_type: str = "targeted_fix",
    ) -> str:
        """
        Synchronize memory for a single revised file with diff information

        Args:
            client: LLM client instance
            client_type: Type of LLM client ("anthropic" or "openai")
            revised_file_path: Path of the revised file
            diff_content: Unified diff showing changes made
            new_content: Complete new content of the file
            revision_type: Type of revision ("targeted_fix", "comprehensive_revision", etc.)

        Returns:
            Updated memory summary for the revised file
        """
        try:
            self.logger.info(
                f"🔄 Synchronizing memory for revised file: {revised_file_path}"
            )

            # Create revision-specific summary prompt
            revision_prompt = self._create_file_revision_summary_prompt(
                revised_file_path, diff_content, new_content, revision_type
            )

            summary_messages = [{"role": "user", "content": revision_prompt}]

            # Get LLM-generated revision summary
            llm_response = await self._call_llm_for_summary(
                client, client_type, summary_messages
            )
            llm_summary = llm_response.get("content", "")

            # Extract summary sections
            revision_sections = self._extract_revision_summary_sections(llm_summary)

            # Format revision summary
            formatted_summary = self._format_file_revision_summary(
                revised_file_path, revision_sections, diff_content, revision_type
            )

            # Save the revision summary (replace old summary)
            await self._save_revised_file_summary(formatted_summary, revised_file_path)

            self.logger.info(
                f"✅ Memory synchronized for revised file: {revised_file_path}"
            )

            return formatted_summary

        except Exception as e:
            self.logger.error(
                f"Failed to synchronize memory for revised file {revised_file_path}: {e}"
            )

            # Fallback to simple revision summary
            return self._create_fallback_revision_summary(
                revised_file_path, revision_type
            )

    async def synchronize_multiple_revised_files(
        self, client, client_type: str, revision_results: List[Dict[str, Any]]
    ) -> Dict[str, str]:
        """
        Synchronize memory for multiple revised files based on revision results

        Args:
            client: LLM client instance
            client_type: Type of LLM client
            revision_results: List of revision results with file paths, diffs, and new content

        Returns:
            Dictionary mapping file paths to updated memory summaries
        """
        try:
            self.logger.info(
                f"🔄 Synchronizing memory for {len(revision_results)} revised files"
            )

            synchronized_summaries = {}

            for revision_result in revision_results:
                file_path = revision_result.get("file_path", "")
                diff_content = revision_result.get("diff", "")
                new_content = revision_result.get("new_content", "")
                revision_type = revision_result.get("revision_type", "targeted_fix")

                if file_path and revision_result.get("success", False):
                    summary = await self.synchronize_revised_file_memory(
                        client,
                        client_type,
                        file_path,
                        diff_content,
                        new_content,
                        revision_type,
                    )
                    synchronized_summaries[file_path] = summary
                else:
                    self.logger.warning(
                        f"⚠️ Skipping memory sync for failed revision: {file_path}"
                    )

            self.logger.info(
                f"✅ Memory synchronized for {len(synchronized_summaries)} successfully revised files"
            )

            return synchronized_summaries

        except Exception as e:
            self.logger.error(
                f"Failed to synchronize memory for multiple revised files: {e}"
            )
            return {}

    def _create_file_revision_summary_prompt(
        self, file_path: str, diff_content: str, new_content: str, revision_type: str
    ) -> str:
        """
        Create prompt for LLM to generate file revision summary

        Args:
            file_path: Path of the revised file
            diff_content: Unified diff showing changes
            new_content: Complete new content of the file
            revision_type: Type of revision performed

        Returns:
            Prompt for LLM revision summarization
        """
        # Truncate content if too long for prompt
        content_preview = (
            new_content[:2000] + "..." if len(new_content) > 2000 else new_content
        )
        diff_preview = (
            diff_content[:1000] + "..." if len(diff_content) > 1000 else diff_content
        )

        prompt = f"""You are an expert code revision summarizer. A file has been REVISED with targeted changes. Create a structured summary of the revision.

**File Revised**: {file_path}
**Revision Type**: {revision_type}

**Changes Made (Diff):**
```diff
{diff_preview}
```

**Updated File Content:**
```python
{content_preview}
```

**Required Summary Format:**

**Revision Summary**:
- Brief description of what was changed and why

**Changes Made**:
- Specific modifications applied (line-level changes)
- Functions/classes affected
- New functionality added or bugs fixed

**Impact Assessment**:
- How the changes affect the file's behavior
- Dependencies that might be affected
- Integration points that need attention

**Quality Improvements**:
- Code quality enhancements made
- Error handling improvements
- Performance or maintainability gains

**Post-Revision Status**:
- Current functionality of the file
- Key interfaces and exports
- Dependencies and imports

**Instructions:**
- Focus on the CHANGES made, not just the final state
- Highlight the specific improvements and fixes applied
- Be concise but comprehensive about the revision impact
- Use the exact format specified above

**Summary:**"""

        return prompt

    def _extract_revision_summary_sections(self, llm_summary: str) -> Dict[str, str]:
        """
        Extract different sections from LLM-generated revision summary

        Args:
            llm_summary: Raw LLM response containing revision summary

        Returns:
            Dictionary with extracted sections
        """
        sections = {
            "revision_summary": "",
            "changes_made": "",
            "impact_assessment": "",
            "quality_improvements": "",
            "post_revision_status": "",
        }

        try:
            lines = llm_summary.split("\n")
            current_section = None
            current_content = []

            for line in lines:
                line_lower = line.lower().strip()
                original_line = line.strip()

                # Skip empty lines
                if not original_line:
                    if current_section:
                        current_content.append(line)
                    continue

                # Section detection
                section_matched = False

                if "revision summary" in line_lower and "**" in original_line:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "revision_summary"
                    current_content = []
                    section_matched = True
                elif "changes made" in line_lower and "**" in original_line:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "changes_made"
                    current_content = []
                    section_matched = True
                elif "impact assessment" in line_lower and "**" in original_line:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "impact_assessment"
                    current_content = []
                    section_matched = True
                elif "quality improvements" in line_lower and "**" in original_line:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "quality_improvements"
                    current_content = []
                    section_matched = True
                elif "post-revision status" in line_lower and "**" in original_line:
                    if current_section and current_content:
                        sections[current_section] = "\n".join(current_content).strip()
                    current_section = "post_revision_status"
                    current_content = []
                    section_matched = True

                # If no section header matched, add to current content
                if not section_matched and current_section:
                    current_content.append(line)

            # Save the final section
            if current_section and current_content:
                sections[current_section] = "\n".join(current_content).strip()

            self.logger.info(
                f"📋 Extracted {len([s for s in sections.values() if s])} revision summary sections"
            )

        except Exception as e:
            self.logger.error(f"Failed to extract revision summary sections: {e}")
            # Provide fallback content
            sections["revision_summary"] = "File revision completed"
            sections["changes_made"] = (
                "Targeted changes applied based on error analysis"
            )
            sections["impact_assessment"] = (
                "Changes should improve code functionality and reduce errors"
            )
            sections["quality_improvements"] = (
                "Code quality enhanced through targeted fixes"
            )
            sections["post_revision_status"] = "File functionality updated and improved"

        return sections

    def _format_file_revision_summary(
        self,
        file_path: str,
        revision_sections: Dict[str, str],
        diff_content: str,
        revision_type: str,
    ) -> str:
        """
        Format the revision summary into the final structure

        Args:
            file_path: Path of the revised file
            revision_sections: Extracted sections from LLM summary
            diff_content: Unified diff content
            revision_type: Type of revision performed

        Returns:
            Formatted revision summary
        """
        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        # Format sections with fallbacks
        revision_summary = revision_sections.get(
            "revision_summary", "File revision completed"
        )
        changes_made = revision_sections.get("changes_made", "Targeted changes applied")
        impact_assessment = revision_sections.get(
            "impact_assessment", "Changes should improve functionality"
        )
        quality_improvements = revision_sections.get(
            "quality_improvements", "Code quality enhanced"
        )
        post_revision_status = revision_sections.get(
            "post_revision_status", "File updated successfully"
        )

        formatted_summary = f"""# File Revision Summary (UPDATED)
**Generated**: {timestamp}
**File Revised**: {file_path}
**Revision Type**: {revision_type}

## Revision Summary
{revision_summary}

## Changes Made
{changes_made}

## Impact Assessment
{impact_assessment}

## Quality Improvements
{quality_improvements}

## Post-Revision Status
{post_revision_status}

## Technical Details
**Diff Applied:**
```diff
{diff_content[:500]}{"..." if len(diff_content) > 500 else ""}
```

---
*Auto-generated by Enhanced Memory Agent (Revision Mode)*
"""
        return formatted_summary

    def _create_fallback_revision_summary(
        self, file_path: str, revision_type: str
    ) -> str:
        """
        Create fallback revision summary when LLM is unavailable

        Args:
            file_path: Path of the revised file
            revision_type: Type of revision performed

        Returns:
            Fallback revision summary
        """
        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

        fallback_summary = f"""# File Revision Summary (UPDATED)
**Generated**: {timestamp}
**File Revised**: {file_path}
**Revision Type**: {revision_type}

## Revision Summary
File has been revised with targeted changes. LLM summary generation failed.

## Changes Made
- Targeted modifications applied based on error analysis
- Specific line-level changes implemented
- Code functionality updated

## Impact Assessment
- File behavior should be improved
- Error conditions addressed
- Integration points maintained

## Quality Improvements
- Code quality enhanced through precise fixes
- Error handling improved
- Maintainability increased

## Post-Revision Status
- File successfully updated
- Functionality preserved and enhanced
- Ready for integration testing

---
*Auto-generated by Enhanced Memory Agent (Revision Fallback Mode)*
"""
        return fallback_summary

    async def _save_revised_file_summary(self, revision_summary: str, file_path: str):
        """
        Save or update the revision summary for a file (replaces old summary)

        Args:
            revision_summary: New revision summary content
            file_path: Path of the file for which the summary was generated
        """
        try:
            # For revised files, we replace the existing summary rather than append
            # Read existing content to find and replace the specific file's summary
            file_exists = os.path.exists(self.code_summary_path)

            if file_exists:
                with open(self.code_summary_path, "r", encoding="utf-8") as f:
                    existing_content = f.read()

                # Look for existing summary for this file and replace it
                import re

                # Pattern to match existing implementation section for this file
                file_pattern = re.escape(file_path)
                section_pattern = rf"={80}\s*\n## IMPLEMENTATION File {file_pattern}\n={80}.*?(?=\n={80}|\Z)"

                # Check if this file already has a summary
                if re.search(section_pattern, existing_content, re.DOTALL):
                    # Replace existing summary
                    new_section = f"\n{'=' * 80}\n## IMPLEMENTATION File {file_path} (REVISED)\n{'=' * 80}\n\n{revision_summary}\n\n"
                    updated_content = re.sub(
                        section_pattern,
                        new_section.strip(),
                        existing_content,
                        flags=re.DOTALL,
                    )

                    with open(self.code_summary_path, "w", encoding="utf-8") as f:
                        f.write(updated_content)

                    self.logger.info(
                        f"Updated existing summary for revised file: {file_path}"
                    )
                else:
                    # Append new summary for this file
                    with open(self.code_summary_path, "a", encoding="utf-8") as f:
                        f.write("\n" + "=" * 80 + "\n")
                        f.write(f"## IMPLEMENTATION File {file_path} (REVISED)\n")
                        f.write("=" * 80 + "\n\n")
                        f.write(revision_summary)
                        f.write("\n\n")

                    self.logger.info(
                        f"Appended new summary for revised file: {file_path}"
                    )
            else:
                # Create new file with header
                os.makedirs(os.path.dirname(self.code_summary_path), exist_ok=True)

                with open(self.code_summary_path, "w", encoding="utf-8") as f:
                    f.write("# Code Implementation Progress Summary\n")
                    f.write("*Accumulated implementation progress for all files*\n\n")
                    f.write("\n" + "=" * 80 + "\n")
                    f.write(f"## IMPLEMENTATION File {file_path} (REVISED)\n")
                    f.write("=" * 80 + "\n\n")
                    f.write(revision_summary)
                    f.write("\n\n")

                self.logger.info(
                    f"Created new summary file with revised file: {file_path}"
                )

        except Exception as e:
            self.logger.error(
                f"Failed to save revised file summary for {file_path}: {e}"
            )

    def get_revision_memory_statistics(
        self, revised_files: List[str]
    ) -> Dict[str, Any]:
        """
        Get memory statistics for revised files

        Args:
            revised_files: List of file paths that have been revised

        Returns:
            Dictionary with revision memory statistics
        """
        try:
            total_revisions = len(revised_files)

            # Count how many files have updated summaries
            summaries_updated = 0
            if os.path.exists(self.code_summary_path):
                with open(self.code_summary_path, "r", encoding="utf-8") as f:
                    content = f.read()

                for file_path in revised_files:
                    if f"File {file_path} (REVISED)" in content:
                        summaries_updated += 1

            return {
                "total_revised_files": total_revisions,
                "summaries_updated": summaries_updated,
                "memory_sync_rate": (summaries_updated / total_revisions * 100)
                if total_revisions > 0
                else 0,
                "revised_files_list": revised_files.copy(),
                "memory_summary_path": self.code_summary_path,
                "revision_memory_mode": "active",
            }

        except Exception as e:
            self.logger.error(f"Failed to get revision memory statistics: {e}")
            return {
                "total_revised_files": len(revised_files),
                "summaries_updated": 0,
                "memory_sync_rate": 0,
                "revised_files_list": revised_files.copy(),
                "memory_summary_path": self.code_summary_path,
                "revision_memory_mode": "error",
            }


================================================
FILE: workflows/agents/requirement_analysis_agent.py
================================================
"""
User Requirement Analysis Agent

Responsible for analyzing user initial requirements, generating guiding questions,
and summarizing detailed requirement documents based on user responses.
This Agent seamlessly integrates with existing chat workflows to provide more precise requirement understanding.
"""

import json
import logging
from typing import Dict, List, Optional

from mcp_agent.agents.agent import Agent
from utils.llm_utils import get_preferred_llm_class


class RequirementAnalysisAgent:
    """
    User Requirement Analysis Agent

    Core Functions:
    1. Generate 5-8 guiding questions based on user initial requirements
    2. Collect user responses and analyze requirement completeness
    3. Generate detailed requirement documents for subsequent workflows
    4. Support skipping questions to directly enter implementation process

    Design Philosophy:ß
    - Intelligent question generation covering functionality, technology, performance, UI, deployment dimensions
    - Flexible user interaction supporting partial answers or complete skipping
    - Structured requirement output for easy understanding by code generation agents
    """

    def __init__(self, logger: Optional[logging.Logger] = None):
        """
        Initialize requirement analysis agent
        Args:
            logger: Logger instance
        """
        self.logger = logger or self._create_default_logger()
        self.mcp_agent = None
        self.llm = None

    def _create_default_logger(self) -> logging.Logger:
        """Create default logger"""
        logger = logging.getLogger(f"{__name__}.RequirementAnalysisAgent")
        logger.setLevel(logging.INFO)
        return logger

    async def __aenter__(self):
        """Async context manager entry"""
        await self.initialize()
        return self

    async def __aexit__(self, exc_type, exc_val, exc_tb):
        """Async context manager exit"""
        await self.cleanup()

    async def initialize(self):
        """Initialize MCP Agent connection and LLM"""
        try:
            self.mcp_agent = Agent(
                name="RequirementAnalysisAgent",
                instruction="""You are a professional requirement analysis expert, skilled at guiding users to provide more detailed project requirements through precise questions.

Your core capabilities:
1. **Intelligent Question Generation**: Based on user initial descriptions, generate 5-8 key questions covering functional requirements, technology selection, performance requirements, user interface, deployment environment, etc.
2. **Requirement Understanding Analysis**: Deep analysis of user's real intentions and implicit requirements
3. **Structured Requirement Output**: Integrate scattered requirement information into clear technical specification documents

Question Generation Principles:
- Questions should be specific and clear, avoiding overly broad scope
- Cover key decision points for technical implementation
- Consider project feasibility and complexity
- Help users think about important details they might have missed

Requirement Summary Principles:
- Maintain user's original intent unchanged
- Supplement key information for technical implementation
- Provide clear functional module division
- Give reasonable technical architecture suggestions""",
                server_names=[],  # No MCP servers needed, only use LLM
            )

            # Initialize agent context
            await self.mcp_agent.__aenter__()

            # Attach LLM
            self.llm = await self.mcp_agent.attach_llm(get_preferred_llm_class())

            self.logger.info("RequirementAnalysisAgent initialized successfully")

        except Exception as e:
            self.logger.error(f"RequirementAnalysisAgent initialization failed: {e}")
            raise

    async def cleanup(self):
        """Clean up resources"""
        if self.mcp_agent:
            try:
                await self.mcp_agent.__aexit__(None, None, None)
            except Exception as e:
                self.logger.warning(f"Error during resource cleanup: {e}")

    async def generate_guiding_questions(self, user_input: str) -> List[Dict[str, str]]:
        """
        Generate guiding questions based on user initial requirements

        Args:
            user_input: User's initial requirement description

        Returns:
            List[Dict]: Question list, each question contains category, question, importance and other fields
        """
        try:
            self.logger.info("Starting to generate AI precise guiding questions")

            # Build more precise prompt
            prompt = f"""Based on user's project requirements, generate precise guiding questions to help refine requirements.

User Requirements: {user_input}

Please analyze user requirements and generate 1-3 most critical targeted questions focusing on the most important aspects for this specific project

Return format (pure JSON array, no other text):
[
  {{
    "category": "Functional Requirements",
    "question": "Specific question content",
    "importance": "High",
    "hint": "Question hint"
  }}
]

Requirements: Questions should be specific and practical, avoiding general discussions."""

            from mcp_agent.workflows.llm.augmented_llm import RequestParams

            params = RequestParams(
                max_tokens=3000,
                temperature=0.5,  # Lower temperature for more stable JSON output
            )

            self.logger.info(
                f"Calling LLM to generate precise questions, input length: {len(user_input)}"
            )

            result = await self.llm.generate_str(message=prompt, request_params=params)

            self.logger.info(
                f"LLM returned result length: {len(result) if result else 0}"
            )

            if not result or not result.strip():
                self.logger.error("LLM returned empty result")
                raise ValueError("LLM returned empty result")

            self.logger.info(f"LLM returned result: {result[:500]}...")

            # Clean result and extract JSON part
            result_cleaned = result.strip()

            # Try to find JSON array
            import re

            json_pattern = r"\[\s*\{.*?\}\s*\]"
            json_match = re.search(json_pattern, result_cleaned, re.DOTALL)

            if json_match:
                json_str = json_match.group()
                self.logger.info(f"Extracted JSON: {json_str[:200]}...")
            else:
                # If complete JSON not found, try direct parsing
                json_str = result_cleaned

            # Parse JSON result
            try:
                questions = json.loads(json_str)
                if isinstance(questions, list) and len(questions) > 0:
                    self.logger.info(
                        f"✅ Successfully generated {len(questions)} AI precise guiding questions"
                    )
                    return questions
                else:
                    raise ValueError("Returned result is not a valid question list")

            except json.JSONDecodeError as e:
                self.logger.error(f"JSON parsing failed: {e}")
                self.logger.error(f"Original result: {result}")

                # Try more lenient JSON extraction
                lines = result.split("\n")
                json_lines = []
                in_json = False

                for line in lines:
                    if "[" in line:
                        in_json = True
                    if in_json:
                        json_lines.append(line)
                    if "]" in line and in_json:
                        break

                if json_lines:
                    try:
                        json_attempt = "\n".join(json_lines)
                        questions = json.loads(json_attempt)
                        if isinstance(questions, list) and len(questions) > 0:
                            self.logger.info(
                                f"✅ Generated {len(questions)} questions through lenient parsing"
                            )
                            return questions
                    except Exception:
                        pass

                # If JSON parsing fails, raise an error
                self.logger.error("JSON parsing completely failed")
                raise ValueError("Failed to parse AI generated questions")

        except Exception as e:
            self.logger.error(f"Failed to generate guiding questions: {e}")
            # Re-raise the exception instead of falling back to default questions
            raise

    async def summarize_detailed_requirements(
        self, initial_input: str, answers: Dict[str, str]
    ) -> str:
        """
        Generate detailed requirement document based on initial input and user answers

        Args:
            initial_input: User's initial requirement description
            answers: User's answer dictionary {question_id: answer}

        Returns:
            str: Detailed requirement document
        """
        try:
            self.logger.info("Starting to generate AI detailed requirement summary")

            # Build answer content
            answers_text = ""
            if answers:
                for question_id, answer in answers.items():
                    if answer and answer.strip():
                        answers_text += f"• {answer}\n"

            if not answers_text:
                answers_text = "User chose to skip questions, generating based on initial requirements"

            prompt = f"""Based on user requirements and responses, generate a concise project requirement document.

Initial Requirements: {initial_input}

Additional Information:
{answers_text}

Please generate a focused requirement document including:

## Project Overview
Brief description of project's core goals and value proposition

## Functional Requirements
Detailed list of required features and functional modules:
- Core functionalities
- User interactions and workflows
- Data processing requirements
- Integration needs

## Technical Architecture
Recommended technical design including:
- Technology stack and frameworks
- System architecture design
- Database and data storage solutions
- API design considerations
- Security requirements

## Performance & Scalability
- Expected user scale and performance requirements
- Scalability considerations and constraints

Requirements: Focus on what needs to be built and how to build it technically. Be concise but comprehensive - avoid unnecessary implementation details."""

            from mcp_agent.workflows.llm.augmented_llm import RequestParams

            params = RequestParams(max_tokens=4000, temperature=0.3)

            self.logger.info(
                f"Calling LLM to generate requirement summary, initial requirement length: {len(initial_input)}"
            )

            result = await self.llm.generate_str(message=prompt, request_params=params)

            if not result or not result.strip():
                self.logger.error("LLM returned empty requirement summary")
                raise ValueError("LLM returned empty requirement summary")

            self.logger.info(
                f"✅ Requirement summary generation completed, length: {len(result)}"
            )
            return result.strip()

        except Exception as e:
            self.logger.error(f"Requirement summary failed: {e}")
            # Return basic requirement document
            return f"""## Project Overview
Based on user requirements: {initial_input}

## Functional Requirements
Core functionality needed: {initial_input}

## Technical Architecture
- Select appropriate technology stack based on project requirements
- Adopt modular architecture design
- Consider database and data storage solutions
- Implement necessary security measures

## Performance & Scalability
- Design for expected user scale
- Consider scalability and performance requirements

Note: Due to technical issues, this is a simplified requirement document. Manual supplementation of detailed information is recommended."""

    async def modify_requirements(
        self, current_requirements: str, modification_feedback: str
    ) -> str:
        """
        Modify existing requirement document based on user feedback

        Args:
            current_requirements: Current requirement document content
            modification_feedback: User's modification requests and feedback

        Returns:
            str: Modified requirement document
        """
        try:
            self.logger.info("Starting to modify requirements based on user feedback")

            # Build modification prompt
            prompt = f"""Based on the current requirement document and user's modification requests, generate an updated requirement document.

Current Requirements Document:
{current_requirements}

User's Modification Requests:
{modification_feedback}

CRITICAL REQUIREMENT: You MUST generate a complete, well-structured requirement document regardless of how complete or incomplete the user's modification requests are. Even if the user only provides minimal or unclear feedback, you must still produce a comprehensive requirement document following the exact format below.

Generate an updated requirement document that incorporates any reasonable interpretation of the user's requested changes while maintaining the EXACT structure and format:

## Project Overview
Brief description of project's core goals and value proposition

## Functional Requirements
Detailed list of required features and functional modules:
- Core functionalities
- User interactions and workflows
- Data processing requirements
- Integration needs

## Technical Architecture
Recommended technical design including:
- Technology stack and frameworks
- System architecture design
- Database and data storage solutions
- API design considerations
- Security requirements

## Performance & Scalability
- Expected user scale and performance requirements
- Scalability considerations and constraints

MANDATORY REQUIREMENTS:
1. ALWAYS return a complete document with ALL sections above, regardless of user input completeness
2. If user feedback is unclear or incomplete, make reasonable assumptions based on the current requirements
3. Incorporate any clear user requests while filling in missing details intelligently
4. Maintain consistency and coherence throughout the document
5. Ensure all technical suggestions are feasible and practical
6. NEVER return an incomplete or partial document - always provide full sections
7. Keep the same professional structure and format in all cases"""

            from mcp_agent.workflows.llm.augmented_llm import RequestParams

            params = RequestParams(max_tokens=4000, temperature=0.3)

            self.logger.info(
                f"Calling LLM to modify requirements, feedback length: {len(modification_feedback)}"
            )

            result = await self.llm.generate_str(message=prompt, request_params=params)

            if not result or not result.strip():
                self.logger.error("LLM returned empty modified requirements")
                raise ValueError("LLM returned empty modified requirements")

            self.logger.info(
                f"✅ Requirements modification completed, length: {len(result)}"
            )
            return result.strip()

        except Exception as e:
            self.logger.error(f"Requirements modification failed: {e}")
            # Return current requirements with a note about the modification attempt
            return f"""{current_requirements}

---
**Note:** Automatic modification failed due to technical issues. The original requirements are shown above. Please manually incorporate the following requested changes:

{modification_feedback}"""


================================================
FILE: workflows/code_implementation_workflow.py
================================================
"""
Paper Code Implementation Workflow - MCP-compliant Iterative Development

Features:
1. File Tree Creation
2. Code Implementation - Based on aisi-basic-agent iterative development

MCP Architecture:
- MCP Server: tools/code_implementation_server.py
- MCP Client: Called through mcp_agent framework
- Configuration: mcp_agent.config.yaml
"""

import asyncio
import json
import logging
import os
import sys
import time
from pathlib import Path
from typing import Dict, Any, Optional, List

# MCP Agent imports
from mcp_agent.agents.agent import Agent

# Local imports
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from prompts.code_prompts import STRUCTURE_GENERATOR_PROMPT
from prompts.code_prompts import (
    GENERAL_CODE_IMPLEMENTATION_SYSTEM_PROMPT,
)
from workflows.agents import CodeImplementationAgent
from workflows.agents.memory_agent_concise import ConciseMemoryAgent
from config.mcp_tool_definitions import get_mcp_tools
from utils.llm_utils import get_preferred_llm_class, get_default_models, load_api_config
# DialogueLogger removed - no longer needed


class CodeImplementationWorkflow:
    """
    Paper Code Implementation Workflow Manager

    Uses standard MCP architecture:
    1. Connect to code-implementation server via MCP client
    2. Use MCP protocol for tool calls
    3. Support workspace management and operation history tracking
    """

    # ==================== 1. Class Initialization and Configuration (Infrastructure Layer) ====================

    def __init__(self, config_path: str = "mcp_agent.secrets.yaml"):
        """Initialize workflow with configuration"""
        self.config_path = config_path
        # Derive main config path from secrets path (same directory)
        secrets_dir = os.path.dirname(os.path.abspath(config_path))
        self.main_config_path = os.path.join(secrets_dir, "mcp_agent.config.yaml")
        self.api_config = self._load_api_config()
        self.default_models = get_default_models(self.main_config_path)
        self.logger = self._create_logger()
        self.mcp_agent = None
        self.enable_read_tools = (
            True  # Default value, will be overridden by run_workflow parameter
        )
        self.loop_detector = LoopDetector()
        self.progress_tracker = ProgressTracker()

    def _load_api_config(self) -> Dict[str, Any]:
        """Load API configuration with environment variable override."""
        try:
            return load_api_config(self.config_path)
        except Exception as e:
            raise Exception(f"Failed to load API config: {e}")

    def _create_logger(self) -> logging.Logger:
        """Create and configure logger"""
        logger = logging.getLogger(__name__)
        # Don't add handlers to child loggers - let them propagate to root
        logger.setLevel(logging.INFO)
        return logger

    def _read_plan_file(self, plan_file_path: str) -> str:
        """Read implementation plan file"""
        plan_path = Path(plan_file_path)
        if not plan_path.exists():
            raise FileNotFoundError(
                f"Implementation plan file not found: {plan_file_path}"
            )

        with open(plan_path, "r", encoding="utf-8") as f:
            return f.read()

    def _check_file_tree_exists(self, target_directory: str) -> bool:
        """Check if file tree structure already exists"""
        code_directory = os.path.join(target_directory, "generate_code")
        return os.path.exists(code_directory) and len(os.listdir(code_directory)) > 0

    # ==================== 2. Public Interface Methods (External API Layer) ====================

    async def run_workflow(
        self,
        plan_file_path: str,
        target_directory: Optional[str] = None,
        pure_code_mode: bool = False,
        enable_read_tools: bool = True,
    ):
        """Run complete workflow - Main public interface"""
        # Set the read tools configuration
        self.enable_read_tools = enable_read_tools

        try:
            plan_content = self._read_plan_file(plan_file_path)

            if target_directory is None:
                target_directory = str(Path(plan_file_path).parent)

            # Calculate code directory for workspace alignment
            code_directory = os.path.join(target_directory, "generate_code")

            self.logger.info("=" * 80)
            self.logger.info("🚀 STARTING CODE IMPLEMENTATION WORKFLOW")
            self.logger.info("=" * 80)
            self.logger.info(f"📄 Plan file: {plan_file_path}")
            self.logger.info(f"📂 Plan file parent: {target_directory}")
            self.logger.info(f"🎯 Code directory (MCP workspace): {code_directory}")
            self.logger.info(
                f"⚙️  Read tools: {'ENABLED' if self.enable_read_tools else 'DISABLED'}"
            )
            self.logger.info("=" * 80)

            results = {}

            # Check if file tree exists
            if self._check_file_tree_exists(target_directory):
                self.logger.info("File tree exists, skipping creation")
                results["file_tree"] = "Already exists, skipped creation"
            else:
                self.logger.info("Creating file tree...")
                results["file_tree"] = await self.create_file_structure(
                    plan_content, target_directory
                )

            # Code implementation
            if pure_code_mode:
                self.logger.info("Starting pure code implementation...")
                results["code_implementation"] = await self.implement_code_pure(
                    plan_content, target_directory, code_directory
                )
            else:
                pass

            self.logger.info("Workflow execution successful")

            return {
                "status": "success",
                "plan_file": plan_file_path,
                "target_directory": target_directory,
                "code_directory": os.path.join(target_directory, "generate_code"),
                "results": results,
                "mcp_architecture": "standard",
            }

        except Exception as e:
            self.logger.error(f"Workflow execution failed: {e}")

            return {"status": "error", "message": str(e), "plan_file": plan_file_path}
        finally:
            await self._cleanup_mcp_agent()

    async def create_file_structure(
        self, plan_content: str, target_directory: str
    ) -> str:
        """Create file tree structure based on implementation plan"""
        self.logger.info("Starting file tree creation...")

        structure_agent = Agent(
            name="StructureGeneratorAgent",
            instruction=STRUCTURE_GENERATOR_PROMPT,
            server_names=["command-executor"],
        )

        async with structure_agent:
            creator = await structure_agent.attach_llm(
                get_preferred_llm_class(self.config_path)
            )

            message = f"""Analyze the following implementation plan and generate shell commands to create the file tree structure.

Target Directory: {target_directory}/generate_code/

Implementation Plan:
{plan_content}

Tasks:
1. Find the file tree structure in the implementation plan
2. Generate shell commands (mkdir -p, touch) to create that structure
3. Use the execute_commands tool to run the commands and create the file structure

Requirements:
- Use mkdir -p to create directories
- Use touch to create files
- Include __init__.py file for Python packages
- Use relative paths to the target directory
- Execute commands to actually create the file structure"""

            result = await creator.generate_str(message=message)
            self.logger.info(f"LLM response: {result[:200]}...")  # Log first 200 chars

            # Verify directory was created, if not create it manually
            code_dir = os.path.join(target_directory, "generate_code")
            if not os.path.exists(code_dir):
                self.logger.warning(
                    "LLM did not create directory, creating manually..."
                )
                os.makedirs(code_dir, exist_ok=True)
                self.logger.info(f"✅ Manually created directory: {code_dir}")
            else:
                self.logger.info(f"✅ Directory exists: {code_dir}")

            return result

    async def implement_code_pure(
        self, plan_content: str, target_directory: str, code_directory: str = None
    ) -> str:
        """Pure code implementation - focus on code writing without testing"""
        self.logger.info("Starting pure code implementation (no testing)...")

        # Use provided code_directory or calculate it (for backwards compatibility)
        if code_directory is None:
            code_directory = os.path.join(target_directory, "generate_code")

        self.logger.info(f"🎯 Using code directory (MCP workspace): {code_directory}")

        if not os.path.exists(code_directory):
            self.logger.warning(
                f"Code directory does not exist, creating it: {code_directory}"
            )
            os.makedirs(code_directory, exist_ok=True)
            self.logger.info(f"✅ Code directory created: {code_directory}")

        try:
            client, client_type = await self._initialize_llm_client()
            await self._initialize_mcp_agent(code_directory)

            tools = self._prepare_mcp_tool_definitions()
            system_message = GENERAL_CODE_IMPLEMENTATION_SYSTEM_PROMPT
            messages = []

            #             implementation_message = f"""**TASK: Implement Research Paper Reproduction Code**

            # You are implementing a complete, working codebase that reproduces the core algorithms, experiments, and methods described in a research paper. Your goal is to create functional code that can replicate the paper's key results and contributions.

            # **What you need to do:**
            # - Analyze the paper content and reproduction plan to understand requirements
            # - Implement all core algorithms mentioned in the main body of the paper
            # - Create the necessary components following the planned architecture
            # - Test each component to ensure functionality
            # - Integrate components into a cohesive, executable system
            # - Focus on reproducing main contributions rather than appendix-only experiments

            # **RESOURCES:**
            # - **Paper & Reproduction Plan**: `{target_directory}/` (contains .md paper files and initial_plan.txt with detailed implementation guidance)
            # - **Reference Code Indexes**: `{target_directory}/indexes/` (JSON files with implementation patterns from related codebases)
            # - **Implementation Directory**: `{code_directory}/` (your working directory for all code files)

            # **CURRENT OBJECTIVE:**
            # Start by reading the reproduction plan (`{target_directory}/initial_plan.txt`) to understand the implementation strategy, then examine the paper content to identify the first priority component to implement. Use the search_code tool to find relevant reference implementations from the indexes directory (`{target_directory}/indexes/*.json`) before coding.

            # ---
            # **START:** Review the plan above and begin implementation."""
            implementation_message = f"""**Task: Implement code based on the following reproduction plan**

**Code Reproduction Plan:**
{plan_content}

**Working Directory:** {code_directory}

**Current Objective:** Begin implementation by analyzing the plan structure, examining the current project layout, and implementing the first foundation file according to the plan's priority order."""

            messages.append({"role": "user", "content": implementation_message})

            result = await self._pure_code_implementation_loop(
                client,
                client_type,
                system_message,
                messages,
                tools,
                plan_content,
                target_directory,
            )

            return result

        finally:
            await self._cleanup_mcp_agent()

    # ==================== 3. Core Business Logic (Implementation Layer) ====================

    async def _pure_code_implementation_loop(
        self,
        client,
        client_type,
        system_message,
        messages,
        tools,
        plan_content,
        target_directory,
    ):
        """Pure code implementation loop with memory optimization and phase consistency"""
        max_iterations = 800
        iteration = 0
        start_time = time.time()
        max_time = 7200  # 120 minutes (2 hours)

        # Initialize specialized agents
        code_agent = CodeImplementationAgent(
            self.mcp_agent, self.logger, self.enable_read_tools
        )

        # Pass code_directory to memory agent for file extraction
        code_directory = os.path.join(target_directory, "generate_code")
        memory_agent = ConciseMemoryAgent(
            plan_content,
            self.logger,
            target_directory,
            self.default_models,
            code_directory,
        )

        # Log read tools configuration
        read_tools_status = "ENABLED" if self.enable_read_tools else "DISABLED"
        self.logger.info(
            f"🔧 Read tools (read_file, read_code_mem): {read_tools_status}"
        )
        if not self.enable_read_tools:
            self.logger.info(
                "🚫 No read mode: read_file and read_code_mem tools will be skipped"
            )

        # Connect code agent with memory agent for summary generation
        # Note: Concise memory agent doesn't need LLM client for summary generation
        code_agent.set_memory_agent(memory_agent, client, client_type)

        # Initialize memory agent with iteration 0
        memory_agent.start_new_round(iteration=0)

        while iteration < max_iterations:
            iteration += 1
            elapsed_time = time.time() - start_time

            if elapsed_time > max_time:
                self.logger.warning(f"Time limit reached: {elapsed_time:.2f}s")
                break
                
            # Check for loops and timeouts
            if self.loop_detector.should_abort():
                abort_reason = self.loop_detector.get_abort_reason()
                self.logger.error(f"🛑 Process aborted: {abort_reason}")
                # Return error immediately instead of continuing to final report
                return f"❌ Process aborted due to: {abort_reason}\n\nThe code implementation was stopped because the system detected an issue that prevented progress. Please check the logs for more details."
                
            # Update file-level progress
            files_implemented = code_agent.get_files_implemented_count()
            if files_implemented > 0:
                self.progress_tracker.total_files = max(self.progress_tracker.total_files, files_implemented + 5)  # Estimate total
                progress_info = self.progress_tracker.get_progress_info()
                print(f"📁 Files: {progress_info['files_completed']}/{progress_info['total_files']} ({progress_info['file_progress']:.1f}%)")
                if progress_info['estimated_remaining_seconds'] > 0:
                    print(f"⏱️ Estimated remaining: {progress_info['estimated_remaining_seconds']:.0f}s")

            # # Test simplified memory approach if we have files implemented
            # if iteration == 5 and code_agent.get_files_implemented_count() > 0:
            #     self.logger.info("🧪 Testing simplified memory approach...")
            #     test_results = await memory_agent.test_simplified_memory_approach()
            #     self.logger.info(f"Memory test results: {test_results}")

            # self.logger.info(f"Pure code implementation iteration {iteration}: generating code")

            messages = self._validate_messages(messages)
            current_system_message = code_agent.get_system_prompt()

            # Round logging removed

            # Call LLM
            response = await self._call_llm_with_tools(
                client, client_type, current_system_message, messages, tools
            )

            response_content = response.get("content", "").strip()
            if not response_content:
                response_content = "Continue implementing code files..."

            messages.append({"role": "assistant", "content": response_content})

            # Handle tool calls
            if response.get("tool_calls"):
                # Check for loops before executing tools
                for tool_call in response["tool_calls"]:
                    loop_status = self.loop_detector.check_tool_call(tool_call["name"])
                    if loop_status["should_stop"]:
                        self.logger.error(f"🛑 Tool execution aborted: {loop_status['message']}")
                        return f"Process aborted: {loop_status['message']}"
                
                tool_results = await code_agent.execute_tool_calls(
                    response["tool_calls"]
                )

                # Record essential tool results in concise memory agent
                for tool_call, tool_result in zip(response["tool_calls"], tool_results):
                    # Check if tool actually failed
                    # Only count as error if isError flag is True
                    is_error = tool_result.get("isError", False)
                    
                    if not is_error:
                        # Tool succeeded
                        self.loop_detector.record_success()
                        
                        # Track file completion
                        if tool_call["name"] == "write_file":
                            filename = tool_call["input"].get("file_path", "unknown")
                            self.progress_tracker.complete_file(filename)
                            print(f"✅ File completed: {filename}")
                    else:
                        # Tool actually failed
                        self.loop_detector.record_error(f"Tool {tool_call['name']} failed: {tool_result.get('result', '')[:100]}")
                    
                    memory_agent.record_tool_result(
                        tool_name=tool_call["name"],
                        tool_input=tool_call["input"],
                        tool_result=tool_result.get("result"),
                    )

                # NEW LOGIC: Check if write_file was called and trigger memory optimization immediately

                # Determine guidance based on results
                has_error = self._check_tool_results_for_errors(tool_results)
                files_count = code_agent.get_files_implemented_count()

                if has_error:
                    guidance = self._generate_error_guidance()
                else:
                    guidance = self._generate_success_guidance(files_count)

                compiled_response = self._compile_user_response(tool_results, guidance)
                messages.append({"role": "user", "content": compiled_response})

                # NEW LOGIC: Apply memory optimization immediately after write_file detection
                if memory_agent.should_trigger_memory_optimization(
                    messages, code_agent.get_files_implemented_count()
                ):
                    # Memory optimization triggered

                    # Apply concise memory optimization
                    files_implemented_count = code_agent.get_files_implemented_count()
                    current_system_message = code_agent.get_system_prompt()
                    messages = memory_agent.apply_memory_optimization(
                        current_system_message, messages, files_implemented_count
                    )

                    # Memory optimization completed

            else:
                files_count = code_agent.get_files_implemented_count()
                no_tools_guidance = self._generate_no_tools_guidance(files_count)
                messages.append({"role": "user", "content": no_tools_guidance})

            # # Check for analysis loop and provide corrective guidance
            # if code_agent.is_in_analysis_loop():
            #     analysis_loop_guidance = code_agent.get_analysis_loop_guidance()
            #     messages.append({"role": "user", "content": analysis_loop_guidance})
            #     self.logger.warning(
            #         "Analysis loop detected and corrective guidance provided"
            #     )

            # Record file implementations in memory agent (for the current round)
            for file_info in code_agent.get_implementation_summary()["completed_files"]:
                memory_agent.record_file_implementation(file_info["file"])

            # REMOVED: Old memory optimization logic - now happens immediately after write_file
            # Memory optimization is now triggered immediately after write_file detection

            # Start new round for next iteration, sync with workflow iteration
            memory_agent.start_new_round(iteration=iteration)

            # Check completion based on actual unimplemented files list
            unimplemented_files = memory_agent.get_unimplemented_files()
            if not unimplemented_files:  # Empty list means all files implemented
                self.logger.info(
                    "✅ Code implementation complete - All files implemented"
                )
                break

            # Emergency trim if too long
            if len(messages) > 50:
                self.logger.warning(
                    "Emergency message trim - applying concise memory optimization"
                )

                current_system_message = code_agent.get_system_prompt()
                files_implemented_count = code_agent.get_files_implemented_count()
                messages = memory_agent.apply_memory_optimization(
                    current_system_message, messages, files_implemented_count
                )

        return await self._generate_pure_code_final_report_with_concise_agents(
            iteration, time.time() - start_time, code_agent, memory_agent
        )

    # ==================== 4. MCP Agent and LLM Communication Management (Communication Layer) ====================

    async def _initialize_mcp_agent(self, code_directory: str):
        """Initialize MCP agent and connect to code-implementation server"""
        try:
            self.mcp_agent = Agent(
                name="CodeImplementationAgent",
                instruction="You are a code implementation assistant, using MCP tools to implement paper code replication. For large documents, use document-segmentation tools to read content in smaller chunks to avoid token limits.",
                server_names=["code-implementation", "code-reference-indexer", "document-segmentation"],
            )

            await self.mcp_agent.__aenter__()
            llm = await self.mcp_agent.attach_llm(
                get_preferred_llm_class(self.config_path)
            )

            # Set workspace to the target code directory
            workspace_result = await self.mcp_agent.call_tool(
                "set_workspace", {"workspace_path": code_directory}
            )
            self.logger.info(f"Workspace setup result: {workspace_result}")

            return llm

        except Exception as e:
            self.logger.error(f"Failed to initialize MCP agent: {e}")
            if self.mcp_agent:
                try:
                    await self.mcp_agent.__aexit__(None, None, None)
                except Exception:
                    pass
                self.mcp_agent = None
            raise

    async def _cleanup_mcp_agent(self):
        """Clean up MCP agent resources"""
        if self.mcp_agent:
            try:
                await self.mcp_agent.__aexit__(None, None, None)
                self.logger.info("MCP agent connection closed")
            except Exception as e:
                self.logger.warning(f"Error closing MCP agent: {e}")
            finally:
                self.mcp_agent = None

    async def _initialize_llm_client(self):
        """Initialize LLM client based on llm_provider preference and API key availability"""
        # Get API keys
        anthropic_key = self.api_config.get("anthropic", {}).get("api_key", "")
        openai_key = self.api_config.get("openai", {}).get("api_key", "")
        google_key = self.api_config.get("google", {}).get("api_key", "")

        # Read user preference from main config
        preferred_provider = None
        try:
            import yaml

            # Derive config path from secrets path (same directory)
            secrets_dir = os.path.dirname(os.path.abspath(self.config_path))
            config_path = os.path.join(secrets_dir, "mcp_agent.config.yaml")
            if os.path.exists(config_path):
                with open(config_path, "r", encoding="utf-8") as f:
                    config = yaml.safe_load(f)
                    preferred_provider = config.get("llm_provider", "").strip().lower()
        except Exception as e:
            self.logger.warning(f"Could not read llm_provider preference: {e}")

        # Define provider initialization functions
        async def init_anthropic():
            if not (anthropic_key and anthropic_key.strip()):
                return None
            try:
                from anthropic import AsyncAnthropic

                client = AsyncAnthropic(api_key=anthropic_key)
                await client.messages.create(
                    model=self.default_models["anthropic"],
                    max_tokens=20,
                    messages=[{"role": "user", "content": "test"}],
                )
                self.logger.info(
                    f"Using Anthropic API with model: {self.default_models['anthropic']}"
                )
                return client, "anthropic"
            except Exception as e:
                self.logger.warning(f"Anthropic API unavailable: {e}")
                return None

        async def init_google():
            if not (google_key and google_key.strip()):
                return None
            try:
                from google import genai

                client = genai.Client(api_key=google_key)
                try:
                    test_response = await client.aio.models.generate_content(
                        model=self.default_models.get("google", "gemini-2.0-flash"),
                        contents="test",
                    )
                    self.logger.info(
                        "Google API connection successful: " + str(test_response)
                    )
                except Exception as test_err:
                    self.logger.warning(
                        f"Could not test Google API: {test_err}, but will try to use client"
                    )

                self.logger.info(
                    f"Using Google API with model: {self.default_models.get('google', 'gemini-2.0-flash')}"
                )
                return client, "google"
            except Exception as e:
                self.logger.warning(f"Google API unavailable: {e}")
                return None

        async def init_openai():
            if not (openai_key and openai_key.strip()):
                return None
            try:
                from openai import AsyncOpenAI

                openai_config = self.api_config.get("openai", {})
                base_url = openai_config.get("base_url")

                if base_url:
                    client = AsyncOpenAI(api_key=openai_key, base_url=base_url)
                else:
                    client = AsyncOpenAI(api_key=openai_key)

                model_name = self.default_models.get("openai", "o3-mini")

                try:
                    await client.chat.completions.create(
                        model=model_name,
                        max_tokens=20,
                        messages=[{"role": "user", "content": "test"}],
                    )
                except Exception as e:
                    if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                        self.logger.info(
                            f"Model {model_name} requires max_completion_tokens parameter"
                        )
                        await client.chat.completions.create(
                            model=model_name,
                            max_completion_tokens=20,
                            messages=[{"role": "user", "content": "test"}],
                        )
                    else:
                        raise
                self.logger.info(f"Using OpenAI API with model: {model_name}")
                if base_url:
                    self.logger.info(f"Using custom base URL: {base_url}")
                return client, "openai"
            except Exception as e:
                self.logger.warning(f"OpenAI API unavailable: {e}")
                return None

        # Map providers to their init functions
        provider_init_map = {
            "anthropic": init_anthropic,
            "google": init_google,
            "openai": init_openai,
        }

        # Try preferred provider first
        if preferred_provider and preferred_provider in provider_init_map:
            self.logger.info(f"🎯 Trying preferred provider: {preferred_provider}")
            result = await provider_init_map[preferred_provider]()
            if result:
                return result
            else:
                self.logger.warning(
                    f"⚠️ Preferred provider '{preferred_provider}' unavailable, trying alternatives..."
                )

        # Fallback: try providers in order
        for provider_name, init_func in provider_init_map.items():
            if provider_name == preferred_provider:
                continue  # Already tried
            result = await init_func()
            if result:
                return result

        raise ValueError(
            "No available LLM API - please check your API keys in configuration"
        )

    async def _call_llm_with_tools(
        self, client, client_type, system_message, messages, tools, max_tokens=8192
    ):
        """Call LLM with tools"""
        try:
            if client_type == "anthropic":
                return await self._call_anthropic_with_tools(
                    client, system_message, messages, tools, max_tokens
                )
            elif client_type == "openai":
                return await self._call_openai_with_tools(
                    client, system_message, messages, tools, max_tokens
                )
            elif client_type == "google":
                return await self._call_google_with_tools(
                    client, system_message, messages, tools, max_tokens
                )
            else:
                raise ValueError(f"Unsupported client type: {client_type}")
        except Exception as e:
            self.logger.error(f"LLM call failed: {e}")
            raise

    async def _call_anthropic_with_tools(
        self, client, system_message, messages, tools, max_tokens
    ):
        """Call Anthropic API with token limit management"""
        validated_messages = self._validate_messages(messages)
        if not validated_messages:
            validated_messages = [
                {"role": "user", "content": "Please continue implementing code"}
            ]

        try:
            # Use implementation-specific model for code generation
            impl_model = self.default_models.get(
                "anthropic_implementation", self.default_models["anthropic"]
            )
            self.logger.info(f"🔧 Code generation using model: {impl_model}")
            response = await client.messages.create(
                model=impl_model,
                system=system_message,
                messages=validated_messages,
                tools=tools,
                max_tokens=max_tokens,
                temperature=0.2,
            )
        except Exception as e:
            self.logger.error(f"Anthropic API call failed: {e}")
            raise

        content = ""
        tool_calls = []

        for block in response.content:
            if block.type == "text":
                content += block.text
            elif block.type == "tool_use":
                tool_calls.append(
                    {"id": block.id, "name": block.name, "input": block.input}
                )

        # Extract token usage and calculate cost
        token_usage = {}
        cost = 0.0
        
        if hasattr(response, 'usage') and response.usage:
            token_usage = {
                "input_tokens": response.usage.input_tokens,
                "output_tokens": response.usage.output_tokens,
                "total_tokens": response.usage.input_tokens + response.usage.output_tokens
            }
            
            # Use dynamic cost calculation based on current model
            from utils.model_limits import calculate_token_cost
            cost = calculate_token_cost(
                response.usage.input_tokens,
                response.usage.output_tokens,
                model_name=self.default_models.get("anthropic")
            )
            
            print(f"💰 Tokens: {token_usage['total_tokens']} (${cost:.4f})")
            self.logger.info(f"Token usage: {token_usage['input_tokens']} input + {token_usage['output_tokens']} output = {token_usage['total_tokens']} total (${cost:.4f})")

        return {
            "content": content, 
            "tool_calls": tool_calls,
            "token_usage": token_usage,
            "cost": cost
        }

    async def _call_google_with_tools(
        self, client, system_message, messages, tools, max_tokens
    ):
        """
        Call Google Gemini API with tools

        Note: Google Gemini uses a completely different API structure.
        The client here is expected to be google.genai.Client from google-genai SDK.

        Reference: https://ai.google.dev/gemini-api/docs/function-calling
        """
        try:
            from google.genai import types
        except ImportError:
            raise ImportError("google-genai package is required for Google API calls")

        validated_messages = self._validate_messages(messages)
        if not validated_messages:
            validated_messages = [
                {"role": "user", "content": "Please continue implementing code"}
            ]

        # Convert messages to Google Gemini format (types.Content)
        # Gemini expects: role="user" or role="model" (not "assistant")
        gemini_messages = []
        for msg in validated_messages:
            role = msg.get("role", "user")
            content = msg.get("content", "")

            # Convert role names: "assistant" -> "model"
            if role == "assistant":
                role = "model"
            elif role not in ["user", "model"]:
                # Skip unsupported roles or convert to user
                role = "user"

            gemini_messages.append(
                types.Content(role=role, parts=[types.Part.from_text(text=content)])
            )

        # Convert tools to Google Gemini format (types.Tool with FunctionDeclaration)
        # Following the EXACT pattern from GoogleAugmentedLLM line 92-103
        # IMPORTANT: Each tool should be wrapped in its own Tool object!
        gemini_tools = []
        if tools:
            for tool in tools:
                # Transform the input_schema to be Gemini-compatible
                parameters = self._transform_schema_for_gemini(tool["input_schema"])

                # Each tool gets its own Tool wrapper (not all in one!)
                gemini_tools.append(
                    types.Tool(
                        function_declarations=[
                            types.FunctionDeclaration(
                                name=tool["name"],
                                description=tool["description"],
                                parameters=parameters,
                            )
                        ]
                    )
                )

        # Create config with system instruction and tools
        config = types.GenerateContentConfig(
            max_output_tokens=max_tokens,
            temperature=0.2,
            system_instruction=system_message if system_message else None,
            tools=gemini_tools if gemini_tools else None,
            # Disable automatic function calling - we handle it manually
            automatic_function_calling=types.AutomaticFunctionCallingConfig(
                disable=True
            ),
        )

        try:
            # Google Gemini API call using the native SDK
            # client is google.genai.Client instance
            # Use implementation-specific model for code generation
            impl_model = self.default_models.get(
                "google_implementation", self.default_models["google"]
            )
            self.logger.info(f"🔧 Code generation using model: {impl_model}")
            response = await client.aio.models.generate_content(
                model=impl_model,
                contents=gemini_messages,
                config=config,
            )
        except Exception as e:
            self.logger.error(f"Google API call failed: {e}")
            raise

        # Parse Gemini response (types.GenerateContentResponse)
        # Following the pattern from augmented_llm_google.py lines 145-165
        content = ""
        tool_calls = []

        if response and hasattr(response, "candidates") and response.candidates:
            candidate = response.candidates[0]

            if hasattr(candidate, "content") and candidate.content:
                if hasattr(candidate.content, "parts") and candidate.content.parts:
                    for part in candidate.content.parts:
                        # Handle text content
                        if hasattr(part, "text") and part.text:
                            content += part.text

                        # Handle function calls
                        # Check for function_call attribute, matching augmented_llm_google.py line 164
                        if hasattr(part, "function_call") and part.function_call:
                            fc = part.function_call
                            # Extract function call details
                            # Note: Gemini function_call has name and args attributes
                            tool_call = {
                                "id": getattr(
                                    fc, "id", getattr(fc, "name", "")
                                ),  # Use name as fallback for id
                                "name": fc.name if hasattr(fc, "name") else "",
                                "input": dict(fc.args)
                                if hasattr(fc, "args") and fc.args
                                else {},
                            }
                            self.logger.debug(
                                f"Google function_call parsed: {tool_call}"
                            )
                            tool_calls.append(tool_call)

        return {"content": content, "tool_calls": tool_calls}

    def _transform_schema_for_gemini(self, schema: dict) -> dict:
        """
        Transform JSON Schema to OpenAPI Schema format compatible with Gemini.

        This is based on the transform_mcp_tool_schema from GoogleAugmentedLLM.
        Key transformations:
        1. Convert camelCase to snake_case
        2. Remove unsupported fields (default, additionalProperties)
        3. Handle nullable types via anyOf
        """
        if not isinstance(schema, dict):
            return schema

        # Fields to exclude
        EXCLUDED_PROPERTIES = {"default", "additionalProperties"}

        # camelCase to snake_case mappings
        CAMEL_TO_SNAKE = {
            "anyOf": "any_of",
            "maxLength": "max_length",
            "minLength": "min_length",
            "minProperties": "min_properties",
            "maxProperties": "max_properties",
            "maxItems": "max_items",
            "minItems": "min_items",
        }

        result = {}

        for key, value in schema.items():
            # Skip excluded properties
            if key in EXCLUDED_PROPERTIES:
                continue

            # Convert camelCase to snake_case
            snake_key = CAMEL_TO_SNAKE.get(key, key)

            # Handle nested structures
            if key == "properties" and isinstance(value, dict):
                result[snake_key] = {
                    prop_k: self._transform_schema_for_gemini(prop_v)
                    for prop_k, prop_v in value.items()
                }
            elif key == "items" and isinstance(value, dict):
                result[snake_key] = self._transform_schema_for_gemini(value)
            elif key == "anyOf" and isinstance(value, list):
                # Handle nullable types (Type | None)
                has_null = any(
                    isinstance(item, dict) and item.get("type") == "null"
                    for item in value
                )
                if has_null:
                    result["nullable"] = True

                # Get first non-null schema
                for item in value:
                    if isinstance(item, dict) and item.get("type") != "null":
                        transformed = self._transform_schema_for_gemini(item)
                        for k, v in transformed.items():
                            if k not in result:
                                result[k] = v
                        break
            else:
                result[snake_key] = value

        return result

    def _repair_truncated_json(self, json_str: str, tool_name: str = "") -> dict:
        """
        Advanced JSON repair for truncated or malformed JSON from LLM responses.

        Handles:
        - Missing closing braces/brackets
        - Truncated string values
        - Missing required fields
        - Trailing commas
        """
        import re

        # Step 1: Try basic fixes first
        fixed = json_str.strip()

        # Remove trailing commas
        fixed = re.sub(r",\s*}", "}", fixed)
        fixed = re.sub(r",\s*]", "]", fixed)

        try:
            return json.loads(fixed)
        except json.JSONDecodeError as e:
            print("   🔧 Attempting advanced JSON repair...")

            # Step 2: Check for truncation issues
            if e.msg == "Expecting value":
                # Likely truncated - try to close open structures
                fixed = self._close_json_structures(fixed)
                try:
                    return json.loads(fixed)
                except (json.JSONDecodeError, ValueError, TypeError):
                    pass

            # Step 3: Try to extract partial valid JSON
            if e.msg.startswith("Expecting") and e.pos:
                # Truncate at error position and try to close
                truncated = fixed[: e.pos]
                closed = self._close_json_structures(truncated)
                try:
                    partial = json.loads(closed)
                    print("   ✅ Extracted partial JSON successfully")
                    return partial
                except (json.JSONDecodeError, ValueError, TypeError):
                    pass

            # Step 4: Tool-specific defaults for critical tools
            if tool_name == "write_file":
                # For write_file, try to extract at least file_path
                file_path_match = re.search(r'"file_path"\s*:\s*"([^"]*)"', fixed)
                if file_path_match:
                    print("   ⚠️  write_file JSON truncated, using minimal structure")
                    return {
                        "file_path": file_path_match.group(1),
                        "content": "",  # Empty content is better than crashing
                    }

            # Step 5: Last resort - return error indicator
            print("   ❌ JSON repair failed completely")
            return None

    def _close_json_structures(self, json_str: str) -> str:
        """
        Intelligently close unclosed JSON structures.
        Counts braces and brackets to determine what needs closing.
        """
        # Count open structures
        open_braces = json_str.count("{") - json_str.count("}")
        open_brackets = json_str.count("[") - json_str.count("]")

        # Check if we're in the middle of a string
        quote_count = json_str.count('"')
        in_string = (quote_count % 2) != 0

        result = json_str

        # Close string if needed
        if in_string:
            result += '"'

        # Close brackets first (inner structures)
        result += "]" * open_brackets

        # Close braces
        result += "}" * open_braces

        return result

    async def _call_openai_with_tools(
        self, client, system_message, messages, tools, max_tokens
    ):
        """Call OpenAI API with robust JSON error handling and retry mechanism"""
        openai_tools = []
        for tool in tools:
            openai_tools.append(
                {
                    "type": "function",
                    "function": {
                        "name": tool["name"],
                        "description": tool["description"],
                        "parameters": tool["input_schema"],
                    },
                }
            )

        openai_messages = [{"role": "system", "content": system_message}]
        openai_messages.extend(messages)

        # Retry mechanism for API calls
        max_retries = 3
        retry_delay = 2  # seconds

        # Use implementation-specific model for code generation
        impl_model = self.default_models.get(
            "openai_implementation", self.default_models["openai"]
        )
        self.logger.info(f"🔧 Code generation using model: {impl_model}")

        for attempt in range(max_retries):
            try:
                # Try max_tokens first, fallback to max_completion_tokens if unsupported
                try:
                    response = await client.chat.completions.create(
                        model=impl_model,
                        messages=openai_messages,
                        tools=openai_tools if openai_tools else None,
                        max_tokens=max_tokens,
                        temperature=0.2,
                    )
                except Exception as e:
                    if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                        # Retry with max_completion_tokens for models that require it
                        response = await client.chat.completions.create(
                            model=impl_model,
                            messages=openai_messages,
                            tools=openai_tools if openai_tools else None,
                            max_completion_tokens=max_tokens,
                        )
                    else:
                        raise

                # Validate response structure
                if (
                    not response
                    or not hasattr(response, "choices")
                    or not response.choices
                ):
                    raise ValueError("Invalid API response: missing choices")

                if not response.choices[0] or not hasattr(
                    response.choices[0], "message"
                ):
                    raise ValueError("Invalid API response: missing message in choice")

                message = response.choices[0].message
                content = message.content or ""

                # Successfully got a valid response
                break

            except json.JSONDecodeError as e:
                print(
                    f"\n❌ JSON Decode Error in API response (attempt {attempt + 1}/{max_retries}):"
                )
                print(f"   Error: {e}")
                print(f"   Position: line {e.lineno}, column {e.colno}")

                if attempt < max_retries - 1:
                    print(f"   ⏳ Retrying in {retry_delay} seconds...")
                    await asyncio.sleep(retry_delay)
                    retry_delay *= 2  # Exponential backoff
                else:
                    print("   ❌ All retries exhausted")
                    raise

            except (ValueError, AttributeError, TypeError) as e:
                print(f"\n❌ API Response Error (attempt {attempt + 1}/{max_retries}):")
                print(f"   Error type: {type(e).__name__}")
                print(f"   Error: {e}")

                if attempt < max_retries - 1:
                    print(f"   ⏳ Retrying in {retry_delay} seconds...")
                    await asyncio.sleep(retry_delay)
                    retry_delay *= 2
                else:
                    print("   ❌ All retries exhausted")
                    # Return empty response instead of crashing
                    return {
                        "content": "API error - unable to get valid response",
                        "tool_calls": [],
                    }

            except Exception as e:
                print(
                    f"\n❌ Unexpected API Error (attempt {attempt + 1}/{max_retries}):"
                )
                print(f"   Error type: {type(e).__name__}")
                print(f"   Error: {e}")

                if attempt < max_retries - 1:
                    print(f"   ⏳ Retrying in {retry_delay} seconds...")
                    await asyncio.sleep(retry_delay)
                    retry_delay *= 2
                else:
                    print("   ❌ All retries exhausted")
                    raise

        tool_calls = []
        if message.tool_calls:
            for tool_call in message.tool_calls:
                try:
                    # Attempt to parse tool call arguments
                    parsed_input = json.loads(tool_call.function.arguments)
                    tool_calls.append(
                        {
                            "id": tool_call.id,
                            "name": tool_call.function.name,
                            "input": parsed_input,
                        }
                    )
                except json.JSONDecodeError as e:
                    # Detailed JSON parsing error logging
                    print("\n❌ JSON Parsing Error in tool call:")
                    print(f"   Tool: {tool_call.function.name}")
                    print(f"   Error: {e}")
                    print("   Raw arguments (first 500 chars):")
                    print(f"   {tool_call.function.arguments[:500]}")
                    print(f"   Error position: line {e.lineno}, column {e.colno}")
                    print(
                        f"   Problem at: ...{tool_call.function.arguments[max(0, e.pos-50):e.pos+50]}..."
                    )

                    # Attempt advanced JSON repair
                    repaired = self._repair_truncated_json(
                        tool_call.function.arguments, tool_call.function.name
                    )

                    if repaired:
                        print("   ✅ JSON repaired successfully")
                        tool_calls.append(
                            {
                                "id": tool_call.id,
                                "name": tool_call.function.name,
                                "input": repaired,
                            }
                        )
                    else:
                        # Skip this tool call if repair failed
                        print("   ⚠️  Skipping unrepairable tool call")
                        continue

        # Extract token usage and calculate cost
        token_usage = {}
        cost = 0.0
        
        if hasattr(response, 'usage') and response.usage:
            token_usage = {
                "prompt_tokens": response.usage.prompt_tokens,
                "completion_tokens": response.usage.completion_tokens,
                "total_tokens": response.usage.total_tokens
            }
            
            # Use dynamic cost calculation based on current model
            from utils.model_limits import calculate_token_cost
            cost = calculate_token_cost(
                response.usage.prompt_tokens,
                response.usage.completion_tokens,
                model_name=self.default_models.get("openai")
            )
            
            print(f"💰 Tokens: {token_usage['total_tokens']} (${cost:.4f})")
            self.logger.info(f"Token usage: {token_usage['prompt_tokens']} prompt + {token_usage['completion_tokens']} completion = {token_usage['total_tokens']} total (${cost:.4f})")

        return {
            "content": content, 
            "tool_calls": tool_calls,
            "token_usage": token_usage,
            "cost": cost
        }

    # ==================== 5. Tools and Utility Methods (Utility Layer) ====================

    def _validate_messages(self, messages: List[Dict]) -> List[Dict]:
        """Validate and clean message list"""
        valid_messages = []
        for msg in messages:
            content = msg.get("content", "").strip()
            if content:
                valid_messages.append(
                    {"role": msg.get("role", "user"), "content": content}
                )
            else:
                self.logger.warning(f"Skipping empty message: {msg}")
        return valid_messages

    def _prepare_mcp_tool_definitions(self) -> List[Dict[str, Any]]:
        """Prepare tool definitions in Anthropic API standard format"""
        return get_mcp_tools("code_implementation")

    def _check_tool_results_for_errors(self, tool_results: List[Dict]) -> bool:
        """Check tool results for errors with JSON repair capability"""
        for result in tool_results:
            try:
                if hasattr(result["result"], "content") and result["result"].content:
                    content_text = result["result"].content[0].text

                    # First attempt: try direct JSON parsing
                    try:
                        parsed_result = json.loads(content_text)
                        if parsed_result.get("status") == "error":
                            return True
                    except json.JSONDecodeError as e:
                        # JSON parsing failed - try to repair
                        print("\n⚠️  JSON parsing failed in tool result check:")
                        print(f"   Error: {e}")
                        print(
                            f"   Position: line {e.lineno}, column {e.colno}, char {e.pos}"
                        )
                        print(f"   Content length: {len(content_text)} chars")
                        print(f"   First 300 chars: {content_text[:300]}")

                        # Attempt to repair the JSON
                        repaired = self._repair_truncated_json(content_text)
                        if repaired:
                            print("   ✅ Tool result JSON repaired successfully")
                            if repaired.get("status") == "error":
                                return True
                        else:
                            # Fallback: check for "error" keyword in text
                            if "error" in content_text.lower():
                                return True

                elif isinstance(result["result"], str):
                    if "error" in result["result"].lower():
                        return True

            except (AttributeError, IndexError) as e:
                # Unexpected result structure
                print(f"\n⚠️  Unexpected result structure: {type(e).__name__}: {e}")
                result_str = str(result["result"])
                if "error" in result_str.lower():
                    return True
        return False

    # ==================== 6. User Interaction and Feedback (Interaction Layer) ====================

    def _generate_success_guidance(self, files_count: int) -> str:
        """Generate concise success guidance for continuing implementation"""
        return f"""✅ File implementation completed successfully!

📊 **Progress Status:** {files_count} files implemented

🎯 **Next Action:** Check if ALL files from the reproduction plan are implemented.

⚡ **Decision Process:**
1. **If ALL files implemented:** Reply with "All files implemented" to complete the task
2. **If MORE files need implementation:** Continue with dependency-aware workflow:
   - **Use `write_file` to implement the new component"""

    def _generate_error_guidance(self) -> str:
        """Generate error guidance for handling issues"""
        return """❌ Error detected during file implementation.

🔧 **Action Required:**
1. Review the error details above
2. Fix the identified issue
3. **Check if ALL files from the reproduction plan are implemented:**
   - **If YES:** Respond "**implementation complete**" to end the conversation
   - **If NO:** Continue with proper development cycle for next file:
     - **Use `write_file` to implement properly
4. Ensure proper error handling in future implementations"""

    def _generate_no_tools_guidance(self, files_count: int) -> str:
        """Generate concise guidance when no tools are called"""
        return f"""⚠️ No tool calls detected in your response.

📊 **Current Progress:** {files_count} files implemented

🚨 **Action Required:** Check completion status NOW:

⚡ **Decision Process:**
1. **If ALL files from plan are implemented:** Reply "All files implemented" to complete
2. **If MORE files need implementation:** Use tools to continue:
   - **Use `write_file` to implement the new component

🚨 **Critical:** Don't just explain - either declare completion or use tools!"""

    def _compile_user_response(self, tool_results: List[Dict], guidance: str) -> str:
        """Compile tool results and guidance into a single user response"""
        response_parts = []

        if tool_results:
            response_parts.append("🔧 **Tool Execution Results:**")
            for tool_result in tool_results:
                tool_name = tool_result["tool_name"]
                result_content = tool_result["result"]
                response_parts.append(
                    f"```\nTool: {tool_name}\nResult: {result_content}\n```"
                )

        if guidance:
            response_parts.append("\n" + guidance)

        return "\n\n".join(response_parts)

    # ==================== 7. Reporting and Output (Output Layer) ====================

    async def _generate_pure_code_final_report_with_concise_agents(
        self,
        iterations: int,
        elapsed_time: float,
        code_agent: CodeImplementationAgent,
        memory_agent: ConciseMemoryAgent,
    ):
        """Generate final report using concise agent statistics"""
        try:
            code_stats = code_agent.get_implementation_statistics()
            memory_stats = memory_agent.get_memory_statistics(
                code_stats["files_implemented_count"]
            )

            if self.mcp_agent:
                history_result = await self.mcp_agent.call_tool(
                    "get_operation_history", {"last_n": 30}
                )
                history_data = (
                    json.loads(history_result)
                    if isinstance(history_result, str)
                    else history_result
                )
            else:
                history_data = {"total_operations": 0, "history": []}

            write_operations = 0
            files_created = []
            if "history" in history_data:
                for item in history_data["history"]:
                    if item.get("action") == "write_file":
                        write_operations += 1
                        file_path = item.get("details", {}).get("file_path", "unknown")
                        files_created.append(file_path)

            report = f"""
# Pure Code Implementation Completion Report (Write-File-Based Memory Mode)

## Execution Summary
- Implementation iterations: {iterations}
- Total elapsed time: {elapsed_time:.2f} seconds
- Files implemented: {code_stats['total_files_implemented']}
- File write operations: {write_operations}
- Total MCP operations: {history_data.get('total_operations', 0)}

## Read Tools Configuration
- Read tools enabled: {code_stats['read_tools_status']['read_tools_enabled']}
- Status: {code_stats['read_tools_status']['status']}
- Tools affected: {', '.join(code_stats['read_tools_status']['tools_affected'])}

## Agent Performance
### Code Implementation Agent
- Files tracked: {code_stats['files_implemented_count']}
- Technical decisions: {code_stats['technical_decisions_count']}
- Constraints tracked: {code_stats['constraints_count']}
- Architecture notes: {code_stats['architecture_notes_count']}
- Dependency analysis performed: {code_stats['dependency_analysis_count']}
- Files read for dependencies: {code_stats['files_read_for_dependencies']}
- Last summary triggered at file count: {code_stats['last_summary_file_count']}

### Concise Memory Agent (Write-File-Based)
- Last write_file detected: {memory_stats['last_write_file_detected']}
- Should clear memory next: {memory_stats['should_clear_memory_next']}
- Files implemented count: {memory_stats['implemented_files_tracked']}
- Current round: {memory_stats['current_round']}
- Concise mode active: {memory_stats['concise_mode_active']}
- Current round tool results: {memory_stats['current_round_tool_results']}
- Essential tools recorded: {memory_stats['essential_tools_recorded']}

## Files Created
"""
            for file_path in files_created[-20:]:
                report += f"- {file_path}\n"

            if len(files_created) > 20:
                report += f"... and {len(files_created) - 20} more files\n"

            report += """
## Architecture Features
✅ WRITE-FILE-BASED Memory Agent - Clear after each file generation
✅ After write_file: Clear history → Keep system prompt + initial plan + tool results
✅ Tool accumulation: read_code_mem, read_file, search_reference_code until next write_file
✅ Clean memory cycle: write_file → clear → accumulate → write_file → clear
✅ Essential tool recording with write_file detection
✅ Specialized agent separation for clean code organization
✅ MCP-compliant tool execution
✅ Production-grade code with comprehensive type hints
✅ Intelligent dependency analysis and file reading
✅ Automated read_file usage for implementation context
✅ Eliminates conversation clutter between file generations
✅ Focused memory for efficient next file generation
"""
            return report

        except Exception as e:
            self.logger.error(f"Failed to generate final report: {e}")
            return f"Failed to generate final report: {str(e)}"


async def main():
    """Main function for running the workflow"""
    # Configure root logger carefully to avoid duplicates
    root_logger = logging.getLogger()
    if not root_logger.handlers:
        handler = logging.StreamHandler()
        formatter = logging.Formatter("%(levelname)s:%(name)s:%(message)s")
        handler.setFormatter(formatter)
        root_logger.addHandler(handler)
        root_logger.setLevel(logging.INFO)

    workflow = CodeImplementationWorkflow()

    print("=" * 60)
    print("Code Implementation Workflow with UNIFIED Reference Indexer")
    print("=" * 60)
    print("Select mode:")
    print("1. Test Code Reference Indexer Integration")
    print("2. Run Full Implementation Workflow")
    print("3. Run Implementation with Pure Code Mode")
    print("4. Test Read Tools Configuration")

    # mode_choice = input("Enter choice (1-4, default: 3): ").strip()

    # For testing purposes, we'll run the test first
    # if mode_choice == "4":
    #     print("Testing Read Tools Configuration...")

    #     # Create a test workflow normally
    #     test_workflow = CodeImplementationWorkflow()

    #     # Create a mock code agent for testing
    #     print("\n🧪 Testing with read tools DISABLED:")
    #     test_agent_disabled = CodeImplementationAgent(None, enable_read_tools=False)
    #     await test_agent_disabled.test_read_tools_configuration()

    #     print("\n🧪 Testing with read tools ENABLED:")
    #     test_agent_enabled = CodeImplementationAgent(None, enable_read_tools=True)
    #     await test_agent_enabled.test_read_tools_configuration()

    #     print("✅ Read tools configuration testing completed!")
    #     return

    # print("Running Code Reference Indexer Integration Test...")

    test_success = True
    if test_success:
        print("\n" + "=" * 60)
        print("🎉 UNIFIED Code Reference Indexer Integration Test PASSED!")
        print("🔧 Three-step process successfully merged into ONE tool")
        print("=" * 60)

        # Ask if user wants to continue with actual workflow
        print("\nContinuing with workflow execution...")

        plan_file = os.path.join(
            os.getcwd(), "deepcode_lab", "papers", "2", "initial_plan.txt"
        )
        target_directory = os.path.join(os.getcwd(), "deepcode_lab", "papers", "2")
        print("Implementation Mode Selection:")
        print("1. Pure Code Implementation Mode (Recommended)")
        print("2. Iterative Implementation Mode")

        pure_code_mode = True
        mode_name = "Pure Code Implementation Mode with Memory Agent Architecture + Code Reference Indexer"
        print(f"Using: {mode_name}")

        # Configure read tools - modify this parameter to enable/disable read tools
        enable_read_tools = (
            True  # Set to False to disable read_file and read_code_mem tools
        )
        read_tools_status = "ENABLED" if enable_read_tools else "DISABLED"
        print(f"🔧 Read tools (read_file, read_code_mem): {read_tools_status}")

        # NOTE: To test without read tools, change the line above to:
        # enable_read_tools = False

        result = await workflow.run_workflow(
            plan_file,
            target_directory=target_directory,
            pure_code_mode=pure_code_mode,
            enable_read_tools=enable_read_tools,
        )

        print("=" * 60)
        print("Workflow Execution Results:")
        print(f"Status: {result['status']}")
        print(f"Mode: {mode_name}")

        if result["status"] == "success":
            print(f"Code Directory: {result['code_directory']}")
            print(f"MCP Architecture: {result.get('mcp_architecture', 'unknown')}")
            print("Execution completed!")
        else:
            print(f"Error Message: {result['message']}")

        print("=" * 60)
        print(
            "✅ Using Standard MCP Architecture with Memory Agent + Code Reference Indexer"
        )

    else:
        print("\n" + "=" * 60)
        print("❌ Code Reference Indexer Integration Test FAILED!")
        print("Please check the configuration and try again.")
        print("=" * 60)


if __name__ == "__main__":
    asyncio.run(main())


================================================
FILE: workflows/code_implementation_workflow_index.py
================================================
"""
Paper Code Implementation Workflow - MCP-compliant Iterative Development

Features:
1. File Tree Creation
2. Code Implementation - Based on aisi-basic-agent iterative development

MCP Architecture:
- MCP Server: tools/code_implementation_server.py
- MCP Client: Called through mcp_agent framework
- Configuration: mcp_agent.config.yaml
"""

import asyncio
import json
import logging
import os
import sys
import time
from pathlib import Path
from typing import Dict, Any, Optional, List

# MCP Agent imports
from mcp_agent.agents.agent import Agent

# Local imports
sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from prompts.code_prompts import STRUCTURE_GENERATOR_PROMPT
from prompts.code_prompts import (
    PURE_CODE_IMPLEMENTATION_SYSTEM_PROMPT_INDEX,
)
from workflows.agents import CodeImplementationAgent
from workflows.agents.memory_agent_concise import ConciseMemoryAgent
from config.mcp_tool_definitions_index import get_mcp_tools
from utils.llm_utils import get_preferred_llm_class, get_default_models, load_api_config
# DialogueLogger removed - no longer needed


class CodeImplementationWorkflowWithIndex:
    """
    Paper Code Implementation Workflow Manager with Code Reference Indexer

    Uses standard MCP architecture with enhanced indexing capabilities:
    1. Connect to code-implementation server via MCP client
    2. Use MCP protocol for tool calls
    3. Support workspace management and operation history tracking
    4. Integrated code reference indexer for enhanced code understanding
    """

    # ==================== 1. Class Initialization and Configuration (Infrastructure Layer) ====================

    def __init__(self, config_path: str = "mcp_agent.secrets.yaml"):
        """Initialize workflow with configuration"""
        self.config_path = config_path
        # Derive main config path from secrets path (same directory)
        secrets_dir = os.path.dirname(os.path.abspath(config_path))
        self.main_config_path = os.path.join(secrets_dir, "mcp_agent.config.yaml")
        self.api_config = self._load_api_config()
        self.default_models = get_default_models(self.main_config_path)
        self.logger = self._create_logger()
        self.mcp_agent = None
        self.enable_read_tools = (
            True  # Default value, will be overridden by run_workflow parameter
        )
        self.loop_detector = LoopDetector()
        self.progress_tracker = ProgressTracker()

    def _load_api_config(self) -> Dict[str, Any]:
        """Load API configuration with environment variable override."""
        try:
            return load_api_config(self.config_path)
        except Exception as e:
            raise Exception(f"Failed to load API config: {e}")

    def _create_logger(self) -> logging.Logger:
        """Create and configure logger"""
        logger = logging.getLogger(__name__)
        # Don't add handlers to child loggers - let them propagate to root
        logger.setLevel(logging.INFO)
        return logger

    def _read_plan_file(self, plan_file_path: str) -> str:
        """Read implementation plan file"""
        plan_path = Path(plan_file_path)
        if not plan_path.exists():
            raise FileNotFoundError(
                f"Implementation plan file not found: {plan_file_path}"
            )

        with open(plan_path, "r", encoding="utf-8") as f:
            return f.read()

    def _check_file_tree_exists(self, target_directory: str) -> bool:
        """Check if file tree structure already exists"""
        code_directory = os.path.join(target_directory, "generate_code")
        return os.path.exists(code_directory) and len(os.listdir(code_directory)) > 0

    # ==================== 2. Public Interface Methods (External API Layer) ====================

    async def run_workflow(
        self,
        plan_file_path: str,
        target_directory: Optional[str] = None,
        pure_code_mode: bool = False,
        enable_read_tools: bool = True,
    ):
        """Run complete workflow - Main public interface"""
        # Set the read tools configuration
        self.enable_read_tools = enable_read_tools

        try:
            plan_content = self._read_plan_file(plan_file_path)

            if target_directory is None:
                target_directory = str(Path(plan_file_path).parent)

            # Calculate code directory for workspace alignment
            code_directory = os.path.join(target_directory, "generate_code")

            self.logger.info("=" * 80)
            self.logger.info("🚀 STARTING CODE IMPLEMENTATION WORKFLOW")
            self.logger.info("=" * 80)
            self.logger.info(f"📄 Plan file: {plan_file_path}")
            self.logger.info(f"📂 Plan file parent: {target_directory}")
            self.logger.info(f"🎯 Code directory (MCP workspace): {code_directory}")
            self.logger.info(
                f"⚙️  Read tools: {'ENABLED' if self.enable_read_tools else 'DISABLED'}"
            )
            self.logger.info("=" * 80)

            results = {}

            # Check if file tree exists
            if self._check_file_tree_exists(target_directory):
                self.logger.info("File tree exists, skipping creation")
                results["file_tree"] = "Already exists, skipped creation"
            else:
                self.logger.info("Creating file tree...")
                results["file_tree"] = await self.create_file_structure(
                    plan_content, target_directory
                )

            # Code implementation
            if pure_code_mode:
                self.logger.info("Starting pure code implementation...")
                results["code_implementation"] = await self.implement_code_pure(
                    plan_content, target_directory, code_directory
                )
            else:
                pass

            self.logger.info("Workflow execution successful")

            return {
                "status": "success",
                "plan_file": plan_file_path,
                "target_directory": target_directory,
                "code_directory": os.path.join(target_directory, "generate_code"),
                "results": results,
                "mcp_architecture": "standard",
            }

        except Exception as e:
            self.logger.error(f"Workflow execution failed: {e}")

            return {"status": "error", "message": str(e), "plan_file": plan_file_path}
        finally:
            await self._cleanup_mcp_agent()

    async def create_file_structure(
        self, plan_content: str, target_directory: str
    ) -> str:
        """Create file tree structure based on implementation plan"""
        self.logger.info("Starting file tree creation...")

        structure_agent = Agent(
            name="StructureGeneratorAgent",
            instruction=STRUCTURE_GENERATOR_PROMPT,
            server_names=["command-executor"],
        )

        async with structure_agent:
            creator = await structure_agent.attach_llm(
                get_preferred_llm_class(self.config_path)
            )

            message = f"""Analyze the following implementation plan and generate shell commands to create the file tree structure.

Target Directory: {target_directory}/generate_code

Implementation Plan:
{plan_content}

Tasks:
1. Find the file tree structure in the implementation plan
2. Generate shell commands (mkdir -p, touch) to create that structure
3. Use the execute_commands tool to run the commands and create the file structure

Requirements:
- Use mkdir -p to create directories
- Use touch to create files
- Include __init__.py file for Python packages
- Use relative paths to the target directory
- Execute commands to actually create the file structure"""

            result = await creator.generate_str(message=message)
            self.logger.info("File tree structure creation completed")
            return result

    async def implement_code_pure(
        self, plan_content: str, target_directory: str, code_directory: str = None
    ) -> str:
        """Pure code implementation - focus on code writing without testing"""
        self.logger.info("Starting pure code implementation (no testing)...")

        # Use provided code_directory or calculate it (for backwards compatibility)
        if code_directory is None:
            code_directory = os.path.join(target_directory, "generate_code")

        self.logger.info(f"🎯 Using code directory (MCP workspace): {code_directory}")

        if not os.path.exists(code_directory):
            self.logger.warning(
                f"Code directory does not exist, creating it: {code_directory}"
            )
            os.makedirs(code_directory, exist_ok=True)
            self.logger.info(f"✅ Code directory created: {code_directory}")

        try:
            client, client_type = await self._initialize_llm_client()
            await self._initialize_mcp_agent(code_directory)

            tools = self._prepare_mcp_tool_definitions()
            system_message = PURE_CODE_IMPLEMENTATION_SYSTEM_PROMPT_INDEX
            messages = []

            #             implementation_message = f"""**TASK: Implement Research Paper Reproduction Code**

            # You are implementing a complete, working codebase that reproduces the core algorithms, experiments, and methods described in a research paper. Your goal is to create functional code that can replicate the paper's key results and contributions.

            # **What you need to do:**
            # - Analyze the paper content and reproduction plan to understand requirements
            # - Implement all core algorithms mentioned in the main body of the paper
            # - Create the necessary components following the planned architecture
            # - Test each component to ensure functionality
            # - Integrate components into a cohesive, executable system
            # - Focus on reproducing main contributions rather than appendix-only experiments

            # **RESOURCES:**
            # - **Paper & Reproduction Plan**: `{target_directory}/` (contains .md paper files and initial_plan.txt with detailed implementation guidance)
            # - **Reference Code Indexes**: `{target_directory}/indexes/` (JSON files with implementation patterns from related codebases)
            # - **Implementation Directory**: `{code_directory}/` (your working directory for all code files)

            # **CURRENT OBJECTIVE:**
            # Start by reading the reproduction plan (`{target_directory}/initial_plan.txt`) to understand the implementation strategy, then examine the paper content to identify the first priority component to implement. Use the search_code tool to find relevant reference implementations from the indexes directory (`{target_directory}/indexes/*.json`) before coding.

            # ---
            # **START:** Review the plan above and begin implementation."""
            implementation_message = f"""**Task: Implement code based on the following reproduction plan**

**Code Reproduction Plan:**
{plan_content}

**Working Directory:** {code_directory}

**Current Objective:** Begin implementation by analyzing the plan structure, examining the current project layout, and implementing the first foundation file according to the plan's priority order."""

            messages.append({"role": "user", "content": implementation_message})

            result = await self._pure_code_implementation_loop(
                client,
                client_type,
                system_message,
                messages,
                tools,
                plan_content,
                target_directory,
            )

            return result

        finally:
            await self._cleanup_mcp_agent()

    # ==================== 3. Core Business Logic (Implementation Layer) ====================

    async def _pure_code_implementation_loop(
        self,
        client,
        client_type,
        system_message,
        messages,
        tools,
        plan_content,
        target_directory,
    ):
        """Pure code implementation loop with memory optimization and phase consistency"""
        max_iterations = 800
        iteration = 0
        start_time = time.time()
        max_time = 7200  # 120 minutes (2 hours)

        # Initialize specialized agents
        code_agent = CodeImplementationAgent(
            self.mcp_agent, self.logger, self.enable_read_tools
        )

        # Pass code_directory to memory agent for file extraction
        code_directory = os.path.join(target_directory, "generate_code")
        memory_agent = ConciseMemoryAgent(
            plan_content,
            self.logger,
            target_directory,
            self.default_models,
            code_directory,
        )

        # Log read tools configuration
        read_tools_status = "ENABLED" if self.enable_read_tools else "DISABLED"
        self.logger.info(
            f"🔧 Read tools (read_file, read_code_mem): {read_tools_status}"
        )
        if not self.enable_read_tools:
            self.logger.info(
                "🚫 No read mode: read_file and read_code_mem tools will be skipped"
            )

        # Connect code agent with memory agent for summary generation
        # Note: Concise memory agent doesn't need LLM client for summary generation
        code_agent.set_memory_agent(memory_agent, client, client_type)

        # Initialize memory agent with iteration 0
        memory_agent.start_new_round(iteration=0)

        while iteration < max_iterations:
            iteration += 1
            elapsed_time = time.time() - start_time

            if elapsed_time > max_time:
                self.logger.warning(f"Time limit reached: {elapsed_time:.2f}s")
                break

            # # Test simplified memory approach if we have files implemented
            # if iteration == 5 and code_agent.get_files_implemented_count() > 0:
            #     self.logger.info("🧪 Testing simplified memory approach...")
            #     test_results = await memory_agent.test_simplified_memory_approach()
            #     self.logger.info(f"Memory test results: {test_results}")

            # self.logger.info(f"Pure code implementation iteration {iteration}: generating code")

            messages = self._validate_messages(messages)
            current_system_message = code_agent.get_system_prompt()

            # Round logging removed

            # Call LLM
            response = await self._call_llm_with_tools(
                client, client_type, current_system_message, messages, tools
            )

            response_content = response.get("content", "").strip()
            if not response_content:
                response_content = "Continue implementing code files..."

            messages.append({"role": "assistant", "content": response_content})

            # Handle tool calls
            if response.get("tool_calls"):
                tool_results = await code_agent.execute_tool_calls(
                    response["tool_calls"]
                )

                # Record essential tool results in concise memory agent
                for tool_call, tool_result in zip(response["tool_calls"], tool_results):
                    memory_agent.record_tool_result(
                        tool_name=tool_call["name"],
                        tool_input=tool_call["input"],
                        tool_result=tool_result.get("result"),
                    )

                # NEW LOGIC: Check if write_file was called and trigger memory optimization immediately

                # Determine guidance based on results
                has_error = self._check_tool_results_for_errors(tool_results)
                files_count = code_agent.get_files_implemented_count()

                if has_error:
                    guidance = self._generate_error_guidance()
                else:
                    guidance = self._generate_success_guidance(files_count)

                compiled_response = self._compile_user_response(tool_results, guidance)
                messages.append({"role": "user", "content": compiled_response})

                # NEW LOGIC: Apply memory optimization immediately after write_file detection
                if memory_agent.should_trigger_memory_optimization(
                    messages, code_agent.get_files_implemented_count()
                ):
                    # Memory optimization triggered

                    # Apply concise memory optimization
                    files_implemented_count = code_agent.get_files_implemented_count()
                    current_system_message = code_agent.get_system_prompt()
                    messages = memory_agent.apply_memory_optimization(
                        current_system_message, messages, files_implemented_count
                    )

                    # Memory optimization completed

            else:
                files_count = code_agent.get_files_implemented_count()
                no_tools_guidance = self._generate_no_tools_guidance(files_count)
                messages.append({"role": "user", "content": no_tools_guidance})

            # Check for analysis loop and provide corrective guidance
            # if code_agent.is_in_analysis_loop():
            #     analysis_loop_guidance = code_agent.get_analysis_loop_guidance()
            #     messages.append({"role": "user", "content": analysis_loop_guidance})
            #     self.logger.warning(
            #         "Analysis loop detected and corrective guidance provided"
            #     )

            # Record file implementations in memory agent (for the current round)
            for file_info in code_agent.get_implementation_summary()["completed_files"]:
                memory_agent.record_file_implementation(file_info["file"])

            # REMOVED: Old memory optimization logic - now happens immediately after write_file
            # Memory optimization is now triggered immediately after write_file detection

            # Start new round for next iteration, sync with workflow iteration
            memory_agent.start_new_round(iteration=iteration)

            # Check completion based on actual unimplemented files list
            unimplemented_files = memory_agent.get_unimplemented_files()
            if not unimplemented_files:  # Empty list means all files implemented
                self.logger.info(
                    "✅ Code implementation complete - All files implemented"
                )
                break

            # Emergency trim if too long
            if len(messages) > 50:
                self.logger.warning(
                    "Emergency message trim - applying concise memory optimization"
                )

                current_system_message = code_agent.get_system_prompt()
                files_implemented_count = code_agent.get_files_implemented_count()
                messages = memory_agent.apply_memory_optimization(
                    current_system_message, messages, files_implemented_count
                )

        return await self._generate_pure_code_final_report_with_concise_agents(
            iteration, time.time() - start_time, code_agent, memory_agent
        )

    # ==================== 4. MCP Agent and LLM Communication Management (Communication Layer) ====================

    async def _initialize_mcp_agent(self, code_directory: str):
        """Initialize MCP agent and connect to code-implementation server"""
        try:
            self.mcp_agent = Agent(
                name="CodeImplementationAgent",
                instruction="You are a code implementation assistant, using MCP tools to implement paper code replication. For large documents, use document-segmentation tools to read content in smaller chunks to avoid token limits.",
                server_names=["code-implementation", "code-reference-indexer", "document-segmentation"],
            )

            await self.mcp_agent.__aenter__()
            llm = await self.mcp_agent.attach_llm(
                get_preferred_llm_class(self.config_path)
            )

            # Set workspace to the target code directory
            workspace_result = await self.mcp_agent.call_tool(
                "set_workspace", {"workspace_path": code_directory}
            )
            self.logger.info(f"Workspace setup result: {workspace_result}")

            return llm

        except Exception as e:
            self.logger.error(f"Failed to initialize MCP agent: {e}")
            if self.mcp_agent:
                try:
                    await self.mcp_agent.__aexit__(None, None, None)
                except Exception:
                    pass
                self.mcp_agent = None
            raise

    async def _cleanup_mcp_agent(self):
        """Clean up MCP agent resources"""
        if self.mcp_agent:
            try:
                await self.mcp_agent.__aexit__(None, None, None)
                self.logger.info("MCP agent connection closed")
            except Exception as e:
                self.logger.warning(f"Error closing MCP agent: {e}")
            finally:
                self.mcp_agent = None

    async def _initialize_llm_client(self):
        """Initialize LLM client based on llm_provider preference and API key availability"""
        # Get API keys
        anthropic_key = self.api_config.get("anthropic", {}).get("api_key", "")
        openai_key = self.api_config.get("openai", {}).get("api_key", "")
        google_key = self.api_config.get("google", {}).get("api_key", "")

        # Read user preference from main config
        preferred_provider = None
        try:
            import yaml

            # Derive config path from secrets path (same directory)
            secrets_dir = os.path.dirname(os.path.abspath(self.config_path))
            config_path = os.path.join(secrets_dir, "mcp_agent.config.yaml")
            if os.path.exists(config_path):
                with open(config_path, "r", encoding="utf-8") as f:
                    config = yaml.safe_load(f)
                    preferred_provider = config.get("llm_provider", "").strip().lower()
        except Exception as e:
            self.logger.warning(f"Could not read llm_provider preference: {e}")

        # Define provider initialization functions
        async def init_anthropic():
            if not (anthropic_key and anthropic_key.strip()):
                return None
            try:
                from anthropic import AsyncAnthropic

                client = AsyncAnthropic(api_key=anthropic_key)
                await client.messages.create(
                    model=self.default_models["anthropic"],
                    max_tokens=20,
                    messages=[{"role": "user", "content": "test"}],
                )
                self.logger.info(
                    f"Using Anthropic API with model: {self.default_models['anthropic']}"
                )
                return client, "anthropic"
            except Exception as e:
                self.logger.warning(f"Anthropic API unavailable: {e}")
                return None

        async def init_google():
            if not (google_key and google_key.strip()):
                return None
            try:
                from google import genai

                client = genai.Client(api_key=google_key)
                try:
                    test_response = await client.aio.models.generate_content(
                        model=self.default_models.get("google", "gemini-2.0-flash"),
                        contents="test",
                    )

                    self.logger.info(
                        "Google API connection successful: " + str(test_response)
                    )
                except Exception as test_err:
                    self.logger.warning(
                        f"Could not test Google API: {test_err}, but will try to use client"
                    )

                self.logger.info(
                    f"Using Google API with model: {self.default_models.get('google', 'gemini-2.0-flash')}"
                )
                return client, "google"
            except Exception as e:
                self.logger.warning(f"Google API unavailable: {e}")
                return None

        async def init_openai():
            if not (openai_key and openai_key.strip()):
                return None
            try:
                from openai import AsyncOpenAI

                openai_config = self.api_config.get("openai", {})
                base_url = openai_config.get("base_url")

                if base_url:
                    client = AsyncOpenAI(api_key=openai_key, base_url=base_url)
                else:
                    client = AsyncOpenAI(api_key=openai_key)

                model_name = self.default_models.get("openai", "o3-mini")

                try:
                    await client.chat.completions.create(
                        model=model_name,
                        max_tokens=20,
                        messages=[{"role": "user", "content": "test"}],
                    )
                except Exception as e:
                    if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                        self.logger.info(
                            f"Model {model_name} requires max_completion_tokens parameter"
                        )
                        await client.chat.completions.create(
                            model=model_name,
                            max_completion_tokens=20,
                            messages=[{"role": "user", "content": "test"}],
                        )
                    else:
                        raise
                self.logger.info(f"Using OpenAI API with model: {model_name}")
                if base_url:
                    self.logger.info(f"Using custom base URL: {base_url}")
                return client, "openai"
            except Exception as e:
                self.logger.warning(f"OpenAI API unavailable: {e}")
                return None

        # Map providers to their init functions
        provider_init_map = {
            "anthropic": init_anthropic,
            "google": init_google,
            "openai": init_openai,
        }

        # Try preferred provider first
        if preferred_provider and preferred_provider in provider_init_map:
            self.logger.info(f"🎯 Trying preferred provider: {preferred_provider}")
            result = await provider_init_map[preferred_provider]()
            if result:
                return result
            else:
                self.logger.warning(
                    f"⚠️ Preferred provider '{preferred_provider}' unavailable, trying alternatives..."
                )

        # Fallback: try providers in order
        for provider_name, init_func in provider_init_map.items():
            if provider_name == preferred_provider:
                continue  # Already tried
            result = await init_func()
            if result:
                return result

        raise ValueError(
            "No available LLM API - please check your API keys in configuration"
        )

    async def _call_llm_with_tools(
        self, client, client_type, system_message, messages, tools, max_tokens=8192
    ):
        """Call LLM with tools"""
        try:
            if client_type == "anthropic":
                return await self._call_anthropic_with_tools(
                    client, system_message, messages, tools, max_tokens
                )
            elif client_type == "openai":
                return await self._call_openai_with_tools(
                    client, system_message, messages, tools, max_tokens
                )
            elif client_type == "google":
                return await self._call_google_with_tools(
                    client, system_message, messages, tools, max_tokens
                )
            else:
                raise ValueError(f"Unsupported client type: {client_type}")
        except Exception as e:
            self.logger.error(f"LLM call failed: {e}")
            raise

    async def _call_anthropic_with_tools(
        self, client, system_message, messages, tools, max_tokens
    ):
        """Call Anthropic API with token limit management"""
        validated_messages = self._validate_messages(messages)
        if not validated_messages:
            validated_messages = [
                {"role": "user", "content": "Please continue implementing code"}
            ]

        try:
            # Use implementation-specific model for code generation
            impl_model = self.default_models.get(
                "anthropic_implementation", self.default_models["anthropic"]
            )
            self.logger.info(f"🔧 Code generation using model: {impl_model}")
            response = await client.messages.create(
                model=impl_model,
                system=system_message,
                messages=validated_messages,
                tools=tools,
                max_tokens=max_tokens,
                temperature=0.2,
            )
        except Exception as e:
            self.logger.error(f"Anthropic API call failed: {e}")
            raise

        content = ""
        tool_calls = []

        for block in response.content:
            if block.type == "text":
                content += block.text
            elif block.type == "tool_use":
                tool_calls.append(
                    {"id": block.id, "name": block.name, "input": block.input}
                )

        # Extract token usage and calculate cost
        token_usage = {}
        cost = 0.0
        
        if hasattr(response, 'usage') and response.usage:
            token_usage = {
                "input_tokens": response.usage.input_tokens,
                "output_tokens": response.usage.output_tokens,
                "total_tokens": response.usage.input_tokens + response.usage.output_tokens
            }
            
            # Use dynamic cost calculation based on current model
            from utils.model_limits import calculate_token_cost
            cost = calculate_token_cost(
                response.usage.input_tokens,
                response.usage.output_tokens,
                model_name=self.default_models.get("anthropic")
            )
            
            print(f"💰 Tokens: {token_usage['total_tokens']} (${cost:.4f})")
            self.logger.info(f"Token usage: {token_usage['input_tokens']} input + {token_usage['output_tokens']} output = {token_usage['total_tokens']} total (${cost:.4f})")

        return {
            "content": content, 
            "tool_calls": tool_calls,
            "token_usage": token_usage,
            "cost": cost
        }

    async def _call_google_with_tools(
        self, client, system_message, messages, tools, max_tokens
    ):
        """
        Call Google Gemini API with tools

        Note: Google Gemini uses a completely different API structure.
        The client here is expected to be google.genai.Client from google-genai SDK.

        Reference: https://ai.google.dev/gemini-api/docs/function-calling
        """
        try:
            from google.genai import types
        except ImportError:
            raise ImportError("google-genai package is required for Google API calls")

        validated_messages = self._validate_messages(messages)
        if not validated_messages:
            validated_messages = [
                {"role": "user", "content": "Please continue implementing code"}
            ]

        # Convert messages to Google Gemini format (types.Content)
        # Gemini expects: role="user" or role="model" (not "assistant")
        gemini_messages = []
        for msg in validated_messages:
            role = msg.get("role", "user")
            content = msg.get("content", "")

            # Convert role names: "assistant" -> "model"
            if role == "assistant":
                role = "model"
            elif role not in ["user", "model"]:
                # Skip unsupported roles or convert to user
                role = "user"

            gemini_messages.append(
                types.Content(role=role, parts=[types.Part.from_text(text=content)])
            )

        # Convert tools to Google Gemini format (types.Tool with FunctionDeclaration)
        # Following the EXACT pattern from GoogleAugmentedLLM line 92-103
        # IMPORTANT: Each tool should be wrapped in its own Tool object!
        gemini_tools = []
        if tools:
            for tool in tools:
                # Transform the input_schema to be Gemini-compatible
                parameters = self._transform_schema_for_gemini(tool["input_schema"])

                # Each tool gets its own Tool wrapper (not all in one!)
                gemini_tools.append(
                    types.Tool(
                        function_declarations=[
                            types.FunctionDeclaration(
                                name=tool["name"],
                                description=tool["description"],
                                parameters=parameters,
                            )
                        ]
                    )
                )

        # Create config with system instruction and tools
        config = types.GenerateContentConfig(
            max_output_tokens=max_tokens,
            temperature=0.2,
            system_instruction=system_message if system_message else None,
            tools=gemini_tools if gemini_tools else None,
            # Disable automatic function calling - we handle it manually
            automatic_function_calling=types.AutomaticFunctionCallingConfig(
                disable=True
            ),
        )

        try:
            # Google Gemini API call using the native SDK
            # client is google.genai.Client instance
            # Use implementation-specific model for code generation
            impl_model = self.default_models.get(
                "google_implementation", self.default_models["google"]
            )
            self.logger.info(f"🔧 Code generation using model: {impl_model}")
            response = await client.aio.models.generate_content(
                model=impl_model,
                contents=gemini_messages,
                config=config,
            )
        except Exception as e:
            self.logger.error(f"Google API call failed: {e}")
            raise

        # Parse Gemini response (types.GenerateContentResponse)
        # Following the pattern from augmented_llm_google.py lines 145-165
        content = ""
        tool_calls = []

        if response and hasattr(response, "candidates") and response.candidates:
            candidate = response.candidates[0]

            if hasattr(candidate, "content") and candidate.content:
                if hasattr(candidate.content, "parts") and candidate.content.parts:
                    for part in candidate.content.parts:
                        # Handle text content
                        if hasattr(part, "text") and part.text:
                            content += part.text

                        # Handle function calls
                        # Check for function_call attribute, matching augmented_llm_google.py line 164
                        if hasattr(part, "function_call") and part.function_call:
                            fc = part.function_call
                            # Extract function call details
                            # Note: Gemini function_call has name and args attributes
                            tool_call = {
                                "id": getattr(
                                    fc, "id", getattr(fc, "name", "")
                                ),  # Use name as fallback for id
                                "name": fc.name if hasattr(fc, "name") else "",
                                "input": dict(fc.args)
                                if hasattr(fc, "args") and fc.args
                                else {},
                            }
                            self.logger.debug(
                                f"Google function_call parsed: {tool_call}"
                            )
                            tool_calls.append(tool_call)

        return {"content": content, "tool_calls": tool_calls}

    def _transform_schema_for_gemini(self, schema: dict) -> dict:
        """
        Transform JSON Schema to OpenAPI Schema format compatible with Gemini.

        This is based on the transform_mcp_tool_schema from GoogleAugmentedLLM.
        Key transformations:
        1. Convert camelCase to snake_case
        2. Remove unsupported fields (default, additionalProperties)
        3. Handle nullable types via anyOf
        """
        if not isinstance(schema, dict):
            return schema

        # Fields to exclude
        EXCLUDED_PROPERTIES = {"default", "additionalProperties"}

        # camelCase to snake_case mappings
        CAMEL_TO_SNAKE = {
            "anyOf": "any_of",
            "maxLength": "max_length",
            "minLength": "min_length",
            "minProperties": "min_properties",
            "maxProperties": "max_properties",
            "maxItems": "max_items",
            "minItems": "min_items",
        }

        result = {}

        for key, value in schema.items():
            # Skip excluded properties
            if key in EXCLUDED_PROPERTIES:
                continue

            # Convert camelCase to snake_case
            snake_key = CAMEL_TO_SNAKE.get(key, key)

            # Handle nested structures
            if key == "properties" and isinstance(value, dict):
                result[snake_key] = {
                    prop_k: self._transform_schema_for_gemini(prop_v)
                    for prop_k, prop_v in value.items()
                }
            elif key == "items" and isinstance(value, dict):
                result[snake_key] = self._transform_schema_for_gemini(value)
            elif key == "anyOf" and isinstance(value, list):
                # Handle nullable types (Type | None)
                has_null = any(
                    isinstance(item, dict) and item.get("type") == "null"
                    for item in value
                )
                if has_null:
                    result["nullable"] = True

                # Get first non-null schema
                for item in value:
                    if isinstance(item, dict) and item.get("type") != "null":
                        transformed = self._transform_schema_for_gemini(item)
                        for k, v in transformed.items():
                            if k not in result:
                                result[k] = v
                        break
            else:
                result[snake_key] = value

        return result

    def _repair_truncated_json(self, json_str: str, tool_name: str = "") -> dict:
        """
        Advanced JSON repair for truncated or malformed JSON from LLM responses.

        Handles:
        - Missing closing braces/brackets
        - Truncated string values
        - Missing required fields
        - Trailing commas
        """
        import re

        # Step 1: Try basic fixes first
        fixed = json_str.strip()

        # Remove trailing commas
        fixed = re.sub(r",\s*}", "}", fixed)
        fixed = re.sub(r",\s*]", "]", fixed)

        try:
            return json.loads(fixed)
        except json.JSONDecodeError as e:
            print("   🔧 Attempting advanced JSON repair...")

            # Step 2: Check for truncation issues
            if e.msg == "Expecting value":
                # Likely truncated - try to close open structures
                fixed = self._close_json_structures(fixed)
                try:
                    return json.loads(fixed)
                except (json.JSONDecodeError, ValueError, TypeError):
                    pass

            # Step 3: Try to extract partial valid JSON
            if e.msg.startswith("Expecting") and e.pos:
                # Truncate at error position and try to close
                truncated = fixed[: e.pos]
                closed = self._close_json_structures(truncated)
                try:
                    partial = json.loads(closed)
                    print("   ✅ Extracted partial JSON successfully")
                    return partial
                except (json.JSONDecodeError, ValueError, TypeError):
                    pass

            # Step 4: Tool-specific defaults for critical tools
            if tool_name == "write_file":
                # For write_file, try to extract at least file_path
                file_path_match = re.search(r'"file_path"\s*:\s*"([^"]*)"', fixed)
                if file_path_match:
                    print("   ⚠️  write_file JSON truncated, using minimal structure")
                    return {
                        "file_path": file_path_match.group(1),
                        "content": "",  # Empty content is better than crashing
                    }

            # Step 5: Last resort - return error indicator
            print("   ❌ JSON repair failed completely")
            return None

    def _close_json_structures(self, json_str: str) -> str:
        """
        Intelligently close unclosed JSON structures.
        Counts braces and brackets to determine what needs closing.
        """
        # Count open structures
        open_braces = json_str.count("{") - json_str.count("}")
        open_brackets = json_str.count("[") - json_str.count("]")

        # Check if we're in the middle of a string
        quote_count = json_str.count('"')
        in_string = (quote_count % 2) != 0

        result = json_str

        # Close string if needed
        if in_string:
            result += '"'

        # Close brackets first (inner structures)
        result += "]" * open_brackets

        # Close braces
        result += "}" * open_braces

        return result

    async def _call_openai_with_tools(
        self, client, system_message, messages, tools, max_tokens
    ):
        """Call OpenAI API with robust JSON error handling and retry mechanism"""
        openai_tools = []
        for tool in tools:
            openai_tools.append(
                {
                    "type": "function",
                    "function": {
                        "name": tool["name"],
                        "description": tool["description"],
                        "parameters": tool["input_schema"],
                    },
                }
            )

        openai_messages = [{"role": "system", "content": system_message}]
        openai_messages.extend(messages)

        # Retry mechanism for API calls
        max_retries = 3
        retry_delay = 2  # seconds

        # Use implementation-specific model for code generation
        impl_model = self.default_models.get(
            "openai_implementation", self.default_models["openai"]
        )
        self.logger.info(f"🔧 Code generation using model: {impl_model}")

        for attempt in range(max_retries):
            try:
                # Try max_tokens first, fallback to max_completion_tokens if unsupported
                try:
                    response = await client.chat.completions.create(
                        model=impl_model,
                        messages=openai_messages,
                        tools=openai_tools if openai_tools else None,
                        max_tokens=max_tokens,
                        temperature=0.2,
                    )
                except Exception as e:
                    if "max_tokens" in str(e) and "max_completion_tokens" in str(e):
                        # Retry with max_completion_tokens for models that require it
                        response = await client.chat.completions.create(
                            model=impl_model,
                            messages=openai_messages,
                            tools=openai_tools if openai_tools else None,
                            max_completion_tokens=max_tokens,
                        )
                    else:
                        raise

                # Validate response structure
                if (
                    not response
                    or not hasattr(response, "choices")
                    or not response.choices
                ):
                    raise ValueError("Invalid API response: missing choices")

                if not response.choices[0] or not hasattr(
                    response.choices[0], "message"
                ):
                    raise ValueError("Invalid API response: missing message in choice")

                message = response.choices[0].message
                content = message.content or ""

                # Successfully got a valid response
                break

            except json.JSONDecodeError as e:
                print(
                    f"\n❌ JSON Decode Error in API response (attempt {attempt + 1}/{max_retries}):"
                )
                print(f"   Error: {e}")
                print(f"   Position: line {e.lineno}, column {e.colno}")

                if attempt < max_retries - 1:
                    print(f"   ⏳ Retrying in {retry_delay} seconds...")
                    await asyncio.sleep(retry_delay)
                    retry_delay *= 2  # Exponential backoff
                else:
                    print("   ❌ All retries exhausted")
                    raise

            except (ValueError, AttributeError, TypeError) as e:
                print(f"\n❌ API Response Error (attempt {attempt + 1}/{max_retries}):")
                print(f"   Error type: {type(e).__name__}")
                print(f"   Error: {e}")

                if attempt < max_retries - 1:
                    print(f"   ⏳ Retrying in {retry_delay} seconds...")
                    await asyncio.sleep(retry_delay)
                    retry_delay *= 2
                else:
                    print("   ❌ All retries exhausted")
                    # Return empty response instead of crashing
                    return {
                        "content": "API error - unable to get valid response",
                        "tool_calls": [],
                    }

            except Exception as e:
                print(
                    f"\n❌ Unexpected API Error (attempt {attempt + 1}/{max_retries}):"
                )
                print(f"   Error type: {type(e).__name__}")
                print(f"   Error: {e}")

                if attempt < max_retries - 1:
                    print(f"   ⏳ Retrying in {retry_delay} seconds...")
                    await asyncio.sleep(retry_delay)
                    retry_delay *= 2
                else:
                    print("   ❌ All retries exhausted")
                    raise

        tool_calls = []
        if message.tool_calls:
            for tool_call in message.tool_calls:
                try:
                    # Attempt to parse tool call arguments
                    parsed_input = json.loads(tool_call.function.arguments)
                    tool_calls.append(
                        {
                            "id": tool_call.id,
                            "name": tool_call.function.name,
                            "input": parsed_input,
                        }
                    )
                except json.JSONDecodeError as e:
                    # Detailed JSON parsing error logging
                    print("\n❌ JSON Parsing Error in tool call:")
                    print(f"   Tool: {tool_call.function.name}")
                    print(f"   Error: {e}")
                    print("   Raw arguments (first 500 chars):")
                    print(f"   {tool_call.function.arguments[:500]}")
                    print(f"   Error position: line {e.lineno}, column {e.colno}")
                    print(
                        f"   Problem at: ...{tool_call.function.arguments[max(0, e.pos-50):e.pos+50]}..."
                    )

                    # Attempt advanced JSON repair
                    repaired = self._repair_truncated_json(
                        tool_call.function.arguments, tool_call.function.name
                    )

                    if repaired:
                        print("   ✅ JSON repaired successfully")
                        tool_calls.append(
                            {
                                "id": tool_call.id,
                                "name": tool_call.function.name,
                                "input": repaired,
                            }
                        )
                    else:
                        # Skip this tool call if repair failed
                        print("   ⚠️  Skipping unrepairable tool call")
                        continue

        # Extract token usage and calculate cost
        token_usage = {}
        cost = 0.0
        
        if hasattr(response, 'usage') and response.usage:
            token_usage = {
                "prompt_tokens": response.usage.prompt_tokens,
                "completion_tokens": response.usage.completion_tokens,
                "total_tokens": response.usage.total_tokens
            }
            
            # Use dynamic cost calculation based on current model
            from utils.model_limits import calculate_token_cost
            cost = calculate_token_cost(
                response.usage.prompt_tokens,
                response.usage.completion_tokens,
                model_name=self.default_models.get("openai")
            )
            
            print(f"💰 Tokens: {token_usage['total_tokens']} (${cost:.4f})")
            self.logger.info(f"Token usage: {token_usage['prompt_tokens']} prompt + {token_usage['completion_tokens']} completion = {token_usage['total_tokens']} total (${cost:.4f})")

        return {
            "content": content, 
            "tool_calls": tool_calls,
            "token_usage": token_usage,
            "cost": cost
        }

    # ==================== 5. Tools and Utility Methods (Utility Layer) ====================

    def _validate_messages(self, messages: List[Dict]) -> List[Dict]:
        """Validate and clean message list"""
        valid_messages = []
        for msg in messages:
            content = msg.get("content", "").strip()
            if content:
                valid_messages.append(
                    {"role": msg.get("role", "user"), "content": content}
                )
            else:
                self.logger.warning(f"Skipping empty message: {msg}")
        return valid_messages

    def _prepare_mcp_tool_definitions(self) -> List[Dict[str, Any]]:
        """Prepare tool definitions in Anthropic API standard format with filtering"""
        # Get all available tools
        all_tools = get_mcp_tools("code_implementation")

        # Define essential tools for code implementation
        essential_tool_names = {"write_file", "search_code_references"}

        # Filter to only essential tools
        filtered_tools = [
            tool for tool in all_tools if tool.get("name") in essential_tool_names
        ]

        self.logger.info(
            f"🔧 Tool filtering: {len(filtered_tools)}/{len(all_tools)} tools enabled"
        )
        self.logger.info(
            f"   Available tools: {[tool.get('name') for tool in filtered_tools]}"
        )

        return filtered_tools

        # return get_mcp_tools("code_implementation")

    def _check_tool_results_for_errors(self, tool_results: List[Dict]) -> bool:
        """Check tool results for errors with JSON repair capability"""
        for result in tool_results:
            try:
                if hasattr(result["result"], "content") and result["result"].content:
                    content_text = result["result"].content[0].text

                    # First attempt: try direct JSON parsing
                    try:
                        parsed_result = json.loads(content_text)
                        if parsed_result.get("status") == "error":
                            return True
                    except json.JSONDecodeError as e:
                        # JSON parsing failed - try to repair
                        print("\n⚠️  JSON parsing failed in tool result check:")
                        print(f"   Error: {e}")
                        print(
                            f"   Position: line {e.lineno}, column {e.colno}, char {e.pos}"
                        )
                        print(f"   Content length: {len(content_text)} chars")
                        print(f"   First 300 chars: {content_text[:300]}")

                        # Attempt to repair the JSON
                        repaired = self._repair_truncated_json(content_text)
                        if repaired:
                            print("   ✅ Tool result JSON repaired successfully")
                            if repaired.get("status") == "error":
                                return True
                        else:
                            # Fallback: check for "error" keyword in text
                            if "error" in content_text.lower():
                                return True

                elif isinstance(result["result"], str):
                    if "error" in result["result"].lower():
                        return True

            except (AttributeError, IndexError) as e:
                # Unexpected result structure
                print(f"\n⚠️  Unexpected result structure: {type(e).__name__}: {e}")
                result_str = str(result["result"])
                if "error" in result_str.lower():
                    return True
        return False

    # ==================== 6. User Interaction and Feedback (Interaction Layer) ====================

    def _generate_success_guidance(self, files_count: int) -> str:
        """Generate concise success guidance for continuing implementation"""
        return f"""✅ File implementation completed successfully!

📊 **Progress Status:** {files_count} files implemented

🎯 **Next Action:** Check if ALL files from the reproduction plan are implemented.

⚡ **Decision Process:**
1. **If ALL files are implemented:** Use `execute_python` or `execute_bash` to test the complete implementation, then respond "**implementation complete**" to end the conversation
2. **If MORE files need implementation:** Continue with dependency-aware workflow:
   - **Start with `read_code_mem`** to understand existing implementations and dependencies
   - **Optionally use `search_code_references`** for reference patterns (OPTIONAL - use for inspiration only, original paper specs take priority)
   - **Then `write_file`** to implement the new component
   - **Finally: Test** if needed

💡 **Key Point:** Always verify completion status before continuing with new file creation."""

    def _generate_error_guidance(self) -> str:
        """Generate error guidance for handling issues"""
        return """❌ Error detected during file implementation.

🔧 **Action Required:**
1. Review the error details above
2. Fix the identified issue
3. **Check if ALL files from the reproduction plan are implemented:**
   - **If YES:** Use `execute_python` or `execute_bash` to test the complete implementation, then respond "**implementation complete**" to end the conversation
   - **If NO:** Continue with proper development cycle for next file:
     - **Start with `read_code_mem`** to understand existing implementations
     - **Optionally use `search_code_references`** for reference patterns (OPTIONAL - for inspiration only)
     - **Then `write_file`** to implement properly
     - **Test** if needed
4. Ensure proper error handling in future implementations

💡 **Remember:** Always verify if all planned files are implemented before continuing with new file creation."""

    def _generate_no_tools_guidance(self, files_count: int) -> str:
        """Generate concise guidance when no tools are called"""
        return f"""⚠️ No tool calls detected in your response.

📊 **Current Progress:** {files_count} files implemented

🚨 **Action Required:** You must use tools. **FIRST check if ALL files from the reproduction plan are implemented:**

⚡ **Decision Process:**
1. **If ALL files are implemented:** Use `execute_python` or `execute_bash` to test the complete implementation, then respond "**implementation complete**" to end the conversation
2. **If MORE files need implementation:** Follow the development cycle:
   - **Start with `read_code_mem`** to understand existing implementations
   - **Optionally use `search_code_references`** for reference patterns (OPTIONAL - for inspiration only)
   - **Then `write_file`** to implement the new component
   - **Finally: Test** if needed

🚨 **Critical:** Always verify completion status first, then use appropriate tools - not just explanations!"""

    def _compile_user_response(self, tool_results: List[Dict], guidance: str) -> str:
        """Compile tool results and guidance into a single user response"""
        response_parts = []

        if tool_results:
            response_parts.append("🔧 **Tool Execution Results:**")
            for tool_result in tool_results:
                tool_name = tool_result["tool_name"]
                result_content = tool_result["result"]
                response_parts.append(
                    f"```\nTool: {tool_name}\nResult: {result_content}\n```"
                )

        if guidance:
            response_parts.append("\n" + guidance)

        return "\n\n".join(response_parts)

    # ==================== 7. Reporting and Output (Output Layer) ====================

    async def _generate_pure_code_final_report_with_concise_agents(
        self,
        iterations: int,
        elapsed_time: float,
        code_agent: CodeImplementationAgent,
        memory_agent: ConciseMemoryAgent,
    ):
        """Generate final report using concise agent statistics"""
        try:
            code_stats = code_agent.get_implementation_statistics()
            memory_stats = memory_agent.get_memory_statistics(
                code_stats["files_implemented_count"]
            )

            if self.mcp_agent:
                history_result = await self.mcp_agent.call_tool(
                    "get_operation_history", {"last_n": 30}
                )
                history_data = (
                    json.loads(history_result)
                    if isinstance(history_result, str)
                    else history_result
                )
            else:
                history_data = {"total_operations": 0, "history": []}

            write_operations = 0
            files_created = []
            if "history" in history_data:
                for item in history_data["history"]:
                    if item.get("action") == "write_file":
                        write_operations += 1
                        file_path = item.get("details", {}).get("file_path", "unknown")
                        files_created.append(file_path)

            report = f"""
# Pure Code Implementation Completion Report (Write-File-Based Memory Mode)

## Execution Summary
- Implementation iterations: {iterations}
- Total elapsed time: {elapsed_time:.2f} seconds
- Files implemented: {code_stats['total_files_implemented']}
- File write operations: {write_operations}
- Total MCP operations: {history_data.get('total_operations', 0)}

## Read Tools Configuration
- Read tools enabled: {code_stats['read_tools_status']['read_tools_enabled']}
- Status: {code_stats['read_tools_status']['status']}
- Tools affected: {', '.join(code_stats['read_tools_status']['tools_affected'])}

## Agent Performance
### Code Implementation Agent
- Files tracked: {code_stats['files_implemented_count']}
- Technical decisions: {code_stats['technical_decisions_count']}
- Constraints tracked: {code_stats['constraints_count']}
- Architecture notes: {code_stats['architecture_notes_count']}
- Dependency analysis performed: {code_stats['dependency_analysis_count']}
- Files read for dependencies: {code_stats['files_read_for_dependencies']}
- Last summary triggered at file count: {code_stats['last_summary_file_count']}

### Concise Memory Agent (Write-File-Based)
- Last write_file detected: {memory_stats['last_write_file_detected']}
- Should clear memory next: {memory_stats['should_clear_memory_next']}
- Files implemented count: {memory_stats['implemented_files_tracked']}
- Current round: {memory_stats['current_round']}
- Concise mode active: {memory_stats['concise_mode_active']}
- Current round tool results: {memory_stats['current_round_tool_results']}
- Essential tools recorded: {memory_stats['essential_tools_recorded']}

## Files Created
"""
            for file_path in files_created[-20:]:
                report += f"- {file_path}\n"

            if len(files_created) > 20:
                report += f"... and {len(files_created) - 20} more files\n"

            report += """
## Architecture Features
✅ WRITE-FILE-BASED Memory Agent - Clear after each file generation
✅ After write_file: Clear history → Keep system prompt + initial plan + tool results
✅ Tool accumulation: read_code_mem, read_file, search_reference_code until next write_file
✅ Clean memory cycle: write_file → clear → accumulate → write_file → clear
✅ Essential tool recording with write_file detection
✅ Specialized agent separation for clean code organization
✅ MCP-compliant tool execution
✅ Production-grade code with comprehensive type hints
✅ Intelligent dependency analysis and file reading
✅ Automated read_file usage for implementation context
✅ Eliminates conversation clutter between file generations
✅ Focused memory for efficient next file generation
"""
            return report

        except Exception as e:
            self.logger.error(f"Failed to generate final report: {e}")
            return f"Failed to generate final report: {str(e)}"


async def main():
    """Main function for running the workflow"""
    # Configure root logger carefully to avoid duplicates
    root_logger = logging.getLogger()
    if not root_logger.handlers:
        handler = logging.StreamHandler()
        formatter = logging.Formatter("%(levelname)s:%(name)s:%(message)s")
        handler.setFormatter(formatter)
        root_logger.addHandler(handler)
        root_logger.setLevel(logging.INFO)

    workflow = CodeImplementationWorkflowWithIndex()

    print("=" * 60)
    print("Code Implementation Workflow with UNIFIED Reference Indexer")
    print("=" * 60)
    print("Select mode:")
    print("1. Test Code Reference Indexer Integration")
    print("2. Run Full Implementation Workflow")
    print("3. Run Implementation with Pure Code Mode")
    print("4. Test Read Tools Configuration")

    # mode_choice = input("Enter choice (1-4, default: 3): ").strip()

    # For testing purposes, we'll run the test first
    # if mode_choice == "4":
    #     print("Testing Read Tools Configuration...")

    #     # Create a test workflow normally
    #     test_workflow = CodeImplementationWorkflow()

    #     # Create a mock code agent for testing
    #     print("\n🧪 Testing with read tools DISABLED:")
    #     test_agent_disabled = CodeImplementationAgent(None, enable_read_tools=False)
    #     await test_agent_disabled.test_read_tools_configuration()

    #     print("\n🧪 Testing with read tools ENABLED:")
    #     test_agent_enabled = CodeImplementationAgent(None, enable_read_tools=True)
    #     await test_agent_enabled.test_read_tools_configuration()

    #     print("✅ Read tools configuration testing completed!")
    #     return

    # print("Running Code Reference Indexer Integration Test...")

    test_success = True
    if test_success:
        print("\n" + "=" * 60)
        print("🎉 UNIFIED Code Reference Indexer Integration Test PASSED!")
        print("🔧 Three-step process successfully merged into ONE tool")
        print("=" * 60)

        # Ask if user wants to continue with actual workflow
        print("\nContinuing with workflow execution...")

        plan_file = "/data2/bjdwhzzh/project-hku/Deepcode_collections/DeepCode/deepcode_lab/papers/54_only_code_gen/initial_plan.txt"
        # plan_file = "/data2/bjdwhzzh/project-hku/Code-Agent2.0/Code-Agent/deepcode-mcp/agent_folders/papers/1/initial_plan.txt"
        target_directory = "/data2/bjdwhzzh/project-hku/Deepcode_collections/DeepCode/deepcode_lab/papers/54_only_code_gen/"
        print("Implementation Mode Selection:")
        print("1. Pure Code Implementation Mode (Recommended)")
        print("2. Iterative Implementation Mode")

        pure_code_mode = True
        mode_name = "Pure Code Implementation Mode with Memory Agent Architecture + Code Reference Indexer"
        print(f"Using: {mode_name}")

        # Configure read tools - modify this parameter to enable/disable read tools
        enable_read_tools = (
            True  # Set to False to disable read_file and read_code_mem tools
        )
        read_tools_status = "ENABLED" if enable_read_tools else "DISABLED"
        print(f"🔧 Read tools (read_file, read_code_mem): {read_tools_status}")

        # NOTE: To test without read tools, change the line above to:
        # enable_read_tools = False

        result = await workflow.run_workflow(
            plan_file,
            target_directory=target_directory,
            pure_code_mode=pure_code_mode,
            enable_read_tools=enable_read_tools,
        )

        print("=" * 60)
        print("Workflow Execution Results:")
        print(f"Status: {result['status']}")
        print(f"Mode: {mode_name}")

        if result["status"] == "success":
            print(f"Code Directory: {result['code_directory']}")
            print(f"MCP Architecture: {result.get('mcp_architecture', 'unknown')}")
            print("Execution completed!")
        else:
            print(f"Error Message: {result['message']}")

        print("=" * 60)
        print(
            "✅ Using Standard MCP Architecture with Memory Agent + Code Reference Indexer"
        )

    else:
        print("\n" + "=" * 60)
        print("❌ Code Reference Indexer Integration Test FAILED!")
        print("Please check the configuration and try again.")
        print("=" * 60)


if __name__ == "__main__":
    asyncio.run(main())


================================================
FILE: workflows/codebase_index_workflow.py
================================================
"""
Codebase Index Workflow

This workflow integrates the functionality of run_indexer.py and code_indexer.py
to build intelligent relationships between existing codebase and target structure.

Features:
- Extract target file structure from initial_plan.txt
- Analyze codebase and build indexes
- Generate relationship mappings and statistical reports
- Provide reference basis for code reproduction
"""

import asyncio
import json
import logging
import os
import re
import sys
from pathlib import Path
from typing import Dict, Any, Optional
import yaml

# Add tools directory to path
sys.path.append(str(Path(__file__).parent.parent / "tools"))

from tools.code_indexer import CodeIndexer


class CodebaseIndexWorkflow:
    """Codebase Index Workflow Class"""

    def __init__(self, logger=None):
        """
        Initialize workflow

        Args:
            logger: Logger instance
        """
        self.logger = logger or self._setup_default_logger()
        self.indexer = None

    def _setup_default_logger(self) -> logging.Logger:
        """Setup default logger"""
        logger = logging.getLogger("CodebaseIndexWorkflow")
        logger.setLevel(logging.INFO)

        if not logger.handlers:
            handler = logging.StreamHandler()
            formatter = logging.Formatter(
                "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
            )
            handler.setFormatter(formatter)
            logger.addHandler(handler)

        return logger

    def extract_file_tree_from_plan(self, plan_content: str) -> Optional[str]:
        """
        Extract file tree structure from initial_plan.txt content

        Args:
            plan_content: Content of the initial_plan.txt file

        Returns:
            Extracted file tree structure as string
        """
        # Look for file structure section, specifically "## File Structure" format
        file_structure_pattern = r"## File Structure[^\n]*\n```[^\n]*\n(.*?)\n```"

        match = re.search(file_structure_pattern, plan_content, re.DOTALL)
        if match:
            file_tree = match.group(1).strip()
            lines = file_tree.split("\n")

            # Clean tree structure - remove empty lines and comments not part of structure
            cleaned_lines = []
            for line in lines:
                # Keep tree structure lines
                if line.strip() and (
                    any(char in line for char in ["├──", "└──", "│"])
                    or line.strip().endswith("/")
                    or "." in line.split("/")[-1]  # has file extension
                    or line.strip().endswith(".py")
                    or line.strip().endswith(".txt")
                    or line.strip().endswith(".md")
                    or line.strip().endswith(".yaml")
                ):
                    cleaned_lines.append(line)

            if len(cleaned_lines) >= 5:
                file_tree = "\n".join(cleaned_lines)
                self.logger.info(
                    f"📊 Extracted file tree structure from ## File Structure section ({len(cleaned_lines)} lines)"
                )
                return file_tree

        # Fallback: look for any code block containing project structure
        code_block_patterns = [
            r"```[^\n]*\n(project/.*?(?:├──|└──).*?)\n```",
            r"```[^\n]*\n(src/.*?(?:├──|└──).*?)\n```",
            r"```[^\n]*\n(core/.*?(?:├──|└──).*?)\n```",
            r"```[^\n]*\n(.*?(?:├──|└──).*?(?:\.py|\.txt|\.md|\.yaml).*?)\n```",
        ]

        for pattern in code_block_patterns:
            match = re.search(pattern, plan_content, re.DOTALL)
            if match:
                file_tree = match.group(1).strip()
                lines = [line for line in file_tree.split("\n") if line.strip()]
                if len(lines) >= 5:
                    self.logger.info(
                        f"📊 Extracted file tree structure from code block ({len(lines)} lines)"
                    )
                    return file_tree

        # Final fallback: extract file paths from file mentions and create basic structure
        self.logger.warning(
            "⚠️ No standard file tree found, trying to extract from file mentions..."
        )

        # Search for file paths in backticks throughout the document
        file_mentions = re.findall(
            r"`([^`]*(?:\.py|\.txt|\.md|\.yaml|\.yml)[^`]*)`", plan_content
        )

        if file_mentions:
            # Organize files into directory structure
            dirs = set()
            files_by_dir = {}

            for file_path in file_mentions:
                file_path = file_path.strip()
                if "/" in file_path:
                    dir_path = "/".join(file_path.split("/")[:-1])
                    filename = file_path.split("/")[-1]
                    dirs.add(dir_path)
                    if dir_path not in files_by_dir:
                        files_by_dir[dir_path] = []
                    files_by_dir[dir_path].append(filename)
                else:
                    if "root" not in files_by_dir:
                        files_by_dir["root"] = []
                    files_by_dir["root"].append(file_path)

            # Create tree structure
            structure_lines = []

            # Determine root directory name from common patterns
            if any("src/" in f for f in file_mentions):
                root_name = "src"
            elif any("core/" in f for f in file_mentions):
                root_name = "core"
            elif any("lib/" in f for f in file_mentions):
                root_name = "lib"
            else:
                root_name = "project"
            structure_lines.append(f"{root_name}/")

            # Add directories and files
            sorted_dirs = sorted(dirs) if dirs else []
            for i, dir_path in enumerate(sorted_dirs):
                is_last_dir = i == len(sorted_dirs) - 1
                prefix = "└──" if is_last_dir else "├──"
                structure_lines.append(f"{prefix} {dir_path}/")

                if dir_path in files_by_dir:
                    files = sorted(files_by_dir[dir_path])
                    for j, filename in enumerate(files):
                        is_last_file = j == len(files) - 1
                        if is_last_dir:
                            file_prefix = "    └──" if is_last_file else "    ├──"
                        else:
                            file_prefix = "│   └──" if is_last_file else "│   ├──"
                        structure_lines.append(f"{file_prefix} {filename}")

            # Add root files (if any)
            if "root" in files_by_dir:
                root_files = sorted(files_by_dir["root"])
                for i, filename in enumerate(root_files):
                    is_last = (i == len(root_files) - 1) and not sorted_dirs
                    prefix = "└──" if is_last else "├──"
                    structure_lines.append(f"{prefix} {filename}")

            if len(structure_lines) >= 3:
                file_tree = "\n".join(structure_lines)
                self.logger.info(
                    f"📊 Generated file tree from file mentions ({len(structure_lines)} lines)"
                )
                return file_tree

        # If no file tree found, return None
        self.logger.warning("⚠️ No file tree structure found in initial plan")
        return None

    def load_target_structure_from_plan(self, plan_path: str) -> str:
        """
        Load target structure from initial_plan.txt and extract file tree

        Args:
            plan_path: Path to initial_plan.txt file

        Returns:
            Extracted file tree structure
        """
        try:
            # Load complete plan content
            with open(plan_path, "r", encoding="utf-8") as f:
                plan_content = f.read()

            self.logger.info(f"📄 Loaded initial plan ({len(plan_content)} characters)")

            # Extract file tree structure
            file_tree = self.extract_file_tree_from_plan(plan_content)

            if file_tree:
                self.logger.info(
                    "✅ Successfully extracted file tree from initial plan"
                )
                self.logger.info("📋 Extracted structure preview:")
                # Show first few lines of extracted tree
                preview_lines = file_tree.split("\n")[:8]
                for line in preview_lines:
                    self.logger.info(f"   {line}")
                if len(file_tree.split("\n")) > 8:
                    self.logger.info(
                        f"   ... {len(file_tree.split('\n')) - 8} more lines"
                    )
                return file_tree
            else:
                self.logger.warning("⚠️ Unable to extract file tree from initial plan")
                self.logger.info("🔄 Falling back to default target structure")
                return self.get_default_target_structure()

        except Exception as e:
            self.logger.error(f"❌ Failed to load initial plan file {plan_path}: {e}")
            self.logger.info("🔄 Falling back to default target structure")
            return self.get_default_target_structure()

    def get_default_target_structure(self) -> str:
        """Get default target structure"""
        return """
project/
├── src/
│   ├── core/
│   │   ├── gcn.py        # GCN encoder
│   │   ├── diffusion.py  # forward/reverse processes
│   │   ├── denoiser.py   # denoising MLP
│   │   └── fusion.py     # fusion combiner
│   ├── models/           # model wrapper classes
│   │   └── recdiff.py
│   ├── utils/
│   │   ├── data.py       # loading & preprocessing
│   │   ├── predictor.py  # scoring functions
│   │   ├── loss.py       # loss functions
│   │   ├── metrics.py    # NDCG, Recall etc.
│   │   └── sched.py      # beta/alpha schedule utils
│   └── configs/
│       └── default.yaml  # hyperparameters, paths
├── tests/
│   ├── test_gcn.py
│   ├── test_diffusion.py
│   ├── test_denoiser.py
│   ├── test_loss.py
│   └── test_pipeline.py
├── docs/
│   ├── architecture.md
│   ├── api_reference.md
│   └── README.md
├── experiments/
│   ├── run_experiment.py
│   └── notebooks/
│       └── analysis.ipynb
├── requirements.txt
└── setup.py
"""

    def load_or_create_indexer_config(self, paper_dir: str) -> Dict[str, Any]:
        """
        Load or create indexer configuration

        Args:
            paper_dir: Paper directory path

        Returns:
            Configuration dictionary
        """
        # Try to load existing configuration file
        config_path = Path(__file__).parent.parent / "tools" / "indexer_config.yaml"

        try:
            if config_path.exists():
                with open(config_path, "r", encoding="utf-8") as f:
                    config = yaml.safe_load(f)

                # Update path configuration to current paper directory
                if "paths" not in config:
                    config["paths"] = {}
                config["paths"]["code_base_path"] = os.path.join(paper_dir, "code_base")
                config["paths"]["output_dir"] = os.path.join(paper_dir, "indexes")

                # Adjust performance settings for workflow
                if "performance" in config:
                    config["performance"]["enable_concurrent_analysis"] = (
                        False  # Disable concurrency to avoid API limits
                    )
                if "debug" in config:
                    config["debug"]["verbose_output"] = True  # Enable verbose output
                if "llm" in config:
                    config["llm"]["request_delay"] = 0.5  # Increase request delay

                self.logger.info(f"Loaded configuration file: {config_path}")
                return config

        except Exception as e:
            self.logger.warning(f"Failed to load configuration file: {e}")

        # If loading fails, use default configuration
        self.logger.info("Using default configuration")
        default_config = {
            "paths": {
                "code_base_path": os.path.join(paper_dir, "code_base"),
                "output_dir": os.path.join(paper_dir, "indexes"),
            },
            "llm": {
                "model_provider": "anthropic",
                "max_tokens": 4000,
                "temperature": 0.3,
                "request_delay": 0.5,  # Increase request delay
                "max_retries": 3,
                "retry_delay": 1.0,
            },
            "file_analysis": {
                "max_file_size": 1048576,  # 1MB
                "max_content_length": 3000,
                "supported_extensions": [
                    ".py",
                    ".js",
                    ".ts",
                    ".java",
                    ".cpp",
                    ".c",
                    ".h",
                    ".hpp",
                    ".cs",
                    ".php",
                    ".rb",
                    ".go",
                    ".rs",
                    ".scala",
                    ".kt",
                    ".yaml",
                    ".yml",
                    ".json",
                    ".xml",
                    ".toml",
                    ".md",
                    ".txt",
                ],
                "skip_directories": [
                    "__pycache__",
                    "node_modules",
                    "target",
                    "build",
                    "dist",
                    "venv",
                    "env",
                    ".git",
                    ".svn",
                    "data",
                    "datasets",
                ],
            },
            "relationships": {
                "min_confidence_score": 0.3,
                "high_confidence_threshold": 0.7,
                "relationship_types": {
                    "direct_match": 1.0,
                    "partial_match": 0.8,
                    "reference": 0.6,
                    "utility": 0.4,
                },
            },
            "performance": {
                "enable_concurrent_analysis": False,  # Disable concurrency to avoid API limits
                "max_concurrent_files": 3,
                "enable_content_caching": True,
                "max_cache_size": 100,
            },
            "debug": {
                "verbose_output": True,
                "save_raw_responses": False,
                "mock_llm_responses": False,
            },
            "output": {
                "generate_summary": True,
                "generate_statistics": True,
                "include_metadata": True,
                "json_indent": 2,
            },
            "logging": {"level": "INFO", "log_to_file": False},
        }

        return default_config

    async def run_indexing_workflow(
        self,
        paper_dir: str,
        initial_plan_path: Optional[str] = None,
        config_path: str = "mcp_agent.secrets.yaml",
    ) -> Dict[str, Any]:
        """
        Run the complete code indexing workflow

        Args:
            paper_dir: Paper directory path
            initial_plan_path: Initial plan file path (optional)
            config_path: API configuration file path

        Returns:
            Index result dictionary
        """
        try:
            self.logger.info("🚀 Starting codebase index workflow...")

            # Step 1: Determine initial plan file path
            if not initial_plan_path:
                initial_plan_path = os.path.join(paper_dir, "initial_plan.txt")

            # Step 2: Load target structure
            if os.path.exists(initial_plan_path):
                self.logger.info(
                    f"📐 Loading target structure from {initial_plan_path}"
                )
                target_structure = self.load_target_structure_from_plan(
                    initial_plan_path
                )
            else:
                self.logger.warning(
                    f"⚠️ Initial plan file does not exist: {initial_plan_path}"
                )
                self.logger.info("📐 Using default target structure")
                target_structure = self.get_default_target_structure()

            # Step 3: Check codebase path
            code_base_path = os.path.join(paper_dir, "code_base")
            if not os.path.exists(code_base_path):
                self.logger.error(f"❌ Codebase path does not exist: {code_base_path}")
                return {
                    "status": "error",
                    "message": f"Code base path does not exist: {code_base_path}",
                    "output_files": {},
                }

            # Step 4: Create output directory
            output_dir = os.path.join(paper_dir, "indexes")
            os.makedirs(output_dir, exist_ok=True)

            # Step 5: Load configuration
            indexer_config = self.load_or_create_indexer_config(paper_dir)

            self.logger.info(f"📁 Codebase path: {code_base_path}")
            self.logger.info(f"📤 Output directory: {output_dir}")

            # Step 6: Create code indexer
            self.indexer = CodeIndexer(
                code_base_path=code_base_path,
                target_structure=target_structure,
                output_dir=output_dir,
                config_path=config_path,
                enable_pre_filtering=True,
            )

            # Apply configuration settings
            self.indexer.indexer_config = indexer_config

            # Directly set configuration attributes to indexer
            if "file_analysis" in indexer_config:
                file_config = indexer_config["file_analysis"]
                self.indexer.supported_extensions = set(
                    file_config.get(
                        "supported_extensions", self.indexer.supported_extensions
                    )
                )
                self.indexer.skip_directories = set(
                    file_config.get("skip_directories", self.indexer.skip_directories)
                )
                self.indexer.max_file_size = file_config.get(
                    "max_file_size", self.indexer.max_file_size
                )
                self.indexer.max_content_length = file_config.get(
                    "max_content_length", self.indexer.max_content_length
                )

            if "llm" in indexer_config:
                llm_config = indexer_config["llm"]
                self.indexer.model_provider = llm_config.get(
                    "model_provider", self.indexer.model_provider
                )
                self.indexer.llm_max_tokens = llm_config.get(
                    "max_tokens", self.indexer.llm_max_tokens
                )
                self.indexer.llm_temperature = llm_config.get(
                    "temperature", self.indexer.llm_temperature
                )
                self.indexer.request_delay = llm_config.get(
                    "request_delay", self.indexer.request_delay
                )
                self.indexer.max_retries = llm_config.get(
                    "max_retries", self.indexer.max_retries
                )
                self.indexer.retry_delay = llm_config.get(
                    "retry_delay", self.indexer.retry_delay
                )

            if "relationships" in indexer_config:
                rel_config = indexer_config["relationships"]
                self.indexer.min_confidence_score = rel_config.get(
                    "min_confidence_score", self.indexer.min_confidence_score
                )
                self.indexer.high_confidence_threshold = rel_config.get(
                    "high_confidence_threshold", self.indexer.high_confidence_threshold
                )
                self.indexer.relationship_types = rel_config.get(
                    "relationship_types", self.indexer.relationship_types
                )

            if "performance" in indexer_config:
                perf_config = indexer_config["performance"]
                self.indexer.enable_concurrent_analysis = perf_config.get(
                    "enable_concurrent_analysis",
                    self.indexer.enable_concurrent_analysis,
                )
                self.indexer.max_concurrent_files = perf_config.get(
                    "max_concurrent_files", self.indexer.max_concurrent_files
                )
                self.indexer.enable_content_caching = perf_config.get(
                    "enable_content_caching", self.indexer.enable_content_caching
                )
                self.indexer.max_cache_size = perf_config.get(
                    "max_cache_size", self.indexer.max_cache_size
                )

            if "debug" in indexer_config:
                debug_config = indexer_config["debug"]
                self.indexer.verbose_output = debug_config.get(
                    "verbose_output", self.indexer.verbose_output
                )
                self.indexer.save_raw_responses = debug_config.get(
                    "save_raw_responses", self.indexer.save_raw_responses
                )
                self.indexer.mock_llm_responses = debug_config.get(
                    "mock_llm_responses", self.indexer.mock_llm_responses
                )

            if "output" in indexer_config:
                output_config = indexer_config["output"]
                self.indexer.generate_summary = output_config.get(
                    "generate_summary", self.indexer.generate_summary
                )
                self.indexer.generate_statistics = output_config.get(
                    "generate_statistics", self.indexer.generate_statistics
                )
                self.indexer.include_metadata = output_config.get(
                    "include_metadata", self.indexer.include_metadata
                )

            self.logger.info("🔧 Indexer configuration completed")
            self.logger.info(f"🤖 Model provider: {self.indexer.model_provider}")
            self.logger.info(
                f"⚡ Concurrent analysis: {'Enabled' if self.indexer.enable_concurrent_analysis else 'Disabled'}"
            )
            self.logger.info(
                f"🗄️ Content caching: {'Enabled' if self.indexer.enable_content_caching else 'Disabled'}"
            )
            self.logger.info(
                f"🔍 Pre-filtering: {'Enabled' if self.indexer.enable_pre_filtering else 'Disabled'}"
            )

            self.logger.info("=" * 60)
            self.logger.info("🚀 Starting code indexing process...")

            # Step 7: Build all indexes
            output_files = await self.indexer.build_all_indexes()

            # Step 8: Generate summary report
            if output_files:
                summary_report = self.indexer.generate_summary_report(output_files)

                self.logger.info("=" * 60)
                self.logger.info("✅ Indexing completed successfully!")
                self.logger.info(f"📊 Processed {len(output_files)} repositories")
                self.logger.info("📁 Generated index files:")
                for repo_name, file_path in output_files.items():
                    self.logger.info(f"   📄 {repo_name}: {file_path}")
                self.logger.info(f"📋 Summary report: {summary_report}")

                # Statistics (if enabled)
                if self.indexer.generate_statistics:
                    self.logger.info("\n📈 Processing statistics:")
                    total_relationships = 0
                    high_confidence_relationships = 0

                    for file_path in output_files.values():
                        try:
                            with open(file_path, "r", encoding="utf-8") as f:
                                index_data = json.load(f)
                                relationships = index_data.get("relationships", [])
                                total_relationships += len(relationships)
                                high_confidence_relationships += len(
                                    [
                                        r
                                        for r in relationships
                                        if r.get("confidence_score", 0)
                                        > self.indexer.high_confidence_threshold
                                    ]
                                )
                        except Exception as e:
                            self.logger.warning(
                                f"   ⚠️ Unable to load statistics from {file_path}: {e}"
                            )

                    self.logger.info(
                        f"   🔗 Total relationships found: {total_relationships}"
                    )
                    self.logger.info(
                        f"   ⭐ High confidence relationships: {high_confidence_relationships}"
                    )
                    self.logger.info(
                        f"   📊 Average relationships per repository: {total_relationships / len(output_files) if output_files else 0:.1f}"
                    )

                self.logger.info("\n🎉 Code indexing process completed successfully!")

                return {
                    "status": "success",
                    "message": f"Successfully indexed {len(output_files)} repositories",
                    "output_files": output_files,
                    "summary_report": summary_report,
                    "statistics": {
                        "total_repositories": len(output_files),
                        "total_relationships": total_relationships,
                        "high_confidence_relationships": high_confidence_relationships,
                    }
                    if self.indexer.generate_statistics
                    else None,
                }
            else:
                self.logger.warning("⚠️ No index files generated")
                return {
                    "status": "warning",
                    "message": "No index files were generated",
                    "output_files": {},
                }

        except Exception as e:
            self.logger.error(f"❌ Index workflow failed: {e}")
            # If there are detailed error messages, log them
            import traceback

            self.logger.error(f"Detailed error information: {traceback.format_exc()}")
            return {"status": "error", "message": str(e), "output_files": {}}

    def print_banner(self):
        """Print application banner"""
        banner = """
╔═══════════════════════════════════════════════════════════════════════╗
║                    🔍 Codebase Index Workflow v1.0                   ║
║              Intelligent Code Relationship Analysis Tool              ║
╠═══════════════════════════════════════════════════════════════════════╣
║  📁 Analyzes existing codebases                                      ║
║  🔗 Builds intelligent relationships with target structure           ║
║  🤖 Powered by LLM analysis                                          ║
║  📊 Generates detailed JSON indexes                                   ║
║  🎯 Provides reference for code reproduction                          ║
╚═══════════════════════════════════════════════════════════════════════╝
        """
        print(banner)


# Convenience function for direct workflow invocation
async def run_codebase_indexing(
    paper_dir: str,
    initial_plan_path: Optional[str] = None,
    config_path: str = "mcp_agent.secrets.yaml",
    logger=None,
) -> Dict[str, Any]:
    """
    Convenience function to run codebase indexing

    Args:
        paper_dir: Paper directory path
        initial_plan_path: Initial plan file path (optional)
        config_path: API configuration file path
        logger: Logger instance (optional)

    Returns:
        Index result dictionary
    """
    workflow = CodebaseIndexWorkflow(logger=logger)
    workflow.print_banner()

    return await workflow.run_indexing_workflow(
        paper_dir=paper_dir,
        initial_plan_path=initial_plan_path,
        config_path=config_path,
    )


# Main function for testing
async def main():
    """Main function for testing workflow"""
    import logging

    # Setup logging
    logging.basicConfig(level=logging.INFO)
    logger = logging.getLogger(__name__)

    # Test parameters
    paper_dir = "./deepcode_lab/papers/1"
    initial_plan_path = os.path.join(paper_dir, "initial_plan.txt")

    # Run workflow
    result = await run_codebase_indexing(
        paper_dir=paper_dir, initial_plan_path=initial_plan_path, logger=logger
    )

    logger.info(f"Index result: {result}")


if __name__ == "__main__":
    asyncio.run(main())


================================================
FILE: workflows/plugins/USAGE.md
================================================
# User-in-Loop 插件系统使用指南

## 概述

这是一个插件式的用户交互系统，可以像中间件一样无侵入地插入到工作流中。

## 核心概念

```
工作流执行:  [Phase 1] ──▶ [Hook Point] ──▶ [Phase 2] ──▶ [Hook Point] ──▶ [Phase 3]
                              │                              │
                              ▼                              ▼
                         [Plugin A]                     [Plugin B]
                         需求分析                        计划确认
```

## 快速开始

### 1. 在 workflow_service.py 中添加插件支持

```python
# workflow_service.py

from workflows.plugins.integration import WorkflowPluginIntegration
from workflows.plugins import InteractionPoint

class WorkflowService:
    def __init__(self):
        self._tasks = {}
        self._subscribers = {}
        # 添加这一行
        self._plugin_integration = WorkflowPluginIntegration(self)

    async def execute_chat_planning(self, task_id, requirements, enable_indexing=False):
        # ... 原有代码 ...

        # ===== 添加插件支持 (仅需3行代码) =====

        # 1. 创建上下文
        context = self._plugin_integration.create_context(
            task_id=task_id,
            user_input=requirements,
            enable_indexing=enable_indexing,
        )

        # 2. 运行 BEFORE_PLANNING 插件 (需求分析)
        context = await self._plugin_integration.run_hook(
            InteractionPoint.BEFORE_PLANNING,
            context
        )

        # 检查是否被取消
        if context.get("workflow_cancelled"):
            return {"status": "cancelled", "reason": context.get("cancel_reason")}

        # 使用可能被增强的需求
        requirements = context.get("requirements", requirements)

        # ===== 原有的计划生成代码 =====
        planning_result = await run_chat_planning_agent(requirements, logger)

        # ===== 添加计划确认插件 =====
        context["planning_result"] = planning_result
        context = await self._plugin_integration.run_hook(
            InteractionPoint.AFTER_PLANNING,
            context
        )

        if context.get("workflow_cancelled"):
            return {"status": "cancelled", "reason": context.get("cancel_reason")}

        # 使用可能被修改的计划
        planning_result = context.get("planning_result", planning_result)

        # ===== 继续原有的代码实现流程 =====
        ...
```

### 2. 添加用户响应 API

```python
# workflows.py (API routes)

@router.post("/respond/{task_id}")
async def respond_to_interaction(task_id: str, response: InteractionResponseRequest):
    """用户提交交互响应"""
    success = workflow_service._plugin_integration.submit_response(
        task_id=task_id,
        action=response.action,
        data=response.data,
        skipped=response.skipped,
    )

    if not success:
        raise HTTPException(status_code=404, detail="No pending interaction")

    return {"status": "ok"}
```

### 3. 前端处理交互请求

```typescript
// useStreaming.ts

case 'interaction_required':
  // 显示交互面板
  setInteraction({
    type: message.interaction_type,
    title: message.title,
    description: message.description,
    data: message.data,
    options: message.options,
  });
  break;
```

## 配置插件

### 启用/禁用插件

```python
from workflows.plugins import get_default_registry

registry = get_default_registry()

# 禁用需求分析插件
registry.disable("requirement_analysis")

# 启用计划确认插件
registry.enable("plan_review")
```

### 创建自定义插件

```python
from workflows.plugins import InteractionPlugin, InteractionPoint, InteractionRequest

class MyCustomPlugin(InteractionPlugin):
    name = "my_custom_plugin"
    description = "My custom interaction"
    hook_point = InteractionPoint.BEFORE_IMPLEMENTATION
    priority = 50

    async def should_trigger(self, context):
        return context.get("enable_my_plugin", True)

    async def create_interaction(self, context):
        return InteractionRequest(
            interaction_type="custom_interaction",
            title="Custom Check",
            description="Please confirm...",
            data={"key": "value"},
            options={"yes": "Confirm", "no": "Cancel"},
        )

    async def process_response(self, response, context):
        if response.action == "yes":
            context["custom_confirmed"] = True
        else:
            context["workflow_cancelled"] = True
        return context

# 注册插件
registry.register(MyCustomPlugin())
```

## 交互点列表

| Hook Point | 位置 | 默认插件 |
|------------|------|----------|
| `BEFORE_PLANNING` | 生成计划前 | RequirementAnalysisPlugin |
| `AFTER_PLANNING` | 计划生成后 | PlanReviewPlugin |
| `BEFORE_IMPLEMENTATION` | 代码生成前 | (无) |
| `AFTER_IMPLEMENTATION` | 代码生成后 | (无) |

## WebSocket 消息格式

### 后端 → 前端: `interaction_required`

```json
{
  "type": "interaction_required",
  "task_id": "xxx",
  "interaction_type": "requirement_questions",
  "title": "Let's clarify your requirements",
  "description": "Answer these questions...",
  "data": {
    "questions": [...]
  },
  "options": {
    "submit": "Submit Answers",
    "skip": "Skip"
  },
  "timestamp": "2024-01-01T00:00:00Z"
}
```

### 前端 → 后端: POST `/api/v1/workflows/respond/{task_id}`

```json
{
  "action": "submit",
  "data": {
    "answers": {
      "q1": "Answer 1",
      "q2": "Answer 2"
    }
  },
  "skipped": false
}
```

## 优势

1. **无侵入** - 不修改核心工作流逻辑
2. **可插拔** - 随时启用/禁用插件
3. **可扩展** - 轻松添加新的交互点
4. **可配置** - 通过配置文件控制行为
5. **解耦合** - 交互逻辑与业务逻辑分离


================================================
FILE: workflows/plugins/__init__.py
================================================
# User-in-Loop Plugin System
from .base import InteractionPlugin, InteractionPoint, PluginRegistry
from .requirement_analysis import RequirementAnalysisPlugin
from .plan_review import PlanReviewPlugin

__all__ = [
    "InteractionPlugin",
    "InteractionPoint",
    "PluginRegistry",
    "RequirementAnalysisPlugin",
    "PlanReviewPlugin",
]


================================================
FILE: workflows/plugins/base.py
================================================
"""
User-in-Loop Plugin System - Base Classes

This module provides a plugin-based architecture for adding user interaction
points to workflows without modifying core workflow code.

Design Philosophy:
- Plugins are registered at specific "hook points" in the workflow
- Each plugin decides if it should trigger based on context
- Plugins are completely optional and can be enabled/disabled via config
- Zero changes to core workflow code - just call `await plugins.run_hook(...)`

Usage:
    from workflows.plugins import PluginRegistry, InteractionPoint

    # Initialize registry with interaction callback
    plugins = PluginRegistry(interaction_callback=my_callback)

    # In workflow, call hooks at specific points
    context = await plugins.run_hook(
        InteractionPoint.BEFORE_PLANNING,
        context={"user_input": user_input, "task_id": task_id}
    )
"""

import asyncio
from abc import ABC, abstractmethod
from dataclasses import dataclass, field
from enum import Enum
from typing import Any, Callable, Dict, List, Optional, Awaitable
import logging


class InteractionPoint(Enum):
    """
    Defines hook points where plugins can be inserted in the workflow.

    Hook points are named by their position relative to workflow phases:
    - BEFORE_* : Before a phase starts
    - AFTER_*  : After a phase completes
    """

    # Chat Planning Pipeline hooks
    BEFORE_PLANNING = "before_planning"  # Before generating implementation plan
    AFTER_PLANNING = "after_planning"  # After plan is generated, before implementation

    # Paper-to-Code Pipeline hooks
    BEFORE_RESEARCH_ANALYSIS = "before_research_analysis"  # Before analyzing paper
    AFTER_RESEARCH_ANALYSIS = "after_research_analysis"  # After paper analysis
    AFTER_CODE_PLANNING = "after_code_planning"  # After code plan generated

    # Common hooks
    BEFORE_IMPLEMENTATION = "before_implementation"  # Before code generation starts
    AFTER_IMPLEMENTATION = "after_implementation"  # After code is generated


@dataclass
class InteractionRequest:
    """Data structure for requesting user interaction"""

    interaction_type: str  # Type of interaction (e.g., "questions", "plan_review")
    title: str  # Display title
    description: str  # Description for user
    data: Dict[str, Any]  # Interaction-specific data
    options: Dict[str, str] = field(default_factory=dict)  # Available actions
    required: bool = False  # If True, cannot be skipped
    timeout_seconds: int = 300  # Timeout for response (5 min default)


@dataclass
class InteractionResponse:
    """Data structure for user's response to interaction"""

    action: str  # User's action (e.g., "confirm", "modify", "skip")
    data: Dict[str, Any] = field(default_factory=dict)  # Response data
    skipped: bool = False  # True if user chose to skip


class InteractionPlugin(ABC):
    """
    Base class for User-in-Loop plugins.

    Each plugin implements:
    1. should_trigger() - Decides if plugin should run based on context
    2. create_interaction() - Creates the interaction request
    3. process_response() - Handles user's response and updates context

    Example:
        class MyPlugin(InteractionPlugin):
            name = "my_plugin"
            hook_point = InteractionPoint.AFTER_PLANNING

            async def should_trigger(self, context):
                return context.get("enable_my_plugin", True)

            async def create_interaction(self, context):
                return InteractionRequest(...)

            async def process_response(self, response, context):
                context["my_result"] = response.data
                return context
    """

    # Plugin metadata - override in subclass
    name: str = "base_plugin"
    description: str = "Base plugin"
    hook_point: InteractionPoint = InteractionPoint.BEFORE_PLANNING
    priority: int = 100  # Lower number = higher priority (runs first)

    def __init__(self, enabled: bool = True, config: Optional[Dict] = None):
        self.enabled = enabled
        self.config = config or {}
        self.logger = logging.getLogger(f"plugin.{self.name}")

    @abstractmethod
    async def should_trigger(self, context: Dict[str, Any]) -> bool:
        """
        Determine if this plugin should trigger.

        Args:
            context: Current workflow context

        Returns:
            True if plugin should run, False to skip
        """
        pass

    @abstractmethod
    async def create_interaction(self, context: Dict[str, Any]) -> InteractionRequest:
        """
        Create the interaction request to send to user.

        Args:
            context: Current workflow context

        Returns:
            InteractionRequest with data for user interface
        """
        pass

    @abstractmethod
    async def process_response(
        self, response: InteractionResponse, context: Dict[str, Any]
    ) -> Dict[str, Any]:
        """
        Process user's response and update context.

        Args:
            response: User's response
            context: Current workflow context

        Returns:
            Updated context dictionary
        """
        pass

    async def on_skip(self, context: Dict[str, Any]) -> Dict[str, Any]:
        """
        Called when user skips the interaction.
        Override to provide default behavior.

        Args:
            context: Current workflow context

        Returns:
            Updated context (default: unchanged)
        """
        self.logger.info(f"Plugin {self.name} skipped by user")
        return context

    async def on_timeout(self, context: Dict[str, Any]) -> Dict[str, Any]:
        """
        Called when interaction times out.
        Override to provide timeout behavior.

        Args:
            context: Current workflow context

        Returns:
            Updated context (default: same as skip)
        """
        self.logger.warning(f"Plugin {self.name} timed out")
        return await self.on_skip(context)


# Type alias for interaction callback
InteractionCallback = Callable[
    [str, InteractionRequest],  # (task_id, request)
    Awaitable[InteractionResponse],  # Returns response
]


class PluginRegistry:
    """
    Registry for managing and executing User-in-Loop plugins.

    Features:
    - Register plugins at specific hook points
    - Enable/disable plugins dynamically
    - Execute all plugins at a hook point in priority order
    - Handle interaction callbacks to frontend

    Usage:
        # Create registry
        registry = PluginRegistry()

        # Register plugins
        registry.register(RequirementAnalysisPlugin())
        registry.register(PlanReviewPlugin(enabled=False))

        # Set interaction callback (connects to WebSocket/API)
        registry.set_interaction_callback(my_callback)

        # Run hooks in workflow
        context = await registry.run_hook(InteractionPoint.BEFORE_PLANNING, context)
    """

    def __init__(self, interaction_callback: Optional[InteractionCallback] = None):
        self._plugins: Dict[InteractionPoint, List[InteractionPlugin]] = {
            point: [] for point in InteractionPoint
        }
        self._interaction_callback = interaction_callback
        self.logger = logging.getLogger("plugin.registry")

    def register(self, plugin: InteractionPlugin) -> None:
        """Register a plugin at its hook point."""
        hook_point = plugin.hook_point
        self._plugins[hook_point].append(plugin)
        # Sort by priority (lower number first)
        self._plugins[hook_point].sort(key=lambda p: p.priority)
        self.logger.info(f"Registered plugin '{plugin.name}' at {hook_point.value}")

    def unregister(self, plugin_name: str) -> bool:
        """Unregister a plugin by name."""
        for hook_point, plugins in self._plugins.items():
            for plugin in plugins:
                if plugin.name == plugin_name:
                    plugins.remove(plugin)
                    self.logger.info(f"Unregistered plugin '{plugin_name}'")
                    return True
        return False

    def enable(self, plugin_name: str) -> bool:
        """Enable a plugin by name."""
        for plugins in self._plugins.values():
            for plugin in plugins:
                if plugin.name == plugin_name:
                    plugin.enabled = True
                    self.logger.info(f"Enabled plugin '{plugin_name}'")
                    return True
        return False

    def disable(self, plugin_name: str) -> bool:
        """Disable a plugin by name."""
        for plugins in self._plugins.values():
            for plugin in plugins:
                if plugin.name == plugin_name:
                    plugin.enabled = False
                    self.logger.info(f"Disabled plugin '{plugin_name}'")
                    return True
        return False

    def set_interaction_callback(self, callback: InteractionCallback) -> None:
        """Set the callback function for user interactions."""
        self._interaction_callback = callback

    def get_plugins(self, hook_point: InteractionPoint) -> List[InteractionPlugin]:
        """Get all plugins registered at a hook point."""
        return self._plugins.get(hook_point, [])

    async def run_hook(
        self,
        hook_point: InteractionPoint,
        context: Dict[str, Any],
        task_id: Optional[str] = None,
    ) -> Dict[str, Any]:
        """
        Execute all enabled plugins at a hook point.

        Plugins are executed in priority order. Each plugin can:
        - Modify the context
        - Request user interaction
        - Be skipped by the user

        Args:
            hook_point: The hook point to execute
            context: Current workflow context
            task_id: Task ID for interaction callbacks

        Returns:
            Updated context after all plugins have run
        """
        plugins = self._plugins.get(hook_point, [])

        if not plugins:
            self.logger.debug(f"No plugins registered at {hook_point.value}")
            return context

        self.logger.info(
            f"Running hook {hook_point.value} with {len(plugins)} plugin(s)"
        )

        for plugin in plugins:
            if not plugin.enabled:
                self.logger.debug(f"Plugin '{plugin.name}' is disabled, skipping")
                continue

            try:
                # Check if plugin should trigger
                if not await plugin.should_trigger(context):
                    self.logger.debug(f"Plugin '{plugin.name}' chose not to trigger")
                    continue

                self.logger.info(f"Running plugin '{plugin.name}'")

                # Create interaction request
                interaction = await plugin.create_interaction(context)

                # If we have a callback, request user interaction
                if self._interaction_callback and task_id:
                    try:
                        response = await asyncio.wait_for(
                            self._interaction_callback(task_id, interaction),
                            timeout=interaction.timeout_seconds,
                        )

                        if response.skipped:
                            context = await plugin.on_skip(context)
                        else:
                            context = await plugin.process_response(response, context)

                    except asyncio.TimeoutError:
                        self.logger.warning(
                            f"Plugin '{plugin.name}' interaction timed out"
                        )
                        context = await plugin.on_timeout(context)
                else:
                    # No callback - auto-skip non-required interactions
                    if not interaction.required:
                        self.logger.info(
                            f"No callback, auto-skipping plugin '{plugin.name}'"
                        )
                        context = await plugin.on_skip(context)
                    else:
                        raise RuntimeError(
                            f"Plugin '{plugin.name}' requires interaction but no callback provided"
                        )

            except Exception as e:
                self.logger.error(f"Plugin '{plugin.name}' failed: {e}")
                # Continue with other plugins
                continue

        return context


# Global default registry
_default_registry: Optional[PluginRegistry] = None


def get_default_registry(auto_register: bool = True) -> PluginRegistry:
    """
    Get or create the default plugin registry.

    Args:
        auto_register: If True, auto-register default plugins. Set to False to avoid
                       circular imports when called from plugin modules.
    """
    global _default_registry
    if _default_registry is None:
        _default_registry = PluginRegistry()

        if auto_register:
            # Lazy import to avoid circular imports
            try:
                from .requirement_analysis import RequirementAnalysisPlugin
                from .plan_review import PlanReviewPlugin

                _default_registry.register(RequirementAnalysisPlugin())
                _default_registry.register(PlanReviewPlugin())
            except ImportError as e:
                logging.getLogger("plugin.registry").warning(
                    f"Could not auto-register default plugins: {e}"
                )

    return _default_registry


def reset_registry() -> None:
    """Reset the default registry (useful for testing)."""
    global _default_registry
    _default_registry = None


================================================
FILE: workflows/plugins/integration.py
================================================
"""
Plugin Integration Helper

This module shows how to integrate the User-in-Loop plugin system
into existing workflows with minimal code changes.

The key idea is to add ONE LINE at each hook point:
    context = await plugins.run_hook(InteractionPoint.XXX, context, task_id)

Example integration in execute_chat_based_planning_pipeline:

    # Before (original code):
    planning_result = await run_chat_planning_agent(user_input, logger)

    # After (with plugin):
    context = {"user_input": user_input, "task_id": task_id}
    context = await plugins.run_hook(InteractionPoint.BEFORE_PLANNING, context, task_id)
    user_input = context.get("requirements", user_input)  # May be enhanced

    planning_result = await run_chat_planning_agent(user_input, logger)

    context["planning_result"] = planning_result
    context = await plugins.run_hook(InteractionPoint.AFTER_PLANNING, context, task_id)

    if context.get("workflow_cancelled"):
        return {"status": "cancelled", "reason": context.get("cancel_reason")}
"""

import asyncio
from typing import Any, Callable, Dict, List, Optional
from datetime import datetime

from .base import (
    PluginRegistry,
    InteractionPoint,
    InteractionRequest,
    InteractionResponse,
    get_default_registry,
)


class WorkflowPluginIntegration:
    """
    Helper class for integrating plugins with workflow execution.

    This class bridges the plugin system with the workflow service,
    handling the communication between backend and frontend.

    Usage in workflow_service.py:

        from workflows.plugins.integration import WorkflowPluginIntegration

        class WorkflowService:
            def __init__(self):
                self._plugin_integration = WorkflowPluginIntegration(self)

            async def execute_chat_planning(self, task_id, requirements, ...):
                # Get context with plugin support
                context = self._plugin_integration.create_context(
                    task_id=task_id,
                    user_input=requirements,
                )

                # Run before-planning plugins
                context = await self._plugin_integration.run_hook(
                    InteractionPoint.BEFORE_PLANNING,
                    context
                )

                # Continue with (possibly enhanced) requirements
                requirements = context.get("requirements", requirements)
                ...
    """

    def __init__(
        self, workflow_service: Any, registry: Optional[PluginRegistry] = None
    ):
        """
        Initialize plugin integration.

        Args:
            workflow_service: The WorkflowService instance
            registry: Optional custom plugin registry (uses default if not provided)
        """
        self._workflow_service = workflow_service
        self._registry = registry or get_default_registry()

        # Set up interaction callback
        self._registry.set_interaction_callback(self._handle_interaction)

        # Pending interactions (task_id -> response_future)
        self._pending_interactions: Dict[str, asyncio.Future] = {}

    def create_context(self, task_id: str, **kwargs) -> Dict[str, Any]:
        """Create a workflow context with plugin support."""
        return {
            "task_id": task_id,
            "timestamp": datetime.utcnow().isoformat(),
            **kwargs,
        }

    async def run_hook(
        self,
        hook_point: InteractionPoint,
        context: Dict[str, Any],
    ) -> Dict[str, Any]:
        """
        Run plugins at a hook point.

        This is the main entry point for plugin execution.
        """
        task_id = context.get("task_id")
        return await self._registry.run_hook(hook_point, context, task_id)

    async def _handle_interaction(
        self,
        task_id: str,
        request: InteractionRequest,
    ) -> InteractionResponse:
        """
        Handle interaction request from a plugin.

        This method:
        1. Broadcasts the interaction request to frontend via WebSocket
        2. Waits for user response (via submit_response)
        3. Returns the response to the plugin
        """
        # Update task status
        task = self._workflow_service.get_task(task_id)
        if task:
            task.status = "waiting_for_input"
            task.pending_interaction = {
                "type": request.interaction_type,
                "title": request.title,
                "description": request.description,
                "data": request.data,
                "options": request.options,
                "required": request.required,
            }

        # Create future for response (use get_running_loop for Python 3.10+ compatibility)
        try:
            loop = asyncio.get_running_loop()
        except RuntimeError:
            loop = asyncio.get_event_loop()
        response_future: asyncio.Future = loop.create_future()
        self._pending_interactions[task_id] = response_future

        # Broadcast to frontend
        await self._workflow_service._broadcast(
            task_id,
            {
                "type": "interaction_required",
                "task_id": task_id,
                "interaction_type": request.interaction_type,
                "title": request.title,
                "description": request.description,
                "data": request.data,
                "options": request.options,
                "required": request.required,
                "timestamp": datetime.utcnow().isoformat(),
            },
        )

        try:
            # Wait for response
            response = await asyncio.wait_for(
                response_future, timeout=request.timeout_seconds
            )
            return response

        except asyncio.TimeoutError:
            # Return timeout response
            return InteractionResponse(
                action="timeout",
                data={},
                skipped=True,
            )
        finally:
            # Clean up
            self._pending_interactions.pop(task_id, None)
            if task:
                task.status = "running"
                task.pending_interaction = None

    def submit_response(
        self,
        task_id: str,
        action: str,
        data: Optional[Dict[str, Any]] = None,
        skipped: bool = False,
    ) -> bool:
        """
        Submit user's response to a pending interaction.

        Called by the API endpoint when user responds.

        Args:
            task_id: The task ID
            action: User's action (e.g., "confirm", "modify", "skip")
            data: Response data
            skipped: Whether user chose to skip

        Returns:
            True if response was submitted, False if no pending interaction
        """
        future = self._pending_interactions.get(task_id)
        if future and not future.done():
            response = InteractionResponse(
                action=action,
                data=data or {},
                skipped=skipped,
            )
            future.set_result(response)
            return True
        return False

    def has_pending_interaction(self, task_id: str) -> bool:
        """Check if a task has a pending interaction."""
        return task_id in self._pending_interactions

    def cancel_interaction(self, task_id: str) -> bool:
        """Cancel a pending interaction (e.g., when task is cancelled)."""
        future = self._pending_interactions.get(task_id)
        if future and not future.done():
            future.cancel()
            self._pending_interactions.pop(task_id, None)
            return True
        return False


def create_plugin_enabled_wrapper(
    original_function: Callable,
    before_hooks: List[InteractionPoint],
    after_hooks: List[InteractionPoint],
    integration: WorkflowPluginIntegration,
) -> Callable:
    """
    Create a wrapper that adds plugin hooks around an existing function.

    This is useful for wrapping existing workflow functions without
    modifying their code.

    Example:
        # Original function
        async def execute_planning(requirements, logger):
            ...

        # Wrap with plugins
        execute_planning_with_plugins = create_plugin_enabled_wrapper(
            execute_planning,
            before_hooks=[InteractionPoint.BEFORE_PLANNING],
            after_hooks=[InteractionPoint.AFTER_PLANNING],
            integration=plugin_integration,
        )
    """

    async def wrapper(*args, task_id: str = None, **kwargs):
        context = integration.create_context(
            task_id=task_id or "unknown",
            args=args,
            kwargs=kwargs,
        )

        # Run before hooks
        for hook in before_hooks:
            context = await integration.run_hook(hook, context)
            if context.get("workflow_cancelled"):
                return {"status": "cancelled", "reason": context.get("cancel_reason")}

        # Execute original function
        result = await original_function(*args, **kwargs)

        # Run after hooks
        context["result"] = result
        for hook in after_hooks:
            context = await integration.run_hook(hook, context)
            if context.get("workflow_cancelled"):
                return {"status": "cancelled", "reason": context.get("cancel_reason")}

        return result

    return wrapper


================================================
FILE: workflows/plugins/plan_review.py
================================================
"""
Plan Review Plugin

This plugin triggers after planning to let users review and modify
the implementation plan before code generation begins.

Flow:
1. AI generates implementation plan
2. Plugin presents plan to user
3. User can: Confirm / Request modifications / Cancel
4. If modifications requested, AI updates the plan
5. Code generation proceeds with approved plan
"""

from typing import Any, Dict, Optional
from .base import (
    InteractionPlugin,
    InteractionPoint,
    InteractionRequest,
    InteractionResponse,
)


class PlanReviewPlugin(InteractionPlugin):
    """
    Plugin for reviewing and modifying implementation plans.

    This allows users to:
    - Review the generated YAML implementation plan
    - Confirm to proceed with code generation
    - Request modifications to the plan
    - Cancel the workflow entirely

    The confirmed/modified plan is then used for code generation.
    """

    name = "plan_review"
    description = "Review and optionally modify the implementation plan"
    hook_point = InteractionPoint.AFTER_PLANNING
    priority = 10

    def __init__(self, enabled: bool = True, config: Optional[Dict] = None):
        super().__init__(enabled, config)
        self._max_modification_rounds = (
            config.get("max_modification_rounds", 3) if config else 3
        )

    async def should_trigger(self, context: Dict[str, Any]) -> bool:
        """
        Trigger if:
        - A plan has been generated
        - Plan review is not disabled
        - Haven't already reviewed/approved the plan
        """
        # Check if disabled
        if context.get("skip_plan_review", False):
            return False

        # Check if already reviewed
        if context.get("plan_approved", False):
            return False

        # Check if we have a plan to review
        plan = context.get("implementation_plan") or context.get("planning_result")
        if not plan:
            # Try to read from file
            plan_path = context.get("initial_plan_path")
            if plan_path:
                try:
                    with open(plan_path, "r", encoding="utf-8") as f:
                        plan = f.read()
                        context["implementation_plan"] = plan
                except Exception:
                    return False
            else:
                return False

        return len(str(plan).strip()) > 0

    async def create_interaction(self, context: Dict[str, Any]) -> InteractionRequest:
        """Create plan review interaction."""
        plan = context.get("implementation_plan") or context.get("planning_result", "")
        modification_round = context.get("plan_modification_round", 0)

        # Prepare plan summary
        plan_lines = str(plan).split("\n")
        plan_preview = "\n".join(plan_lines[:50])  # First 50 lines as preview
        if len(plan_lines) > 50:
            plan_preview += f"\n... ({len(plan_lines) - 50} more lines)"

        description = "Review the implementation plan below. You can approve it, request changes, or cancel."
        if modification_round > 0:
            description = f"Plan has been modified (round {modification_round}). Please review again."

        return InteractionRequest(
            interaction_type="plan_review",
            title="🔍 Review Implementation Plan",
            description=description,
            data={
                "plan": plan,
                "plan_preview": plan_preview,
                "plan_path": context.get("initial_plan_path"),
                "modification_round": modification_round,
                "max_rounds": self._max_modification_rounds,
            },
            options={
                "confirm": "✓ Approve & Continue",
                "modify": "✎ Request Changes",
                "cancel": "✕ Cancel Workflow",
            },
            required=False,  # Can be skipped (auto-approve)
            timeout_seconds=600,  # 10 minutes for review
        )

    async def process_response(
        self, response: InteractionResponse, context: Dict[str, Any]
    ) -> Dict[str, Any]:
        """Process user's plan review response."""
        action = response.action.lower()

        if action == "confirm":
            # Plan approved, proceed
            context["plan_approved"] = True
            self.logger.info("Implementation plan approved by user")

        elif action == "modify":
            # User wants modifications
            feedback = response.data.get("feedback", "")
            modification_round = context.get("plan_modification_round", 0) + 1

            if modification_round > self._max_modification_rounds:
                self.logger.warning(
                    f"Max modification rounds ({self._max_modification_rounds}) reached"
                )
                context["plan_approved"] = True
                context["plan_modification_warning"] = (
                    "Maximum modification rounds reached"
                )
                return context

            # Modify the plan based on feedback
            try:
                modified_plan = await self._modify_plan(
                    context.get("implementation_plan", ""), feedback, context
                )

                context["implementation_plan"] = modified_plan
                context["planning_result"] = modified_plan
                context["plan_modification_round"] = modification_round
                context["last_modification_feedback"] = feedback

                # Save modified plan to file
                plan_path = context.get("initial_plan_path")
                if plan_path:
                    with open(plan_path, "w", encoding="utf-8") as f:
                        f.write(modified_plan)

                self.logger.info(f"Plan modified (round {modification_round})")

                # Note: The workflow should loop back to show the modified plan
                # This is handled by NOT setting plan_approved = True

            except Exception as e:
                self.logger.error(f"Failed to modify plan: {e}")
                context["plan_modification_error"] = str(e)
                # Auto-approve to continue
                context["plan_approved"] = True

        elif action == "cancel":
            # User wants to cancel
            context["workflow_cancelled"] = True
            context["cancel_reason"] = response.data.get(
                "reason", "User cancelled at plan review"
            )
            self.logger.info("Workflow cancelled by user at plan review")

        else:
            # Unknown action, treat as confirm
            self.logger.warning(f"Unknown action '{action}', treating as confirm")
            context["plan_approved"] = True

        return context

    async def _modify_plan(
        self, current_plan: str, feedback: str, context: Dict[str, Any]
    ) -> str:
        """
        Modify the implementation plan based on user feedback.
        Uses RequirementAnalysisAgent's modify_requirements method.
        """
        try:
            from workflows.agents.requirement_analysis_agent import (
                RequirementAnalysisAgent,
            )

            async with RequirementAnalysisAgent() as agent:
                modified = await agent.modify_requirements(current_plan, feedback)
                return modified

        except Exception as e:
            self.logger.error(f"Plan modification failed: {e}")
            # Return original plan with feedback appended as comment
            return f"""{current_plan}

# ==========================================
# User Modification Request (not applied automatically):
# {feedback}
# ==========================================
"""

    async def on_skip(self, context: Dict[str, Any]) -> Dict[str, Any]:
        """Handle skip - auto-approve the plan."""
        context["plan_approved"] = True
        context["plan_auto_approved"] = True
        self.logger.info("Plan auto-approved (user skipped review)")
        return context

    async def on_timeout(self, context: Dict[str, Any]) -> Dict[str, Any]:
        """Handle timeout - auto-approve."""
        self.logger.warning("Plan review timed out, auto-approving")
        return await self.on_skip(context)


================================================
FILE: workflows/plugins/requirement_analysis.py
================================================
"""
Requirement Analysis Plugin

This plugin triggers before planning to gather more detailed requirements
from the user through guided questions.

Flow:
1. User submits initial requirements
2. Plugin generates 1-3 targeted questions
3. User answers questions (or skips)
4. Plugin creates enhanced requirements document
5. Enhanced requirements passed to planning phase
"""

from typing import Any, Dict, Optional
from .base import (
    InteractionPlugin,
    InteractionPoint,
    InteractionRequest,
    InteractionResponse,
)


class RequirementAnalysisPlugin(InteractionPlugin):
    """
    Plugin for enhanced requirement gathering through AI-generated questions.

    This plugin uses the existing RequirementAnalysisAgent to:
    1. Generate targeted questions based on initial requirements
    2. Collect user answers
    3. Create a detailed requirements document

    The enhanced requirements lead to better implementation plans and code.
    """

    name = "requirement_analysis"
    description = "Gather detailed requirements through guided questions"
    hook_point = InteractionPoint.BEFORE_PLANNING
    priority = 10  # High priority - runs first

    def __init__(self, enabled: bool = True, config: Optional[Dict] = None):
        super().__init__(enabled, config)
        self._agent = None

    async def _get_agent(self):
        """Lazy load RequirementAnalysisAgent."""
        if self._agent is None:
            from workflows.agents.requirement_analysis_agent import (
                RequirementAnalysisAgent,
            )

            self._agent = RequirementAnalysisAgent()
            await self._agent.initialize()
        return self._agent

    async def _cleanup_agent(self):
        """Clean up agent resources."""
        if self._agent is not None:
            await self._agent.cleanup()
            self._agent = None

    async def should_trigger(self, context: Dict[str, Any]) -> bool:
        """
        Trigger if:
        - User has provided initial requirements
        - Requirement analysis is not disabled in config
        - User hasn't already answered questions for this session
        """
        # Check if disabled in context
        if context.get("skip_requirement_analysis", False):
            return False

        # Check if already processed
        if context.get("requirements_enhanced", False):
            return False

        # Check if we have user input to analyze
        user_input = context.get("user_input") or context.get("requirements")
        if not user_input or len(user_input.strip()) < 10:
            return False

        return True

    async def create_interaction(self, context: Dict[str, Any]) -> InteractionRequest:
        """Generate questions based on user's initial requirements."""
        user_input = context.get("user_input") or context.get("requirements", "")

        try:
            agent = await self._get_agent()
            questions = await agent.generate_guiding_questions(user_input)

            return InteractionRequest(
                interaction_type="requirement_questions",
                title="📋 Let's clarify your requirements",
                description="Answer these questions to help generate better code (or skip to continue)",
                data={
                    "questions": questions,
                    "original_input": user_input,
                },
                options={
                    "submit": "Submit Answers",
                    "skip": "Skip and Continue",
                },
                required=False,
                timeout_seconds=300,  # 5 minutes
            )
        except Exception as e:
            self.logger.error(f"Failed to generate questions: {e}")
            # Return a simple fallback interaction
            return InteractionRequest(
                interaction_type="requirement_questions",
                title="📋 Add more details?",
                description="Would you like to provide any additional details about your requirements?",
                data={
                    "questions": [
                        {
                            "id": "additional_details",
                            "category": "General",
                            "question": "Is there anything else you'd like to add about your project requirements?",
                            "importance": "Medium",
                            "hint": "Any technical preferences, constraints, or specific features",
                        }
                    ],
                    "original_input": user_input,
                },
                options={
                    "submit": "Submit",
                    "skip": "Skip",
                },
                required=False,
                timeout_seconds=300,
            )

    async def process_response(
        self, response: InteractionResponse, context: Dict[str, Any]
    ) -> Dict[str, Any]:
        """Process user's answers and create enhanced requirements."""
        user_input = context.get("user_input") or context.get("requirements", "")
        answers = response.data.get("answers", {})

        if not answers:
            # No answers provided, use original input
            context["requirements_enhanced"] = True
            return context

        try:
            agent = await self._get_agent()

            # Generate detailed requirements document
            enhanced_requirements = await agent.summarize_detailed_requirements(
                user_input, answers
            )

            # Update context with enhanced requirements
            context["original_requirements"] = user_input
            context["user_answers"] = answers
            context["requirements"] = enhanced_requirements
            context["user_input"] = enhanced_requirements  # For chat pipeline
            context["requirements_enhanced"] = True

            self.logger.info("Requirements enhanced with user answers")

        except Exception as e:
            self.logger.error(f"Failed to enhance requirements: {e}")
            # Keep original requirements
            context["requirements_enhanced"] = True

        finally:
            await self._cleanup_agent()

        return context

    async def on_skip(self, context: Dict[str, Any]) -> Dict[str, Any]:
        """Handle skip - mark as processed but don't modify requirements."""
        context["requirements_enhanced"] = True
        context["requirements_skipped"] = True
        await self._cleanup_agent()
        return context

    async def on_timeout(self, context: Dict[str, Any]) -> Dict[str, Any]:
        """Handle timeout - same as skip."""
        self.logger.warning(
            "Requirement analysis timed out, continuing with original requirements"
        )
        return await self.on_skip(context)