gitextract_qsg5gbbh/

├── .github/
│   ├── dependabot.yml
│   └── workflows/
│       ├── claude-code-review.yml
│       └── claude.yml
├── .gitignore
├── CLAUDE.md
├── LICENSE
├── README.md
├── examples/
│   ├── arxiv.md
│   ├── inference-market-gpt45.md
│   ├── inference-market.md
│   └── pubmed.md
├── langgraph.json
├── pyproject.toml
├── src/
│   ├── legacy/
│   │   ├── CLAUDE.md
│   │   ├── __init__.py
│   │   ├── configuration.py
│   │   ├── files/
│   │   │   └── vibe_code.md
│   │   ├── graph.ipynb
│   │   ├── graph.py
│   │   ├── legacy.md
│   │   ├── multi_agent.ipynb
│   │   ├── multi_agent.py
│   │   ├── prompts.py
│   │   ├── state.py
│   │   ├── tests/
│   │   │   ├── conftest.py
│   │   │   ├── run_test.py
│   │   │   └── test_report_quality.py
│   │   └── utils.py
│   ├── open_deep_research/
│   │   ├── configuration.py
│   │   ├── deep_researcher.py
│   │   ├── prompts.py
│   │   ├── state.py
│   │   └── utils.py
│   └── security/
│       └── auth.py
└── tests/
    ├── evaluators.py
    ├── expt_results/
    │   ├── deep_research_bench_claude4-sonnet.jsonl
    │   ├── deep_research_bench_gpt-4.1.jsonl
    │   └── deep_research_bench_gpt-5.jsonl
    ├── extract_langsmith_data.py
    ├── pairwise_evaluation.py
    ├── prompts.py
    ├── run_evaluate.py
    └── supervisor_parallel_evaluation.py